diff --git a/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/eval_dior/parsed_answers_test/eval_liqingyun@SH-IDC1-10-140-37-21_device0_rank0.log b/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/eval_dior/parsed_answers_test/eval_liqingyun@SH-IDC1-10-140-37-21_device0_rank0.log new file mode 100644 index 0000000000000000000000000000000000000000..c512f6ea7abf7d56a153b50afea69c48cd5a9770 --- /dev/null +++ b/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/eval_dior/parsed_answers_test/eval_liqingyun@SH-IDC1-10-140-37-21_device0_rank0.log @@ -0,0 +1,42 @@ +2025/01/04 02:50:07 - dior test Evaluation - INFO - -------------------- +2025/01/04 02:50:09 - dior test Evaluation - INFO - Fuzzy matched vehicleicle to vehicle +2025/01/04 02:50:10 - dior test Evaluation - INFO - Fuzzy matched vehicleicle to vehicle +2025/01/04 02:50:11 - dior test Evaluation - INFO - Fuzzy matched groundtrackstation to trainstation +2025/01/04 02:50:12 - dior test Evaluation - INFO - Fuzzy matched tennicle to vehicle +2025/01/04 02:50:13 - dior test Evaluation - INFO - Fuzzy matched tennourt to tenniscourt +2025/01/04 02:50:15 - dior test Evaluation - INFO - Fuzzy matched storgetank to storagetank +2025/01/04 02:50:16 - dior test Evaluation - INFO - Fuzzy matched trainstationstationstation to trainstation +2025/01/04 02:50:16 - dior test Evaluation - INFO - Fuzzy matched storank to storagetank +2025/01/04 02:50:18 - dior test Evaluation - INFO - Fuzzy matched stadiumadiumadium to stadium +2025/01/04 02:50:19 - dior test Evaluation - INFO - Fuzzy matched storadium to stadium +2025/01/04 02:50:22 - dior test Evaluation - INFO - +---------------iou_thr: 0.5--------------- +2025/01/04 02:51:06 - dior test Evaluation - INFO - ++-------------------------+-------+-------+--------+-------+ +| class | gts | dets | recall | ap | ++-------------------------+-------+-------+--------+-------+ +| airplane | 8212 | 7661 | 0.827 | 0.746 | +| airport | 666 | 691 | 0.581 | 0.346 | +| baseballfield | 3434 | 2940 | 0.791 | 0.682 | +| basketballcourt | 2146 | 1951 | 0.832 | 0.758 | +| bridge | 2589 | 2178 | 0.421 | 0.277 | +| chimney | 1031 | 884 | 0.799 | 0.687 | +| expressway-service-area | 1085 | 1063 | 0.846 | 0.722 | +| expressway-toll-station | 688 | 685 | 0.749 | 0.570 | +| dam | 538 | 590 | 0.398 | 0.195 | +| golffield | 575 | 642 | 0.823 | 0.644 | +| groundtrackfield | 1885 | 2179 | 0.836 | 0.636 | +| harbor | 3105 | 3584 | 0.437 | 0.250 | +| overpass | 1782 | 1516 | 0.552 | 0.364 | +| ship | 35184 | 29010 | 0.677 | 0.543 | +| stadium | 672 | 517 | 0.564 | 0.478 | +| storagetank | 23361 | 17806 | 0.627 | 0.544 | +| tenniscourt | 7343 | 6754 | 0.849 | 0.775 | +| trainstation | 509 | 548 | 0.670 | 0.431 | +| vehicle | 26640 | 17384 | 0.471 | 0.355 | +| windmill | 2998 | 3007 | 0.780 | 0.598 | ++-------------------------+-------+-------+--------+-------+ +| mAP | | | | 0.530 | ++-------------------------+-------+-------+--------+-------+ +2025/01/04 02:51:06 - dior test Evaluation - INFO - -------------------- + diff --git a/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/trainer_state.json b/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..446a809a3e05e780d23a05a509fa8534b9104b68 --- /dev/null +++ b/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/trainer_state.json @@ -0,0 +1,256942 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 100.0, + "eval_steps": 200.0, + "global_step": 36700, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0027247956403269754, + "grad_norm": 40.78464126586914, + "learning_rate": 1.8165304268846506e-08, + "loss": 6.8438, + "step": 1 + }, + { + "epoch": 0.005449591280653951, + "grad_norm": 44.312137603759766, + "learning_rate": 3.633060853769301e-08, + "loss": 6.8809, + "step": 2 + }, + { + "epoch": 0.008174386920980926, + "grad_norm": 44.27949523925781, + "learning_rate": 5.449591280653951e-08, + "loss": 6.8516, + "step": 3 + }, + { + "epoch": 0.010899182561307902, + "grad_norm": 40.63651657104492, + "learning_rate": 7.266121707538602e-08, + "loss": 7.0879, + "step": 4 + }, + { + "epoch": 0.013623978201634877, + "grad_norm": 39.83088302612305, + "learning_rate": 9.082652134423253e-08, + "loss": 6.8555, + "step": 5 + }, + { + "epoch": 0.01634877384196185, + "grad_norm": 38.950218200683594, + "learning_rate": 1.0899182561307902e-07, + "loss": 6.9551, + "step": 6 + }, + { + "epoch": 0.01907356948228883, + "grad_norm": 40.39432144165039, + "learning_rate": 1.2715712988192554e-07, + "loss": 6.9512, + "step": 7 + }, + { + "epoch": 0.021798365122615803, + "grad_norm": 48.991764068603516, + "learning_rate": 1.4532243415077205e-07, + "loss": 7.0898, + "step": 8 + }, + { + "epoch": 0.02452316076294278, + "grad_norm": 49.33735275268555, + "learning_rate": 1.6348773841961852e-07, + "loss": 6.8613, + "step": 9 + }, + { + "epoch": 0.027247956403269755, + "grad_norm": 61.31592559814453, + "learning_rate": 1.8165304268846506e-07, + "loss": 6.8047, + "step": 10 + }, + { + "epoch": 0.02997275204359673, + "grad_norm": 39.412933349609375, + "learning_rate": 1.9981834695731156e-07, + "loss": 6.9297, + "step": 11 + }, + { + "epoch": 0.0326975476839237, + "grad_norm": 39.78142166137695, + "learning_rate": 2.1798365122615804e-07, + "loss": 7.0254, + "step": 12 + }, + { + "epoch": 0.035422343324250684, + "grad_norm": 38.37565994262695, + "learning_rate": 2.3614895549500455e-07, + "loss": 6.9766, + "step": 13 + }, + { + "epoch": 0.03814713896457766, + "grad_norm": 51.07477951049805, + "learning_rate": 2.543142597638511e-07, + "loss": 6.9414, + "step": 14 + }, + { + "epoch": 0.04087193460490463, + "grad_norm": 38.784751892089844, + "learning_rate": 2.7247956403269756e-07, + "loss": 6.8379, + "step": 15 + }, + { + "epoch": 0.043596730245231606, + "grad_norm": 38.25511932373047, + "learning_rate": 2.906448683015441e-07, + "loss": 6.8965, + "step": 16 + }, + { + "epoch": 0.04632152588555858, + "grad_norm": 32.41145324707031, + "learning_rate": 3.0881017257039057e-07, + "loss": 6.9238, + "step": 17 + }, + { + "epoch": 0.04904632152588556, + "grad_norm": 35.66207504272461, + "learning_rate": 3.2697547683923705e-07, + "loss": 6.9258, + "step": 18 + }, + { + "epoch": 0.051771117166212535, + "grad_norm": 57.06675720214844, + "learning_rate": 3.4514078110808363e-07, + "loss": 6.8262, + "step": 19 + }, + { + "epoch": 0.05449591280653951, + "grad_norm": 36.9990119934082, + "learning_rate": 3.633060853769301e-07, + "loss": 6.9121, + "step": 20 + }, + { + "epoch": 0.05722070844686648, + "grad_norm": 56.178890228271484, + "learning_rate": 3.814713896457766e-07, + "loss": 7.1934, + "step": 21 + }, + { + "epoch": 0.05994550408719346, + "grad_norm": 44.32059097290039, + "learning_rate": 3.996366939146231e-07, + "loss": 6.8652, + "step": 22 + }, + { + "epoch": 0.06267029972752043, + "grad_norm": 46.04462432861328, + "learning_rate": 4.178019981834696e-07, + "loss": 7.0117, + "step": 23 + }, + { + "epoch": 0.0653950953678474, + "grad_norm": 57.29674530029297, + "learning_rate": 4.359673024523161e-07, + "loss": 6.8086, + "step": 24 + }, + { + "epoch": 0.0681198910081744, + "grad_norm": 34.19939041137695, + "learning_rate": 4.541326067211626e-07, + "loss": 6.5684, + "step": 25 + }, + { + "epoch": 0.07084468664850137, + "grad_norm": 36.27748107910156, + "learning_rate": 4.722979109900091e-07, + "loss": 6.9805, + "step": 26 + }, + { + "epoch": 0.07356948228882834, + "grad_norm": 33.618751525878906, + "learning_rate": 4.904632152588557e-07, + "loss": 6.873, + "step": 27 + }, + { + "epoch": 0.07629427792915532, + "grad_norm": 38.21268844604492, + "learning_rate": 5.086285195277022e-07, + "loss": 6.7188, + "step": 28 + }, + { + "epoch": 0.07901907356948229, + "grad_norm": 40.83243942260742, + "learning_rate": 5.267938237965486e-07, + "loss": 6.8965, + "step": 29 + }, + { + "epoch": 0.08174386920980926, + "grad_norm": 34.49842071533203, + "learning_rate": 5.449591280653951e-07, + "loss": 7.0137, + "step": 30 + }, + { + "epoch": 0.08446866485013624, + "grad_norm": 41.635982513427734, + "learning_rate": 5.631244323342416e-07, + "loss": 7.0996, + "step": 31 + }, + { + "epoch": 0.08719346049046321, + "grad_norm": 53.25373458862305, + "learning_rate": 5.812897366030882e-07, + "loss": 7.1289, + "step": 32 + }, + { + "epoch": 0.08991825613079019, + "grad_norm": 31.06708526611328, + "learning_rate": 5.994550408719347e-07, + "loss": 6.5547, + "step": 33 + }, + { + "epoch": 0.09264305177111716, + "grad_norm": 53.0910530090332, + "learning_rate": 6.176203451407811e-07, + "loss": 6.9785, + "step": 34 + }, + { + "epoch": 0.09536784741144415, + "grad_norm": 38.88106918334961, + "learning_rate": 6.357856494096276e-07, + "loss": 6.8457, + "step": 35 + }, + { + "epoch": 0.09809264305177112, + "grad_norm": 37.74711608886719, + "learning_rate": 6.539509536784741e-07, + "loss": 6.7148, + "step": 36 + }, + { + "epoch": 0.1008174386920981, + "grad_norm": 63.326045989990234, + "learning_rate": 6.721162579473206e-07, + "loss": 6.7129, + "step": 37 + }, + { + "epoch": 0.10354223433242507, + "grad_norm": 33.27577209472656, + "learning_rate": 6.902815622161673e-07, + "loss": 6.7168, + "step": 38 + }, + { + "epoch": 0.10626702997275204, + "grad_norm": 31.722137451171875, + "learning_rate": 7.084468664850137e-07, + "loss": 6.7754, + "step": 39 + }, + { + "epoch": 0.10899182561307902, + "grad_norm": 44.16450881958008, + "learning_rate": 7.266121707538602e-07, + "loss": 6.8105, + "step": 40 + }, + { + "epoch": 0.11171662125340599, + "grad_norm": 38.69147491455078, + "learning_rate": 7.447774750227067e-07, + "loss": 6.6855, + "step": 41 + }, + { + "epoch": 0.11444141689373297, + "grad_norm": 27.381261825561523, + "learning_rate": 7.629427792915532e-07, + "loss": 6.623, + "step": 42 + }, + { + "epoch": 0.11716621253405994, + "grad_norm": 33.229217529296875, + "learning_rate": 7.811080835603997e-07, + "loss": 6.6211, + "step": 43 + }, + { + "epoch": 0.11989100817438691, + "grad_norm": 42.80620193481445, + "learning_rate": 7.992733878292462e-07, + "loss": 6.8574, + "step": 44 + }, + { + "epoch": 0.1226158038147139, + "grad_norm": 33.26158905029297, + "learning_rate": 8.174386920980927e-07, + "loss": 6.375, + "step": 45 + }, + { + "epoch": 0.12534059945504086, + "grad_norm": 26.46646499633789, + "learning_rate": 8.356039963669392e-07, + "loss": 6.3516, + "step": 46 + }, + { + "epoch": 0.12806539509536785, + "grad_norm": 32.222042083740234, + "learning_rate": 8.537693006357857e-07, + "loss": 6.4531, + "step": 47 + }, + { + "epoch": 0.1307901907356948, + "grad_norm": 38.365352630615234, + "learning_rate": 8.719346049046322e-07, + "loss": 6.6836, + "step": 48 + }, + { + "epoch": 0.1335149863760218, + "grad_norm": 28.54322052001953, + "learning_rate": 8.900999091734786e-07, + "loss": 6.498, + "step": 49 + }, + { + "epoch": 0.1362397820163488, + "grad_norm": 28.877483367919922, + "learning_rate": 9.082652134423252e-07, + "loss": 6.4141, + "step": 50 + }, + { + "epoch": 0.13896457765667575, + "grad_norm": 27.959054946899414, + "learning_rate": 9.264305177111717e-07, + "loss": 6.2188, + "step": 51 + }, + { + "epoch": 0.14168937329700274, + "grad_norm": 23.965312957763672, + "learning_rate": 9.445958219800182e-07, + "loss": 6.3184, + "step": 52 + }, + { + "epoch": 0.1444141689373297, + "grad_norm": 59.07518768310547, + "learning_rate": 9.627611262488648e-07, + "loss": 6.5605, + "step": 53 + }, + { + "epoch": 0.14713896457765668, + "grad_norm": 29.662635803222656, + "learning_rate": 9.809264305177114e-07, + "loss": 6.2461, + "step": 54 + }, + { + "epoch": 0.14986376021798364, + "grad_norm": 29.20414161682129, + "learning_rate": 9.990917347865577e-07, + "loss": 6.3477, + "step": 55 + }, + { + "epoch": 0.15258855585831063, + "grad_norm": 37.64859390258789, + "learning_rate": 1.0172570390554043e-06, + "loss": 6.0879, + "step": 56 + }, + { + "epoch": 0.1553133514986376, + "grad_norm": 30.13629150390625, + "learning_rate": 1.0354223433242507e-06, + "loss": 6.293, + "step": 57 + }, + { + "epoch": 0.15803814713896458, + "grad_norm": 21.255197525024414, + "learning_rate": 1.0535876475930973e-06, + "loss": 6.3887, + "step": 58 + }, + { + "epoch": 0.16076294277929154, + "grad_norm": 29.932714462280273, + "learning_rate": 1.0717529518619439e-06, + "loss": 6.1172, + "step": 59 + }, + { + "epoch": 0.16348773841961853, + "grad_norm": 23.474641799926758, + "learning_rate": 1.0899182561307902e-06, + "loss": 6.1816, + "step": 60 + }, + { + "epoch": 0.16621253405994552, + "grad_norm": 22.93517303466797, + "learning_rate": 1.1080835603996368e-06, + "loss": 6.3008, + "step": 61 + }, + { + "epoch": 0.16893732970027248, + "grad_norm": 19.647396087646484, + "learning_rate": 1.1262488646684832e-06, + "loss": 6.0918, + "step": 62 + }, + { + "epoch": 0.17166212534059946, + "grad_norm": 25.928668975830078, + "learning_rate": 1.1444141689373298e-06, + "loss": 5.9766, + "step": 63 + }, + { + "epoch": 0.17438692098092642, + "grad_norm": 23.329084396362305, + "learning_rate": 1.1625794732061764e-06, + "loss": 5.9316, + "step": 64 + }, + { + "epoch": 0.1771117166212534, + "grad_norm": 28.719526290893555, + "learning_rate": 1.1807447774750227e-06, + "loss": 5.9121, + "step": 65 + }, + { + "epoch": 0.17983651226158037, + "grad_norm": 23.34282112121582, + "learning_rate": 1.1989100817438693e-06, + "loss": 5.7422, + "step": 66 + }, + { + "epoch": 0.18256130790190736, + "grad_norm": 23.170896530151367, + "learning_rate": 1.217075386012716e-06, + "loss": 5.7812, + "step": 67 + }, + { + "epoch": 0.18528610354223432, + "grad_norm": 17.787656784057617, + "learning_rate": 1.2352406902815623e-06, + "loss": 5.9316, + "step": 68 + }, + { + "epoch": 0.1880108991825613, + "grad_norm": 28.331361770629883, + "learning_rate": 1.2534059945504087e-06, + "loss": 5.6387, + "step": 69 + }, + { + "epoch": 0.1907356948228883, + "grad_norm": 20.090055465698242, + "learning_rate": 1.2715712988192552e-06, + "loss": 5.7715, + "step": 70 + }, + { + "epoch": 0.19346049046321526, + "grad_norm": 20.68782615661621, + "learning_rate": 1.2897366030881018e-06, + "loss": 5.457, + "step": 71 + }, + { + "epoch": 0.19618528610354224, + "grad_norm": 16.90093421936035, + "learning_rate": 1.3079019073569482e-06, + "loss": 5.6348, + "step": 72 + }, + { + "epoch": 0.1989100817438692, + "grad_norm": 50.501258850097656, + "learning_rate": 1.3260672116257948e-06, + "loss": 5.5293, + "step": 73 + }, + { + "epoch": 0.2016348773841962, + "grad_norm": 18.65361213684082, + "learning_rate": 1.3442325158946412e-06, + "loss": 5.4395, + "step": 74 + }, + { + "epoch": 0.20435967302452315, + "grad_norm": 32.909339904785156, + "learning_rate": 1.362397820163488e-06, + "loss": 5.5742, + "step": 75 + }, + { + "epoch": 0.20708446866485014, + "grad_norm": 17.824298858642578, + "learning_rate": 1.3805631244323345e-06, + "loss": 5.6914, + "step": 76 + }, + { + "epoch": 0.2098092643051771, + "grad_norm": 20.759225845336914, + "learning_rate": 1.398728428701181e-06, + "loss": 5.418, + "step": 77 + }, + { + "epoch": 0.2125340599455041, + "grad_norm": 20.385583877563477, + "learning_rate": 1.4168937329700275e-06, + "loss": 5.3809, + "step": 78 + }, + { + "epoch": 0.21525885558583105, + "grad_norm": 16.89611053466797, + "learning_rate": 1.4350590372388739e-06, + "loss": 5.4844, + "step": 79 + }, + { + "epoch": 0.21798365122615804, + "grad_norm": 22.670808792114258, + "learning_rate": 1.4532243415077205e-06, + "loss": 5.3105, + "step": 80 + }, + { + "epoch": 0.22070844686648503, + "grad_norm": 20.921186447143555, + "learning_rate": 1.471389645776567e-06, + "loss": 5.2852, + "step": 81 + }, + { + "epoch": 0.22343324250681199, + "grad_norm": 18.31825065612793, + "learning_rate": 1.4895549500454134e-06, + "loss": 5.4473, + "step": 82 + }, + { + "epoch": 0.22615803814713897, + "grad_norm": 17.247661590576172, + "learning_rate": 1.50772025431426e-06, + "loss": 5.2773, + "step": 83 + }, + { + "epoch": 0.22888283378746593, + "grad_norm": 26.34626579284668, + "learning_rate": 1.5258855585831064e-06, + "loss": 5.291, + "step": 84 + }, + { + "epoch": 0.23160762942779292, + "grad_norm": 21.106550216674805, + "learning_rate": 1.544050862851953e-06, + "loss": 5.4531, + "step": 85 + }, + { + "epoch": 0.23433242506811988, + "grad_norm": 25.7116756439209, + "learning_rate": 1.5622161671207993e-06, + "loss": 5.2168, + "step": 86 + }, + { + "epoch": 0.23705722070844687, + "grad_norm": 21.119768142700195, + "learning_rate": 1.580381471389646e-06, + "loss": 5.3438, + "step": 87 + }, + { + "epoch": 0.23978201634877383, + "grad_norm": 20.929882049560547, + "learning_rate": 1.5985467756584925e-06, + "loss": 5.1504, + "step": 88 + }, + { + "epoch": 0.24250681198910082, + "grad_norm": 29.220802307128906, + "learning_rate": 1.6167120799273389e-06, + "loss": 4.918, + "step": 89 + }, + { + "epoch": 0.2452316076294278, + "grad_norm": 35.418941497802734, + "learning_rate": 1.6348773841961855e-06, + "loss": 5.0137, + "step": 90 + }, + { + "epoch": 0.24795640326975477, + "grad_norm": 16.804855346679688, + "learning_rate": 1.6530426884650318e-06, + "loss": 5.1211, + "step": 91 + }, + { + "epoch": 0.2506811989100817, + "grad_norm": 17.878726959228516, + "learning_rate": 1.6712079927338784e-06, + "loss": 5.1953, + "step": 92 + }, + { + "epoch": 0.25340599455040874, + "grad_norm": 18.441425323486328, + "learning_rate": 1.689373297002725e-06, + "loss": 4.7861, + "step": 93 + }, + { + "epoch": 0.2561307901907357, + "grad_norm": 21.388906478881836, + "learning_rate": 1.7075386012715714e-06, + "loss": 4.8379, + "step": 94 + }, + { + "epoch": 0.25885558583106266, + "grad_norm": 19.879146575927734, + "learning_rate": 1.725703905540418e-06, + "loss": 4.7842, + "step": 95 + }, + { + "epoch": 0.2615803814713896, + "grad_norm": 24.641145706176758, + "learning_rate": 1.7438692098092643e-06, + "loss": 4.9785, + "step": 96 + }, + { + "epoch": 0.26430517711171664, + "grad_norm": 13.113323211669922, + "learning_rate": 1.762034514078111e-06, + "loss": 4.6279, + "step": 97 + }, + { + "epoch": 0.2670299727520436, + "grad_norm": 16.05596923828125, + "learning_rate": 1.7801998183469573e-06, + "loss": 4.3711, + "step": 98 + }, + { + "epoch": 0.26975476839237056, + "grad_norm": 14.967947006225586, + "learning_rate": 1.7983651226158039e-06, + "loss": 4.376, + "step": 99 + }, + { + "epoch": 0.2724795640326976, + "grad_norm": 15.026629447937012, + "learning_rate": 1.8165304268846505e-06, + "loss": 5.0801, + "step": 100 + }, + { + "epoch": 0.27520435967302453, + "grad_norm": 15.951396942138672, + "learning_rate": 1.8346957311534968e-06, + "loss": 4.8525, + "step": 101 + }, + { + "epoch": 0.2779291553133515, + "grad_norm": 13.121307373046875, + "learning_rate": 1.8528610354223434e-06, + "loss": 4.4746, + "step": 102 + }, + { + "epoch": 0.28065395095367845, + "grad_norm": 14.952683448791504, + "learning_rate": 1.8710263396911898e-06, + "loss": 4.665, + "step": 103 + }, + { + "epoch": 0.28337874659400547, + "grad_norm": 13.740148544311523, + "learning_rate": 1.8891916439600364e-06, + "loss": 4.3633, + "step": 104 + }, + { + "epoch": 0.28610354223433243, + "grad_norm": 15.738082885742188, + "learning_rate": 1.907356948228883e-06, + "loss": 4.5303, + "step": 105 + }, + { + "epoch": 0.2888283378746594, + "grad_norm": 12.909492492675781, + "learning_rate": 1.9255222524977295e-06, + "loss": 4.3691, + "step": 106 + }, + { + "epoch": 0.29155313351498635, + "grad_norm": 15.026860237121582, + "learning_rate": 1.943687556766576e-06, + "loss": 4.6152, + "step": 107 + }, + { + "epoch": 0.29427792915531337, + "grad_norm": 13.496101379394531, + "learning_rate": 1.9618528610354227e-06, + "loss": 4.2588, + "step": 108 + }, + { + "epoch": 0.2970027247956403, + "grad_norm": 14.526864051818848, + "learning_rate": 1.9800181653042693e-06, + "loss": 4.4912, + "step": 109 + }, + { + "epoch": 0.2997275204359673, + "grad_norm": 12.712934494018555, + "learning_rate": 1.9981834695731155e-06, + "loss": 4.4111, + "step": 110 + }, + { + "epoch": 0.3024523160762943, + "grad_norm": 11.968435287475586, + "learning_rate": 2.016348773841962e-06, + "loss": 4.4316, + "step": 111 + }, + { + "epoch": 0.30517711171662126, + "grad_norm": 13.326701164245605, + "learning_rate": 2.0345140781108086e-06, + "loss": 4.5, + "step": 112 + }, + { + "epoch": 0.3079019073569482, + "grad_norm": 16.02067756652832, + "learning_rate": 2.0526793823796552e-06, + "loss": 4.124, + "step": 113 + }, + { + "epoch": 0.3106267029972752, + "grad_norm": 13.210917472839355, + "learning_rate": 2.0708446866485014e-06, + "loss": 4.3545, + "step": 114 + }, + { + "epoch": 0.3133514986376022, + "grad_norm": 12.205485343933105, + "learning_rate": 2.089009990917348e-06, + "loss": 4.6543, + "step": 115 + }, + { + "epoch": 0.31607629427792916, + "grad_norm": 11.650239944458008, + "learning_rate": 2.1071752951861945e-06, + "loss": 4.3682, + "step": 116 + }, + { + "epoch": 0.3188010899182561, + "grad_norm": 11.849342346191406, + "learning_rate": 2.125340599455041e-06, + "loss": 4.4482, + "step": 117 + }, + { + "epoch": 0.3215258855585831, + "grad_norm": 10.80008316040039, + "learning_rate": 2.1435059037238877e-06, + "loss": 3.9756, + "step": 118 + }, + { + "epoch": 0.3242506811989101, + "grad_norm": 12.67882251739502, + "learning_rate": 2.161671207992734e-06, + "loss": 4.2832, + "step": 119 + }, + { + "epoch": 0.32697547683923706, + "grad_norm": 10.75010871887207, + "learning_rate": 2.1798365122615805e-06, + "loss": 4.3525, + "step": 120 + }, + { + "epoch": 0.329700272479564, + "grad_norm": 10.905150413513184, + "learning_rate": 2.198001816530427e-06, + "loss": 4.3975, + "step": 121 + }, + { + "epoch": 0.33242506811989103, + "grad_norm": 12.39403247833252, + "learning_rate": 2.2161671207992736e-06, + "loss": 4.5381, + "step": 122 + }, + { + "epoch": 0.335149863760218, + "grad_norm": 13.479368209838867, + "learning_rate": 2.2343324250681202e-06, + "loss": 3.8682, + "step": 123 + }, + { + "epoch": 0.33787465940054495, + "grad_norm": 13.995524406433105, + "learning_rate": 2.2524977293369664e-06, + "loss": 4.3496, + "step": 124 + }, + { + "epoch": 0.3405994550408719, + "grad_norm": 12.977371215820312, + "learning_rate": 2.270663033605813e-06, + "loss": 4.0049, + "step": 125 + }, + { + "epoch": 0.34332425068119893, + "grad_norm": 11.538091659545898, + "learning_rate": 2.2888283378746596e-06, + "loss": 4.4365, + "step": 126 + }, + { + "epoch": 0.3460490463215259, + "grad_norm": 12.014766693115234, + "learning_rate": 2.306993642143506e-06, + "loss": 4.0898, + "step": 127 + }, + { + "epoch": 0.34877384196185285, + "grad_norm": 10.364009857177734, + "learning_rate": 2.3251589464123527e-06, + "loss": 4.292, + "step": 128 + }, + { + "epoch": 0.35149863760217986, + "grad_norm": 10.310364723205566, + "learning_rate": 2.343324250681199e-06, + "loss": 3.9658, + "step": 129 + }, + { + "epoch": 0.3542234332425068, + "grad_norm": 14.921072959899902, + "learning_rate": 2.3614895549500455e-06, + "loss": 3.9932, + "step": 130 + }, + { + "epoch": 0.3569482288828338, + "grad_norm": 11.562774658203125, + "learning_rate": 2.379654859218892e-06, + "loss": 4.292, + "step": 131 + }, + { + "epoch": 0.35967302452316074, + "grad_norm": 12.198079109191895, + "learning_rate": 2.3978201634877386e-06, + "loss": 4.2441, + "step": 132 + }, + { + "epoch": 0.36239782016348776, + "grad_norm": 12.380412101745605, + "learning_rate": 2.415985467756585e-06, + "loss": 4.2373, + "step": 133 + }, + { + "epoch": 0.3651226158038147, + "grad_norm": 11.048654556274414, + "learning_rate": 2.434150772025432e-06, + "loss": 3.998, + "step": 134 + }, + { + "epoch": 0.3678474114441417, + "grad_norm": 17.524181365966797, + "learning_rate": 2.4523160762942784e-06, + "loss": 4.0967, + "step": 135 + }, + { + "epoch": 0.37057220708446864, + "grad_norm": 12.678315162658691, + "learning_rate": 2.4704813805631246e-06, + "loss": 4.1025, + "step": 136 + }, + { + "epoch": 0.37329700272479566, + "grad_norm": 10.025920867919922, + "learning_rate": 2.488646684831971e-06, + "loss": 4.0293, + "step": 137 + }, + { + "epoch": 0.3760217983651226, + "grad_norm": 14.001442909240723, + "learning_rate": 2.5068119891008173e-06, + "loss": 4.0107, + "step": 138 + }, + { + "epoch": 0.3787465940054496, + "grad_norm": 13.694280624389648, + "learning_rate": 2.5249772933696643e-06, + "loss": 3.9805, + "step": 139 + }, + { + "epoch": 0.3814713896457766, + "grad_norm": 10.68122673034668, + "learning_rate": 2.5431425976385105e-06, + "loss": 3.8984, + "step": 140 + }, + { + "epoch": 0.38419618528610355, + "grad_norm": 17.292200088500977, + "learning_rate": 2.561307901907357e-06, + "loss": 3.8594, + "step": 141 + }, + { + "epoch": 0.3869209809264305, + "grad_norm": 11.216814041137695, + "learning_rate": 2.5794732061762036e-06, + "loss": 3.9932, + "step": 142 + }, + { + "epoch": 0.3896457765667575, + "grad_norm": 11.111741065979004, + "learning_rate": 2.5976385104450502e-06, + "loss": 3.8643, + "step": 143 + }, + { + "epoch": 0.3923705722070845, + "grad_norm": 12.438227653503418, + "learning_rate": 2.6158038147138964e-06, + "loss": 3.7656, + "step": 144 + }, + { + "epoch": 0.39509536784741145, + "grad_norm": 11.749055862426758, + "learning_rate": 2.6339691189827434e-06, + "loss": 3.8945, + "step": 145 + }, + { + "epoch": 0.3978201634877384, + "grad_norm": 12.600846290588379, + "learning_rate": 2.6521344232515896e-06, + "loss": 4.1074, + "step": 146 + }, + { + "epoch": 0.40054495912806537, + "grad_norm": 10.880453109741211, + "learning_rate": 2.670299727520436e-06, + "loss": 4.0225, + "step": 147 + }, + { + "epoch": 0.4032697547683924, + "grad_norm": 10.751895904541016, + "learning_rate": 2.6884650317892823e-06, + "loss": 4.0391, + "step": 148 + }, + { + "epoch": 0.40599455040871935, + "grad_norm": 12.65353775024414, + "learning_rate": 2.7066303360581293e-06, + "loss": 4.0244, + "step": 149 + }, + { + "epoch": 0.4087193460490463, + "grad_norm": 13.534128189086914, + "learning_rate": 2.724795640326976e-06, + "loss": 3.7412, + "step": 150 + }, + { + "epoch": 0.4114441416893733, + "grad_norm": 13.41270923614502, + "learning_rate": 2.742960944595822e-06, + "loss": 3.8105, + "step": 151 + }, + { + "epoch": 0.4141689373297003, + "grad_norm": 11.690704345703125, + "learning_rate": 2.761126248864669e-06, + "loss": 4.0684, + "step": 152 + }, + { + "epoch": 0.41689373297002724, + "grad_norm": 12.114771842956543, + "learning_rate": 2.7792915531335152e-06, + "loss": 3.751, + "step": 153 + }, + { + "epoch": 0.4196185286103542, + "grad_norm": 46.29283142089844, + "learning_rate": 2.797456857402362e-06, + "loss": 3.875, + "step": 154 + }, + { + "epoch": 0.4223433242506812, + "grad_norm": 15.252677917480469, + "learning_rate": 2.815622161671208e-06, + "loss": 3.8926, + "step": 155 + }, + { + "epoch": 0.4250681198910082, + "grad_norm": 9.994403839111328, + "learning_rate": 2.833787465940055e-06, + "loss": 3.6943, + "step": 156 + }, + { + "epoch": 0.42779291553133514, + "grad_norm": 12.046945571899414, + "learning_rate": 2.851952770208901e-06, + "loss": 3.8477, + "step": 157 + }, + { + "epoch": 0.4305177111716621, + "grad_norm": 10.81486701965332, + "learning_rate": 2.8701180744777477e-06, + "loss": 3.9033, + "step": 158 + }, + { + "epoch": 0.4332425068119891, + "grad_norm": 10.982769966125488, + "learning_rate": 2.8882833787465943e-06, + "loss": 3.707, + "step": 159 + }, + { + "epoch": 0.4359673024523161, + "grad_norm": 21.560009002685547, + "learning_rate": 2.906448683015441e-06, + "loss": 3.709, + "step": 160 + }, + { + "epoch": 0.43869209809264303, + "grad_norm": 10.339600563049316, + "learning_rate": 2.924613987284287e-06, + "loss": 3.6982, + "step": 161 + }, + { + "epoch": 0.44141689373297005, + "grad_norm": 12.688766479492188, + "learning_rate": 2.942779291553134e-06, + "loss": 3.7021, + "step": 162 + }, + { + "epoch": 0.444141689373297, + "grad_norm": 13.196794509887695, + "learning_rate": 2.9609445958219802e-06, + "loss": 3.5156, + "step": 163 + }, + { + "epoch": 0.44686648501362397, + "grad_norm": 11.564620971679688, + "learning_rate": 2.979109900090827e-06, + "loss": 3.8828, + "step": 164 + }, + { + "epoch": 0.44959128065395093, + "grad_norm": 10.873297691345215, + "learning_rate": 2.997275204359673e-06, + "loss": 3.7412, + "step": 165 + }, + { + "epoch": 0.45231607629427795, + "grad_norm": 11.341376304626465, + "learning_rate": 3.01544050862852e-06, + "loss": 3.7471, + "step": 166 + }, + { + "epoch": 0.4550408719346049, + "grad_norm": 12.239847183227539, + "learning_rate": 3.033605812897366e-06, + "loss": 3.6182, + "step": 167 + }, + { + "epoch": 0.45776566757493187, + "grad_norm": 10.07335376739502, + "learning_rate": 3.0517711171662127e-06, + "loss": 3.5586, + "step": 168 + }, + { + "epoch": 0.4604904632152589, + "grad_norm": 12.485919952392578, + "learning_rate": 3.069936421435059e-06, + "loss": 3.7471, + "step": 169 + }, + { + "epoch": 0.46321525885558584, + "grad_norm": 13.17069149017334, + "learning_rate": 3.088101725703906e-06, + "loss": 3.79, + "step": 170 + }, + { + "epoch": 0.4659400544959128, + "grad_norm": 10.066970825195312, + "learning_rate": 3.106267029972752e-06, + "loss": 3.8877, + "step": 171 + }, + { + "epoch": 0.46866485013623976, + "grad_norm": 10.02057933807373, + "learning_rate": 3.1244323342415987e-06, + "loss": 3.8125, + "step": 172 + }, + { + "epoch": 0.4713896457765668, + "grad_norm": 9.856107711791992, + "learning_rate": 3.1425976385104452e-06, + "loss": 3.46, + "step": 173 + }, + { + "epoch": 0.47411444141689374, + "grad_norm": 9.71706771850586, + "learning_rate": 3.160762942779292e-06, + "loss": 3.7637, + "step": 174 + }, + { + "epoch": 0.4768392370572207, + "grad_norm": 10.88630199432373, + "learning_rate": 3.178928247048138e-06, + "loss": 3.6582, + "step": 175 + }, + { + "epoch": 0.47956403269754766, + "grad_norm": 14.558564186096191, + "learning_rate": 3.197093551316985e-06, + "loss": 3.7422, + "step": 176 + }, + { + "epoch": 0.4822888283378747, + "grad_norm": 16.139097213745117, + "learning_rate": 3.215258855585831e-06, + "loss": 3.7441, + "step": 177 + }, + { + "epoch": 0.48501362397820164, + "grad_norm": 9.087676048278809, + "learning_rate": 3.2334241598546777e-06, + "loss": 3.6074, + "step": 178 + }, + { + "epoch": 0.4877384196185286, + "grad_norm": 11.948226928710938, + "learning_rate": 3.2515894641235247e-06, + "loss": 3.5625, + "step": 179 + }, + { + "epoch": 0.4904632152588556, + "grad_norm": 10.44946002960205, + "learning_rate": 3.269754768392371e-06, + "loss": 3.6328, + "step": 180 + }, + { + "epoch": 0.49318801089918257, + "grad_norm": 13.133516311645508, + "learning_rate": 3.2879200726612175e-06, + "loss": 3.7539, + "step": 181 + }, + { + "epoch": 0.49591280653950953, + "grad_norm": 9.692259788513184, + "learning_rate": 3.3060853769300637e-06, + "loss": 3.4502, + "step": 182 + }, + { + "epoch": 0.4986376021798365, + "grad_norm": 14.369646072387695, + "learning_rate": 3.3242506811989107e-06, + "loss": 3.4297, + "step": 183 + }, + { + "epoch": 0.5013623978201635, + "grad_norm": 14.707884788513184, + "learning_rate": 3.342415985467757e-06, + "loss": 3.4756, + "step": 184 + }, + { + "epoch": 0.5040871934604905, + "grad_norm": 11.313895225524902, + "learning_rate": 3.3605812897366034e-06, + "loss": 3.7871, + "step": 185 + }, + { + "epoch": 0.5068119891008175, + "grad_norm": 12.058860778808594, + "learning_rate": 3.37874659400545e-06, + "loss": 3.4521, + "step": 186 + }, + { + "epoch": 0.5095367847411444, + "grad_norm": 9.204839706420898, + "learning_rate": 3.3969118982742966e-06, + "loss": 3.623, + "step": 187 + }, + { + "epoch": 0.5122615803814714, + "grad_norm": 16.05647087097168, + "learning_rate": 3.4150772025431427e-06, + "loss": 3.5137, + "step": 188 + }, + { + "epoch": 0.5149863760217984, + "grad_norm": 11.145015716552734, + "learning_rate": 3.4332425068119898e-06, + "loss": 3.5723, + "step": 189 + }, + { + "epoch": 0.5177111716621253, + "grad_norm": 10.855523109436035, + "learning_rate": 3.451407811080836e-06, + "loss": 3.2344, + "step": 190 + }, + { + "epoch": 0.5204359673024523, + "grad_norm": 10.985532760620117, + "learning_rate": 3.4695731153496825e-06, + "loss": 3.6309, + "step": 191 + }, + { + "epoch": 0.5231607629427792, + "grad_norm": 12.266671180725098, + "learning_rate": 3.4877384196185287e-06, + "loss": 3.3369, + "step": 192 + }, + { + "epoch": 0.5258855585831063, + "grad_norm": 10.597880363464355, + "learning_rate": 3.5059037238873757e-06, + "loss": 3.4443, + "step": 193 + }, + { + "epoch": 0.5286103542234333, + "grad_norm": 19.650754928588867, + "learning_rate": 3.524069028156222e-06, + "loss": 3.5801, + "step": 194 + }, + { + "epoch": 0.5313351498637602, + "grad_norm": 11.14974308013916, + "learning_rate": 3.5422343324250684e-06, + "loss": 3.4766, + "step": 195 + }, + { + "epoch": 0.5340599455040872, + "grad_norm": 11.0927734375, + "learning_rate": 3.5603996366939146e-06, + "loss": 3.3281, + "step": 196 + }, + { + "epoch": 0.5367847411444142, + "grad_norm": 10.628003120422363, + "learning_rate": 3.5785649409627616e-06, + "loss": 3.293, + "step": 197 + }, + { + "epoch": 0.5395095367847411, + "grad_norm": 10.564107894897461, + "learning_rate": 3.5967302452316077e-06, + "loss": 3.1475, + "step": 198 + }, + { + "epoch": 0.5422343324250681, + "grad_norm": 13.25076961517334, + "learning_rate": 3.6148955495004543e-06, + "loss": 3.4648, + "step": 199 + }, + { + "epoch": 0.5449591280653951, + "grad_norm": 14.788480758666992, + "learning_rate": 3.633060853769301e-06, + "loss": 3.4941, + "step": 200 + }, + { + "epoch": 0.547683923705722, + "grad_norm": 9.797980308532715, + "learning_rate": 3.6512261580381475e-06, + "loss": 3.1133, + "step": 201 + }, + { + "epoch": 0.5504087193460491, + "grad_norm": 13.813182830810547, + "learning_rate": 3.6693914623069937e-06, + "loss": 3.3164, + "step": 202 + }, + { + "epoch": 0.553133514986376, + "grad_norm": 15.10222053527832, + "learning_rate": 3.6875567665758407e-06, + "loss": 3.5234, + "step": 203 + }, + { + "epoch": 0.555858310626703, + "grad_norm": 12.306085586547852, + "learning_rate": 3.705722070844687e-06, + "loss": 3.334, + "step": 204 + }, + { + "epoch": 0.55858310626703, + "grad_norm": 9.715800285339355, + "learning_rate": 3.7238873751135334e-06, + "loss": 3.4756, + "step": 205 + }, + { + "epoch": 0.5613079019073569, + "grad_norm": 12.598706245422363, + "learning_rate": 3.7420526793823796e-06, + "loss": 3.4111, + "step": 206 + }, + { + "epoch": 0.5640326975476839, + "grad_norm": 8.66494369506836, + "learning_rate": 3.7602179836512266e-06, + "loss": 3.4951, + "step": 207 + }, + { + "epoch": 0.5667574931880109, + "grad_norm": 9.56230354309082, + "learning_rate": 3.7783832879200728e-06, + "loss": 3.624, + "step": 208 + }, + { + "epoch": 0.5694822888283378, + "grad_norm": 10.649101257324219, + "learning_rate": 3.7965485921889193e-06, + "loss": 3.3105, + "step": 209 + }, + { + "epoch": 0.5722070844686649, + "grad_norm": 12.988601684570312, + "learning_rate": 3.814713896457766e-06, + "loss": 3.1914, + "step": 210 + }, + { + "epoch": 0.5749318801089919, + "grad_norm": 10.908307075500488, + "learning_rate": 3.832879200726612e-06, + "loss": 3.752, + "step": 211 + }, + { + "epoch": 0.5776566757493188, + "grad_norm": 20.07297706604004, + "learning_rate": 3.851044504995459e-06, + "loss": 3.5322, + "step": 212 + }, + { + "epoch": 0.5803814713896458, + "grad_norm": 11.026345252990723, + "learning_rate": 3.869209809264305e-06, + "loss": 3.6133, + "step": 213 + }, + { + "epoch": 0.5831062670299727, + "grad_norm": 11.130549430847168, + "learning_rate": 3.887375113533152e-06, + "loss": 3.3799, + "step": 214 + }, + { + "epoch": 0.5858310626702997, + "grad_norm": 12.440305709838867, + "learning_rate": 3.9055404178019984e-06, + "loss": 3.1426, + "step": 215 + }, + { + "epoch": 0.5885558583106267, + "grad_norm": 10.083247184753418, + "learning_rate": 3.9237057220708454e-06, + "loss": 3.4043, + "step": 216 + }, + { + "epoch": 0.5912806539509536, + "grad_norm": 10.952589988708496, + "learning_rate": 3.941871026339692e-06, + "loss": 3.7031, + "step": 217 + }, + { + "epoch": 0.5940054495912807, + "grad_norm": 12.696151733398438, + "learning_rate": 3.960036330608539e-06, + "loss": 3.3369, + "step": 218 + }, + { + "epoch": 0.5967302452316077, + "grad_norm": 11.99606990814209, + "learning_rate": 3.978201634877385e-06, + "loss": 3.4512, + "step": 219 + }, + { + "epoch": 0.5994550408719346, + "grad_norm": 10.46695613861084, + "learning_rate": 3.996366939146231e-06, + "loss": 3.3955, + "step": 220 + }, + { + "epoch": 0.6021798365122616, + "grad_norm": 10.558157920837402, + "learning_rate": 4.014532243415077e-06, + "loss": 3.4482, + "step": 221 + }, + { + "epoch": 0.6049046321525886, + "grad_norm": 8.639076232910156, + "learning_rate": 4.032697547683924e-06, + "loss": 3.1802, + "step": 222 + }, + { + "epoch": 0.6076294277929155, + "grad_norm": 9.703048706054688, + "learning_rate": 4.05086285195277e-06, + "loss": 3.374, + "step": 223 + }, + { + "epoch": 0.6103542234332425, + "grad_norm": 14.701447486877441, + "learning_rate": 4.069028156221617e-06, + "loss": 3.2822, + "step": 224 + }, + { + "epoch": 0.6130790190735694, + "grad_norm": 12.3848237991333, + "learning_rate": 4.0871934604904634e-06, + "loss": 3.2939, + "step": 225 + }, + { + "epoch": 0.6158038147138964, + "grad_norm": 9.180680274963379, + "learning_rate": 4.1053587647593104e-06, + "loss": 3.4766, + "step": 226 + }, + { + "epoch": 0.6185286103542235, + "grad_norm": 10.701723098754883, + "learning_rate": 4.123524069028157e-06, + "loss": 3.2617, + "step": 227 + }, + { + "epoch": 0.6212534059945504, + "grad_norm": 9.880071640014648, + "learning_rate": 4.141689373297003e-06, + "loss": 3.5107, + "step": 228 + }, + { + "epoch": 0.6239782016348774, + "grad_norm": 9.402396202087402, + "learning_rate": 4.15985467756585e-06, + "loss": 3.0391, + "step": 229 + }, + { + "epoch": 0.6267029972752044, + "grad_norm": 12.24167251586914, + "learning_rate": 4.178019981834696e-06, + "loss": 3.1533, + "step": 230 + }, + { + "epoch": 0.6294277929155313, + "grad_norm": 12.463957786560059, + "learning_rate": 4.196185286103542e-06, + "loss": 3.4404, + "step": 231 + }, + { + "epoch": 0.6321525885558583, + "grad_norm": 9.269294738769531, + "learning_rate": 4.214350590372389e-06, + "loss": 3.3408, + "step": 232 + }, + { + "epoch": 0.6348773841961853, + "grad_norm": 10.651533126831055, + "learning_rate": 4.232515894641235e-06, + "loss": 3.4043, + "step": 233 + }, + { + "epoch": 0.6376021798365122, + "grad_norm": 10.966300010681152, + "learning_rate": 4.250681198910082e-06, + "loss": 3.4717, + "step": 234 + }, + { + "epoch": 0.6403269754768393, + "grad_norm": 8.606398582458496, + "learning_rate": 4.2688465031789284e-06, + "loss": 3.2646, + "step": 235 + }, + { + "epoch": 0.6430517711171662, + "grad_norm": 11.82869815826416, + "learning_rate": 4.2870118074477754e-06, + "loss": 3.1846, + "step": 236 + }, + { + "epoch": 0.6457765667574932, + "grad_norm": 11.79569149017334, + "learning_rate": 4.305177111716622e-06, + "loss": 3.2842, + "step": 237 + }, + { + "epoch": 0.6485013623978202, + "grad_norm": 11.205436706542969, + "learning_rate": 4.323342415985468e-06, + "loss": 3.4346, + "step": 238 + }, + { + "epoch": 0.6512261580381471, + "grad_norm": 8.987303733825684, + "learning_rate": 4.341507720254315e-06, + "loss": 3.0576, + "step": 239 + }, + { + "epoch": 0.6539509536784741, + "grad_norm": 9.633455276489258, + "learning_rate": 4.359673024523161e-06, + "loss": 3.2197, + "step": 240 + }, + { + "epoch": 0.6566757493188011, + "grad_norm": 11.276183128356934, + "learning_rate": 4.377838328792008e-06, + "loss": 3.04, + "step": 241 + }, + { + "epoch": 0.659400544959128, + "grad_norm": 11.363617897033691, + "learning_rate": 4.396003633060854e-06, + "loss": 3.2559, + "step": 242 + }, + { + "epoch": 0.662125340599455, + "grad_norm": 11.577837944030762, + "learning_rate": 4.414168937329701e-06, + "loss": 3.2891, + "step": 243 + }, + { + "epoch": 0.6648501362397821, + "grad_norm": 8.874040603637695, + "learning_rate": 4.432334241598547e-06, + "loss": 3.1104, + "step": 244 + }, + { + "epoch": 0.667574931880109, + "grad_norm": 10.832159042358398, + "learning_rate": 4.4504995458673934e-06, + "loss": 3.0151, + "step": 245 + }, + { + "epoch": 0.670299727520436, + "grad_norm": 11.228150367736816, + "learning_rate": 4.4686648501362404e-06, + "loss": 3.2842, + "step": 246 + }, + { + "epoch": 0.6730245231607629, + "grad_norm": 9.785909652709961, + "learning_rate": 4.486830154405087e-06, + "loss": 3.4727, + "step": 247 + }, + { + "epoch": 0.6757493188010899, + "grad_norm": 9.006978034973145, + "learning_rate": 4.504995458673933e-06, + "loss": 3.3057, + "step": 248 + }, + { + "epoch": 0.6784741144414169, + "grad_norm": 9.31069278717041, + "learning_rate": 4.52316076294278e-06, + "loss": 3.1445, + "step": 249 + }, + { + "epoch": 0.6811989100817438, + "grad_norm": 14.589471817016602, + "learning_rate": 4.541326067211626e-06, + "loss": 3.0654, + "step": 250 + }, + { + "epoch": 0.6839237057220708, + "grad_norm": 9.290428161621094, + "learning_rate": 4.559491371480473e-06, + "loss": 3.127, + "step": 251 + }, + { + "epoch": 0.6866485013623979, + "grad_norm": 10.998537063598633, + "learning_rate": 4.577656675749319e-06, + "loss": 2.8945, + "step": 252 + }, + { + "epoch": 0.6893732970027248, + "grad_norm": 13.25707721710205, + "learning_rate": 4.595821980018166e-06, + "loss": 3.3193, + "step": 253 + }, + { + "epoch": 0.6920980926430518, + "grad_norm": 9.896824836730957, + "learning_rate": 4.613987284287012e-06, + "loss": 3.3301, + "step": 254 + }, + { + "epoch": 0.6948228882833788, + "grad_norm": 10.812071800231934, + "learning_rate": 4.6321525885558584e-06, + "loss": 3.2236, + "step": 255 + }, + { + "epoch": 0.6975476839237057, + "grad_norm": 10.396222114562988, + "learning_rate": 4.6503178928247054e-06, + "loss": 3.1211, + "step": 256 + }, + { + "epoch": 0.7002724795640327, + "grad_norm": 9.00611686706543, + "learning_rate": 4.668483197093552e-06, + "loss": 3.2051, + "step": 257 + }, + { + "epoch": 0.7029972752043597, + "grad_norm": 9.797375679016113, + "learning_rate": 4.686648501362398e-06, + "loss": 3.1797, + "step": 258 + }, + { + "epoch": 0.7057220708446866, + "grad_norm": 10.615898132324219, + "learning_rate": 4.704813805631245e-06, + "loss": 2.9658, + "step": 259 + }, + { + "epoch": 0.7084468664850136, + "grad_norm": 11.570025444030762, + "learning_rate": 4.722979109900091e-06, + "loss": 3.0869, + "step": 260 + }, + { + "epoch": 0.7111716621253406, + "grad_norm": 11.155060768127441, + "learning_rate": 4.741144414168938e-06, + "loss": 3.3213, + "step": 261 + }, + { + "epoch": 0.7138964577656676, + "grad_norm": 13.674558639526367, + "learning_rate": 4.759309718437784e-06, + "loss": 3.5439, + "step": 262 + }, + { + "epoch": 0.7166212534059946, + "grad_norm": 10.254398345947266, + "learning_rate": 4.777475022706631e-06, + "loss": 3.3672, + "step": 263 + }, + { + "epoch": 0.7193460490463215, + "grad_norm": 10.633976936340332, + "learning_rate": 4.795640326975477e-06, + "loss": 3.1436, + "step": 264 + }, + { + "epoch": 0.7220708446866485, + "grad_norm": 13.250679016113281, + "learning_rate": 4.8138056312443234e-06, + "loss": 3.0303, + "step": 265 + }, + { + "epoch": 0.7247956403269755, + "grad_norm": 10.197409629821777, + "learning_rate": 4.83197093551317e-06, + "loss": 3.0986, + "step": 266 + }, + { + "epoch": 0.7275204359673024, + "grad_norm": 12.010652542114258, + "learning_rate": 4.850136239782017e-06, + "loss": 3.0781, + "step": 267 + }, + { + "epoch": 0.7302452316076294, + "grad_norm": 10.654179573059082, + "learning_rate": 4.868301544050864e-06, + "loss": 3.2129, + "step": 268 + }, + { + "epoch": 0.7329700272479565, + "grad_norm": 10.578466415405273, + "learning_rate": 4.88646684831971e-06, + "loss": 3.3418, + "step": 269 + }, + { + "epoch": 0.7356948228882834, + "grad_norm": 11.487197875976562, + "learning_rate": 4.904632152588557e-06, + "loss": 3.1787, + "step": 270 + }, + { + "epoch": 0.7384196185286104, + "grad_norm": 8.67462158203125, + "learning_rate": 4.922797456857403e-06, + "loss": 3.0166, + "step": 271 + }, + { + "epoch": 0.7411444141689373, + "grad_norm": 10.115763664245605, + "learning_rate": 4.940962761126249e-06, + "loss": 2.9932, + "step": 272 + }, + { + "epoch": 0.7438692098092643, + "grad_norm": 10.159469604492188, + "learning_rate": 4.959128065395096e-06, + "loss": 3.0356, + "step": 273 + }, + { + "epoch": 0.7465940054495913, + "grad_norm": 10.377588272094727, + "learning_rate": 4.977293369663942e-06, + "loss": 3.043, + "step": 274 + }, + { + "epoch": 0.7493188010899182, + "grad_norm": 11.266051292419434, + "learning_rate": 4.9954586739327884e-06, + "loss": 3.1914, + "step": 275 + }, + { + "epoch": 0.7520435967302452, + "grad_norm": 12.121461868286133, + "learning_rate": 5.013623978201635e-06, + "loss": 2.8984, + "step": 276 + }, + { + "epoch": 0.7547683923705722, + "grad_norm": 10.40197467803955, + "learning_rate": 5.031789282470482e-06, + "loss": 2.6602, + "step": 277 + }, + { + "epoch": 0.7574931880108992, + "grad_norm": 10.558917999267578, + "learning_rate": 5.049954586739329e-06, + "loss": 3.043, + "step": 278 + }, + { + "epoch": 0.7602179836512262, + "grad_norm": 9.786828994750977, + "learning_rate": 5.068119891008176e-06, + "loss": 3.1069, + "step": 279 + }, + { + "epoch": 0.7629427792915532, + "grad_norm": 11.263306617736816, + "learning_rate": 5.086285195277021e-06, + "loss": 3.0688, + "step": 280 + }, + { + "epoch": 0.7656675749318801, + "grad_norm": 8.676852226257324, + "learning_rate": 5.104450499545868e-06, + "loss": 2.9199, + "step": 281 + }, + { + "epoch": 0.7683923705722071, + "grad_norm": 10.780664443969727, + "learning_rate": 5.122615803814714e-06, + "loss": 3.0317, + "step": 282 + }, + { + "epoch": 0.771117166212534, + "grad_norm": 12.283220291137695, + "learning_rate": 5.140781108083561e-06, + "loss": 3.1592, + "step": 283 + }, + { + "epoch": 0.773841961852861, + "grad_norm": 9.572271347045898, + "learning_rate": 5.158946412352407e-06, + "loss": 3.1748, + "step": 284 + }, + { + "epoch": 0.776566757493188, + "grad_norm": 13.599047660827637, + "learning_rate": 5.1771117166212534e-06, + "loss": 2.9395, + "step": 285 + }, + { + "epoch": 0.779291553133515, + "grad_norm": 12.397294998168945, + "learning_rate": 5.1952770208901005e-06, + "loss": 3.0732, + "step": 286 + }, + { + "epoch": 0.782016348773842, + "grad_norm": 10.11894416809082, + "learning_rate": 5.2134423251589475e-06, + "loss": 3.2109, + "step": 287 + }, + { + "epoch": 0.784741144414169, + "grad_norm": 9.713980674743652, + "learning_rate": 5.231607629427793e-06, + "loss": 3.002, + "step": 288 + }, + { + "epoch": 0.7874659400544959, + "grad_norm": 12.788566589355469, + "learning_rate": 5.24977293369664e-06, + "loss": 3.125, + "step": 289 + }, + { + "epoch": 0.7901907356948229, + "grad_norm": 10.20035171508789, + "learning_rate": 5.267938237965487e-06, + "loss": 3.1172, + "step": 290 + }, + { + "epoch": 0.7929155313351499, + "grad_norm": 9.050313949584961, + "learning_rate": 5.286103542234333e-06, + "loss": 3.1074, + "step": 291 + }, + { + "epoch": 0.7956403269754768, + "grad_norm": 12.593305587768555, + "learning_rate": 5.304268846503179e-06, + "loss": 3.2715, + "step": 292 + }, + { + "epoch": 0.7983651226158038, + "grad_norm": 9.735793113708496, + "learning_rate": 5.322434150772025e-06, + "loss": 3.1445, + "step": 293 + }, + { + "epoch": 0.8010899182561307, + "grad_norm": 13.674619674682617, + "learning_rate": 5.340599455040872e-06, + "loss": 3.1611, + "step": 294 + }, + { + "epoch": 0.8038147138964578, + "grad_norm": 11.066041946411133, + "learning_rate": 5.358764759309719e-06, + "loss": 2.8115, + "step": 295 + }, + { + "epoch": 0.8065395095367848, + "grad_norm": 10.592111587524414, + "learning_rate": 5.376930063578565e-06, + "loss": 2.9028, + "step": 296 + }, + { + "epoch": 0.8092643051771117, + "grad_norm": 10.814714431762695, + "learning_rate": 5.395095367847412e-06, + "loss": 2.8428, + "step": 297 + }, + { + "epoch": 0.8119891008174387, + "grad_norm": 9.773011207580566, + "learning_rate": 5.413260672116259e-06, + "loss": 2.8975, + "step": 298 + }, + { + "epoch": 0.8147138964577657, + "grad_norm": 9.989364624023438, + "learning_rate": 5.431425976385105e-06, + "loss": 2.8833, + "step": 299 + }, + { + "epoch": 0.8174386920980926, + "grad_norm": 10.806577682495117, + "learning_rate": 5.449591280653952e-06, + "loss": 3.3301, + "step": 300 + }, + { + "epoch": 0.8201634877384196, + "grad_norm": 11.721353530883789, + "learning_rate": 5.467756584922798e-06, + "loss": 3.0889, + "step": 301 + }, + { + "epoch": 0.8228882833787466, + "grad_norm": 11.272564888000488, + "learning_rate": 5.485921889191644e-06, + "loss": 3.25, + "step": 302 + }, + { + "epoch": 0.8256130790190735, + "grad_norm": 9.646610260009766, + "learning_rate": 5.504087193460491e-06, + "loss": 3.0498, + "step": 303 + }, + { + "epoch": 0.8283378746594006, + "grad_norm": 10.122640609741211, + "learning_rate": 5.522252497729338e-06, + "loss": 2.8525, + "step": 304 + }, + { + "epoch": 0.8310626702997275, + "grad_norm": 11.975621223449707, + "learning_rate": 5.5404178019981835e-06, + "loss": 2.98, + "step": 305 + }, + { + "epoch": 0.8337874659400545, + "grad_norm": 9.96011734008789, + "learning_rate": 5.5585831062670305e-06, + "loss": 3.1787, + "step": 306 + }, + { + "epoch": 0.8365122615803815, + "grad_norm": 11.059173583984375, + "learning_rate": 5.5767484105358775e-06, + "loss": 3.2861, + "step": 307 + }, + { + "epoch": 0.8392370572207084, + "grad_norm": 10.573100090026855, + "learning_rate": 5.594913714804724e-06, + "loss": 2.9976, + "step": 308 + }, + { + "epoch": 0.8419618528610354, + "grad_norm": 11.470596313476562, + "learning_rate": 5.61307901907357e-06, + "loss": 2.9238, + "step": 309 + }, + { + "epoch": 0.8446866485013624, + "grad_norm": 11.162026405334473, + "learning_rate": 5.631244323342416e-06, + "loss": 3.2871, + "step": 310 + }, + { + "epoch": 0.8474114441416893, + "grad_norm": 10.692909240722656, + "learning_rate": 5.649409627611263e-06, + "loss": 3.252, + "step": 311 + }, + { + "epoch": 0.8501362397820164, + "grad_norm": 11.107943534851074, + "learning_rate": 5.66757493188011e-06, + "loss": 3.2139, + "step": 312 + }, + { + "epoch": 0.8528610354223434, + "grad_norm": 9.772025108337402, + "learning_rate": 5.685740236148955e-06, + "loss": 2.8848, + "step": 313 + }, + { + "epoch": 0.8555858310626703, + "grad_norm": 10.775506019592285, + "learning_rate": 5.703905540417802e-06, + "loss": 3.0908, + "step": 314 + }, + { + "epoch": 0.8583106267029973, + "grad_norm": 14.792106628417969, + "learning_rate": 5.722070844686649e-06, + "loss": 2.8691, + "step": 315 + }, + { + "epoch": 0.8610354223433242, + "grad_norm": 10.167881965637207, + "learning_rate": 5.7402361489554955e-06, + "loss": 3.0137, + "step": 316 + }, + { + "epoch": 0.8637602179836512, + "grad_norm": 11.682990074157715, + "learning_rate": 5.758401453224342e-06, + "loss": 3.2441, + "step": 317 + }, + { + "epoch": 0.8664850136239782, + "grad_norm": 10.642148971557617, + "learning_rate": 5.776566757493189e-06, + "loss": 2.9629, + "step": 318 + }, + { + "epoch": 0.8692098092643051, + "grad_norm": 13.177349090576172, + "learning_rate": 5.794732061762035e-06, + "loss": 3.1973, + "step": 319 + }, + { + "epoch": 0.8719346049046321, + "grad_norm": 10.01991081237793, + "learning_rate": 5.812897366030882e-06, + "loss": 2.9751, + "step": 320 + }, + { + "epoch": 0.8746594005449592, + "grad_norm": 11.585193634033203, + "learning_rate": 5.831062670299727e-06, + "loss": 3.249, + "step": 321 + }, + { + "epoch": 0.8773841961852861, + "grad_norm": 9.34164047241211, + "learning_rate": 5.849227974568574e-06, + "loss": 2.9863, + "step": 322 + }, + { + "epoch": 0.8801089918256131, + "grad_norm": 10.178692817687988, + "learning_rate": 5.867393278837421e-06, + "loss": 2.9072, + "step": 323 + }, + { + "epoch": 0.8828337874659401, + "grad_norm": 10.652539253234863, + "learning_rate": 5.885558583106268e-06, + "loss": 2.9502, + "step": 324 + }, + { + "epoch": 0.885558583106267, + "grad_norm": 9.648669242858887, + "learning_rate": 5.9037238873751135e-06, + "loss": 3.0527, + "step": 325 + }, + { + "epoch": 0.888283378746594, + "grad_norm": 8.94349193572998, + "learning_rate": 5.9218891916439605e-06, + "loss": 3.1143, + "step": 326 + }, + { + "epoch": 0.8910081743869209, + "grad_norm": 9.749101638793945, + "learning_rate": 5.940054495912807e-06, + "loss": 2.957, + "step": 327 + }, + { + "epoch": 0.8937329700272479, + "grad_norm": 10.487102508544922, + "learning_rate": 5.958219800181654e-06, + "loss": 2.7764, + "step": 328 + }, + { + "epoch": 0.896457765667575, + "grad_norm": 11.558155059814453, + "learning_rate": 5.976385104450501e-06, + "loss": 3.0679, + "step": 329 + }, + { + "epoch": 0.8991825613079019, + "grad_norm": 8.687368392944336, + "learning_rate": 5.994550408719346e-06, + "loss": 2.8779, + "step": 330 + }, + { + "epoch": 0.9019073569482289, + "grad_norm": 11.50344181060791, + "learning_rate": 6.012715712988193e-06, + "loss": 2.8945, + "step": 331 + }, + { + "epoch": 0.9046321525885559, + "grad_norm": 8.328307151794434, + "learning_rate": 6.03088101725704e-06, + "loss": 2.8618, + "step": 332 + }, + { + "epoch": 0.9073569482288828, + "grad_norm": 10.823127746582031, + "learning_rate": 6.049046321525886e-06, + "loss": 3.085, + "step": 333 + }, + { + "epoch": 0.9100817438692098, + "grad_norm": 9.42167854309082, + "learning_rate": 6.067211625794732e-06, + "loss": 2.7568, + "step": 334 + }, + { + "epoch": 0.9128065395095368, + "grad_norm": 9.684298515319824, + "learning_rate": 6.085376930063579e-06, + "loss": 2.9136, + "step": 335 + }, + { + "epoch": 0.9155313351498637, + "grad_norm": 10.575213432312012, + "learning_rate": 6.1035422343324255e-06, + "loss": 3.1797, + "step": 336 + }, + { + "epoch": 0.9182561307901907, + "grad_norm": 9.206254959106445, + "learning_rate": 6.1217075386012725e-06, + "loss": 3.084, + "step": 337 + }, + { + "epoch": 0.9209809264305178, + "grad_norm": 10.56982135772705, + "learning_rate": 6.139872842870118e-06, + "loss": 2.7876, + "step": 338 + }, + { + "epoch": 0.9237057220708447, + "grad_norm": 9.894237518310547, + "learning_rate": 6.158038147138965e-06, + "loss": 2.9077, + "step": 339 + }, + { + "epoch": 0.9264305177111717, + "grad_norm": 8.02868366241455, + "learning_rate": 6.176203451407812e-06, + "loss": 2.8062, + "step": 340 + }, + { + "epoch": 0.9291553133514986, + "grad_norm": 8.86514663696289, + "learning_rate": 6.194368755676659e-06, + "loss": 2.9062, + "step": 341 + }, + { + "epoch": 0.9318801089918256, + "grad_norm": 15.095792770385742, + "learning_rate": 6.212534059945504e-06, + "loss": 2.9209, + "step": 342 + }, + { + "epoch": 0.9346049046321526, + "grad_norm": 10.972758293151855, + "learning_rate": 6.230699364214351e-06, + "loss": 2.9863, + "step": 343 + }, + { + "epoch": 0.9373297002724795, + "grad_norm": 9.462160110473633, + "learning_rate": 6.248864668483197e-06, + "loss": 2.9688, + "step": 344 + }, + { + "epoch": 0.9400544959128065, + "grad_norm": 8.696920394897461, + "learning_rate": 6.267029972752044e-06, + "loss": 2.96, + "step": 345 + }, + { + "epoch": 0.9427792915531336, + "grad_norm": 12.647309303283691, + "learning_rate": 6.2851952770208905e-06, + "loss": 3.0645, + "step": 346 + }, + { + "epoch": 0.9455040871934605, + "grad_norm": 10.608399391174316, + "learning_rate": 6.303360581289737e-06, + "loss": 2.8242, + "step": 347 + }, + { + "epoch": 0.9482288828337875, + "grad_norm": 11.65522289276123, + "learning_rate": 6.321525885558584e-06, + "loss": 3.1382, + "step": 348 + }, + { + "epoch": 0.9509536784741145, + "grad_norm": 8.824722290039062, + "learning_rate": 6.339691189827431e-06, + "loss": 2.917, + "step": 349 + }, + { + "epoch": 0.9536784741144414, + "grad_norm": 11.027289390563965, + "learning_rate": 6.357856494096276e-06, + "loss": 3.0371, + "step": 350 + }, + { + "epoch": 0.9564032697547684, + "grad_norm": 12.124699592590332, + "learning_rate": 6.376021798365123e-06, + "loss": 3.1348, + "step": 351 + }, + { + "epoch": 0.9591280653950953, + "grad_norm": 11.385178565979004, + "learning_rate": 6.39418710263397e-06, + "loss": 2.9229, + "step": 352 + }, + { + "epoch": 0.9618528610354223, + "grad_norm": 11.994840621948242, + "learning_rate": 6.412352406902816e-06, + "loss": 3.1709, + "step": 353 + }, + { + "epoch": 0.9645776566757494, + "grad_norm": 8.85571002960205, + "learning_rate": 6.430517711171662e-06, + "loss": 2.7881, + "step": 354 + }, + { + "epoch": 0.9673024523160763, + "grad_norm": 11.468720436096191, + "learning_rate": 6.448683015440509e-06, + "loss": 2.7666, + "step": 355 + }, + { + "epoch": 0.9700272479564033, + "grad_norm": 9.187004089355469, + "learning_rate": 6.4668483197093555e-06, + "loss": 3.0547, + "step": 356 + }, + { + "epoch": 0.9727520435967303, + "grad_norm": 11.031088829040527, + "learning_rate": 6.4850136239782025e-06, + "loss": 3.1611, + "step": 357 + }, + { + "epoch": 0.9754768392370572, + "grad_norm": 10.66789436340332, + "learning_rate": 6.5031789282470495e-06, + "loss": 2.8545, + "step": 358 + }, + { + "epoch": 0.9782016348773842, + "grad_norm": 12.648036003112793, + "learning_rate": 6.521344232515895e-06, + "loss": 2.9009, + "step": 359 + }, + { + "epoch": 0.9809264305177112, + "grad_norm": 9.666924476623535, + "learning_rate": 6.539509536784742e-06, + "loss": 2.9673, + "step": 360 + }, + { + "epoch": 0.9836512261580381, + "grad_norm": 11.903847694396973, + "learning_rate": 6.557674841053589e-06, + "loss": 2.6465, + "step": 361 + }, + { + "epoch": 0.9863760217983651, + "grad_norm": 14.617626190185547, + "learning_rate": 6.575840145322435e-06, + "loss": 3.0, + "step": 362 + }, + { + "epoch": 0.989100817438692, + "grad_norm": 17.167770385742188, + "learning_rate": 6.594005449591281e-06, + "loss": 3.041, + "step": 363 + }, + { + "epoch": 0.9918256130790191, + "grad_norm": 12.77061653137207, + "learning_rate": 6.612170753860127e-06, + "loss": 2.9688, + "step": 364 + }, + { + "epoch": 0.9945504087193461, + "grad_norm": 10.30443286895752, + "learning_rate": 6.630336058128974e-06, + "loss": 2.7344, + "step": 365 + }, + { + "epoch": 0.997275204359673, + "grad_norm": 14.379679679870605, + "learning_rate": 6.648501362397821e-06, + "loss": 2.8291, + "step": 366 + }, + { + "epoch": 1.0, + "grad_norm": 10.28809928894043, + "learning_rate": 6.666666666666667e-06, + "loss": 2.9424, + "step": 367 + }, + { + "epoch": 1.002724795640327, + "grad_norm": 10.779088973999023, + "learning_rate": 6.684831970935514e-06, + "loss": 2.9834, + "step": 368 + }, + { + "epoch": 1.005449591280654, + "grad_norm": 11.226832389831543, + "learning_rate": 6.702997275204361e-06, + "loss": 2.9473, + "step": 369 + }, + { + "epoch": 1.008174386920981, + "grad_norm": 9.997020721435547, + "learning_rate": 6.721162579473207e-06, + "loss": 2.7344, + "step": 370 + }, + { + "epoch": 1.0108991825613078, + "grad_norm": 11.764245986938477, + "learning_rate": 6.739327883742053e-06, + "loss": 2.8877, + "step": 371 + }, + { + "epoch": 1.013623978201635, + "grad_norm": 11.373870849609375, + "learning_rate": 6.7574931880109e-06, + "loss": 3.1035, + "step": 372 + }, + { + "epoch": 1.0163487738419619, + "grad_norm": 12.055533409118652, + "learning_rate": 6.775658492279746e-06, + "loss": 2.8447, + "step": 373 + }, + { + "epoch": 1.0190735694822888, + "grad_norm": 31.768789291381836, + "learning_rate": 6.793823796548593e-06, + "loss": 2.8325, + "step": 374 + }, + { + "epoch": 1.021798365122616, + "grad_norm": 10.671889305114746, + "learning_rate": 6.8119891008174385e-06, + "loss": 2.96, + "step": 375 + }, + { + "epoch": 1.0245231607629428, + "grad_norm": 11.033255577087402, + "learning_rate": 6.8301544050862855e-06, + "loss": 2.8223, + "step": 376 + }, + { + "epoch": 1.0272479564032697, + "grad_norm": 11.364258766174316, + "learning_rate": 6.8483197093551325e-06, + "loss": 2.9634, + "step": 377 + }, + { + "epoch": 1.0299727520435966, + "grad_norm": 8.979849815368652, + "learning_rate": 6.8664850136239795e-06, + "loss": 2.9229, + "step": 378 + }, + { + "epoch": 1.0326975476839237, + "grad_norm": 10.40015697479248, + "learning_rate": 6.884650317892825e-06, + "loss": 2.8232, + "step": 379 + }, + { + "epoch": 1.0354223433242506, + "grad_norm": 8.893531799316406, + "learning_rate": 6.902815622161672e-06, + "loss": 2.8813, + "step": 380 + }, + { + "epoch": 1.0381471389645776, + "grad_norm": 11.417078018188477, + "learning_rate": 6.920980926430518e-06, + "loss": 2.7207, + "step": 381 + }, + { + "epoch": 1.0408719346049047, + "grad_norm": 10.525177955627441, + "learning_rate": 6.939146230699365e-06, + "loss": 2.9854, + "step": 382 + }, + { + "epoch": 1.0435967302452316, + "grad_norm": 9.927412033081055, + "learning_rate": 6.957311534968211e-06, + "loss": 2.8262, + "step": 383 + }, + { + "epoch": 1.0463215258855585, + "grad_norm": 12.706193923950195, + "learning_rate": 6.975476839237057e-06, + "loss": 3.0049, + "step": 384 + }, + { + "epoch": 1.0490463215258856, + "grad_norm": 10.498812675476074, + "learning_rate": 6.993642143505904e-06, + "loss": 2.7578, + "step": 385 + }, + { + "epoch": 1.0517711171662125, + "grad_norm": 10.719517707824707, + "learning_rate": 7.011807447774751e-06, + "loss": 2.8618, + "step": 386 + }, + { + "epoch": 1.0544959128065394, + "grad_norm": 12.072530746459961, + "learning_rate": 7.0299727520435975e-06, + "loss": 2.7798, + "step": 387 + }, + { + "epoch": 1.0572207084468666, + "grad_norm": 9.507881164550781, + "learning_rate": 7.048138056312444e-06, + "loss": 2.6548, + "step": 388 + }, + { + "epoch": 1.0599455040871935, + "grad_norm": 12.026369094848633, + "learning_rate": 7.066303360581291e-06, + "loss": 2.7642, + "step": 389 + }, + { + "epoch": 1.0626702997275204, + "grad_norm": 11.388680458068848, + "learning_rate": 7.084468664850137e-06, + "loss": 2.749, + "step": 390 + }, + { + "epoch": 1.0653950953678475, + "grad_norm": 12.096214294433594, + "learning_rate": 7.102633969118984e-06, + "loss": 2.6499, + "step": 391 + }, + { + "epoch": 1.0681198910081744, + "grad_norm": 12.473118782043457, + "learning_rate": 7.120799273387829e-06, + "loss": 2.9619, + "step": 392 + }, + { + "epoch": 1.0708446866485013, + "grad_norm": 10.778851509094238, + "learning_rate": 7.138964577656676e-06, + "loss": 2.7432, + "step": 393 + }, + { + "epoch": 1.0735694822888284, + "grad_norm": 12.79310417175293, + "learning_rate": 7.157129881925523e-06, + "loss": 2.8647, + "step": 394 + }, + { + "epoch": 1.0762942779291553, + "grad_norm": 12.59657096862793, + "learning_rate": 7.17529518619437e-06, + "loss": 2.689, + "step": 395 + }, + { + "epoch": 1.0790190735694822, + "grad_norm": 11.395380973815918, + "learning_rate": 7.1934604904632155e-06, + "loss": 2.9043, + "step": 396 + }, + { + "epoch": 1.0817438692098094, + "grad_norm": 12.513686180114746, + "learning_rate": 7.2116257947320625e-06, + "loss": 2.8154, + "step": 397 + }, + { + "epoch": 1.0844686648501363, + "grad_norm": 10.173294067382812, + "learning_rate": 7.229791099000909e-06, + "loss": 2.6123, + "step": 398 + }, + { + "epoch": 1.0871934604904632, + "grad_norm": 9.681666374206543, + "learning_rate": 7.247956403269756e-06, + "loss": 2.4634, + "step": 399 + }, + { + "epoch": 1.0899182561307903, + "grad_norm": 11.721431732177734, + "learning_rate": 7.266121707538602e-06, + "loss": 2.8311, + "step": 400 + }, + { + "epoch": 1.0926430517711172, + "grad_norm": 9.718865394592285, + "learning_rate": 7.284287011807448e-06, + "loss": 2.7515, + "step": 401 + }, + { + "epoch": 1.095367847411444, + "grad_norm": 13.524134635925293, + "learning_rate": 7.302452316076295e-06, + "loss": 2.6484, + "step": 402 + }, + { + "epoch": 1.0980926430517712, + "grad_norm": 8.978958129882812, + "learning_rate": 7.320617620345142e-06, + "loss": 2.8022, + "step": 403 + }, + { + "epoch": 1.1008174386920981, + "grad_norm": 10.181389808654785, + "learning_rate": 7.338782924613987e-06, + "loss": 2.8721, + "step": 404 + }, + { + "epoch": 1.103542234332425, + "grad_norm": 9.95703125, + "learning_rate": 7.356948228882834e-06, + "loss": 2.9873, + "step": 405 + }, + { + "epoch": 1.106267029972752, + "grad_norm": 9.80728530883789, + "learning_rate": 7.375113533151681e-06, + "loss": 2.5879, + "step": 406 + }, + { + "epoch": 1.108991825613079, + "grad_norm": 11.94822883605957, + "learning_rate": 7.3932788374205275e-06, + "loss": 2.6226, + "step": 407 + }, + { + "epoch": 1.111716621253406, + "grad_norm": 10.268418312072754, + "learning_rate": 7.411444141689374e-06, + "loss": 2.6157, + "step": 408 + }, + { + "epoch": 1.1144414168937329, + "grad_norm": 13.16259765625, + "learning_rate": 7.42960944595822e-06, + "loss": 2.6309, + "step": 409 + }, + { + "epoch": 1.11716621253406, + "grad_norm": 9.806975364685059, + "learning_rate": 7.447774750227067e-06, + "loss": 2.5195, + "step": 410 + }, + { + "epoch": 1.119891008174387, + "grad_norm": 11.498656272888184, + "learning_rate": 7.465940054495914e-06, + "loss": 2.9082, + "step": 411 + }, + { + "epoch": 1.1226158038147138, + "grad_norm": 10.164894104003906, + "learning_rate": 7.484105358764759e-06, + "loss": 2.7812, + "step": 412 + }, + { + "epoch": 1.125340599455041, + "grad_norm": 16.40764808654785, + "learning_rate": 7.502270663033606e-06, + "loss": 2.5967, + "step": 413 + }, + { + "epoch": 1.1280653950953679, + "grad_norm": 13.020524024963379, + "learning_rate": 7.520435967302453e-06, + "loss": 2.793, + "step": 414 + }, + { + "epoch": 1.1307901907356948, + "grad_norm": 9.52269458770752, + "learning_rate": 7.538601271571299e-06, + "loss": 2.4224, + "step": 415 + }, + { + "epoch": 1.1335149863760219, + "grad_norm": 13.420445442199707, + "learning_rate": 7.5567665758401455e-06, + "loss": 2.6089, + "step": 416 + }, + { + "epoch": 1.1362397820163488, + "grad_norm": 10.215398788452148, + "learning_rate": 7.5749318801089925e-06, + "loss": 2.9336, + "step": 417 + }, + { + "epoch": 1.1389645776566757, + "grad_norm": 11.343588829040527, + "learning_rate": 7.593097184377839e-06, + "loss": 2.8281, + "step": 418 + }, + { + "epoch": 1.1416893732970028, + "grad_norm": 11.341489791870117, + "learning_rate": 7.611262488646686e-06, + "loss": 2.8442, + "step": 419 + }, + { + "epoch": 1.1444141689373297, + "grad_norm": 13.097975730895996, + "learning_rate": 7.629427792915532e-06, + "loss": 2.897, + "step": 420 + }, + { + "epoch": 1.1471389645776566, + "grad_norm": 15.45946216583252, + "learning_rate": 7.647593097184378e-06, + "loss": 2.4253, + "step": 421 + }, + { + "epoch": 1.1498637602179835, + "grad_norm": 9.48956298828125, + "learning_rate": 7.665758401453224e-06, + "loss": 2.501, + "step": 422 + }, + { + "epoch": 1.1525885558583107, + "grad_norm": 14.140972137451172, + "learning_rate": 7.683923705722072e-06, + "loss": 2.6108, + "step": 423 + }, + { + "epoch": 1.1553133514986376, + "grad_norm": 12.59040641784668, + "learning_rate": 7.702089009990918e-06, + "loss": 2.7061, + "step": 424 + }, + { + "epoch": 1.1580381471389645, + "grad_norm": 11.303720474243164, + "learning_rate": 7.720254314259764e-06, + "loss": 2.6416, + "step": 425 + }, + { + "epoch": 1.1607629427792916, + "grad_norm": 9.568498611450195, + "learning_rate": 7.73841961852861e-06, + "loss": 2.6787, + "step": 426 + }, + { + "epoch": 1.1634877384196185, + "grad_norm": 9.496077537536621, + "learning_rate": 7.756584922797458e-06, + "loss": 2.918, + "step": 427 + }, + { + "epoch": 1.1662125340599454, + "grad_norm": 11.773557662963867, + "learning_rate": 7.774750227066305e-06, + "loss": 2.9116, + "step": 428 + }, + { + "epoch": 1.1689373297002725, + "grad_norm": 10.357346534729004, + "learning_rate": 7.79291553133515e-06, + "loss": 2.627, + "step": 429 + }, + { + "epoch": 1.1716621253405994, + "grad_norm": 12.790385246276855, + "learning_rate": 7.811080835603997e-06, + "loss": 2.6235, + "step": 430 + }, + { + "epoch": 1.1743869209809263, + "grad_norm": 13.647273063659668, + "learning_rate": 7.829246139872843e-06, + "loss": 3.248, + "step": 431 + }, + { + "epoch": 1.1771117166212535, + "grad_norm": 12.220288276672363, + "learning_rate": 7.847411444141691e-06, + "loss": 2.769, + "step": 432 + }, + { + "epoch": 1.1798365122615804, + "grad_norm": 11.686890602111816, + "learning_rate": 7.865576748410535e-06, + "loss": 2.3706, + "step": 433 + }, + { + "epoch": 1.1825613079019073, + "grad_norm": 12.022626876831055, + "learning_rate": 7.883742052679383e-06, + "loss": 2.5293, + "step": 434 + }, + { + "epoch": 1.1852861035422344, + "grad_norm": 9.241992950439453, + "learning_rate": 7.90190735694823e-06, + "loss": 2.5386, + "step": 435 + }, + { + "epoch": 1.1880108991825613, + "grad_norm": 9.880123138427734, + "learning_rate": 7.920072661217077e-06, + "loss": 2.687, + "step": 436 + }, + { + "epoch": 1.1907356948228882, + "grad_norm": 11.03382396697998, + "learning_rate": 7.938237965485922e-06, + "loss": 2.7334, + "step": 437 + }, + { + "epoch": 1.1934604904632153, + "grad_norm": 11.051270484924316, + "learning_rate": 7.95640326975477e-06, + "loss": 2.7217, + "step": 438 + }, + { + "epoch": 1.1961852861035422, + "grad_norm": 13.074309349060059, + "learning_rate": 7.974568574023616e-06, + "loss": 2.7139, + "step": 439 + }, + { + "epoch": 1.1989100817438691, + "grad_norm": 11.242266654968262, + "learning_rate": 7.992733878292462e-06, + "loss": 2.6152, + "step": 440 + }, + { + "epoch": 1.2016348773841963, + "grad_norm": 11.25084400177002, + "learning_rate": 8.010899182561308e-06, + "loss": 2.6558, + "step": 441 + }, + { + "epoch": 1.2043596730245232, + "grad_norm": 10.377076148986816, + "learning_rate": 8.029064486830154e-06, + "loss": 2.6245, + "step": 442 + }, + { + "epoch": 1.20708446866485, + "grad_norm": 10.222033500671387, + "learning_rate": 8.047229791099002e-06, + "loss": 3.0137, + "step": 443 + }, + { + "epoch": 1.2098092643051772, + "grad_norm": 9.710803031921387, + "learning_rate": 8.065395095367848e-06, + "loss": 2.8018, + "step": 444 + }, + { + "epoch": 1.2125340599455041, + "grad_norm": 12.02476692199707, + "learning_rate": 8.083560399636694e-06, + "loss": 2.7852, + "step": 445 + }, + { + "epoch": 1.215258855585831, + "grad_norm": 11.377335548400879, + "learning_rate": 8.10172570390554e-06, + "loss": 2.6895, + "step": 446 + }, + { + "epoch": 1.2179836512261581, + "grad_norm": 9.653413772583008, + "learning_rate": 8.119891008174388e-06, + "loss": 2.5435, + "step": 447 + }, + { + "epoch": 1.220708446866485, + "grad_norm": 10.20368480682373, + "learning_rate": 8.138056312443235e-06, + "loss": 2.71, + "step": 448 + }, + { + "epoch": 1.223433242506812, + "grad_norm": 10.484225273132324, + "learning_rate": 8.15622161671208e-06, + "loss": 2.5337, + "step": 449 + }, + { + "epoch": 1.226158038147139, + "grad_norm": 13.753677368164062, + "learning_rate": 8.174386920980927e-06, + "loss": 2.7847, + "step": 450 + }, + { + "epoch": 1.228882833787466, + "grad_norm": 11.210610389709473, + "learning_rate": 8.192552225249773e-06, + "loss": 2.6738, + "step": 451 + }, + { + "epoch": 1.231607629427793, + "grad_norm": 10.580645561218262, + "learning_rate": 8.210717529518621e-06, + "loss": 2.6934, + "step": 452 + }, + { + "epoch": 1.2343324250681198, + "grad_norm": 10.421024322509766, + "learning_rate": 8.228882833787467e-06, + "loss": 2.7798, + "step": 453 + }, + { + "epoch": 1.237057220708447, + "grad_norm": 11.129182815551758, + "learning_rate": 8.247048138056313e-06, + "loss": 2.6597, + "step": 454 + }, + { + "epoch": 1.2397820163487738, + "grad_norm": 11.662261009216309, + "learning_rate": 8.26521344232516e-06, + "loss": 2.6504, + "step": 455 + }, + { + "epoch": 1.2425068119891007, + "grad_norm": 29.719701766967773, + "learning_rate": 8.283378746594006e-06, + "loss": 2.9678, + "step": 456 + }, + { + "epoch": 1.2452316076294279, + "grad_norm": 10.148482322692871, + "learning_rate": 8.301544050862853e-06, + "loss": 2.5928, + "step": 457 + }, + { + "epoch": 1.2479564032697548, + "grad_norm": 10.919842720031738, + "learning_rate": 8.3197093551317e-06, + "loss": 2.6074, + "step": 458 + }, + { + "epoch": 1.2506811989100817, + "grad_norm": 11.2857027053833, + "learning_rate": 8.337874659400546e-06, + "loss": 2.7573, + "step": 459 + }, + { + "epoch": 1.2534059945504088, + "grad_norm": 10.820455551147461, + "learning_rate": 8.356039963669392e-06, + "loss": 2.4141, + "step": 460 + }, + { + "epoch": 1.2561307901907357, + "grad_norm": 14.457060813903809, + "learning_rate": 8.37420526793824e-06, + "loss": 2.8892, + "step": 461 + }, + { + "epoch": 1.2588555858310626, + "grad_norm": 8.9891939163208, + "learning_rate": 8.392370572207084e-06, + "loss": 2.8398, + "step": 462 + }, + { + "epoch": 1.2615803814713895, + "grad_norm": 11.050307273864746, + "learning_rate": 8.410535876475932e-06, + "loss": 2.6924, + "step": 463 + }, + { + "epoch": 1.2643051771117166, + "grad_norm": 10.814742088317871, + "learning_rate": 8.428701180744778e-06, + "loss": 2.6929, + "step": 464 + }, + { + "epoch": 1.2670299727520435, + "grad_norm": 11.274110794067383, + "learning_rate": 8.446866485013624e-06, + "loss": 2.5933, + "step": 465 + }, + { + "epoch": 1.2697547683923704, + "grad_norm": 13.799680709838867, + "learning_rate": 8.46503178928247e-06, + "loss": 2.6382, + "step": 466 + }, + { + "epoch": 1.2724795640326976, + "grad_norm": 11.533510208129883, + "learning_rate": 8.483197093551317e-06, + "loss": 2.7002, + "step": 467 + }, + { + "epoch": 1.2752043596730245, + "grad_norm": 11.78360366821289, + "learning_rate": 8.501362397820165e-06, + "loss": 2.5723, + "step": 468 + }, + { + "epoch": 1.2779291553133514, + "grad_norm": 14.222066879272461, + "learning_rate": 8.51952770208901e-06, + "loss": 2.7705, + "step": 469 + }, + { + "epoch": 1.2806539509536785, + "grad_norm": 12.54738712310791, + "learning_rate": 8.537693006357857e-06, + "loss": 2.4131, + "step": 470 + }, + { + "epoch": 1.2833787465940054, + "grad_norm": 11.072205543518066, + "learning_rate": 8.555858310626703e-06, + "loss": 2.7427, + "step": 471 + }, + { + "epoch": 1.2861035422343323, + "grad_norm": 11.79690170288086, + "learning_rate": 8.574023614895551e-06, + "loss": 2.7095, + "step": 472 + }, + { + "epoch": 1.2888283378746594, + "grad_norm": 11.124776840209961, + "learning_rate": 8.592188919164397e-06, + "loss": 2.624, + "step": 473 + }, + { + "epoch": 1.2915531335149864, + "grad_norm": 10.043506622314453, + "learning_rate": 8.610354223433243e-06, + "loss": 2.4404, + "step": 474 + }, + { + "epoch": 1.2942779291553133, + "grad_norm": 15.051888465881348, + "learning_rate": 8.62851952770209e-06, + "loss": 2.833, + "step": 475 + }, + { + "epoch": 1.2970027247956404, + "grad_norm": 9.278153419494629, + "learning_rate": 8.646684831970936e-06, + "loss": 2.5469, + "step": 476 + }, + { + "epoch": 1.2997275204359673, + "grad_norm": 12.055374145507812, + "learning_rate": 8.664850136239783e-06, + "loss": 2.5098, + "step": 477 + }, + { + "epoch": 1.3024523160762942, + "grad_norm": 9.819018363952637, + "learning_rate": 8.68301544050863e-06, + "loss": 2.522, + "step": 478 + }, + { + "epoch": 1.3051771117166213, + "grad_norm": 10.395660400390625, + "learning_rate": 8.701180744777476e-06, + "loss": 2.6792, + "step": 479 + }, + { + "epoch": 1.3079019073569482, + "grad_norm": 12.166010856628418, + "learning_rate": 8.719346049046322e-06, + "loss": 2.5669, + "step": 480 + }, + { + "epoch": 1.3106267029972751, + "grad_norm": 23.176393508911133, + "learning_rate": 8.73751135331517e-06, + "loss": 2.7007, + "step": 481 + }, + { + "epoch": 1.3133514986376023, + "grad_norm": 11.619187355041504, + "learning_rate": 8.755676657584016e-06, + "loss": 2.6953, + "step": 482 + }, + { + "epoch": 1.3160762942779292, + "grad_norm": 10.351978302001953, + "learning_rate": 8.773841961852862e-06, + "loss": 2.6812, + "step": 483 + }, + { + "epoch": 1.318801089918256, + "grad_norm": 10.137228012084961, + "learning_rate": 8.792007266121708e-06, + "loss": 2.4609, + "step": 484 + }, + { + "epoch": 1.3215258855585832, + "grad_norm": 11.376115798950195, + "learning_rate": 8.810172570390554e-06, + "loss": 2.5933, + "step": 485 + }, + { + "epoch": 1.32425068119891, + "grad_norm": 10.707823753356934, + "learning_rate": 8.828337874659402e-06, + "loss": 2.7358, + "step": 486 + }, + { + "epoch": 1.326975476839237, + "grad_norm": 11.9663724899292, + "learning_rate": 8.846503178928247e-06, + "loss": 2.5566, + "step": 487 + }, + { + "epoch": 1.3297002724795641, + "grad_norm": 10.451996803283691, + "learning_rate": 8.864668483197095e-06, + "loss": 2.6133, + "step": 488 + }, + { + "epoch": 1.332425068119891, + "grad_norm": 10.462884902954102, + "learning_rate": 8.88283378746594e-06, + "loss": 2.373, + "step": 489 + }, + { + "epoch": 1.335149863760218, + "grad_norm": 11.319975852966309, + "learning_rate": 8.900999091734787e-06, + "loss": 2.4707, + "step": 490 + }, + { + "epoch": 1.337874659400545, + "grad_norm": 11.024785995483398, + "learning_rate": 8.919164396003633e-06, + "loss": 2.7427, + "step": 491 + }, + { + "epoch": 1.340599455040872, + "grad_norm": 12.764436721801758, + "learning_rate": 8.937329700272481e-06, + "loss": 2.8945, + "step": 492 + }, + { + "epoch": 1.3433242506811989, + "grad_norm": 12.335233688354492, + "learning_rate": 8.955495004541327e-06, + "loss": 2.7842, + "step": 493 + }, + { + "epoch": 1.346049046321526, + "grad_norm": 10.881226539611816, + "learning_rate": 8.973660308810173e-06, + "loss": 2.6929, + "step": 494 + }, + { + "epoch": 1.348773841961853, + "grad_norm": 13.029730796813965, + "learning_rate": 8.99182561307902e-06, + "loss": 2.416, + "step": 495 + }, + { + "epoch": 1.3514986376021798, + "grad_norm": 9.454353332519531, + "learning_rate": 9.009990917347866e-06, + "loss": 2.395, + "step": 496 + }, + { + "epoch": 1.354223433242507, + "grad_norm": 10.588221549987793, + "learning_rate": 9.028156221616713e-06, + "loss": 2.3359, + "step": 497 + }, + { + "epoch": 1.3569482288828338, + "grad_norm": 10.198881149291992, + "learning_rate": 9.04632152588556e-06, + "loss": 2.7339, + "step": 498 + }, + { + "epoch": 1.3596730245231607, + "grad_norm": 10.493569374084473, + "learning_rate": 9.064486830154406e-06, + "loss": 2.769, + "step": 499 + }, + { + "epoch": 1.3623978201634879, + "grad_norm": 13.529339790344238, + "learning_rate": 9.082652134423252e-06, + "loss": 2.6699, + "step": 500 + }, + { + "epoch": 1.3651226158038148, + "grad_norm": 12.325822830200195, + "learning_rate": 9.1008174386921e-06, + "loss": 2.5801, + "step": 501 + }, + { + "epoch": 1.3678474114441417, + "grad_norm": 10.57773494720459, + "learning_rate": 9.118982742960946e-06, + "loss": 2.8398, + "step": 502 + }, + { + "epoch": 1.3705722070844686, + "grad_norm": 10.800013542175293, + "learning_rate": 9.137148047229792e-06, + "loss": 2.7549, + "step": 503 + }, + { + "epoch": 1.3732970027247957, + "grad_norm": 12.23603343963623, + "learning_rate": 9.155313351498638e-06, + "loss": 2.625, + "step": 504 + }, + { + "epoch": 1.3760217983651226, + "grad_norm": 10.985679626464844, + "learning_rate": 9.173478655767484e-06, + "loss": 2.5469, + "step": 505 + }, + { + "epoch": 1.3787465940054495, + "grad_norm": 10.75507926940918, + "learning_rate": 9.191643960036332e-06, + "loss": 2.4526, + "step": 506 + }, + { + "epoch": 1.3814713896457766, + "grad_norm": 11.696499824523926, + "learning_rate": 9.209809264305178e-06, + "loss": 2.5278, + "step": 507 + }, + { + "epoch": 1.3841961852861036, + "grad_norm": 12.926390647888184, + "learning_rate": 9.227974568574025e-06, + "loss": 2.752, + "step": 508 + }, + { + "epoch": 1.3869209809264305, + "grad_norm": 9.957062721252441, + "learning_rate": 9.24613987284287e-06, + "loss": 2.6543, + "step": 509 + }, + { + "epoch": 1.3896457765667574, + "grad_norm": 11.469195365905762, + "learning_rate": 9.264305177111717e-06, + "loss": 2.5161, + "step": 510 + }, + { + "epoch": 1.3923705722070845, + "grad_norm": 13.082963943481445, + "learning_rate": 9.282470481380565e-06, + "loss": 2.6533, + "step": 511 + }, + { + "epoch": 1.3950953678474114, + "grad_norm": 8.906614303588867, + "learning_rate": 9.300635785649411e-06, + "loss": 2.4404, + "step": 512 + }, + { + "epoch": 1.3978201634877383, + "grad_norm": 11.93236255645752, + "learning_rate": 9.318801089918257e-06, + "loss": 2.8286, + "step": 513 + }, + { + "epoch": 1.4005449591280654, + "grad_norm": 11.915575981140137, + "learning_rate": 9.336966394187103e-06, + "loss": 2.6279, + "step": 514 + }, + { + "epoch": 1.4032697547683923, + "grad_norm": 10.185914039611816, + "learning_rate": 9.355131698455951e-06, + "loss": 2.6211, + "step": 515 + }, + { + "epoch": 1.4059945504087192, + "grad_norm": 8.432724952697754, + "learning_rate": 9.373297002724796e-06, + "loss": 2.4209, + "step": 516 + }, + { + "epoch": 1.4087193460490464, + "grad_norm": 11.576340675354004, + "learning_rate": 9.391462306993643e-06, + "loss": 2.8804, + "step": 517 + }, + { + "epoch": 1.4114441416893733, + "grad_norm": 14.05243968963623, + "learning_rate": 9.40962761126249e-06, + "loss": 2.749, + "step": 518 + }, + { + "epoch": 1.4141689373297002, + "grad_norm": 13.364104270935059, + "learning_rate": 9.427792915531336e-06, + "loss": 2.5923, + "step": 519 + }, + { + "epoch": 1.4168937329700273, + "grad_norm": 11.277190208435059, + "learning_rate": 9.445958219800182e-06, + "loss": 2.5156, + "step": 520 + }, + { + "epoch": 1.4196185286103542, + "grad_norm": 10.909285545349121, + "learning_rate": 9.464123524069028e-06, + "loss": 2.4678, + "step": 521 + }, + { + "epoch": 1.422343324250681, + "grad_norm": 11.696632385253906, + "learning_rate": 9.482288828337876e-06, + "loss": 2.8662, + "step": 522 + }, + { + "epoch": 1.4250681198910082, + "grad_norm": 11.566356658935547, + "learning_rate": 9.500454132606722e-06, + "loss": 2.5601, + "step": 523 + }, + { + "epoch": 1.4277929155313351, + "grad_norm": 10.315143585205078, + "learning_rate": 9.518619436875568e-06, + "loss": 2.5898, + "step": 524 + }, + { + "epoch": 1.430517711171662, + "grad_norm": 10.548094749450684, + "learning_rate": 9.536784741144414e-06, + "loss": 2.7236, + "step": 525 + }, + { + "epoch": 1.4332425068119892, + "grad_norm": 11.040914535522461, + "learning_rate": 9.554950045413262e-06, + "loss": 2.4258, + "step": 526 + }, + { + "epoch": 1.435967302452316, + "grad_norm": 9.996368408203125, + "learning_rate": 9.573115349682108e-06, + "loss": 2.3677, + "step": 527 + }, + { + "epoch": 1.438692098092643, + "grad_norm": 10.326546669006348, + "learning_rate": 9.591280653950955e-06, + "loss": 2.5425, + "step": 528 + }, + { + "epoch": 1.44141689373297, + "grad_norm": 13.101269721984863, + "learning_rate": 9.6094459582198e-06, + "loss": 2.8428, + "step": 529 + }, + { + "epoch": 1.444141689373297, + "grad_norm": 12.325589179992676, + "learning_rate": 9.627611262488647e-06, + "loss": 2.6436, + "step": 530 + }, + { + "epoch": 1.446866485013624, + "grad_norm": 10.933701515197754, + "learning_rate": 9.645776566757495e-06, + "loss": 2.3931, + "step": 531 + }, + { + "epoch": 1.449591280653951, + "grad_norm": 9.500052452087402, + "learning_rate": 9.66394187102634e-06, + "loss": 2.3345, + "step": 532 + }, + { + "epoch": 1.452316076294278, + "grad_norm": 13.047250747680664, + "learning_rate": 9.682107175295187e-06, + "loss": 2.7686, + "step": 533 + }, + { + "epoch": 1.4550408719346049, + "grad_norm": 12.109979629516602, + "learning_rate": 9.700272479564033e-06, + "loss": 2.501, + "step": 534 + }, + { + "epoch": 1.457765667574932, + "grad_norm": 12.179343223571777, + "learning_rate": 9.718437783832881e-06, + "loss": 2.5972, + "step": 535 + }, + { + "epoch": 1.4604904632152589, + "grad_norm": 9.693185806274414, + "learning_rate": 9.736603088101727e-06, + "loss": 2.437, + "step": 536 + }, + { + "epoch": 1.4632152588555858, + "grad_norm": 12.021675109863281, + "learning_rate": 9.754768392370573e-06, + "loss": 2.7832, + "step": 537 + }, + { + "epoch": 1.465940054495913, + "grad_norm": 13.525501251220703, + "learning_rate": 9.77293369663942e-06, + "loss": 2.7178, + "step": 538 + }, + { + "epoch": 1.4686648501362398, + "grad_norm": 10.672472953796387, + "learning_rate": 9.791099000908266e-06, + "loss": 2.7441, + "step": 539 + }, + { + "epoch": 1.4713896457765667, + "grad_norm": 11.792448043823242, + "learning_rate": 9.809264305177114e-06, + "loss": 2.4883, + "step": 540 + }, + { + "epoch": 1.4741144414168939, + "grad_norm": 11.761456489562988, + "learning_rate": 9.827429609445958e-06, + "loss": 2.3374, + "step": 541 + }, + { + "epoch": 1.4768392370572208, + "grad_norm": 9.928813934326172, + "learning_rate": 9.845594913714806e-06, + "loss": 2.3564, + "step": 542 + }, + { + "epoch": 1.4795640326975477, + "grad_norm": 9.164095878601074, + "learning_rate": 9.863760217983652e-06, + "loss": 2.2881, + "step": 543 + }, + { + "epoch": 1.4822888283378748, + "grad_norm": 8.395923614501953, + "learning_rate": 9.881925522252498e-06, + "loss": 2.5308, + "step": 544 + }, + { + "epoch": 1.4850136239782017, + "grad_norm": 11.917168617248535, + "learning_rate": 9.900090826521344e-06, + "loss": 2.4995, + "step": 545 + }, + { + "epoch": 1.4877384196185286, + "grad_norm": 10.364140510559082, + "learning_rate": 9.918256130790192e-06, + "loss": 2.5234, + "step": 546 + }, + { + "epoch": 1.4904632152588557, + "grad_norm": 9.905284881591797, + "learning_rate": 9.936421435059038e-06, + "loss": 2.6123, + "step": 547 + }, + { + "epoch": 1.4931880108991826, + "grad_norm": 10.341503143310547, + "learning_rate": 9.954586739327885e-06, + "loss": 2.6328, + "step": 548 + }, + { + "epoch": 1.4959128065395095, + "grad_norm": 9.595457077026367, + "learning_rate": 9.97275204359673e-06, + "loss": 2.4976, + "step": 549 + }, + { + "epoch": 1.4986376021798364, + "grad_norm": 8.586732864379883, + "learning_rate": 9.990917347865577e-06, + "loss": 2.3501, + "step": 550 + }, + { + "epoch": 1.5013623978201633, + "grad_norm": 10.91036605834961, + "learning_rate": 1.0009082652134423e-05, + "loss": 2.5, + "step": 551 + }, + { + "epoch": 1.5040871934604905, + "grad_norm": 10.423352241516113, + "learning_rate": 1.002724795640327e-05, + "loss": 2.6089, + "step": 552 + }, + { + "epoch": 1.5068119891008176, + "grad_norm": 9.540590286254883, + "learning_rate": 1.0045413260672117e-05, + "loss": 2.4922, + "step": 553 + }, + { + "epoch": 1.5095367847411443, + "grad_norm": 11.419909477233887, + "learning_rate": 1.0063578564940963e-05, + "loss": 2.6396, + "step": 554 + }, + { + "epoch": 1.5122615803814714, + "grad_norm": 14.756720542907715, + "learning_rate": 1.008174386920981e-05, + "loss": 2.7812, + "step": 555 + }, + { + "epoch": 1.5149863760217985, + "grad_norm": 10.618692398071289, + "learning_rate": 1.0099909173478657e-05, + "loss": 2.5645, + "step": 556 + }, + { + "epoch": 1.5177111716621252, + "grad_norm": 9.123624801635742, + "learning_rate": 1.0118074477747503e-05, + "loss": 2.6064, + "step": 557 + }, + { + "epoch": 1.5204359673024523, + "grad_norm": 10.515607833862305, + "learning_rate": 1.0136239782016351e-05, + "loss": 2.5498, + "step": 558 + }, + { + "epoch": 1.5231607629427792, + "grad_norm": 15.523499488830566, + "learning_rate": 1.0154405086285196e-05, + "loss": 2.4937, + "step": 559 + }, + { + "epoch": 1.5258855585831061, + "grad_norm": 13.398969650268555, + "learning_rate": 1.0172570390554042e-05, + "loss": 2.667, + "step": 560 + }, + { + "epoch": 1.5286103542234333, + "grad_norm": 9.918622970581055, + "learning_rate": 1.0190735694822888e-05, + "loss": 2.4619, + "step": 561 + }, + { + "epoch": 1.5313351498637602, + "grad_norm": 11.595111846923828, + "learning_rate": 1.0208900999091736e-05, + "loss": 2.4878, + "step": 562 + }, + { + "epoch": 1.534059945504087, + "grad_norm": 9.246755599975586, + "learning_rate": 1.0227066303360582e-05, + "loss": 2.5894, + "step": 563 + }, + { + "epoch": 1.5367847411444142, + "grad_norm": 13.432228088378906, + "learning_rate": 1.0245231607629428e-05, + "loss": 2.7573, + "step": 564 + }, + { + "epoch": 1.5395095367847411, + "grad_norm": 10.047687530517578, + "learning_rate": 1.0263396911898276e-05, + "loss": 2.25, + "step": 565 + }, + { + "epoch": 1.542234332425068, + "grad_norm": 13.986072540283203, + "learning_rate": 1.0281562216167122e-05, + "loss": 2.6641, + "step": 566 + }, + { + "epoch": 1.5449591280653951, + "grad_norm": 11.353102684020996, + "learning_rate": 1.0299727520435968e-05, + "loss": 2.6831, + "step": 567 + }, + { + "epoch": 1.547683923705722, + "grad_norm": 11.442963600158691, + "learning_rate": 1.0317892824704815e-05, + "loss": 2.3428, + "step": 568 + }, + { + "epoch": 1.550408719346049, + "grad_norm": 10.155078887939453, + "learning_rate": 1.033605812897366e-05, + "loss": 2.4673, + "step": 569 + }, + { + "epoch": 1.553133514986376, + "grad_norm": 9.572172164916992, + "learning_rate": 1.0354223433242507e-05, + "loss": 2.606, + "step": 570 + }, + { + "epoch": 1.555858310626703, + "grad_norm": 11.651671409606934, + "learning_rate": 1.0372388737511355e-05, + "loss": 2.5181, + "step": 571 + }, + { + "epoch": 1.55858310626703, + "grad_norm": 10.545559883117676, + "learning_rate": 1.0390554041780201e-05, + "loss": 2.3989, + "step": 572 + }, + { + "epoch": 1.561307901907357, + "grad_norm": 11.466548919677734, + "learning_rate": 1.0408719346049047e-05, + "loss": 2.5503, + "step": 573 + }, + { + "epoch": 1.564032697547684, + "grad_norm": 11.771925926208496, + "learning_rate": 1.0426884650317895e-05, + "loss": 2.6226, + "step": 574 + }, + { + "epoch": 1.5667574931880108, + "grad_norm": 9.880620956420898, + "learning_rate": 1.0445049954586741e-05, + "loss": 2.4404, + "step": 575 + }, + { + "epoch": 1.569482288828338, + "grad_norm": 11.97048568725586, + "learning_rate": 1.0463215258855586e-05, + "loss": 2.6875, + "step": 576 + }, + { + "epoch": 1.5722070844686649, + "grad_norm": 13.414999008178711, + "learning_rate": 1.0481380563124432e-05, + "loss": 2.6855, + "step": 577 + }, + { + "epoch": 1.5749318801089918, + "grad_norm": 11.781789779663086, + "learning_rate": 1.049954586739328e-05, + "loss": 2.4966, + "step": 578 + }, + { + "epoch": 1.577656675749319, + "grad_norm": 18.100326538085938, + "learning_rate": 1.0517711171662126e-05, + "loss": 2.6426, + "step": 579 + }, + { + "epoch": 1.5803814713896458, + "grad_norm": 11.263434410095215, + "learning_rate": 1.0535876475930974e-05, + "loss": 2.5903, + "step": 580 + }, + { + "epoch": 1.5831062670299727, + "grad_norm": 11.495070457458496, + "learning_rate": 1.055404178019982e-05, + "loss": 2.4575, + "step": 581 + }, + { + "epoch": 1.5858310626702998, + "grad_norm": 9.964534759521484, + "learning_rate": 1.0572207084468666e-05, + "loss": 2.5522, + "step": 582 + }, + { + "epoch": 1.5885558583106267, + "grad_norm": 11.702447891235352, + "learning_rate": 1.0590372388737514e-05, + "loss": 2.3389, + "step": 583 + }, + { + "epoch": 1.5912806539509536, + "grad_norm": 9.268019676208496, + "learning_rate": 1.0608537693006358e-05, + "loss": 2.269, + "step": 584 + }, + { + "epoch": 1.5940054495912808, + "grad_norm": 15.74026870727539, + "learning_rate": 1.0626702997275204e-05, + "loss": 2.3662, + "step": 585 + }, + { + "epoch": 1.5967302452316077, + "grad_norm": 10.973413467407227, + "learning_rate": 1.064486830154405e-05, + "loss": 2.6699, + "step": 586 + }, + { + "epoch": 1.5994550408719346, + "grad_norm": 13.940545082092285, + "learning_rate": 1.0663033605812898e-05, + "loss": 2.668, + "step": 587 + }, + { + "epoch": 1.6021798365122617, + "grad_norm": 9.798370361328125, + "learning_rate": 1.0681198910081745e-05, + "loss": 2.5801, + "step": 588 + }, + { + "epoch": 1.6049046321525886, + "grad_norm": 10.114641189575195, + "learning_rate": 1.069936421435059e-05, + "loss": 2.3628, + "step": 589 + }, + { + "epoch": 1.6076294277929155, + "grad_norm": 13.61198616027832, + "learning_rate": 1.0717529518619439e-05, + "loss": 2.3149, + "step": 590 + }, + { + "epoch": 1.6103542234332426, + "grad_norm": 11.84930419921875, + "learning_rate": 1.0735694822888285e-05, + "loss": 2.1602, + "step": 591 + }, + { + "epoch": 1.6130790190735693, + "grad_norm": 11.23861026763916, + "learning_rate": 1.075386012715713e-05, + "loss": 2.5112, + "step": 592 + }, + { + "epoch": 1.6158038147138964, + "grad_norm": 12.049510955810547, + "learning_rate": 1.0772025431425977e-05, + "loss": 2.499, + "step": 593 + }, + { + "epoch": 1.6185286103542236, + "grad_norm": 11.305673599243164, + "learning_rate": 1.0790190735694823e-05, + "loss": 2.4512, + "step": 594 + }, + { + "epoch": 1.6212534059945503, + "grad_norm": 8.980688095092773, + "learning_rate": 1.080835603996367e-05, + "loss": 2.2471, + "step": 595 + }, + { + "epoch": 1.6239782016348774, + "grad_norm": 13.167588233947754, + "learning_rate": 1.0826521344232517e-05, + "loss": 2.4492, + "step": 596 + }, + { + "epoch": 1.6267029972752045, + "grad_norm": 13.362232208251953, + "learning_rate": 1.0844686648501363e-05, + "loss": 2.3589, + "step": 597 + }, + { + "epoch": 1.6294277929155312, + "grad_norm": 13.432881355285645, + "learning_rate": 1.086285195277021e-05, + "loss": 2.3999, + "step": 598 + }, + { + "epoch": 1.6321525885558583, + "grad_norm": 10.197798728942871, + "learning_rate": 1.0881017257039057e-05, + "loss": 2.4595, + "step": 599 + }, + { + "epoch": 1.6348773841961854, + "grad_norm": 12.196104049682617, + "learning_rate": 1.0899182561307904e-05, + "loss": 2.5488, + "step": 600 + }, + { + "epoch": 1.6376021798365121, + "grad_norm": 10.602243423461914, + "learning_rate": 1.0917347865576748e-05, + "loss": 2.6128, + "step": 601 + }, + { + "epoch": 1.6403269754768393, + "grad_norm": 11.960326194763184, + "learning_rate": 1.0935513169845596e-05, + "loss": 2.6465, + "step": 602 + }, + { + "epoch": 1.6430517711171662, + "grad_norm": 12.77395248413086, + "learning_rate": 1.0953678474114442e-05, + "loss": 2.7295, + "step": 603 + }, + { + "epoch": 1.645776566757493, + "grad_norm": 14.705750465393066, + "learning_rate": 1.0971843778383288e-05, + "loss": 2.5347, + "step": 604 + }, + { + "epoch": 1.6485013623978202, + "grad_norm": 9.935203552246094, + "learning_rate": 1.0990009082652136e-05, + "loss": 2.1514, + "step": 605 + }, + { + "epoch": 1.651226158038147, + "grad_norm": 11.95473575592041, + "learning_rate": 1.1008174386920982e-05, + "loss": 2.5923, + "step": 606 + }, + { + "epoch": 1.653950953678474, + "grad_norm": 14.375449180603027, + "learning_rate": 1.1026339691189828e-05, + "loss": 2.6475, + "step": 607 + }, + { + "epoch": 1.6566757493188011, + "grad_norm": 10.64272689819336, + "learning_rate": 1.1044504995458676e-05, + "loss": 2.4312, + "step": 608 + }, + { + "epoch": 1.659400544959128, + "grad_norm": 12.748344421386719, + "learning_rate": 1.106267029972752e-05, + "loss": 2.4067, + "step": 609 + }, + { + "epoch": 1.662125340599455, + "grad_norm": 10.088484764099121, + "learning_rate": 1.1080835603996367e-05, + "loss": 2.4624, + "step": 610 + }, + { + "epoch": 1.664850136239782, + "grad_norm": 11.537372589111328, + "learning_rate": 1.1099000908265215e-05, + "loss": 2.3145, + "step": 611 + }, + { + "epoch": 1.667574931880109, + "grad_norm": 10.860895156860352, + "learning_rate": 1.1117166212534061e-05, + "loss": 2.4912, + "step": 612 + }, + { + "epoch": 1.6702997275204359, + "grad_norm": 11.544546127319336, + "learning_rate": 1.1135331516802907e-05, + "loss": 2.6802, + "step": 613 + }, + { + "epoch": 1.673024523160763, + "grad_norm": 12.035743713378906, + "learning_rate": 1.1153496821071755e-05, + "loss": 2.3105, + "step": 614 + }, + { + "epoch": 1.67574931880109, + "grad_norm": 11.289690971374512, + "learning_rate": 1.1171662125340601e-05, + "loss": 2.3843, + "step": 615 + }, + { + "epoch": 1.6784741144414168, + "grad_norm": 10.212812423706055, + "learning_rate": 1.1189827429609447e-05, + "loss": 2.7515, + "step": 616 + }, + { + "epoch": 1.681198910081744, + "grad_norm": 11.834221839904785, + "learning_rate": 1.1207992733878292e-05, + "loss": 2.6309, + "step": 617 + }, + { + "epoch": 1.6839237057220708, + "grad_norm": 10.995518684387207, + "learning_rate": 1.122615803814714e-05, + "loss": 2.4917, + "step": 618 + }, + { + "epoch": 1.6866485013623977, + "grad_norm": 11.77338695526123, + "learning_rate": 1.1244323342415986e-05, + "loss": 2.6064, + "step": 619 + }, + { + "epoch": 1.6893732970027249, + "grad_norm": 11.592185020446777, + "learning_rate": 1.1262488646684832e-05, + "loss": 2.4995, + "step": 620 + }, + { + "epoch": 1.6920980926430518, + "grad_norm": 10.184931755065918, + "learning_rate": 1.128065395095368e-05, + "loss": 2.3975, + "step": 621 + }, + { + "epoch": 1.6948228882833787, + "grad_norm": 9.818941116333008, + "learning_rate": 1.1298819255222526e-05, + "loss": 2.5396, + "step": 622 + }, + { + "epoch": 1.6975476839237058, + "grad_norm": 12.17223834991455, + "learning_rate": 1.1316984559491374e-05, + "loss": 2.4321, + "step": 623 + }, + { + "epoch": 1.7002724795640327, + "grad_norm": 10.2310152053833, + "learning_rate": 1.133514986376022e-05, + "loss": 2.3984, + "step": 624 + }, + { + "epoch": 1.7029972752043596, + "grad_norm": 11.413909912109375, + "learning_rate": 1.1353315168029066e-05, + "loss": 2.5557, + "step": 625 + }, + { + "epoch": 1.7057220708446867, + "grad_norm": 10.546042442321777, + "learning_rate": 1.137148047229791e-05, + "loss": 2.6455, + "step": 626 + }, + { + "epoch": 1.7084468664850136, + "grad_norm": 13.648941040039062, + "learning_rate": 1.1389645776566758e-05, + "loss": 2.5625, + "step": 627 + }, + { + "epoch": 1.7111716621253406, + "grad_norm": 14.775775909423828, + "learning_rate": 1.1407811080835605e-05, + "loss": 2.4966, + "step": 628 + }, + { + "epoch": 1.7138964577656677, + "grad_norm": 20.476844787597656, + "learning_rate": 1.142597638510445e-05, + "loss": 2.479, + "step": 629 + }, + { + "epoch": 1.7166212534059946, + "grad_norm": 10.364046096801758, + "learning_rate": 1.1444141689373299e-05, + "loss": 2.6875, + "step": 630 + }, + { + "epoch": 1.7193460490463215, + "grad_norm": 8.582182884216309, + "learning_rate": 1.1462306993642145e-05, + "loss": 2.144, + "step": 631 + }, + { + "epoch": 1.7220708446866486, + "grad_norm": 10.024995803833008, + "learning_rate": 1.1480472297910991e-05, + "loss": 2.4619, + "step": 632 + }, + { + "epoch": 1.7247956403269755, + "grad_norm": 8.943358421325684, + "learning_rate": 1.1498637602179839e-05, + "loss": 2.4033, + "step": 633 + }, + { + "epoch": 1.7275204359673024, + "grad_norm": 12.314430236816406, + "learning_rate": 1.1516802906448683e-05, + "loss": 2.3384, + "step": 634 + }, + { + "epoch": 1.7302452316076296, + "grad_norm": 11.263984680175781, + "learning_rate": 1.153496821071753e-05, + "loss": 2.6621, + "step": 635 + }, + { + "epoch": 1.7329700272479565, + "grad_norm": 11.925774574279785, + "learning_rate": 1.1553133514986377e-05, + "loss": 2.1382, + "step": 636 + }, + { + "epoch": 1.7356948228882834, + "grad_norm": 10.014432907104492, + "learning_rate": 1.1571298819255223e-05, + "loss": 2.1636, + "step": 637 + }, + { + "epoch": 1.7384196185286105, + "grad_norm": 11.657225608825684, + "learning_rate": 1.158946412352407e-05, + "loss": 2.458, + "step": 638 + }, + { + "epoch": 1.7411444141689372, + "grad_norm": 20.94296646118164, + "learning_rate": 1.1607629427792917e-05, + "loss": 2.6333, + "step": 639 + }, + { + "epoch": 1.7438692098092643, + "grad_norm": 12.757229804992676, + "learning_rate": 1.1625794732061764e-05, + "loss": 2.3477, + "step": 640 + }, + { + "epoch": 1.7465940054495914, + "grad_norm": 12.054852485656738, + "learning_rate": 1.164396003633061e-05, + "loss": 2.4404, + "step": 641 + }, + { + "epoch": 1.749318801089918, + "grad_norm": 14.641657829284668, + "learning_rate": 1.1662125340599454e-05, + "loss": 2.3457, + "step": 642 + }, + { + "epoch": 1.7520435967302452, + "grad_norm": 10.225979804992676, + "learning_rate": 1.1680290644868302e-05, + "loss": 2.481, + "step": 643 + }, + { + "epoch": 1.7547683923705724, + "grad_norm": 13.0012788772583, + "learning_rate": 1.1698455949137148e-05, + "loss": 2.375, + "step": 644 + }, + { + "epoch": 1.757493188010899, + "grad_norm": 12.893733978271484, + "learning_rate": 1.1716621253405996e-05, + "loss": 2.7119, + "step": 645 + }, + { + "epoch": 1.7602179836512262, + "grad_norm": 10.805425643920898, + "learning_rate": 1.1734786557674842e-05, + "loss": 2.4614, + "step": 646 + }, + { + "epoch": 1.7629427792915533, + "grad_norm": 11.27730941772461, + "learning_rate": 1.1752951861943688e-05, + "loss": 2.4028, + "step": 647 + }, + { + "epoch": 1.76566757493188, + "grad_norm": 10.970818519592285, + "learning_rate": 1.1771117166212536e-05, + "loss": 2.4282, + "step": 648 + }, + { + "epoch": 1.768392370572207, + "grad_norm": 10.74846076965332, + "learning_rate": 1.1789282470481382e-05, + "loss": 2.2319, + "step": 649 + }, + { + "epoch": 1.771117166212534, + "grad_norm": 11.724044799804688, + "learning_rate": 1.1807447774750227e-05, + "loss": 2.583, + "step": 650 + }, + { + "epoch": 1.773841961852861, + "grad_norm": 11.138653755187988, + "learning_rate": 1.1825613079019073e-05, + "loss": 2.3076, + "step": 651 + }, + { + "epoch": 1.776566757493188, + "grad_norm": 14.40742015838623, + "learning_rate": 1.1843778383287921e-05, + "loss": 2.4297, + "step": 652 + }, + { + "epoch": 1.779291553133515, + "grad_norm": 10.167417526245117, + "learning_rate": 1.1861943687556767e-05, + "loss": 2.4209, + "step": 653 + }, + { + "epoch": 1.7820163487738419, + "grad_norm": 11.244752883911133, + "learning_rate": 1.1880108991825613e-05, + "loss": 2.3984, + "step": 654 + }, + { + "epoch": 1.784741144414169, + "grad_norm": 7.9195685386657715, + "learning_rate": 1.1898274296094461e-05, + "loss": 2.1392, + "step": 655 + }, + { + "epoch": 1.7874659400544959, + "grad_norm": 12.2032470703125, + "learning_rate": 1.1916439600363307e-05, + "loss": 2.3579, + "step": 656 + }, + { + "epoch": 1.7901907356948228, + "grad_norm": 9.648261070251465, + "learning_rate": 1.1934604904632155e-05, + "loss": 2.2925, + "step": 657 + }, + { + "epoch": 1.79291553133515, + "grad_norm": 12.435829162597656, + "learning_rate": 1.1952770208901001e-05, + "loss": 2.5117, + "step": 658 + }, + { + "epoch": 1.7956403269754768, + "grad_norm": 13.42502498626709, + "learning_rate": 1.1970935513169846e-05, + "loss": 2.6919, + "step": 659 + }, + { + "epoch": 1.7983651226158037, + "grad_norm": 13.266587257385254, + "learning_rate": 1.1989100817438692e-05, + "loss": 2.3936, + "step": 660 + }, + { + "epoch": 1.8010899182561309, + "grad_norm": 11.673394203186035, + "learning_rate": 1.200726612170754e-05, + "loss": 2.2725, + "step": 661 + }, + { + "epoch": 1.8038147138964578, + "grad_norm": 10.024274826049805, + "learning_rate": 1.2025431425976386e-05, + "loss": 2.4785, + "step": 662 + }, + { + "epoch": 1.8065395095367847, + "grad_norm": 8.943089485168457, + "learning_rate": 1.2043596730245232e-05, + "loss": 2.3887, + "step": 663 + }, + { + "epoch": 1.8092643051771118, + "grad_norm": 12.43687629699707, + "learning_rate": 1.206176203451408e-05, + "loss": 2.355, + "step": 664 + }, + { + "epoch": 1.8119891008174387, + "grad_norm": 8.887104988098145, + "learning_rate": 1.2079927338782926e-05, + "loss": 2.3379, + "step": 665 + }, + { + "epoch": 1.8147138964577656, + "grad_norm": 16.104576110839844, + "learning_rate": 1.2098092643051772e-05, + "loss": 2.4424, + "step": 666 + }, + { + "epoch": 1.8174386920980927, + "grad_norm": 15.355511665344238, + "learning_rate": 1.2116257947320618e-05, + "loss": 2.4673, + "step": 667 + }, + { + "epoch": 1.8201634877384196, + "grad_norm": 18.361045837402344, + "learning_rate": 1.2134423251589465e-05, + "loss": 2.6831, + "step": 668 + }, + { + "epoch": 1.8228882833787465, + "grad_norm": 9.65218448638916, + "learning_rate": 1.215258855585831e-05, + "loss": 2.4902, + "step": 669 + }, + { + "epoch": 1.8256130790190737, + "grad_norm": 10.684483528137207, + "learning_rate": 1.2170753860127159e-05, + "loss": 2.3867, + "step": 670 + }, + { + "epoch": 1.8283378746594006, + "grad_norm": 9.706910133361816, + "learning_rate": 1.2188919164396005e-05, + "loss": 2.2607, + "step": 671 + }, + { + "epoch": 1.8310626702997275, + "grad_norm": 11.646918296813965, + "learning_rate": 1.2207084468664851e-05, + "loss": 2.2642, + "step": 672 + }, + { + "epoch": 1.8337874659400546, + "grad_norm": 11.801918029785156, + "learning_rate": 1.2225249772933699e-05, + "loss": 2.3691, + "step": 673 + }, + { + "epoch": 1.8365122615803815, + "grad_norm": 11.345173835754395, + "learning_rate": 1.2243415077202545e-05, + "loss": 2.4072, + "step": 674 + }, + { + "epoch": 1.8392370572207084, + "grad_norm": 11.49028205871582, + "learning_rate": 1.226158038147139e-05, + "loss": 2.4395, + "step": 675 + }, + { + "epoch": 1.8419618528610355, + "grad_norm": 11.581648826599121, + "learning_rate": 1.2279745685740236e-05, + "loss": 2.1338, + "step": 676 + }, + { + "epoch": 1.8446866485013624, + "grad_norm": 9.466208457946777, + "learning_rate": 1.2297910990009083e-05, + "loss": 2.29, + "step": 677 + }, + { + "epoch": 1.8474114441416893, + "grad_norm": 10.945378303527832, + "learning_rate": 1.231607629427793e-05, + "loss": 2.4863, + "step": 678 + }, + { + "epoch": 1.8501362397820165, + "grad_norm": 11.229761123657227, + "learning_rate": 1.2334241598546777e-05, + "loss": 2.4067, + "step": 679 + }, + { + "epoch": 1.8528610354223434, + "grad_norm": 13.484183311462402, + "learning_rate": 1.2352406902815624e-05, + "loss": 2.4678, + "step": 680 + }, + { + "epoch": 1.8555858310626703, + "grad_norm": 12.50755500793457, + "learning_rate": 1.237057220708447e-05, + "loss": 2.7646, + "step": 681 + }, + { + "epoch": 1.8583106267029974, + "grad_norm": 12.71037769317627, + "learning_rate": 1.2388737511353318e-05, + "loss": 2.2935, + "step": 682 + }, + { + "epoch": 1.861035422343324, + "grad_norm": 9.98797607421875, + "learning_rate": 1.2406902815622162e-05, + "loss": 2.1328, + "step": 683 + }, + { + "epoch": 1.8637602179836512, + "grad_norm": 10.682023048400879, + "learning_rate": 1.2425068119891008e-05, + "loss": 2.1211, + "step": 684 + }, + { + "epoch": 1.8664850136239783, + "grad_norm": 10.15453815460205, + "learning_rate": 1.2443233424159854e-05, + "loss": 2.3521, + "step": 685 + }, + { + "epoch": 1.869209809264305, + "grad_norm": 10.65381908416748, + "learning_rate": 1.2461398728428702e-05, + "loss": 2.3804, + "step": 686 + }, + { + "epoch": 1.8719346049046321, + "grad_norm": 12.174696922302246, + "learning_rate": 1.2479564032697548e-05, + "loss": 2.4795, + "step": 687 + }, + { + "epoch": 1.8746594005449593, + "grad_norm": 10.093709945678711, + "learning_rate": 1.2497729336966395e-05, + "loss": 2.3071, + "step": 688 + }, + { + "epoch": 1.877384196185286, + "grad_norm": 9.991334915161133, + "learning_rate": 1.2515894641235242e-05, + "loss": 2.2856, + "step": 689 + }, + { + "epoch": 1.880108991825613, + "grad_norm": 10.812753677368164, + "learning_rate": 1.2534059945504089e-05, + "loss": 2.314, + "step": 690 + }, + { + "epoch": 1.8828337874659402, + "grad_norm": 10.286032676696777, + "learning_rate": 1.2552225249772936e-05, + "loss": 2.3818, + "step": 691 + }, + { + "epoch": 1.885558583106267, + "grad_norm": 9.558748245239258, + "learning_rate": 1.2570390554041781e-05, + "loss": 2.2256, + "step": 692 + }, + { + "epoch": 1.888283378746594, + "grad_norm": 12.837057113647461, + "learning_rate": 1.2588555858310627e-05, + "loss": 2.5161, + "step": 693 + }, + { + "epoch": 1.891008174386921, + "grad_norm": 12.383069038391113, + "learning_rate": 1.2606721162579473e-05, + "loss": 2.6084, + "step": 694 + }, + { + "epoch": 1.8937329700272478, + "grad_norm": 12.400851249694824, + "learning_rate": 1.2624886466848321e-05, + "loss": 2.2778, + "step": 695 + }, + { + "epoch": 1.896457765667575, + "grad_norm": 9.855324745178223, + "learning_rate": 1.2643051771117167e-05, + "loss": 2.3657, + "step": 696 + }, + { + "epoch": 1.8991825613079019, + "grad_norm": 12.803309440612793, + "learning_rate": 1.2661217075386013e-05, + "loss": 2.3423, + "step": 697 + }, + { + "epoch": 1.9019073569482288, + "grad_norm": 11.03612232208252, + "learning_rate": 1.2679382379654861e-05, + "loss": 2.583, + "step": 698 + }, + { + "epoch": 1.904632152588556, + "grad_norm": 10.573287010192871, + "learning_rate": 1.2697547683923707e-05, + "loss": 2.5322, + "step": 699 + }, + { + "epoch": 1.9073569482288828, + "grad_norm": 11.009425163269043, + "learning_rate": 1.2715712988192552e-05, + "loss": 2.4336, + "step": 700 + }, + { + "epoch": 1.9100817438692097, + "grad_norm": 10.598993301391602, + "learning_rate": 1.27338782924614e-05, + "loss": 2.2759, + "step": 701 + }, + { + "epoch": 1.9128065395095368, + "grad_norm": 10.426955223083496, + "learning_rate": 1.2752043596730246e-05, + "loss": 2.1611, + "step": 702 + }, + { + "epoch": 1.9155313351498637, + "grad_norm": 10.571686744689941, + "learning_rate": 1.2770208900999092e-05, + "loss": 2.3501, + "step": 703 + }, + { + "epoch": 1.9182561307901906, + "grad_norm": 13.263895988464355, + "learning_rate": 1.278837420526794e-05, + "loss": 2.2925, + "step": 704 + }, + { + "epoch": 1.9209809264305178, + "grad_norm": 9.810479164123535, + "learning_rate": 1.2806539509536786e-05, + "loss": 2.5063, + "step": 705 + }, + { + "epoch": 1.9237057220708447, + "grad_norm": 11.980880737304688, + "learning_rate": 1.2824704813805632e-05, + "loss": 2.4922, + "step": 706 + }, + { + "epoch": 1.9264305177111716, + "grad_norm": 11.019759178161621, + "learning_rate": 1.284287011807448e-05, + "loss": 2.3877, + "step": 707 + }, + { + "epoch": 1.9291553133514987, + "grad_norm": 9.92830753326416, + "learning_rate": 1.2861035422343325e-05, + "loss": 2.0889, + "step": 708 + }, + { + "epoch": 1.9318801089918256, + "grad_norm": 12.595752716064453, + "learning_rate": 1.287920072661217e-05, + "loss": 2.249, + "step": 709 + }, + { + "epoch": 1.9346049046321525, + "grad_norm": 12.465704917907715, + "learning_rate": 1.2897366030881019e-05, + "loss": 2.2461, + "step": 710 + }, + { + "epoch": 1.9373297002724796, + "grad_norm": 9.215608596801758, + "learning_rate": 1.2915531335149865e-05, + "loss": 2.208, + "step": 711 + }, + { + "epoch": 1.9400544959128065, + "grad_norm": 9.664246559143066, + "learning_rate": 1.2933696639418711e-05, + "loss": 2.1519, + "step": 712 + }, + { + "epoch": 1.9427792915531334, + "grad_norm": 10.005195617675781, + "learning_rate": 1.2951861943687559e-05, + "loss": 2.5396, + "step": 713 + }, + { + "epoch": 1.9455040871934606, + "grad_norm": 12.706524848937988, + "learning_rate": 1.2970027247956405e-05, + "loss": 2.3086, + "step": 714 + }, + { + "epoch": 1.9482288828337875, + "grad_norm": 10.416522979736328, + "learning_rate": 1.2988192552225251e-05, + "loss": 2.3281, + "step": 715 + }, + { + "epoch": 1.9509536784741144, + "grad_norm": 8.217157363891602, + "learning_rate": 1.3006357856494099e-05, + "loss": 2.3672, + "step": 716 + }, + { + "epoch": 1.9536784741144415, + "grad_norm": 11.214954376220703, + "learning_rate": 1.3024523160762943e-05, + "loss": 2.2183, + "step": 717 + }, + { + "epoch": 1.9564032697547684, + "grad_norm": 11.53817081451416, + "learning_rate": 1.304268846503179e-05, + "loss": 2.2422, + "step": 718 + }, + { + "epoch": 1.9591280653950953, + "grad_norm": 8.654513359069824, + "learning_rate": 1.3060853769300636e-05, + "loss": 2.4492, + "step": 719 + }, + { + "epoch": 1.9618528610354224, + "grad_norm": 12.240690231323242, + "learning_rate": 1.3079019073569484e-05, + "loss": 2.3838, + "step": 720 + }, + { + "epoch": 1.9645776566757494, + "grad_norm": 10.855642318725586, + "learning_rate": 1.309718437783833e-05, + "loss": 2.4893, + "step": 721 + }, + { + "epoch": 1.9673024523160763, + "grad_norm": 10.994941711425781, + "learning_rate": 1.3115349682107178e-05, + "loss": 2.3906, + "step": 722 + }, + { + "epoch": 1.9700272479564034, + "grad_norm": 10.279187202453613, + "learning_rate": 1.3133514986376024e-05, + "loss": 2.1851, + "step": 723 + }, + { + "epoch": 1.9727520435967303, + "grad_norm": 10.290560722351074, + "learning_rate": 1.315168029064487e-05, + "loss": 2.2305, + "step": 724 + }, + { + "epoch": 1.9754768392370572, + "grad_norm": 8.804238319396973, + "learning_rate": 1.3169845594913714e-05, + "loss": 2.3457, + "step": 725 + }, + { + "epoch": 1.9782016348773843, + "grad_norm": 20.067276000976562, + "learning_rate": 1.3188010899182562e-05, + "loss": 2.3394, + "step": 726 + }, + { + "epoch": 1.9809264305177112, + "grad_norm": 8.709736824035645, + "learning_rate": 1.3206176203451408e-05, + "loss": 2.147, + "step": 727 + }, + { + "epoch": 1.9836512261580381, + "grad_norm": 9.862410545349121, + "learning_rate": 1.3224341507720255e-05, + "loss": 2.3857, + "step": 728 + }, + { + "epoch": 1.9863760217983653, + "grad_norm": 13.235732078552246, + "learning_rate": 1.3242506811989102e-05, + "loss": 2.2124, + "step": 729 + }, + { + "epoch": 1.989100817438692, + "grad_norm": 10.813942909240723, + "learning_rate": 1.3260672116257949e-05, + "loss": 2.5288, + "step": 730 + }, + { + "epoch": 1.991825613079019, + "grad_norm": 10.577856063842773, + "learning_rate": 1.3278837420526795e-05, + "loss": 2.1875, + "step": 731 + }, + { + "epoch": 1.9945504087193462, + "grad_norm": 11.54691219329834, + "learning_rate": 1.3297002724795643e-05, + "loss": 2.4673, + "step": 732 + }, + { + "epoch": 1.9972752043596729, + "grad_norm": 11.1182279586792, + "learning_rate": 1.3315168029064487e-05, + "loss": 2.2476, + "step": 733 + }, + { + "epoch": 2.0, + "grad_norm": 10.508315086364746, + "learning_rate": 1.3333333333333333e-05, + "loss": 2.2329, + "step": 734 + }, + { + "epoch": 2.002724795640327, + "grad_norm": 9.416644096374512, + "learning_rate": 1.3351498637602181e-05, + "loss": 2.3159, + "step": 735 + }, + { + "epoch": 2.005449591280654, + "grad_norm": 11.600786209106445, + "learning_rate": 1.3369663941871027e-05, + "loss": 2.3403, + "step": 736 + }, + { + "epoch": 2.008174386920981, + "grad_norm": 10.866864204406738, + "learning_rate": 1.3387829246139873e-05, + "loss": 2.3638, + "step": 737 + }, + { + "epoch": 2.010899182561308, + "grad_norm": 9.856853485107422, + "learning_rate": 1.3405994550408721e-05, + "loss": 2.1553, + "step": 738 + }, + { + "epoch": 2.0136239782016347, + "grad_norm": 12.677173614501953, + "learning_rate": 1.3424159854677567e-05, + "loss": 2.3608, + "step": 739 + }, + { + "epoch": 2.016348773841962, + "grad_norm": 13.566946983337402, + "learning_rate": 1.3442325158946414e-05, + "loss": 2.2056, + "step": 740 + }, + { + "epoch": 2.019073569482289, + "grad_norm": 11.25836181640625, + "learning_rate": 1.3460490463215258e-05, + "loss": 2.2539, + "step": 741 + }, + { + "epoch": 2.0217983651226157, + "grad_norm": 9.697957992553711, + "learning_rate": 1.3478655767484106e-05, + "loss": 2.1094, + "step": 742 + }, + { + "epoch": 2.024523160762943, + "grad_norm": 11.091008186340332, + "learning_rate": 1.3496821071752952e-05, + "loss": 2.3203, + "step": 743 + }, + { + "epoch": 2.02724795640327, + "grad_norm": 8.965106010437012, + "learning_rate": 1.35149863760218e-05, + "loss": 2.1367, + "step": 744 + }, + { + "epoch": 2.0299727520435966, + "grad_norm": 9.569092750549316, + "learning_rate": 1.3533151680290646e-05, + "loss": 2.2056, + "step": 745 + }, + { + "epoch": 2.0326975476839237, + "grad_norm": 11.248583793640137, + "learning_rate": 1.3551316984559492e-05, + "loss": 2.2119, + "step": 746 + }, + { + "epoch": 2.035422343324251, + "grad_norm": 10.267621994018555, + "learning_rate": 1.356948228882834e-05, + "loss": 2.0845, + "step": 747 + }, + { + "epoch": 2.0381471389645776, + "grad_norm": 13.887840270996094, + "learning_rate": 1.3587647593097186e-05, + "loss": 2.1733, + "step": 748 + }, + { + "epoch": 2.0408719346049047, + "grad_norm": 17.721181869506836, + "learning_rate": 1.3605812897366032e-05, + "loss": 2.3569, + "step": 749 + }, + { + "epoch": 2.043596730245232, + "grad_norm": 15.872747421264648, + "learning_rate": 1.3623978201634877e-05, + "loss": 2.3384, + "step": 750 + }, + { + "epoch": 2.0463215258855585, + "grad_norm": 12.283638000488281, + "learning_rate": 1.3642143505903725e-05, + "loss": 2.1323, + "step": 751 + }, + { + "epoch": 2.0490463215258856, + "grad_norm": 11.33743667602539, + "learning_rate": 1.3660308810172571e-05, + "loss": 2.3105, + "step": 752 + }, + { + "epoch": 2.0517711171662127, + "grad_norm": 9.7986421585083, + "learning_rate": 1.3678474114441417e-05, + "loss": 2.1245, + "step": 753 + }, + { + "epoch": 2.0544959128065394, + "grad_norm": 14.31638240814209, + "learning_rate": 1.3696639418710265e-05, + "loss": 2.5381, + "step": 754 + }, + { + "epoch": 2.0572207084468666, + "grad_norm": 10.74636459350586, + "learning_rate": 1.3714804722979111e-05, + "loss": 2.2754, + "step": 755 + }, + { + "epoch": 2.0599455040871932, + "grad_norm": 11.772139549255371, + "learning_rate": 1.3732970027247959e-05, + "loss": 2.3711, + "step": 756 + }, + { + "epoch": 2.0626702997275204, + "grad_norm": 10.804475784301758, + "learning_rate": 1.3751135331516805e-05, + "loss": 2.3838, + "step": 757 + }, + { + "epoch": 2.0653950953678475, + "grad_norm": 11.526287078857422, + "learning_rate": 1.376930063578565e-05, + "loss": 2.1738, + "step": 758 + }, + { + "epoch": 2.068119891008174, + "grad_norm": 11.430591583251953, + "learning_rate": 1.3787465940054496e-05, + "loss": 2.27, + "step": 759 + }, + { + "epoch": 2.0708446866485013, + "grad_norm": 90.60478210449219, + "learning_rate": 1.3805631244323344e-05, + "loss": 2.106, + "step": 760 + }, + { + "epoch": 2.0735694822888284, + "grad_norm": 12.474735260009766, + "learning_rate": 1.382379654859219e-05, + "loss": 2.2876, + "step": 761 + }, + { + "epoch": 2.076294277929155, + "grad_norm": 13.374337196350098, + "learning_rate": 1.3841961852861036e-05, + "loss": 2.4697, + "step": 762 + }, + { + "epoch": 2.0790190735694822, + "grad_norm": 13.265146255493164, + "learning_rate": 1.3860127157129884e-05, + "loss": 2.2998, + "step": 763 + }, + { + "epoch": 2.0817438692098094, + "grad_norm": 11.40599536895752, + "learning_rate": 1.387829246139873e-05, + "loss": 2.2158, + "step": 764 + }, + { + "epoch": 2.084468664850136, + "grad_norm": 12.681764602661133, + "learning_rate": 1.3896457765667576e-05, + "loss": 2.1958, + "step": 765 + }, + { + "epoch": 2.087193460490463, + "grad_norm": 15.120609283447266, + "learning_rate": 1.3914623069936422e-05, + "loss": 2.582, + "step": 766 + }, + { + "epoch": 2.0899182561307903, + "grad_norm": 20.23128318786621, + "learning_rate": 1.3932788374205268e-05, + "loss": 2.5552, + "step": 767 + }, + { + "epoch": 2.092643051771117, + "grad_norm": 20.257232666015625, + "learning_rate": 1.3950953678474115e-05, + "loss": 2.4346, + "step": 768 + }, + { + "epoch": 2.095367847411444, + "grad_norm": 12.688992500305176, + "learning_rate": 1.3969118982742963e-05, + "loss": 2.1992, + "step": 769 + }, + { + "epoch": 2.0980926430517712, + "grad_norm": 14.45832633972168, + "learning_rate": 1.3987284287011809e-05, + "loss": 2.3193, + "step": 770 + }, + { + "epoch": 2.100817438692098, + "grad_norm": 13.274530410766602, + "learning_rate": 1.4005449591280655e-05, + "loss": 2.2349, + "step": 771 + }, + { + "epoch": 2.103542234332425, + "grad_norm": 15.1006441116333, + "learning_rate": 1.4023614895549503e-05, + "loss": 2.3721, + "step": 772 + }, + { + "epoch": 2.106267029972752, + "grad_norm": 12.727002143859863, + "learning_rate": 1.4041780199818349e-05, + "loss": 2.2393, + "step": 773 + }, + { + "epoch": 2.108991825613079, + "grad_norm": 15.004621505737305, + "learning_rate": 1.4059945504087195e-05, + "loss": 2.2686, + "step": 774 + }, + { + "epoch": 2.111716621253406, + "grad_norm": 13.299857139587402, + "learning_rate": 1.407811080835604e-05, + "loss": 2.334, + "step": 775 + }, + { + "epoch": 2.114441416893733, + "grad_norm": 14.570548057556152, + "learning_rate": 1.4096276112624887e-05, + "loss": 2.208, + "step": 776 + }, + { + "epoch": 2.11716621253406, + "grad_norm": 10.870620727539062, + "learning_rate": 1.4114441416893733e-05, + "loss": 2.2275, + "step": 777 + }, + { + "epoch": 2.119891008174387, + "grad_norm": 11.548524856567383, + "learning_rate": 1.4132606721162581e-05, + "loss": 2.1538, + "step": 778 + }, + { + "epoch": 2.122615803814714, + "grad_norm": 10.89322280883789, + "learning_rate": 1.4150772025431428e-05, + "loss": 2.3955, + "step": 779 + }, + { + "epoch": 2.1253405994550407, + "grad_norm": 13.28118896484375, + "learning_rate": 1.4168937329700274e-05, + "loss": 2.3999, + "step": 780 + }, + { + "epoch": 2.128065395095368, + "grad_norm": 13.44669246673584, + "learning_rate": 1.4187102633969122e-05, + "loss": 2.2476, + "step": 781 + }, + { + "epoch": 2.130790190735695, + "grad_norm": 13.213591575622559, + "learning_rate": 1.4205267938237968e-05, + "loss": 2.0225, + "step": 782 + }, + { + "epoch": 2.1335149863760217, + "grad_norm": 11.242518424987793, + "learning_rate": 1.4223433242506812e-05, + "loss": 2.3213, + "step": 783 + }, + { + "epoch": 2.136239782016349, + "grad_norm": 11.51584243774414, + "learning_rate": 1.4241598546775658e-05, + "loss": 2.2988, + "step": 784 + }, + { + "epoch": 2.138964577656676, + "grad_norm": 13.992745399475098, + "learning_rate": 1.4259763851044506e-05, + "loss": 2.3643, + "step": 785 + }, + { + "epoch": 2.1416893732970026, + "grad_norm": 12.655274391174316, + "learning_rate": 1.4277929155313352e-05, + "loss": 2.5439, + "step": 786 + }, + { + "epoch": 2.1444141689373297, + "grad_norm": 12.481905937194824, + "learning_rate": 1.4296094459582198e-05, + "loss": 2.2559, + "step": 787 + }, + { + "epoch": 2.147138964577657, + "grad_norm": 15.663750648498535, + "learning_rate": 1.4314259763851046e-05, + "loss": 2.311, + "step": 788 + }, + { + "epoch": 2.1498637602179835, + "grad_norm": 12.196157455444336, + "learning_rate": 1.4332425068119893e-05, + "loss": 2.1567, + "step": 789 + }, + { + "epoch": 2.1525885558583107, + "grad_norm": 11.681686401367188, + "learning_rate": 1.435059037238874e-05, + "loss": 2.4229, + "step": 790 + }, + { + "epoch": 2.155313351498638, + "grad_norm": 9.554698944091797, + "learning_rate": 1.4368755676657585e-05, + "loss": 2.0493, + "step": 791 + }, + { + "epoch": 2.1580381471389645, + "grad_norm": 11.352317810058594, + "learning_rate": 1.4386920980926431e-05, + "loss": 2.4033, + "step": 792 + }, + { + "epoch": 2.1607629427792916, + "grad_norm": 9.571414947509766, + "learning_rate": 1.4405086285195277e-05, + "loss": 2.2031, + "step": 793 + }, + { + "epoch": 2.1634877384196187, + "grad_norm": 14.849584579467773, + "learning_rate": 1.4423251589464125e-05, + "loss": 2.0972, + "step": 794 + }, + { + "epoch": 2.1662125340599454, + "grad_norm": 11.889425277709961, + "learning_rate": 1.4441416893732971e-05, + "loss": 2.1924, + "step": 795 + }, + { + "epoch": 2.1689373297002725, + "grad_norm": 10.594819068908691, + "learning_rate": 1.4459582198001817e-05, + "loss": 2.1279, + "step": 796 + }, + { + "epoch": 2.1716621253405997, + "grad_norm": 14.0387544631958, + "learning_rate": 1.4477747502270665e-05, + "loss": 2.4731, + "step": 797 + }, + { + "epoch": 2.1743869209809263, + "grad_norm": 12.90074348449707, + "learning_rate": 1.4495912806539511e-05, + "loss": 2.4609, + "step": 798 + }, + { + "epoch": 2.1771117166212535, + "grad_norm": 11.694089889526367, + "learning_rate": 1.4514078110808356e-05, + "loss": 2.1475, + "step": 799 + }, + { + "epoch": 2.1798365122615806, + "grad_norm": 12.369209289550781, + "learning_rate": 1.4532243415077204e-05, + "loss": 2.2612, + "step": 800 + }, + { + "epoch": 2.1825613079019073, + "grad_norm": 16.08076286315918, + "learning_rate": 1.455040871934605e-05, + "loss": 2.3594, + "step": 801 + }, + { + "epoch": 2.1852861035422344, + "grad_norm": 12.111376762390137, + "learning_rate": 1.4568574023614896e-05, + "loss": 2.2886, + "step": 802 + }, + { + "epoch": 2.1880108991825615, + "grad_norm": 9.426592826843262, + "learning_rate": 1.4586739327883744e-05, + "loss": 1.9961, + "step": 803 + }, + { + "epoch": 2.190735694822888, + "grad_norm": 19.973569869995117, + "learning_rate": 1.460490463215259e-05, + "loss": 2.3408, + "step": 804 + }, + { + "epoch": 2.1934604904632153, + "grad_norm": 8.401344299316406, + "learning_rate": 1.4623069936421436e-05, + "loss": 2.0479, + "step": 805 + }, + { + "epoch": 2.1961852861035425, + "grad_norm": 9.423659324645996, + "learning_rate": 1.4641235240690284e-05, + "loss": 2.0825, + "step": 806 + }, + { + "epoch": 2.198910081743869, + "grad_norm": 11.838205337524414, + "learning_rate": 1.465940054495913e-05, + "loss": 2.3599, + "step": 807 + }, + { + "epoch": 2.2016348773841963, + "grad_norm": 12.468666076660156, + "learning_rate": 1.4677565849227975e-05, + "loss": 2.2124, + "step": 808 + }, + { + "epoch": 2.204359673024523, + "grad_norm": 15.283005714416504, + "learning_rate": 1.469573115349682e-05, + "loss": 2.1201, + "step": 809 + }, + { + "epoch": 2.20708446866485, + "grad_norm": 12.136519432067871, + "learning_rate": 1.4713896457765669e-05, + "loss": 2.3779, + "step": 810 + }, + { + "epoch": 2.209809264305177, + "grad_norm": 9.63491439819336, + "learning_rate": 1.4732061762034515e-05, + "loss": 2.0181, + "step": 811 + }, + { + "epoch": 2.212534059945504, + "grad_norm": 11.01519775390625, + "learning_rate": 1.4750227066303363e-05, + "loss": 1.9985, + "step": 812 + }, + { + "epoch": 2.215258855585831, + "grad_norm": 10.398948669433594, + "learning_rate": 1.4768392370572209e-05, + "loss": 2.2524, + "step": 813 + }, + { + "epoch": 2.217983651226158, + "grad_norm": 10.20798110961914, + "learning_rate": 1.4786557674841055e-05, + "loss": 2.0015, + "step": 814 + }, + { + "epoch": 2.220708446866485, + "grad_norm": 12.424089431762695, + "learning_rate": 1.4804722979109903e-05, + "loss": 2.355, + "step": 815 + }, + { + "epoch": 2.223433242506812, + "grad_norm": 12.882838249206543, + "learning_rate": 1.4822888283378747e-05, + "loss": 2.2236, + "step": 816 + }, + { + "epoch": 2.226158038147139, + "grad_norm": 13.038334846496582, + "learning_rate": 1.4841053587647594e-05, + "loss": 2.5132, + "step": 817 + }, + { + "epoch": 2.2288828337874658, + "grad_norm": 10.221287727355957, + "learning_rate": 1.485921889191644e-05, + "loss": 2.1704, + "step": 818 + }, + { + "epoch": 2.231607629427793, + "grad_norm": 13.483091354370117, + "learning_rate": 1.4877384196185288e-05, + "loss": 2.519, + "step": 819 + }, + { + "epoch": 2.23433242506812, + "grad_norm": 12.316015243530273, + "learning_rate": 1.4895549500454134e-05, + "loss": 2.144, + "step": 820 + }, + { + "epoch": 2.2370572207084467, + "grad_norm": 10.261295318603516, + "learning_rate": 1.4913714804722982e-05, + "loss": 2.186, + "step": 821 + }, + { + "epoch": 2.239782016348774, + "grad_norm": 11.669163703918457, + "learning_rate": 1.4931880108991828e-05, + "loss": 2.166, + "step": 822 + }, + { + "epoch": 2.242506811989101, + "grad_norm": 12.902145385742188, + "learning_rate": 1.4950045413260674e-05, + "loss": 2.2456, + "step": 823 + }, + { + "epoch": 2.2452316076294276, + "grad_norm": 11.576069831848145, + "learning_rate": 1.4968210717529518e-05, + "loss": 2.2324, + "step": 824 + }, + { + "epoch": 2.2479564032697548, + "grad_norm": 11.665193557739258, + "learning_rate": 1.4986376021798366e-05, + "loss": 2.0337, + "step": 825 + }, + { + "epoch": 2.250681198910082, + "grad_norm": 11.684881210327148, + "learning_rate": 1.5004541326067212e-05, + "loss": 2.3325, + "step": 826 + }, + { + "epoch": 2.2534059945504086, + "grad_norm": 10.821648597717285, + "learning_rate": 1.5022706630336059e-05, + "loss": 2.1533, + "step": 827 + }, + { + "epoch": 2.2561307901907357, + "grad_norm": 12.104910850524902, + "learning_rate": 1.5040871934604906e-05, + "loss": 2.104, + "step": 828 + }, + { + "epoch": 2.258855585831063, + "grad_norm": 15.326925277709961, + "learning_rate": 1.5059037238873753e-05, + "loss": 2.1938, + "step": 829 + }, + { + "epoch": 2.2615803814713895, + "grad_norm": 15.872440338134766, + "learning_rate": 1.5077202543142599e-05, + "loss": 2.0366, + "step": 830 + }, + { + "epoch": 2.2643051771117166, + "grad_norm": 19.063030242919922, + "learning_rate": 1.5095367847411447e-05, + "loss": 2.4019, + "step": 831 + }, + { + "epoch": 2.2670299727520438, + "grad_norm": 14.302577018737793, + "learning_rate": 1.5113533151680291e-05, + "loss": 2.2896, + "step": 832 + }, + { + "epoch": 2.2697547683923704, + "grad_norm": 9.565779685974121, + "learning_rate": 1.5131698455949137e-05, + "loss": 2.2368, + "step": 833 + }, + { + "epoch": 2.2724795640326976, + "grad_norm": 10.099272727966309, + "learning_rate": 1.5149863760217985e-05, + "loss": 2.2588, + "step": 834 + }, + { + "epoch": 2.2752043596730247, + "grad_norm": 10.54786491394043, + "learning_rate": 1.5168029064486831e-05, + "loss": 1.916, + "step": 835 + }, + { + "epoch": 2.2779291553133514, + "grad_norm": 8.687639236450195, + "learning_rate": 1.5186194368755677e-05, + "loss": 2.1084, + "step": 836 + }, + { + "epoch": 2.2806539509536785, + "grad_norm": 10.300875663757324, + "learning_rate": 1.5204359673024525e-05, + "loss": 2.4204, + "step": 837 + }, + { + "epoch": 2.2833787465940056, + "grad_norm": 10.761526107788086, + "learning_rate": 1.5222524977293371e-05, + "loss": 2.1538, + "step": 838 + }, + { + "epoch": 2.2861035422343323, + "grad_norm": 10.05339527130127, + "learning_rate": 1.5240690281562218e-05, + "loss": 2.1846, + "step": 839 + }, + { + "epoch": 2.2888283378746594, + "grad_norm": 10.227608680725098, + "learning_rate": 1.5258855585831064e-05, + "loss": 2.2031, + "step": 840 + }, + { + "epoch": 2.291553133514986, + "grad_norm": 9.570499420166016, + "learning_rate": 1.5277020890099908e-05, + "loss": 1.9465, + "step": 841 + }, + { + "epoch": 2.2942779291553133, + "grad_norm": 11.354101181030273, + "learning_rate": 1.5295186194368756e-05, + "loss": 2.1499, + "step": 842 + }, + { + "epoch": 2.2970027247956404, + "grad_norm": 11.209668159484863, + "learning_rate": 1.5313351498637604e-05, + "loss": 2.1768, + "step": 843 + }, + { + "epoch": 2.299727520435967, + "grad_norm": 14.012726783752441, + "learning_rate": 1.533151680290645e-05, + "loss": 2.4834, + "step": 844 + }, + { + "epoch": 2.302452316076294, + "grad_norm": 13.252918243408203, + "learning_rate": 1.5349682107175296e-05, + "loss": 2.4282, + "step": 845 + }, + { + "epoch": 2.3051771117166213, + "grad_norm": 13.012864112854004, + "learning_rate": 1.5367847411444144e-05, + "loss": 2.0635, + "step": 846 + }, + { + "epoch": 2.307901907356948, + "grad_norm": 10.489202499389648, + "learning_rate": 1.538601271571299e-05, + "loss": 2.0771, + "step": 847 + }, + { + "epoch": 2.310626702997275, + "grad_norm": 9.56246280670166, + "learning_rate": 1.5404178019981836e-05, + "loss": 2.0532, + "step": 848 + }, + { + "epoch": 2.3133514986376023, + "grad_norm": 11.222508430480957, + "learning_rate": 1.542234332425068e-05, + "loss": 2.3257, + "step": 849 + }, + { + "epoch": 2.316076294277929, + "grad_norm": 14.687914848327637, + "learning_rate": 1.544050862851953e-05, + "loss": 2.3257, + "step": 850 + }, + { + "epoch": 2.318801089918256, + "grad_norm": 12.809759140014648, + "learning_rate": 1.5458673932788377e-05, + "loss": 2.2896, + "step": 851 + }, + { + "epoch": 2.321525885558583, + "grad_norm": 10.033246994018555, + "learning_rate": 1.547683923705722e-05, + "loss": 2.1733, + "step": 852 + }, + { + "epoch": 2.32425068119891, + "grad_norm": 10.335433959960938, + "learning_rate": 1.549500454132607e-05, + "loss": 2.0479, + "step": 853 + }, + { + "epoch": 2.326975476839237, + "grad_norm": 14.753990173339844, + "learning_rate": 1.5513169845594917e-05, + "loss": 2.082, + "step": 854 + }, + { + "epoch": 2.329700272479564, + "grad_norm": 10.427779197692871, + "learning_rate": 1.553133514986376e-05, + "loss": 2.1675, + "step": 855 + }, + { + "epoch": 2.332425068119891, + "grad_norm": 11.808363914489746, + "learning_rate": 1.554950045413261e-05, + "loss": 2.1299, + "step": 856 + }, + { + "epoch": 2.335149863760218, + "grad_norm": 12.636821746826172, + "learning_rate": 1.5567665758401454e-05, + "loss": 2.3027, + "step": 857 + }, + { + "epoch": 2.337874659400545, + "grad_norm": 10.85216999053955, + "learning_rate": 1.55858310626703e-05, + "loss": 2.1714, + "step": 858 + }, + { + "epoch": 2.3405994550408717, + "grad_norm": 14.7868070602417, + "learning_rate": 1.5603996366939146e-05, + "loss": 2.2993, + "step": 859 + }, + { + "epoch": 2.343324250681199, + "grad_norm": 13.12626838684082, + "learning_rate": 1.5622161671207994e-05, + "loss": 2.3159, + "step": 860 + }, + { + "epoch": 2.346049046321526, + "grad_norm": 27.119937896728516, + "learning_rate": 1.564032697547684e-05, + "loss": 2.1138, + "step": 861 + }, + { + "epoch": 2.3487738419618527, + "grad_norm": 11.369824409484863, + "learning_rate": 1.5658492279745686e-05, + "loss": 2.1289, + "step": 862 + }, + { + "epoch": 2.35149863760218, + "grad_norm": 11.388385772705078, + "learning_rate": 1.5676657584014534e-05, + "loss": 2.125, + "step": 863 + }, + { + "epoch": 2.354223433242507, + "grad_norm": 9.750898361206055, + "learning_rate": 1.5694822888283382e-05, + "loss": 1.9927, + "step": 864 + }, + { + "epoch": 2.3569482288828336, + "grad_norm": 13.13124942779541, + "learning_rate": 1.5712988192552226e-05, + "loss": 2.062, + "step": 865 + }, + { + "epoch": 2.3596730245231607, + "grad_norm": 11.438236236572266, + "learning_rate": 1.573115349682107e-05, + "loss": 2.0923, + "step": 866 + }, + { + "epoch": 2.362397820163488, + "grad_norm": 12.381810188293457, + "learning_rate": 1.574931880108992e-05, + "loss": 2.1172, + "step": 867 + }, + { + "epoch": 2.3651226158038146, + "grad_norm": 12.36788558959961, + "learning_rate": 1.5767484105358766e-05, + "loss": 2.3823, + "step": 868 + }, + { + "epoch": 2.3678474114441417, + "grad_norm": 11.918746948242188, + "learning_rate": 1.578564940962761e-05, + "loss": 2.3428, + "step": 869 + }, + { + "epoch": 2.370572207084469, + "grad_norm": 11.873290061950684, + "learning_rate": 1.580381471389646e-05, + "loss": 1.9648, + "step": 870 + }, + { + "epoch": 2.3732970027247955, + "grad_norm": 9.237068176269531, + "learning_rate": 1.5821980018165307e-05, + "loss": 2.1528, + "step": 871 + }, + { + "epoch": 2.3760217983651226, + "grad_norm": 11.43176555633545, + "learning_rate": 1.5840145322434154e-05, + "loss": 2.3501, + "step": 872 + }, + { + "epoch": 2.3787465940054497, + "grad_norm": 11.239076614379883, + "learning_rate": 1.5858310626703e-05, + "loss": 2.1973, + "step": 873 + }, + { + "epoch": 2.3814713896457764, + "grad_norm": 9.229157447814941, + "learning_rate": 1.5876475930971843e-05, + "loss": 2.1504, + "step": 874 + }, + { + "epoch": 2.3841961852861036, + "grad_norm": 10.20166301727295, + "learning_rate": 1.589464123524069e-05, + "loss": 1.9539, + "step": 875 + }, + { + "epoch": 2.3869209809264307, + "grad_norm": 13.474658012390137, + "learning_rate": 1.591280653950954e-05, + "loss": 2.1465, + "step": 876 + }, + { + "epoch": 2.3896457765667574, + "grad_norm": 9.529938697814941, + "learning_rate": 1.5930971843778384e-05, + "loss": 2.1045, + "step": 877 + }, + { + "epoch": 2.3923705722070845, + "grad_norm": 9.707219123840332, + "learning_rate": 1.594913714804723e-05, + "loss": 2.0859, + "step": 878 + }, + { + "epoch": 2.3950953678474116, + "grad_norm": 10.575519561767578, + "learning_rate": 1.596730245231608e-05, + "loss": 2.3926, + "step": 879 + }, + { + "epoch": 2.3978201634877383, + "grad_norm": 9.208884239196777, + "learning_rate": 1.5985467756584924e-05, + "loss": 2.2114, + "step": 880 + }, + { + "epoch": 2.4005449591280654, + "grad_norm": 11.017399787902832, + "learning_rate": 1.600363306085377e-05, + "loss": 2.4048, + "step": 881 + }, + { + "epoch": 2.4032697547683926, + "grad_norm": 11.70709228515625, + "learning_rate": 1.6021798365122616e-05, + "loss": 2.1816, + "step": 882 + }, + { + "epoch": 2.4059945504087192, + "grad_norm": 13.651061058044434, + "learning_rate": 1.6039963669391464e-05, + "loss": 2.0396, + "step": 883 + }, + { + "epoch": 2.4087193460490464, + "grad_norm": 12.736273765563965, + "learning_rate": 1.605812897366031e-05, + "loss": 2.397, + "step": 884 + }, + { + "epoch": 2.4114441416893735, + "grad_norm": 10.983773231506348, + "learning_rate": 1.6076294277929156e-05, + "loss": 2.0938, + "step": 885 + }, + { + "epoch": 2.4141689373297, + "grad_norm": 10.832428932189941, + "learning_rate": 1.6094459582198004e-05, + "loss": 2.0327, + "step": 886 + }, + { + "epoch": 2.4168937329700273, + "grad_norm": 11.225357055664062, + "learning_rate": 1.611262488646685e-05, + "loss": 1.9614, + "step": 887 + }, + { + "epoch": 2.4196185286103544, + "grad_norm": 12.462913513183594, + "learning_rate": 1.6130790190735696e-05, + "loss": 2.0, + "step": 888 + }, + { + "epoch": 2.422343324250681, + "grad_norm": 10.41214370727539, + "learning_rate": 1.6148955495004544e-05, + "loss": 2.1411, + "step": 889 + }, + { + "epoch": 2.4250681198910082, + "grad_norm": 11.749297142028809, + "learning_rate": 1.616712079927339e-05, + "loss": 2.25, + "step": 890 + }, + { + "epoch": 2.4277929155313354, + "grad_norm": 11.546613693237305, + "learning_rate": 1.6185286103542233e-05, + "loss": 2.0762, + "step": 891 + }, + { + "epoch": 2.430517711171662, + "grad_norm": 11.366194725036621, + "learning_rate": 1.620345140781108e-05, + "loss": 2.2031, + "step": 892 + }, + { + "epoch": 2.433242506811989, + "grad_norm": 13.148904800415039, + "learning_rate": 1.622161671207993e-05, + "loss": 2.1274, + "step": 893 + }, + { + "epoch": 2.4359673024523163, + "grad_norm": 21.143726348876953, + "learning_rate": 1.6239782016348777e-05, + "loss": 2.1182, + "step": 894 + }, + { + "epoch": 2.438692098092643, + "grad_norm": 11.426177978515625, + "learning_rate": 1.625794732061762e-05, + "loss": 2.2329, + "step": 895 + }, + { + "epoch": 2.44141689373297, + "grad_norm": 11.629473686218262, + "learning_rate": 1.627611262488647e-05, + "loss": 2.1201, + "step": 896 + }, + { + "epoch": 2.4441416893732972, + "grad_norm": 12.553741455078125, + "learning_rate": 1.6294277929155317e-05, + "loss": 2.1685, + "step": 897 + }, + { + "epoch": 2.446866485013624, + "grad_norm": 10.176178932189941, + "learning_rate": 1.631244323342416e-05, + "loss": 2.0972, + "step": 898 + }, + { + "epoch": 2.449591280653951, + "grad_norm": 12.827268600463867, + "learning_rate": 1.6330608537693006e-05, + "loss": 2.3735, + "step": 899 + }, + { + "epoch": 2.452316076294278, + "grad_norm": 17.78833770751953, + "learning_rate": 1.6348773841961854e-05, + "loss": 1.9966, + "step": 900 + }, + { + "epoch": 2.455040871934605, + "grad_norm": 10.53470516204834, + "learning_rate": 1.63669391462307e-05, + "loss": 2.2173, + "step": 901 + }, + { + "epoch": 2.457765667574932, + "grad_norm": 12.696940422058105, + "learning_rate": 1.6385104450499546e-05, + "loss": 2.1294, + "step": 902 + }, + { + "epoch": 2.460490463215259, + "grad_norm": 10.315053939819336, + "learning_rate": 1.6403269754768394e-05, + "loss": 2.0537, + "step": 903 + }, + { + "epoch": 2.463215258855586, + "grad_norm": 10.008761405944824, + "learning_rate": 1.6421435059037242e-05, + "loss": 2.2856, + "step": 904 + }, + { + "epoch": 2.465940054495913, + "grad_norm": 11.975059509277344, + "learning_rate": 1.6439600363306086e-05, + "loss": 2.105, + "step": 905 + }, + { + "epoch": 2.4686648501362396, + "grad_norm": 12.422130584716797, + "learning_rate": 1.6457765667574934e-05, + "loss": 2.2124, + "step": 906 + }, + { + "epoch": 2.4713896457765667, + "grad_norm": 11.444618225097656, + "learning_rate": 1.647593097184378e-05, + "loss": 2.1665, + "step": 907 + }, + { + "epoch": 2.474114441416894, + "grad_norm": 13.179655075073242, + "learning_rate": 1.6494096276112626e-05, + "loss": 2.6147, + "step": 908 + }, + { + "epoch": 2.4768392370572205, + "grad_norm": 10.262988090515137, + "learning_rate": 1.651226158038147e-05, + "loss": 2.4829, + "step": 909 + }, + { + "epoch": 2.4795640326975477, + "grad_norm": 9.67646598815918, + "learning_rate": 1.653042688465032e-05, + "loss": 2.0737, + "step": 910 + }, + { + "epoch": 2.482288828337875, + "grad_norm": 8.827295303344727, + "learning_rate": 1.6548592188919167e-05, + "loss": 1.8481, + "step": 911 + }, + { + "epoch": 2.4850136239782015, + "grad_norm": 9.027557373046875, + "learning_rate": 1.656675749318801e-05, + "loss": 2.3447, + "step": 912 + }, + { + "epoch": 2.4877384196185286, + "grad_norm": 13.08642292022705, + "learning_rate": 1.658492279745686e-05, + "loss": 2.3794, + "step": 913 + }, + { + "epoch": 2.4904632152588557, + "grad_norm": 14.326387405395508, + "learning_rate": 1.6603088101725707e-05, + "loss": 2.0713, + "step": 914 + }, + { + "epoch": 2.4931880108991824, + "grad_norm": 10.7723970413208, + "learning_rate": 1.662125340599455e-05, + "loss": 2.2383, + "step": 915 + }, + { + "epoch": 2.4959128065395095, + "grad_norm": 11.671551704406738, + "learning_rate": 1.66394187102634e-05, + "loss": 2.3242, + "step": 916 + }, + { + "epoch": 2.4986376021798367, + "grad_norm": 9.647505760192871, + "learning_rate": 1.6657584014532244e-05, + "loss": 2.1035, + "step": 917 + }, + { + "epoch": 2.5013623978201633, + "grad_norm": 10.872794151306152, + "learning_rate": 1.667574931880109e-05, + "loss": 2.1948, + "step": 918 + }, + { + "epoch": 2.5040871934604905, + "grad_norm": 11.074483871459961, + "learning_rate": 1.669391462306994e-05, + "loss": 2.0283, + "step": 919 + }, + { + "epoch": 2.5068119891008176, + "grad_norm": 10.048798561096191, + "learning_rate": 1.6712079927338784e-05, + "loss": 2.1079, + "step": 920 + }, + { + "epoch": 2.5095367847411443, + "grad_norm": 16.10767936706543, + "learning_rate": 1.673024523160763e-05, + "loss": 2.3203, + "step": 921 + }, + { + "epoch": 2.5122615803814714, + "grad_norm": 10.057881355285645, + "learning_rate": 1.674841053587648e-05, + "loss": 1.9272, + "step": 922 + }, + { + "epoch": 2.5149863760217985, + "grad_norm": 10.424790382385254, + "learning_rate": 1.6766575840145324e-05, + "loss": 1.8945, + "step": 923 + }, + { + "epoch": 2.517711171662125, + "grad_norm": 8.450881958007812, + "learning_rate": 1.678474114441417e-05, + "loss": 2.0601, + "step": 924 + }, + { + "epoch": 2.5204359673024523, + "grad_norm": 8.487282752990723, + "learning_rate": 1.6802906448683016e-05, + "loss": 1.9404, + "step": 925 + }, + { + "epoch": 2.523160762942779, + "grad_norm": 12.343279838562012, + "learning_rate": 1.6821071752951864e-05, + "loss": 2.1753, + "step": 926 + }, + { + "epoch": 2.525885558583106, + "grad_norm": 10.701006889343262, + "learning_rate": 1.683923705722071e-05, + "loss": 2.0884, + "step": 927 + }, + { + "epoch": 2.5286103542234333, + "grad_norm": 12.124945640563965, + "learning_rate": 1.6857402361489556e-05, + "loss": 2.2012, + "step": 928 + }, + { + "epoch": 2.53133514986376, + "grad_norm": 12.241605758666992, + "learning_rate": 1.6875567665758404e-05, + "loss": 2.0977, + "step": 929 + }, + { + "epoch": 2.534059945504087, + "grad_norm": 12.198929786682129, + "learning_rate": 1.689373297002725e-05, + "loss": 2.1514, + "step": 930 + }, + { + "epoch": 2.536784741144414, + "grad_norm": 10.598546028137207, + "learning_rate": 1.6911898274296097e-05, + "loss": 2.1274, + "step": 931 + }, + { + "epoch": 2.539509536784741, + "grad_norm": 10.838115692138672, + "learning_rate": 1.693006357856494e-05, + "loss": 2.1362, + "step": 932 + }, + { + "epoch": 2.542234332425068, + "grad_norm": 12.07777214050293, + "learning_rate": 1.694822888283379e-05, + "loss": 2.1733, + "step": 933 + }, + { + "epoch": 2.544959128065395, + "grad_norm": 12.838855743408203, + "learning_rate": 1.6966394187102633e-05, + "loss": 2.3003, + "step": 934 + }, + { + "epoch": 2.547683923705722, + "grad_norm": 15.405717849731445, + "learning_rate": 1.698455949137148e-05, + "loss": 2.0708, + "step": 935 + }, + { + "epoch": 2.550408719346049, + "grad_norm": 12.793071746826172, + "learning_rate": 1.700272479564033e-05, + "loss": 2.1646, + "step": 936 + }, + { + "epoch": 2.553133514986376, + "grad_norm": 13.155274391174316, + "learning_rate": 1.7020890099909177e-05, + "loss": 1.9976, + "step": 937 + }, + { + "epoch": 2.5558583106267028, + "grad_norm": 11.268887519836426, + "learning_rate": 1.703905540417802e-05, + "loss": 2.2085, + "step": 938 + }, + { + "epoch": 2.55858310626703, + "grad_norm": 10.742142677307129, + "learning_rate": 1.705722070844687e-05, + "loss": 2.3872, + "step": 939 + }, + { + "epoch": 2.561307901907357, + "grad_norm": 9.933159828186035, + "learning_rate": 1.7075386012715714e-05, + "loss": 2.1978, + "step": 940 + }, + { + "epoch": 2.5640326975476837, + "grad_norm": 13.011128425598145, + "learning_rate": 1.709355131698456e-05, + "loss": 2.3154, + "step": 941 + }, + { + "epoch": 2.566757493188011, + "grad_norm": 11.067089080810547, + "learning_rate": 1.7111716621253406e-05, + "loss": 2.207, + "step": 942 + }, + { + "epoch": 2.569482288828338, + "grad_norm": 9.70608139038086, + "learning_rate": 1.7129881925522254e-05, + "loss": 2.1768, + "step": 943 + }, + { + "epoch": 2.5722070844686646, + "grad_norm": 11.981213569641113, + "learning_rate": 1.7148047229791102e-05, + "loss": 2.0952, + "step": 944 + }, + { + "epoch": 2.5749318801089918, + "grad_norm": 12.573433876037598, + "learning_rate": 1.7166212534059946e-05, + "loss": 2.2168, + "step": 945 + }, + { + "epoch": 2.577656675749319, + "grad_norm": 12.08493423461914, + "learning_rate": 1.7184377838328794e-05, + "loss": 1.9185, + "step": 946 + }, + { + "epoch": 2.5803814713896456, + "grad_norm": 13.089865684509277, + "learning_rate": 1.7202543142597642e-05, + "loss": 2.186, + "step": 947 + }, + { + "epoch": 2.5831062670299727, + "grad_norm": 13.027048110961914, + "learning_rate": 1.7220708446866486e-05, + "loss": 1.9521, + "step": 948 + }, + { + "epoch": 2.5858310626703, + "grad_norm": 11.275967597961426, + "learning_rate": 1.723887375113533e-05, + "loss": 2.0278, + "step": 949 + }, + { + "epoch": 2.5885558583106265, + "grad_norm": 11.945215225219727, + "learning_rate": 1.725703905540418e-05, + "loss": 2.0869, + "step": 950 + }, + { + "epoch": 2.5912806539509536, + "grad_norm": 13.042049407958984, + "learning_rate": 1.7275204359673027e-05, + "loss": 2.1851, + "step": 951 + }, + { + "epoch": 2.5940054495912808, + "grad_norm": 12.437920570373535, + "learning_rate": 1.729336966394187e-05, + "loss": 2.189, + "step": 952 + }, + { + "epoch": 2.5967302452316074, + "grad_norm": 10.772150039672852, + "learning_rate": 1.731153496821072e-05, + "loss": 2.0439, + "step": 953 + }, + { + "epoch": 2.5994550408719346, + "grad_norm": 9.490487098693848, + "learning_rate": 1.7329700272479567e-05, + "loss": 2.2412, + "step": 954 + }, + { + "epoch": 2.6021798365122617, + "grad_norm": 11.776585578918457, + "learning_rate": 1.734786557674841e-05, + "loss": 2.2949, + "step": 955 + }, + { + "epoch": 2.6049046321525884, + "grad_norm": 11.594934463500977, + "learning_rate": 1.736603088101726e-05, + "loss": 2.4121, + "step": 956 + }, + { + "epoch": 2.6076294277929155, + "grad_norm": 10.30360221862793, + "learning_rate": 1.7384196185286104e-05, + "loss": 2.2046, + "step": 957 + }, + { + "epoch": 2.6103542234332426, + "grad_norm": 10.74131965637207, + "learning_rate": 1.740236148955495e-05, + "loss": 2.0342, + "step": 958 + }, + { + "epoch": 2.6130790190735693, + "grad_norm": 14.043535232543945, + "learning_rate": 1.74205267938238e-05, + "loss": 2.0068, + "step": 959 + }, + { + "epoch": 2.6158038147138964, + "grad_norm": 15.56317138671875, + "learning_rate": 1.7438692098092644e-05, + "loss": 2.3081, + "step": 960 + }, + { + "epoch": 2.6185286103542236, + "grad_norm": 11.279816627502441, + "learning_rate": 1.745685740236149e-05, + "loss": 2.1792, + "step": 961 + }, + { + "epoch": 2.6212534059945503, + "grad_norm": 10.112878799438477, + "learning_rate": 1.747502270663034e-05, + "loss": 2.0562, + "step": 962 + }, + { + "epoch": 2.6239782016348774, + "grad_norm": 9.889863967895508, + "learning_rate": 1.7493188010899184e-05, + "loss": 2.0547, + "step": 963 + }, + { + "epoch": 2.6267029972752045, + "grad_norm": 11.233699798583984, + "learning_rate": 1.7511353315168032e-05, + "loss": 2.0146, + "step": 964 + }, + { + "epoch": 2.629427792915531, + "grad_norm": 11.08191204071045, + "learning_rate": 1.7529518619436876e-05, + "loss": 2.1846, + "step": 965 + }, + { + "epoch": 2.6321525885558583, + "grad_norm": 10.609518051147461, + "learning_rate": 1.7547683923705724e-05, + "loss": 2.0576, + "step": 966 + }, + { + "epoch": 2.6348773841961854, + "grad_norm": 10.003273010253906, + "learning_rate": 1.756584922797457e-05, + "loss": 2.064, + "step": 967 + }, + { + "epoch": 2.637602179836512, + "grad_norm": 11.615416526794434, + "learning_rate": 1.7584014532243416e-05, + "loss": 2.1299, + "step": 968 + }, + { + "epoch": 2.6403269754768393, + "grad_norm": 9.684825897216797, + "learning_rate": 1.7602179836512264e-05, + "loss": 2.0669, + "step": 969 + }, + { + "epoch": 2.6430517711171664, + "grad_norm": 9.547039985656738, + "learning_rate": 1.762034514078111e-05, + "loss": 2.3301, + "step": 970 + }, + { + "epoch": 2.645776566757493, + "grad_norm": 16.897127151489258, + "learning_rate": 1.7638510445049957e-05, + "loss": 2.1841, + "step": 971 + }, + { + "epoch": 2.64850136239782, + "grad_norm": 10.307887077331543, + "learning_rate": 1.7656675749318804e-05, + "loss": 2.0186, + "step": 972 + }, + { + "epoch": 2.6512261580381473, + "grad_norm": 10.339676856994629, + "learning_rate": 1.767484105358765e-05, + "loss": 1.9565, + "step": 973 + }, + { + "epoch": 2.653950953678474, + "grad_norm": 11.42247200012207, + "learning_rate": 1.7693006357856493e-05, + "loss": 2.1255, + "step": 974 + }, + { + "epoch": 2.656675749318801, + "grad_norm": 14.291765213012695, + "learning_rate": 1.771117166212534e-05, + "loss": 2.1147, + "step": 975 + }, + { + "epoch": 2.6594005449591283, + "grad_norm": 11.153193473815918, + "learning_rate": 1.772933696639419e-05, + "loss": 2.2563, + "step": 976 + }, + { + "epoch": 2.662125340599455, + "grad_norm": 21.198802947998047, + "learning_rate": 1.7747502270663034e-05, + "loss": 2.0952, + "step": 977 + }, + { + "epoch": 2.664850136239782, + "grad_norm": 8.79081916809082, + "learning_rate": 1.776566757493188e-05, + "loss": 1.9707, + "step": 978 + }, + { + "epoch": 2.667574931880109, + "grad_norm": 10.3134126663208, + "learning_rate": 1.778383287920073e-05, + "loss": 2.3716, + "step": 979 + }, + { + "epoch": 2.670299727520436, + "grad_norm": 11.59449577331543, + "learning_rate": 1.7801998183469574e-05, + "loss": 2.1514, + "step": 980 + }, + { + "epoch": 2.673024523160763, + "grad_norm": 11.302346229553223, + "learning_rate": 1.782016348773842e-05, + "loss": 2.1157, + "step": 981 + }, + { + "epoch": 2.67574931880109, + "grad_norm": 9.75825309753418, + "learning_rate": 1.7838328792007266e-05, + "loss": 2.0571, + "step": 982 + }, + { + "epoch": 2.678474114441417, + "grad_norm": 10.609179496765137, + "learning_rate": 1.7856494096276114e-05, + "loss": 2.1133, + "step": 983 + }, + { + "epoch": 2.681198910081744, + "grad_norm": 11.286617279052734, + "learning_rate": 1.7874659400544962e-05, + "loss": 2.3467, + "step": 984 + }, + { + "epoch": 2.683923705722071, + "grad_norm": 9.509994506835938, + "learning_rate": 1.7892824704813806e-05, + "loss": 1.9917, + "step": 985 + }, + { + "epoch": 2.6866485013623977, + "grad_norm": 14.678549766540527, + "learning_rate": 1.7910990009082654e-05, + "loss": 2.0366, + "step": 986 + }, + { + "epoch": 2.689373297002725, + "grad_norm": 11.929479598999023, + "learning_rate": 1.7929155313351502e-05, + "loss": 2.2295, + "step": 987 + }, + { + "epoch": 2.692098092643052, + "grad_norm": 17.15774917602539, + "learning_rate": 1.7947320617620346e-05, + "loss": 2.1348, + "step": 988 + }, + { + "epoch": 2.6948228882833787, + "grad_norm": 10.941985130310059, + "learning_rate": 1.7965485921889194e-05, + "loss": 2.0767, + "step": 989 + }, + { + "epoch": 2.697547683923706, + "grad_norm": 12.462225914001465, + "learning_rate": 1.798365122615804e-05, + "loss": 2.1367, + "step": 990 + }, + { + "epoch": 2.700272479564033, + "grad_norm": 11.844996452331543, + "learning_rate": 1.8001816530426887e-05, + "loss": 2.1934, + "step": 991 + }, + { + "epoch": 2.7029972752043596, + "grad_norm": 14.804704666137695, + "learning_rate": 1.801998183469573e-05, + "loss": 2.395, + "step": 992 + }, + { + "epoch": 2.7057220708446867, + "grad_norm": 11.517407417297363, + "learning_rate": 1.803814713896458e-05, + "loss": 2.3286, + "step": 993 + }, + { + "epoch": 2.708446866485014, + "grad_norm": 14.478534698486328, + "learning_rate": 1.8056312443233427e-05, + "loss": 2.1533, + "step": 994 + }, + { + "epoch": 2.7111716621253406, + "grad_norm": 9.946856498718262, + "learning_rate": 1.807447774750227e-05, + "loss": 1.96, + "step": 995 + }, + { + "epoch": 2.7138964577656677, + "grad_norm": 13.665610313415527, + "learning_rate": 1.809264305177112e-05, + "loss": 2.2798, + "step": 996 + }, + { + "epoch": 2.716621253405995, + "grad_norm": 10.038129806518555, + "learning_rate": 1.8110808356039967e-05, + "loss": 2.1304, + "step": 997 + }, + { + "epoch": 2.7193460490463215, + "grad_norm": 11.260223388671875, + "learning_rate": 1.812897366030881e-05, + "loss": 1.9653, + "step": 998 + }, + { + "epoch": 2.7220708446866486, + "grad_norm": 15.872689247131348, + "learning_rate": 1.8147138964577656e-05, + "loss": 2.145, + "step": 999 + }, + { + "epoch": 2.7247956403269757, + "grad_norm": 11.008293151855469, + "learning_rate": 1.8165304268846504e-05, + "loss": 1.9932, + "step": 1000 + }, + { + "epoch": 2.7275204359673024, + "grad_norm": 21.713911056518555, + "learning_rate": 1.818346957311535e-05, + "loss": 2.1406, + "step": 1001 + }, + { + "epoch": 2.7302452316076296, + "grad_norm": 10.877911567687988, + "learning_rate": 1.82016348773842e-05, + "loss": 1.8789, + "step": 1002 + }, + { + "epoch": 2.7329700272479567, + "grad_norm": 9.547883033752441, + "learning_rate": 1.8219800181653044e-05, + "loss": 1.9058, + "step": 1003 + }, + { + "epoch": 2.7356948228882834, + "grad_norm": 10.755492210388184, + "learning_rate": 1.8237965485921892e-05, + "loss": 2.2559, + "step": 1004 + }, + { + "epoch": 2.7384196185286105, + "grad_norm": 14.680377006530762, + "learning_rate": 1.825613079019074e-05, + "loss": 2.1792, + "step": 1005 + }, + { + "epoch": 2.741144414168937, + "grad_norm": 11.496443748474121, + "learning_rate": 1.8274296094459584e-05, + "loss": 1.8442, + "step": 1006 + }, + { + "epoch": 2.7438692098092643, + "grad_norm": 10.433564186096191, + "learning_rate": 1.829246139872843e-05, + "loss": 2.0632, + "step": 1007 + }, + { + "epoch": 2.7465940054495914, + "grad_norm": 13.286279678344727, + "learning_rate": 1.8310626702997276e-05, + "loss": 2.0337, + "step": 1008 + }, + { + "epoch": 2.749318801089918, + "grad_norm": 12.263654708862305, + "learning_rate": 1.8328792007266124e-05, + "loss": 2.2349, + "step": 1009 + }, + { + "epoch": 2.7520435967302452, + "grad_norm": 12.426753997802734, + "learning_rate": 1.834695731153497e-05, + "loss": 2.1875, + "step": 1010 + }, + { + "epoch": 2.7547683923705724, + "grad_norm": 11.248434066772461, + "learning_rate": 1.8365122615803817e-05, + "loss": 2.3296, + "step": 1011 + }, + { + "epoch": 2.757493188010899, + "grad_norm": 9.859634399414062, + "learning_rate": 1.8383287920072664e-05, + "loss": 2.0513, + "step": 1012 + }, + { + "epoch": 2.760217983651226, + "grad_norm": 14.553107261657715, + "learning_rate": 1.840145322434151e-05, + "loss": 1.9404, + "step": 1013 + }, + { + "epoch": 2.7629427792915533, + "grad_norm": 12.255064010620117, + "learning_rate": 1.8419618528610357e-05, + "loss": 2.0938, + "step": 1014 + }, + { + "epoch": 2.76566757493188, + "grad_norm": 9.135375022888184, + "learning_rate": 1.84377838328792e-05, + "loss": 1.9819, + "step": 1015 + }, + { + "epoch": 2.768392370572207, + "grad_norm": 9.41851806640625, + "learning_rate": 1.845594913714805e-05, + "loss": 2.1963, + "step": 1016 + }, + { + "epoch": 2.771117166212534, + "grad_norm": 10.326286315917969, + "learning_rate": 1.8474114441416894e-05, + "loss": 2.0601, + "step": 1017 + }, + { + "epoch": 2.773841961852861, + "grad_norm": 10.37588119506836, + "learning_rate": 1.849227974568574e-05, + "loss": 2.0913, + "step": 1018 + }, + { + "epoch": 2.776566757493188, + "grad_norm": 11.31806755065918, + "learning_rate": 1.851044504995459e-05, + "loss": 1.9868, + "step": 1019 + }, + { + "epoch": 2.7792915531335147, + "grad_norm": 11.349784851074219, + "learning_rate": 1.8528610354223434e-05, + "loss": 2.0552, + "step": 1020 + }, + { + "epoch": 2.782016348773842, + "grad_norm": 14.040486335754395, + "learning_rate": 1.854677565849228e-05, + "loss": 2.0845, + "step": 1021 + }, + { + "epoch": 2.784741144414169, + "grad_norm": 13.191317558288574, + "learning_rate": 1.856494096276113e-05, + "loss": 2.1899, + "step": 1022 + }, + { + "epoch": 2.7874659400544957, + "grad_norm": 9.923206329345703, + "learning_rate": 1.8583106267029974e-05, + "loss": 1.9409, + "step": 1023 + }, + { + "epoch": 2.790190735694823, + "grad_norm": 10.722381591796875, + "learning_rate": 1.8601271571298822e-05, + "loss": 2.0586, + "step": 1024 + }, + { + "epoch": 2.79291553133515, + "grad_norm": 17.646202087402344, + "learning_rate": 1.8619436875567666e-05, + "loss": 2.1035, + "step": 1025 + }, + { + "epoch": 2.7956403269754766, + "grad_norm": 9.694844245910645, + "learning_rate": 1.8637602179836514e-05, + "loss": 2.0835, + "step": 1026 + }, + { + "epoch": 2.7983651226158037, + "grad_norm": 12.24616813659668, + "learning_rate": 1.8655767484105362e-05, + "loss": 2.1138, + "step": 1027 + }, + { + "epoch": 2.801089918256131, + "grad_norm": 9.930631637573242, + "learning_rate": 1.8673932788374206e-05, + "loss": 2.0835, + "step": 1028 + }, + { + "epoch": 2.8038147138964575, + "grad_norm": 10.830024719238281, + "learning_rate": 1.8692098092643054e-05, + "loss": 2.0444, + "step": 1029 + }, + { + "epoch": 2.8065395095367847, + "grad_norm": 10.865161895751953, + "learning_rate": 1.8710263396911902e-05, + "loss": 2.0405, + "step": 1030 + }, + { + "epoch": 2.809264305177112, + "grad_norm": 14.24614429473877, + "learning_rate": 1.8728428701180747e-05, + "loss": 2.0142, + "step": 1031 + }, + { + "epoch": 2.8119891008174385, + "grad_norm": 11.228114128112793, + "learning_rate": 1.874659400544959e-05, + "loss": 2.0884, + "step": 1032 + }, + { + "epoch": 2.8147138964577656, + "grad_norm": 10.059917449951172, + "learning_rate": 1.876475930971844e-05, + "loss": 2.1763, + "step": 1033 + }, + { + "epoch": 2.8174386920980927, + "grad_norm": 11.651665687561035, + "learning_rate": 1.8782924613987287e-05, + "loss": 2.0122, + "step": 1034 + }, + { + "epoch": 2.8201634877384194, + "grad_norm": 11.106765747070312, + "learning_rate": 1.880108991825613e-05, + "loss": 2.2271, + "step": 1035 + }, + { + "epoch": 2.8228882833787465, + "grad_norm": 15.006171226501465, + "learning_rate": 1.881925522252498e-05, + "loss": 2.1875, + "step": 1036 + }, + { + "epoch": 2.8256130790190737, + "grad_norm": 15.874217987060547, + "learning_rate": 1.8837420526793827e-05, + "loss": 2.2461, + "step": 1037 + }, + { + "epoch": 2.8283378746594003, + "grad_norm": 10.447962760925293, + "learning_rate": 1.885558583106267e-05, + "loss": 2.252, + "step": 1038 + }, + { + "epoch": 2.8310626702997275, + "grad_norm": 10.36314868927002, + "learning_rate": 1.8873751135331516e-05, + "loss": 1.9971, + "step": 1039 + }, + { + "epoch": 2.8337874659400546, + "grad_norm": 10.244414329528809, + "learning_rate": 1.8891916439600364e-05, + "loss": 2.1052, + "step": 1040 + }, + { + "epoch": 2.8365122615803813, + "grad_norm": 10.732833862304688, + "learning_rate": 1.891008174386921e-05, + "loss": 2.0864, + "step": 1041 + }, + { + "epoch": 2.8392370572207084, + "grad_norm": 8.79423999786377, + "learning_rate": 1.8928247048138056e-05, + "loss": 1.834, + "step": 1042 + }, + { + "epoch": 2.8419618528610355, + "grad_norm": 10.455263137817383, + "learning_rate": 1.8946412352406904e-05, + "loss": 2.1279, + "step": 1043 + }, + { + "epoch": 2.844686648501362, + "grad_norm": 10.553400039672852, + "learning_rate": 1.8964577656675752e-05, + "loss": 2.1826, + "step": 1044 + }, + { + "epoch": 2.8474114441416893, + "grad_norm": 14.043966293334961, + "learning_rate": 1.8982742960944596e-05, + "loss": 2.1504, + "step": 1045 + }, + { + "epoch": 2.8501362397820165, + "grad_norm": 9.35976505279541, + "learning_rate": 1.9000908265213444e-05, + "loss": 1.9067, + "step": 1046 + }, + { + "epoch": 2.852861035422343, + "grad_norm": 10.658482551574707, + "learning_rate": 1.9019073569482292e-05, + "loss": 1.834, + "step": 1047 + }, + { + "epoch": 2.8555858310626703, + "grad_norm": 13.526549339294434, + "learning_rate": 1.9037238873751136e-05, + "loss": 2.0977, + "step": 1048 + }, + { + "epoch": 2.8583106267029974, + "grad_norm": 12.88541316986084, + "learning_rate": 1.9055404178019984e-05, + "loss": 2.0054, + "step": 1049 + }, + { + "epoch": 2.861035422343324, + "grad_norm": 10.029620170593262, + "learning_rate": 1.907356948228883e-05, + "loss": 2.1782, + "step": 1050 + }, + { + "epoch": 2.863760217983651, + "grad_norm": 9.453518867492676, + "learning_rate": 1.9091734786557677e-05, + "loss": 1.9761, + "step": 1051 + }, + { + "epoch": 2.8664850136239783, + "grad_norm": 11.48316764831543, + "learning_rate": 1.9109900090826524e-05, + "loss": 2.0508, + "step": 1052 + }, + { + "epoch": 2.869209809264305, + "grad_norm": 11.313542366027832, + "learning_rate": 1.912806539509537e-05, + "loss": 2.2388, + "step": 1053 + }, + { + "epoch": 2.871934604904632, + "grad_norm": 9.777838706970215, + "learning_rate": 1.9146230699364217e-05, + "loss": 2.0586, + "step": 1054 + }, + { + "epoch": 2.8746594005449593, + "grad_norm": 10.812276840209961, + "learning_rate": 1.9164396003633065e-05, + "loss": 2.29, + "step": 1055 + }, + { + "epoch": 2.877384196185286, + "grad_norm": 12.773347854614258, + "learning_rate": 1.918256130790191e-05, + "loss": 1.9983, + "step": 1056 + }, + { + "epoch": 2.880108991825613, + "grad_norm": 11.323981285095215, + "learning_rate": 1.9200726612170754e-05, + "loss": 2.0874, + "step": 1057 + }, + { + "epoch": 2.88283378746594, + "grad_norm": 11.521679878234863, + "learning_rate": 1.92188919164396e-05, + "loss": 2.1499, + "step": 1058 + }, + { + "epoch": 2.885558583106267, + "grad_norm": 9.209939956665039, + "learning_rate": 1.923705722070845e-05, + "loss": 1.978, + "step": 1059 + }, + { + "epoch": 2.888283378746594, + "grad_norm": 10.25390625, + "learning_rate": 1.9255222524977294e-05, + "loss": 2.0332, + "step": 1060 + }, + { + "epoch": 2.891008174386921, + "grad_norm": 10.265666961669922, + "learning_rate": 1.927338782924614e-05, + "loss": 2.1875, + "step": 1061 + }, + { + "epoch": 2.893732970027248, + "grad_norm": 9.984662055969238, + "learning_rate": 1.929155313351499e-05, + "loss": 2.1362, + "step": 1062 + }, + { + "epoch": 2.896457765667575, + "grad_norm": 9.017266273498535, + "learning_rate": 1.9309718437783834e-05, + "loss": 2.0161, + "step": 1063 + }, + { + "epoch": 2.899182561307902, + "grad_norm": 9.564297676086426, + "learning_rate": 1.932788374205268e-05, + "loss": 2.0894, + "step": 1064 + }, + { + "epoch": 2.9019073569482288, + "grad_norm": 10.540470123291016, + "learning_rate": 1.9346049046321526e-05, + "loss": 1.9082, + "step": 1065 + }, + { + "epoch": 2.904632152588556, + "grad_norm": 11.878788948059082, + "learning_rate": 1.9364214350590374e-05, + "loss": 2.2153, + "step": 1066 + }, + { + "epoch": 2.907356948228883, + "grad_norm": 9.226091384887695, + "learning_rate": 1.938237965485922e-05, + "loss": 2.0347, + "step": 1067 + }, + { + "epoch": 2.9100817438692097, + "grad_norm": 11.214638710021973, + "learning_rate": 1.9400544959128066e-05, + "loss": 1.9736, + "step": 1068 + }, + { + "epoch": 2.912806539509537, + "grad_norm": 10.410806655883789, + "learning_rate": 1.9418710263396914e-05, + "loss": 1.8379, + "step": 1069 + }, + { + "epoch": 2.915531335149864, + "grad_norm": 9.997007369995117, + "learning_rate": 1.9436875567665762e-05, + "loss": 1.9756, + "step": 1070 + }, + { + "epoch": 2.9182561307901906, + "grad_norm": 8.648539543151855, + "learning_rate": 1.9455040871934607e-05, + "loss": 2.0698, + "step": 1071 + }, + { + "epoch": 2.9209809264305178, + "grad_norm": 9.715324401855469, + "learning_rate": 1.9473206176203454e-05, + "loss": 2.1509, + "step": 1072 + }, + { + "epoch": 2.923705722070845, + "grad_norm": 11.68460464477539, + "learning_rate": 1.94913714804723e-05, + "loss": 2.1602, + "step": 1073 + }, + { + "epoch": 2.9264305177111716, + "grad_norm": 8.657852172851562, + "learning_rate": 1.9509536784741147e-05, + "loss": 1.9038, + "step": 1074 + }, + { + "epoch": 2.9291553133514987, + "grad_norm": 12.567237854003906, + "learning_rate": 1.952770208900999e-05, + "loss": 2.1553, + "step": 1075 + }, + { + "epoch": 2.931880108991826, + "grad_norm": 10.17682933807373, + "learning_rate": 1.954586739327884e-05, + "loss": 1.9727, + "step": 1076 + }, + { + "epoch": 2.9346049046321525, + "grad_norm": 25.757490158081055, + "learning_rate": 1.9564032697547687e-05, + "loss": 2.1606, + "step": 1077 + }, + { + "epoch": 2.9373297002724796, + "grad_norm": 11.21967887878418, + "learning_rate": 1.958219800181653e-05, + "loss": 2.0835, + "step": 1078 + }, + { + "epoch": 2.9400544959128068, + "grad_norm": 11.750326156616211, + "learning_rate": 1.960036330608538e-05, + "loss": 1.7771, + "step": 1079 + }, + { + "epoch": 2.9427792915531334, + "grad_norm": 10.967148780822754, + "learning_rate": 1.9618528610354227e-05, + "loss": 2.0957, + "step": 1080 + }, + { + "epoch": 2.9455040871934606, + "grad_norm": 14.189801216125488, + "learning_rate": 1.963669391462307e-05, + "loss": 2.0962, + "step": 1081 + }, + { + "epoch": 2.9482288828337877, + "grad_norm": 10.641090393066406, + "learning_rate": 1.9654859218891916e-05, + "loss": 2.1592, + "step": 1082 + }, + { + "epoch": 2.9509536784741144, + "grad_norm": 12.17349910736084, + "learning_rate": 1.9673024523160764e-05, + "loss": 2.1245, + "step": 1083 + }, + { + "epoch": 2.9536784741144415, + "grad_norm": 10.572559356689453, + "learning_rate": 1.9691189827429612e-05, + "loss": 2.0898, + "step": 1084 + }, + { + "epoch": 2.9564032697547686, + "grad_norm": 9.885048866271973, + "learning_rate": 1.9709355131698456e-05, + "loss": 2.1226, + "step": 1085 + }, + { + "epoch": 2.9591280653950953, + "grad_norm": 9.901043891906738, + "learning_rate": 1.9727520435967304e-05, + "loss": 1.8735, + "step": 1086 + }, + { + "epoch": 2.9618528610354224, + "grad_norm": 15.233263969421387, + "learning_rate": 1.9745685740236152e-05, + "loss": 1.9155, + "step": 1087 + }, + { + "epoch": 2.9645776566757496, + "grad_norm": 16.466659545898438, + "learning_rate": 1.9763851044504996e-05, + "loss": 2.1514, + "step": 1088 + }, + { + "epoch": 2.9673024523160763, + "grad_norm": 12.63900089263916, + "learning_rate": 1.978201634877384e-05, + "loss": 2.1035, + "step": 1089 + }, + { + "epoch": 2.9700272479564034, + "grad_norm": 9.711353302001953, + "learning_rate": 1.980018165304269e-05, + "loss": 2.2021, + "step": 1090 + }, + { + "epoch": 2.9727520435967305, + "grad_norm": 10.527975082397461, + "learning_rate": 1.9818346957311537e-05, + "loss": 1.9062, + "step": 1091 + }, + { + "epoch": 2.975476839237057, + "grad_norm": 10.087246894836426, + "learning_rate": 1.9836512261580384e-05, + "loss": 1.9131, + "step": 1092 + }, + { + "epoch": 2.9782016348773843, + "grad_norm": 9.904088973999023, + "learning_rate": 1.985467756584923e-05, + "loss": 2.3457, + "step": 1093 + }, + { + "epoch": 2.9809264305177114, + "grad_norm": 10.21497631072998, + "learning_rate": 1.9872842870118077e-05, + "loss": 1.9922, + "step": 1094 + }, + { + "epoch": 2.983651226158038, + "grad_norm": 10.031513214111328, + "learning_rate": 1.9891008174386925e-05, + "loss": 1.8799, + "step": 1095 + }, + { + "epoch": 2.9863760217983653, + "grad_norm": 18.525638580322266, + "learning_rate": 1.990917347865577e-05, + "loss": 2.0332, + "step": 1096 + }, + { + "epoch": 2.989100817438692, + "grad_norm": 9.667322158813477, + "learning_rate": 1.9927338782924614e-05, + "loss": 1.969, + "step": 1097 + }, + { + "epoch": 2.991825613079019, + "grad_norm": 10.101297378540039, + "learning_rate": 1.994550408719346e-05, + "loss": 2.1143, + "step": 1098 + }, + { + "epoch": 2.994550408719346, + "grad_norm": 9.766504287719727, + "learning_rate": 1.996366939146231e-05, + "loss": 1.9966, + "step": 1099 + }, + { + "epoch": 2.997275204359673, + "grad_norm": 10.17359733581543, + "learning_rate": 1.9981834695731154e-05, + "loss": 2.2192, + "step": 1100 + }, + { + "epoch": 3.0, + "grad_norm": 11.143439292907715, + "learning_rate": 2e-05, + "loss": 2.041, + "step": 1101 + }, + { + "epoch": 3.002724795640327, + "grad_norm": 10.33942699432373, + "learning_rate": 1.9999999961060162e-05, + "loss": 1.875, + "step": 1102 + }, + { + "epoch": 3.005449591280654, + "grad_norm": 11.492137908935547, + "learning_rate": 1.9999999844240644e-05, + "loss": 2.2, + "step": 1103 + }, + { + "epoch": 3.008174386920981, + "grad_norm": 10.473490715026855, + "learning_rate": 1.999999964954145e-05, + "loss": 1.8848, + "step": 1104 + }, + { + "epoch": 3.010899182561308, + "grad_norm": 12.820694923400879, + "learning_rate": 1.9999999376962583e-05, + "loss": 2.1724, + "step": 1105 + }, + { + "epoch": 3.0136239782016347, + "grad_norm": 14.527670860290527, + "learning_rate": 1.999999902650404e-05, + "loss": 2.0332, + "step": 1106 + }, + { + "epoch": 3.016348773841962, + "grad_norm": 9.247108459472656, + "learning_rate": 1.9999998598165827e-05, + "loss": 1.8853, + "step": 1107 + }, + { + "epoch": 3.019073569482289, + "grad_norm": 12.707825660705566, + "learning_rate": 1.9999998091947947e-05, + "loss": 2.231, + "step": 1108 + }, + { + "epoch": 3.0217983651226157, + "grad_norm": 11.171661376953125, + "learning_rate": 1.9999997507850404e-05, + "loss": 1.8789, + "step": 1109 + }, + { + "epoch": 3.024523160762943, + "grad_norm": 11.998929023742676, + "learning_rate": 1.99999968458732e-05, + "loss": 1.9287, + "step": 1110 + }, + { + "epoch": 3.02724795640327, + "grad_norm": 10.787744522094727, + "learning_rate": 1.9999996106016345e-05, + "loss": 2.0576, + "step": 1111 + }, + { + "epoch": 3.0299727520435966, + "grad_norm": 14.347358703613281, + "learning_rate": 1.999999528827984e-05, + "loss": 1.9194, + "step": 1112 + }, + { + "epoch": 3.0326975476839237, + "grad_norm": 10.398091316223145, + "learning_rate": 1.9999994392663697e-05, + "loss": 1.9146, + "step": 1113 + }, + { + "epoch": 3.035422343324251, + "grad_norm": 10.237173080444336, + "learning_rate": 1.9999993419167914e-05, + "loss": 1.9946, + "step": 1114 + }, + { + "epoch": 3.0381471389645776, + "grad_norm": 10.289793968200684, + "learning_rate": 1.999999236779251e-05, + "loss": 1.9805, + "step": 1115 + }, + { + "epoch": 3.0408719346049047, + "grad_norm": 10.29628849029541, + "learning_rate": 1.9999991238537482e-05, + "loss": 2.0688, + "step": 1116 + }, + { + "epoch": 3.043596730245232, + "grad_norm": 10.019878387451172, + "learning_rate": 1.999999003140285e-05, + "loss": 1.8232, + "step": 1117 + }, + { + "epoch": 3.0463215258855585, + "grad_norm": 9.181999206542969, + "learning_rate": 1.9999988746388613e-05, + "loss": 1.8823, + "step": 1118 + }, + { + "epoch": 3.0490463215258856, + "grad_norm": 10.890800476074219, + "learning_rate": 1.9999987383494786e-05, + "loss": 1.8945, + "step": 1119 + }, + { + "epoch": 3.0517711171662127, + "grad_norm": 11.722890853881836, + "learning_rate": 1.999998594272138e-05, + "loss": 1.9785, + "step": 1120 + }, + { + "epoch": 3.0544959128065394, + "grad_norm": 11.116331100463867, + "learning_rate": 1.9999984424068405e-05, + "loss": 1.8101, + "step": 1121 + }, + { + "epoch": 3.0572207084468666, + "grad_norm": 12.051642417907715, + "learning_rate": 1.9999982827535874e-05, + "loss": 2.0015, + "step": 1122 + }, + { + "epoch": 3.0599455040871932, + "grad_norm": 10.866436004638672, + "learning_rate": 1.9999981153123797e-05, + "loss": 1.8687, + "step": 1123 + }, + { + "epoch": 3.0626702997275204, + "grad_norm": 10.616351127624512, + "learning_rate": 1.999997940083219e-05, + "loss": 1.9897, + "step": 1124 + }, + { + "epoch": 3.0653950953678475, + "grad_norm": 11.926887512207031, + "learning_rate": 1.9999977570661064e-05, + "loss": 1.8184, + "step": 1125 + }, + { + "epoch": 3.068119891008174, + "grad_norm": 9.511907577514648, + "learning_rate": 1.9999975662610435e-05, + "loss": 2.0708, + "step": 1126 + }, + { + "epoch": 3.0708446866485013, + "grad_norm": 11.440744400024414, + "learning_rate": 1.9999973676680318e-05, + "loss": 1.9248, + "step": 1127 + }, + { + "epoch": 3.0735694822888284, + "grad_norm": 10.463530540466309, + "learning_rate": 1.999997161287073e-05, + "loss": 2.0166, + "step": 1128 + }, + { + "epoch": 3.076294277929155, + "grad_norm": 13.820565223693848, + "learning_rate": 1.999996947118168e-05, + "loss": 1.9067, + "step": 1129 + }, + { + "epoch": 3.0790190735694822, + "grad_norm": 8.525996208190918, + "learning_rate": 1.999996725161319e-05, + "loss": 1.9385, + "step": 1130 + }, + { + "epoch": 3.0817438692098094, + "grad_norm": 13.830317497253418, + "learning_rate": 1.999996495416528e-05, + "loss": 2.0405, + "step": 1131 + }, + { + "epoch": 3.084468664850136, + "grad_norm": 11.075336456298828, + "learning_rate": 1.9999962578837967e-05, + "loss": 1.9897, + "step": 1132 + }, + { + "epoch": 3.087193460490463, + "grad_norm": 16.12899398803711, + "learning_rate": 1.999996012563126e-05, + "loss": 1.8789, + "step": 1133 + }, + { + "epoch": 3.0899182561307903, + "grad_norm": 10.055564880371094, + "learning_rate": 1.9999957594545193e-05, + "loss": 2.0825, + "step": 1134 + }, + { + "epoch": 3.092643051771117, + "grad_norm": 14.070582389831543, + "learning_rate": 1.9999954985579774e-05, + "loss": 1.8477, + "step": 1135 + }, + { + "epoch": 3.095367847411444, + "grad_norm": 10.774489402770996, + "learning_rate": 1.999995229873503e-05, + "loss": 1.9692, + "step": 1136 + }, + { + "epoch": 3.0980926430517712, + "grad_norm": 11.93801498413086, + "learning_rate": 1.9999949534010975e-05, + "loss": 2.0947, + "step": 1137 + }, + { + "epoch": 3.100817438692098, + "grad_norm": 9.086506843566895, + "learning_rate": 1.9999946691407635e-05, + "loss": 1.7251, + "step": 1138 + }, + { + "epoch": 3.103542234332425, + "grad_norm": 11.340764999389648, + "learning_rate": 1.9999943770925037e-05, + "loss": 1.9004, + "step": 1139 + }, + { + "epoch": 3.106267029972752, + "grad_norm": 11.077136039733887, + "learning_rate": 1.9999940772563194e-05, + "loss": 1.9233, + "step": 1140 + }, + { + "epoch": 3.108991825613079, + "grad_norm": 10.375553131103516, + "learning_rate": 1.9999937696322136e-05, + "loss": 1.8062, + "step": 1141 + }, + { + "epoch": 3.111716621253406, + "grad_norm": 10.730899810791016, + "learning_rate": 1.9999934542201888e-05, + "loss": 2.04, + "step": 1142 + }, + { + "epoch": 3.114441416893733, + "grad_norm": 12.8143310546875, + "learning_rate": 1.999993131020247e-05, + "loss": 2.1177, + "step": 1143 + }, + { + "epoch": 3.11716621253406, + "grad_norm": 12.750884056091309, + "learning_rate": 1.9999928000323903e-05, + "loss": 1.9541, + "step": 1144 + }, + { + "epoch": 3.119891008174387, + "grad_norm": 11.579204559326172, + "learning_rate": 1.9999924612566225e-05, + "loss": 2.0874, + "step": 1145 + }, + { + "epoch": 3.122615803814714, + "grad_norm": 11.029909133911133, + "learning_rate": 1.9999921146929454e-05, + "loss": 1.7896, + "step": 1146 + }, + { + "epoch": 3.1253405994550407, + "grad_norm": 11.410332679748535, + "learning_rate": 1.9999917603413618e-05, + "loss": 2.0469, + "step": 1147 + }, + { + "epoch": 3.128065395095368, + "grad_norm": 11.27589225769043, + "learning_rate": 1.9999913982018747e-05, + "loss": 1.9707, + "step": 1148 + }, + { + "epoch": 3.130790190735695, + "grad_norm": 10.249436378479004, + "learning_rate": 1.9999910282744865e-05, + "loss": 1.9133, + "step": 1149 + }, + { + "epoch": 3.1335149863760217, + "grad_norm": 12.009215354919434, + "learning_rate": 1.999990650559201e-05, + "loss": 1.978, + "step": 1150 + }, + { + "epoch": 3.136239782016349, + "grad_norm": 12.450786590576172, + "learning_rate": 1.99999026505602e-05, + "loss": 1.9531, + "step": 1151 + }, + { + "epoch": 3.138964577656676, + "grad_norm": 10.915098190307617, + "learning_rate": 1.999989871764947e-05, + "loss": 1.7954, + "step": 1152 + }, + { + "epoch": 3.1416893732970026, + "grad_norm": 10.478048324584961, + "learning_rate": 1.9999894706859852e-05, + "loss": 1.9912, + "step": 1153 + }, + { + "epoch": 3.1444141689373297, + "grad_norm": 22.394235610961914, + "learning_rate": 1.9999890618191375e-05, + "loss": 1.8711, + "step": 1154 + }, + { + "epoch": 3.147138964577657, + "grad_norm": 24.724218368530273, + "learning_rate": 1.999988645164407e-05, + "loss": 2.0547, + "step": 1155 + }, + { + "epoch": 3.1498637602179835, + "grad_norm": 9.987106323242188, + "learning_rate": 1.9999882207217976e-05, + "loss": 2.0884, + "step": 1156 + }, + { + "epoch": 3.1525885558583107, + "grad_norm": 10.89595890045166, + "learning_rate": 1.9999877884913116e-05, + "loss": 1.9312, + "step": 1157 + }, + { + "epoch": 3.155313351498638, + "grad_norm": 11.442464828491211, + "learning_rate": 1.9999873484729533e-05, + "loss": 2.0894, + "step": 1158 + }, + { + "epoch": 3.1580381471389645, + "grad_norm": 13.294852256774902, + "learning_rate": 1.9999869006667254e-05, + "loss": 1.8687, + "step": 1159 + }, + { + "epoch": 3.1607629427792916, + "grad_norm": 10.252835273742676, + "learning_rate": 1.999986445072632e-05, + "loss": 1.8933, + "step": 1160 + }, + { + "epoch": 3.1634877384196187, + "grad_norm": 12.676876068115234, + "learning_rate": 1.9999859816906763e-05, + "loss": 1.8652, + "step": 1161 + }, + { + "epoch": 3.1662125340599454, + "grad_norm": 18.203889846801758, + "learning_rate": 1.9999855105208616e-05, + "loss": 1.9907, + "step": 1162 + }, + { + "epoch": 3.1689373297002725, + "grad_norm": 11.438253402709961, + "learning_rate": 1.9999850315631925e-05, + "loss": 2.1001, + "step": 1163 + }, + { + "epoch": 3.1716621253405997, + "grad_norm": 11.49427318572998, + "learning_rate": 1.9999845448176717e-05, + "loss": 1.9683, + "step": 1164 + }, + { + "epoch": 3.1743869209809263, + "grad_norm": 24.44009780883789, + "learning_rate": 1.9999840502843034e-05, + "loss": 1.8289, + "step": 1165 + }, + { + "epoch": 3.1771117166212535, + "grad_norm": 11.613852500915527, + "learning_rate": 1.999983547963092e-05, + "loss": 1.9341, + "step": 1166 + }, + { + "epoch": 3.1798365122615806, + "grad_norm": 11.840388298034668, + "learning_rate": 1.9999830378540403e-05, + "loss": 1.9385, + "step": 1167 + }, + { + "epoch": 3.1825613079019073, + "grad_norm": 15.055170059204102, + "learning_rate": 1.9999825199571533e-05, + "loss": 1.9922, + "step": 1168 + }, + { + "epoch": 3.1852861035422344, + "grad_norm": 9.82111644744873, + "learning_rate": 1.9999819942724343e-05, + "loss": 2.0317, + "step": 1169 + }, + { + "epoch": 3.1880108991825615, + "grad_norm": 11.261125564575195, + "learning_rate": 1.9999814607998884e-05, + "loss": 2.0488, + "step": 1170 + }, + { + "epoch": 3.190735694822888, + "grad_norm": 14.382711410522461, + "learning_rate": 1.9999809195395182e-05, + "loss": 2.064, + "step": 1171 + }, + { + "epoch": 3.1934604904632153, + "grad_norm": 11.627882957458496, + "learning_rate": 1.9999803704913293e-05, + "loss": 2.0542, + "step": 1172 + }, + { + "epoch": 3.1961852861035425, + "grad_norm": 11.54857349395752, + "learning_rate": 1.9999798136553253e-05, + "loss": 2.0269, + "step": 1173 + }, + { + "epoch": 3.198910081743869, + "grad_norm": 11.140435218811035, + "learning_rate": 1.9999792490315107e-05, + "loss": 2.2227, + "step": 1174 + }, + { + "epoch": 3.2016348773841963, + "grad_norm": 14.964839935302734, + "learning_rate": 1.9999786766198902e-05, + "loss": 1.8779, + "step": 1175 + }, + { + "epoch": 3.204359673024523, + "grad_norm": 10.240537643432617, + "learning_rate": 1.9999780964204675e-05, + "loss": 1.9644, + "step": 1176 + }, + { + "epoch": 3.20708446866485, + "grad_norm": 14.842936515808105, + "learning_rate": 1.9999775084332477e-05, + "loss": 2.063, + "step": 1177 + }, + { + "epoch": 3.209809264305177, + "grad_norm": 8.813994407653809, + "learning_rate": 1.999976912658235e-05, + "loss": 2.0947, + "step": 1178 + }, + { + "epoch": 3.212534059945504, + "grad_norm": 9.20219612121582, + "learning_rate": 1.999976309095435e-05, + "loss": 2.0005, + "step": 1179 + }, + { + "epoch": 3.215258855585831, + "grad_norm": 12.575230598449707, + "learning_rate": 1.999975697744851e-05, + "loss": 2.0859, + "step": 1180 + }, + { + "epoch": 3.217983651226158, + "grad_norm": 10.840344429016113, + "learning_rate": 1.999975078606489e-05, + "loss": 1.7068, + "step": 1181 + }, + { + "epoch": 3.220708446866485, + "grad_norm": 10.119123458862305, + "learning_rate": 1.9999744516803527e-05, + "loss": 2.1094, + "step": 1182 + }, + { + "epoch": 3.223433242506812, + "grad_norm": 11.109670639038086, + "learning_rate": 1.999973816966448e-05, + "loss": 2.104, + "step": 1183 + }, + { + "epoch": 3.226158038147139, + "grad_norm": 15.738182067871094, + "learning_rate": 1.999973174464779e-05, + "loss": 1.9448, + "step": 1184 + }, + { + "epoch": 3.2288828337874658, + "grad_norm": 9.035996437072754, + "learning_rate": 1.9999725241753516e-05, + "loss": 1.8745, + "step": 1185 + }, + { + "epoch": 3.231607629427793, + "grad_norm": 12.854116439819336, + "learning_rate": 1.9999718660981703e-05, + "loss": 2.1528, + "step": 1186 + }, + { + "epoch": 3.23433242506812, + "grad_norm": 14.7183837890625, + "learning_rate": 1.9999712002332397e-05, + "loss": 1.9351, + "step": 1187 + }, + { + "epoch": 3.2370572207084467, + "grad_norm": 11.334243774414062, + "learning_rate": 1.9999705265805662e-05, + "loss": 2.042, + "step": 1188 + }, + { + "epoch": 3.239782016348774, + "grad_norm": 9.695436477661133, + "learning_rate": 1.9999698451401542e-05, + "loss": 1.855, + "step": 1189 + }, + { + "epoch": 3.242506811989101, + "grad_norm": 12.386056900024414, + "learning_rate": 1.9999691559120092e-05, + "loss": 2.0366, + "step": 1190 + }, + { + "epoch": 3.2452316076294276, + "grad_norm": 11.660694122314453, + "learning_rate": 1.999968458896137e-05, + "loss": 1.9668, + "step": 1191 + }, + { + "epoch": 3.2479564032697548, + "grad_norm": 10.674187660217285, + "learning_rate": 1.9999677540925416e-05, + "loss": 1.6982, + "step": 1192 + }, + { + "epoch": 3.250681198910082, + "grad_norm": 13.024900436401367, + "learning_rate": 1.9999670415012306e-05, + "loss": 1.8032, + "step": 1193 + }, + { + "epoch": 3.2534059945504086, + "grad_norm": 10.894378662109375, + "learning_rate": 1.9999663211222078e-05, + "loss": 2.0825, + "step": 1194 + }, + { + "epoch": 3.2561307901907357, + "grad_norm": 10.457403182983398, + "learning_rate": 1.9999655929554798e-05, + "loss": 1.9355, + "step": 1195 + }, + { + "epoch": 3.258855585831063, + "grad_norm": 10.54038143157959, + "learning_rate": 1.999964857001052e-05, + "loss": 2.0415, + "step": 1196 + }, + { + "epoch": 3.2615803814713895, + "grad_norm": 9.038063049316406, + "learning_rate": 1.99996411325893e-05, + "loss": 1.9448, + "step": 1197 + }, + { + "epoch": 3.2643051771117166, + "grad_norm": 9.49393081665039, + "learning_rate": 1.9999633617291196e-05, + "loss": 1.7476, + "step": 1198 + }, + { + "epoch": 3.2670299727520438, + "grad_norm": 10.450029373168945, + "learning_rate": 1.9999626024116267e-05, + "loss": 1.9834, + "step": 1199 + }, + { + "epoch": 3.2697547683923704, + "grad_norm": 9.543033599853516, + "learning_rate": 1.999961835306457e-05, + "loss": 1.9922, + "step": 1200 + }, + { + "epoch": 3.2724795640326976, + "grad_norm": 9.017727851867676, + "learning_rate": 1.999961060413617e-05, + "loss": 1.8706, + "step": 1201 + }, + { + "epoch": 3.2752043596730247, + "grad_norm": 11.66344928741455, + "learning_rate": 1.9999602777331124e-05, + "loss": 2.1118, + "step": 1202 + }, + { + "epoch": 3.2779291553133514, + "grad_norm": 9.141104698181152, + "learning_rate": 1.9999594872649495e-05, + "loss": 1.8687, + "step": 1203 + }, + { + "epoch": 3.2806539509536785, + "grad_norm": 9.666121482849121, + "learning_rate": 1.999958689009134e-05, + "loss": 2.0581, + "step": 1204 + }, + { + "epoch": 3.2833787465940056, + "grad_norm": 11.769775390625, + "learning_rate": 1.9999578829656724e-05, + "loss": 1.9629, + "step": 1205 + }, + { + "epoch": 3.2861035422343323, + "grad_norm": 9.261898040771484, + "learning_rate": 1.9999570691345712e-05, + "loss": 2.0469, + "step": 1206 + }, + { + "epoch": 3.2888283378746594, + "grad_norm": 12.135587692260742, + "learning_rate": 1.9999562475158365e-05, + "loss": 1.9556, + "step": 1207 + }, + { + "epoch": 3.291553133514986, + "grad_norm": 9.376842498779297, + "learning_rate": 1.9999554181094748e-05, + "loss": 1.728, + "step": 1208 + }, + { + "epoch": 3.2942779291553133, + "grad_norm": 13.119425773620605, + "learning_rate": 1.9999545809154925e-05, + "loss": 2.1191, + "step": 1209 + }, + { + "epoch": 3.2970027247956404, + "grad_norm": 10.199698448181152, + "learning_rate": 1.9999537359338957e-05, + "loss": 2.0723, + "step": 1210 + }, + { + "epoch": 3.299727520435967, + "grad_norm": 9.926660537719727, + "learning_rate": 1.999952883164692e-05, + "loss": 1.9331, + "step": 1211 + }, + { + "epoch": 3.302452316076294, + "grad_norm": 9.661992073059082, + "learning_rate": 1.9999520226078872e-05, + "loss": 2.2212, + "step": 1212 + }, + { + "epoch": 3.3051771117166213, + "grad_norm": 8.763089179992676, + "learning_rate": 1.999951154263488e-05, + "loss": 1.6157, + "step": 1213 + }, + { + "epoch": 3.307901907356948, + "grad_norm": 10.265016555786133, + "learning_rate": 1.9999502781315018e-05, + "loss": 1.9888, + "step": 1214 + }, + { + "epoch": 3.310626702997275, + "grad_norm": 8.20125961303711, + "learning_rate": 1.9999493942119346e-05, + "loss": 1.8853, + "step": 1215 + }, + { + "epoch": 3.3133514986376023, + "grad_norm": 9.446121215820312, + "learning_rate": 1.999948502504794e-05, + "loss": 1.8525, + "step": 1216 + }, + { + "epoch": 3.316076294277929, + "grad_norm": 10.643209457397461, + "learning_rate": 1.9999476030100862e-05, + "loss": 1.9517, + "step": 1217 + }, + { + "epoch": 3.318801089918256, + "grad_norm": 11.535621643066406, + "learning_rate": 1.999946695727819e-05, + "loss": 1.9863, + "step": 1218 + }, + { + "epoch": 3.321525885558583, + "grad_norm": 11.043972969055176, + "learning_rate": 1.999945780657999e-05, + "loss": 1.979, + "step": 1219 + }, + { + "epoch": 3.32425068119891, + "grad_norm": 11.173770904541016, + "learning_rate": 1.9999448578006337e-05, + "loss": 1.8547, + "step": 1220 + }, + { + "epoch": 3.326975476839237, + "grad_norm": 9.972723960876465, + "learning_rate": 1.9999439271557296e-05, + "loss": 2.0645, + "step": 1221 + }, + { + "epoch": 3.329700272479564, + "grad_norm": 12.643669128417969, + "learning_rate": 1.9999429887232948e-05, + "loss": 1.9204, + "step": 1222 + }, + { + "epoch": 3.332425068119891, + "grad_norm": 10.223214149475098, + "learning_rate": 1.999942042503336e-05, + "loss": 1.8872, + "step": 1223 + }, + { + "epoch": 3.335149863760218, + "grad_norm": 12.952620506286621, + "learning_rate": 1.9999410884958608e-05, + "loss": 1.7798, + "step": 1224 + }, + { + "epoch": 3.337874659400545, + "grad_norm": 11.56080150604248, + "learning_rate": 1.9999401267008766e-05, + "loss": 1.9966, + "step": 1225 + }, + { + "epoch": 3.3405994550408717, + "grad_norm": 8.708621978759766, + "learning_rate": 1.9999391571183907e-05, + "loss": 1.9858, + "step": 1226 + }, + { + "epoch": 3.343324250681199, + "grad_norm": 16.07501792907715, + "learning_rate": 1.9999381797484113e-05, + "loss": 1.937, + "step": 1227 + }, + { + "epoch": 3.346049046321526, + "grad_norm": 19.36942481994629, + "learning_rate": 1.999937194590945e-05, + "loss": 2.2212, + "step": 1228 + }, + { + "epoch": 3.3487738419618527, + "grad_norm": 9.319982528686523, + "learning_rate": 1.9999362016460005e-05, + "loss": 1.8535, + "step": 1229 + }, + { + "epoch": 3.35149863760218, + "grad_norm": 12.806680679321289, + "learning_rate": 1.9999352009135846e-05, + "loss": 2.0532, + "step": 1230 + }, + { + "epoch": 3.354223433242507, + "grad_norm": 8.694989204406738, + "learning_rate": 1.9999341923937056e-05, + "loss": 1.7805, + "step": 1231 + }, + { + "epoch": 3.3569482288828336, + "grad_norm": 11.847393989562988, + "learning_rate": 1.9999331760863715e-05, + "loss": 1.9702, + "step": 1232 + }, + { + "epoch": 3.3596730245231607, + "grad_norm": 17.723541259765625, + "learning_rate": 1.99993215199159e-05, + "loss": 1.8906, + "step": 1233 + }, + { + "epoch": 3.362397820163488, + "grad_norm": 10.759478569030762, + "learning_rate": 1.999931120109369e-05, + "loss": 2.1333, + "step": 1234 + }, + { + "epoch": 3.3651226158038146, + "grad_norm": 10.469283103942871, + "learning_rate": 1.9999300804397164e-05, + "loss": 2.0376, + "step": 1235 + }, + { + "epoch": 3.3678474114441417, + "grad_norm": 9.429465293884277, + "learning_rate": 1.9999290329826406e-05, + "loss": 1.7695, + "step": 1236 + }, + { + "epoch": 3.370572207084469, + "grad_norm": 10.218581199645996, + "learning_rate": 1.99992797773815e-05, + "loss": 1.8613, + "step": 1237 + }, + { + "epoch": 3.3732970027247955, + "grad_norm": 11.13946533203125, + "learning_rate": 1.999926914706252e-05, + "loss": 1.9194, + "step": 1238 + }, + { + "epoch": 3.3760217983651226, + "grad_norm": 10.5692138671875, + "learning_rate": 1.9999258438869558e-05, + "loss": 2.1162, + "step": 1239 + }, + { + "epoch": 3.3787465940054497, + "grad_norm": 10.036789894104004, + "learning_rate": 1.999924765280269e-05, + "loss": 1.9028, + "step": 1240 + }, + { + "epoch": 3.3814713896457764, + "grad_norm": 14.0789794921875, + "learning_rate": 1.9999236788862006e-05, + "loss": 1.7881, + "step": 1241 + }, + { + "epoch": 3.3841961852861036, + "grad_norm": 14.197346687316895, + "learning_rate": 1.999922584704759e-05, + "loss": 1.9946, + "step": 1242 + }, + { + "epoch": 3.3869209809264307, + "grad_norm": 8.973702430725098, + "learning_rate": 1.9999214827359518e-05, + "loss": 2.2031, + "step": 1243 + }, + { + "epoch": 3.3896457765667574, + "grad_norm": 10.881900787353516, + "learning_rate": 1.9999203729797887e-05, + "loss": 2.0522, + "step": 1244 + }, + { + "epoch": 3.3923705722070845, + "grad_norm": 10.742246627807617, + "learning_rate": 1.9999192554362777e-05, + "loss": 2.0303, + "step": 1245 + }, + { + "epoch": 3.3950953678474116, + "grad_norm": 9.714658737182617, + "learning_rate": 1.999918130105428e-05, + "loss": 1.7964, + "step": 1246 + }, + { + "epoch": 3.3978201634877383, + "grad_norm": 12.210956573486328, + "learning_rate": 1.999916996987248e-05, + "loss": 1.9883, + "step": 1247 + }, + { + "epoch": 3.4005449591280654, + "grad_norm": 9.146660804748535, + "learning_rate": 1.9999158560817463e-05, + "loss": 1.7617, + "step": 1248 + }, + { + "epoch": 3.4032697547683926, + "grad_norm": 10.378352165222168, + "learning_rate": 1.9999147073889325e-05, + "loss": 2.0044, + "step": 1249 + }, + { + "epoch": 3.4059945504087192, + "grad_norm": 10.546966552734375, + "learning_rate": 1.999913550908815e-05, + "loss": 2.3315, + "step": 1250 + }, + { + "epoch": 3.4087193460490464, + "grad_norm": 10.025370597839355, + "learning_rate": 1.9999123866414026e-05, + "loss": 1.8623, + "step": 1251 + }, + { + "epoch": 3.4114441416893735, + "grad_norm": 11.024093627929688, + "learning_rate": 1.9999112145867055e-05, + "loss": 2.0156, + "step": 1252 + }, + { + "epoch": 3.4141689373297, + "grad_norm": 8.24333667755127, + "learning_rate": 1.9999100347447314e-05, + "loss": 1.8171, + "step": 1253 + }, + { + "epoch": 3.4168937329700273, + "grad_norm": 10.128952980041504, + "learning_rate": 1.9999088471154904e-05, + "loss": 2.0664, + "step": 1254 + }, + { + "epoch": 3.4196185286103544, + "grad_norm": 9.902071952819824, + "learning_rate": 1.999907651698991e-05, + "loss": 2.292, + "step": 1255 + }, + { + "epoch": 3.422343324250681, + "grad_norm": 10.431514739990234, + "learning_rate": 1.999906448495244e-05, + "loss": 1.9111, + "step": 1256 + }, + { + "epoch": 3.4250681198910082, + "grad_norm": 11.33655071258545, + "learning_rate": 1.999905237504257e-05, + "loss": 1.8418, + "step": 1257 + }, + { + "epoch": 3.4277929155313354, + "grad_norm": 12.280555725097656, + "learning_rate": 1.9999040187260403e-05, + "loss": 1.9412, + "step": 1258 + }, + { + "epoch": 3.430517711171662, + "grad_norm": 9.858194351196289, + "learning_rate": 1.9999027921606033e-05, + "loss": 1.9077, + "step": 1259 + }, + { + "epoch": 3.433242506811989, + "grad_norm": 13.029343605041504, + "learning_rate": 1.9999015578079553e-05, + "loss": 1.9226, + "step": 1260 + }, + { + "epoch": 3.4359673024523163, + "grad_norm": 10.973852157592773, + "learning_rate": 1.9999003156681066e-05, + "loss": 2.0513, + "step": 1261 + }, + { + "epoch": 3.438692098092643, + "grad_norm": 9.369585037231445, + "learning_rate": 1.999899065741066e-05, + "loss": 1.9302, + "step": 1262 + }, + { + "epoch": 3.44141689373297, + "grad_norm": 10.328851699829102, + "learning_rate": 1.999897808026844e-05, + "loss": 2.0688, + "step": 1263 + }, + { + "epoch": 3.4441416893732972, + "grad_norm": 11.273093223571777, + "learning_rate": 1.99989654252545e-05, + "loss": 1.9956, + "step": 1264 + }, + { + "epoch": 3.446866485013624, + "grad_norm": 9.876923561096191, + "learning_rate": 1.9998952692368937e-05, + "loss": 2.0557, + "step": 1265 + }, + { + "epoch": 3.449591280653951, + "grad_norm": 10.082348823547363, + "learning_rate": 1.9998939881611857e-05, + "loss": 1.8853, + "step": 1266 + }, + { + "epoch": 3.452316076294278, + "grad_norm": 11.63476848602295, + "learning_rate": 1.9998926992983348e-05, + "loss": 2.0076, + "step": 1267 + }, + { + "epoch": 3.455040871934605, + "grad_norm": 12.106552124023438, + "learning_rate": 1.9998914026483526e-05, + "loss": 1.8557, + "step": 1268 + }, + { + "epoch": 3.457765667574932, + "grad_norm": 12.849235534667969, + "learning_rate": 1.9998900982112475e-05, + "loss": 1.9768, + "step": 1269 + }, + { + "epoch": 3.460490463215259, + "grad_norm": 12.221293449401855, + "learning_rate": 1.999888785987031e-05, + "loss": 2.2651, + "step": 1270 + }, + { + "epoch": 3.463215258855586, + "grad_norm": 12.192943572998047, + "learning_rate": 1.9998874659757125e-05, + "loss": 2.1226, + "step": 1271 + }, + { + "epoch": 3.465940054495913, + "grad_norm": 12.493210792541504, + "learning_rate": 1.999886138177303e-05, + "loss": 1.8794, + "step": 1272 + }, + { + "epoch": 3.4686648501362396, + "grad_norm": 14.664477348327637, + "learning_rate": 1.999884802591812e-05, + "loss": 1.6948, + "step": 1273 + }, + { + "epoch": 3.4713896457765667, + "grad_norm": 12.013493537902832, + "learning_rate": 1.999883459219251e-05, + "loss": 2.0154, + "step": 1274 + }, + { + "epoch": 3.474114441416894, + "grad_norm": 10.768638610839844, + "learning_rate": 1.999882108059629e-05, + "loss": 1.9712, + "step": 1275 + }, + { + "epoch": 3.4768392370572205, + "grad_norm": 13.831929206848145, + "learning_rate": 1.9998807491129576e-05, + "loss": 1.8254, + "step": 1276 + }, + { + "epoch": 3.4795640326975477, + "grad_norm": 11.40987777709961, + "learning_rate": 1.9998793823792474e-05, + "loss": 2.1958, + "step": 1277 + }, + { + "epoch": 3.482288828337875, + "grad_norm": 9.788375854492188, + "learning_rate": 1.9998780078585085e-05, + "loss": 1.9473, + "step": 1278 + }, + { + "epoch": 3.4850136239782015, + "grad_norm": 11.829399108886719, + "learning_rate": 1.999876625550752e-05, + "loss": 1.9839, + "step": 1279 + }, + { + "epoch": 3.4877384196185286, + "grad_norm": 10.215336799621582, + "learning_rate": 1.999875235455988e-05, + "loss": 1.7559, + "step": 1280 + }, + { + "epoch": 3.4904632152588557, + "grad_norm": 13.019379615783691, + "learning_rate": 1.9998738375742283e-05, + "loss": 2.0889, + "step": 1281 + }, + { + "epoch": 3.4931880108991824, + "grad_norm": 10.324209213256836, + "learning_rate": 1.9998724319054836e-05, + "loss": 2.1416, + "step": 1282 + }, + { + "epoch": 3.4959128065395095, + "grad_norm": 10.5282621383667, + "learning_rate": 1.999871018449764e-05, + "loss": 1.7649, + "step": 1283 + }, + { + "epoch": 3.4986376021798367, + "grad_norm": 9.629287719726562, + "learning_rate": 1.9998695972070814e-05, + "loss": 1.7354, + "step": 1284 + }, + { + "epoch": 3.5013623978201633, + "grad_norm": 18.714492797851562, + "learning_rate": 1.9998681681774465e-05, + "loss": 1.7544, + "step": 1285 + }, + { + "epoch": 3.5040871934604905, + "grad_norm": 11.829867362976074, + "learning_rate": 1.9998667313608706e-05, + "loss": 1.8809, + "step": 1286 + }, + { + "epoch": 3.5068119891008176, + "grad_norm": 18.325145721435547, + "learning_rate": 1.9998652867573646e-05, + "loss": 1.856, + "step": 1287 + }, + { + "epoch": 3.5095367847411443, + "grad_norm": 16.493732452392578, + "learning_rate": 1.99986383436694e-05, + "loss": 2.0933, + "step": 1288 + }, + { + "epoch": 3.5122615803814714, + "grad_norm": 9.553417205810547, + "learning_rate": 1.9998623741896082e-05, + "loss": 2.0122, + "step": 1289 + }, + { + "epoch": 3.5149863760217985, + "grad_norm": 15.020279884338379, + "learning_rate": 1.99986090622538e-05, + "loss": 2.272, + "step": 1290 + }, + { + "epoch": 3.517711171662125, + "grad_norm": 8.37663459777832, + "learning_rate": 1.9998594304742677e-05, + "loss": 1.8589, + "step": 1291 + }, + { + "epoch": 3.5204359673024523, + "grad_norm": 12.794005393981934, + "learning_rate": 1.999857946936282e-05, + "loss": 1.917, + "step": 1292 + }, + { + "epoch": 3.523160762942779, + "grad_norm": 9.891209602355957, + "learning_rate": 1.999856455611435e-05, + "loss": 1.8281, + "step": 1293 + }, + { + "epoch": 3.525885558583106, + "grad_norm": 10.598015785217285, + "learning_rate": 1.999854956499738e-05, + "loss": 1.8079, + "step": 1294 + }, + { + "epoch": 3.5286103542234333, + "grad_norm": 9.42640209197998, + "learning_rate": 1.9998534496012026e-05, + "loss": 2.0293, + "step": 1295 + }, + { + "epoch": 3.53133514986376, + "grad_norm": 10.417404174804688, + "learning_rate": 1.999851934915841e-05, + "loss": 2.031, + "step": 1296 + }, + { + "epoch": 3.534059945504087, + "grad_norm": 11.727996826171875, + "learning_rate": 1.9998504124436647e-05, + "loss": 2.1621, + "step": 1297 + }, + { + "epoch": 3.536784741144414, + "grad_norm": 9.807804107666016, + "learning_rate": 1.9998488821846855e-05, + "loss": 1.7075, + "step": 1298 + }, + { + "epoch": 3.539509536784741, + "grad_norm": 9.008427619934082, + "learning_rate": 1.999847344138915e-05, + "loss": 1.9229, + "step": 1299 + }, + { + "epoch": 3.542234332425068, + "grad_norm": 11.610631942749023, + "learning_rate": 1.999845798306366e-05, + "loss": 1.7598, + "step": 1300 + }, + { + "epoch": 3.544959128065395, + "grad_norm": 13.851554870605469, + "learning_rate": 1.9998442446870503e-05, + "loss": 1.9463, + "step": 1301 + }, + { + "epoch": 3.547683923705722, + "grad_norm": 10.183866500854492, + "learning_rate": 1.9998426832809796e-05, + "loss": 1.9863, + "step": 1302 + }, + { + "epoch": 3.550408719346049, + "grad_norm": 10.200240135192871, + "learning_rate": 1.9998411140881662e-05, + "loss": 2.0298, + "step": 1303 + }, + { + "epoch": 3.553133514986376, + "grad_norm": 14.371204376220703, + "learning_rate": 1.9998395371086223e-05, + "loss": 2.1377, + "step": 1304 + }, + { + "epoch": 3.5558583106267028, + "grad_norm": 9.169516563415527, + "learning_rate": 1.9998379523423604e-05, + "loss": 1.8818, + "step": 1305 + }, + { + "epoch": 3.55858310626703, + "grad_norm": 10.059884071350098, + "learning_rate": 1.9998363597893927e-05, + "loss": 1.875, + "step": 1306 + }, + { + "epoch": 3.561307901907357, + "grad_norm": 13.294024467468262, + "learning_rate": 1.9998347594497314e-05, + "loss": 2.2129, + "step": 1307 + }, + { + "epoch": 3.5640326975476837, + "grad_norm": 10.252388000488281, + "learning_rate": 1.9998331513233894e-05, + "loss": 1.9248, + "step": 1308 + }, + { + "epoch": 3.566757493188011, + "grad_norm": 11.85957145690918, + "learning_rate": 1.9998315354103793e-05, + "loss": 1.9844, + "step": 1309 + }, + { + "epoch": 3.569482288828338, + "grad_norm": 12.752264022827148, + "learning_rate": 1.9998299117107128e-05, + "loss": 2.0601, + "step": 1310 + }, + { + "epoch": 3.5722070844686646, + "grad_norm": 10.488571166992188, + "learning_rate": 1.9998282802244032e-05, + "loss": 1.9507, + "step": 1311 + }, + { + "epoch": 3.5749318801089918, + "grad_norm": 9.606192588806152, + "learning_rate": 1.9998266409514634e-05, + "loss": 1.8174, + "step": 1312 + }, + { + "epoch": 3.577656675749319, + "grad_norm": 10.860569953918457, + "learning_rate": 1.9998249938919056e-05, + "loss": 1.8677, + "step": 1313 + }, + { + "epoch": 3.5803814713896456, + "grad_norm": 10.547423362731934, + "learning_rate": 1.9998233390457433e-05, + "loss": 1.9253, + "step": 1314 + }, + { + "epoch": 3.5831062670299727, + "grad_norm": 10.076347351074219, + "learning_rate": 1.9998216764129887e-05, + "loss": 2.1001, + "step": 1315 + }, + { + "epoch": 3.5858310626703, + "grad_norm": 10.426956176757812, + "learning_rate": 1.9998200059936554e-05, + "loss": 1.9341, + "step": 1316 + }, + { + "epoch": 3.5885558583106265, + "grad_norm": 9.54003620147705, + "learning_rate": 1.9998183277877555e-05, + "loss": 2.0928, + "step": 1317 + }, + { + "epoch": 3.5912806539509536, + "grad_norm": 10.653057098388672, + "learning_rate": 1.9998166417953034e-05, + "loss": 1.8672, + "step": 1318 + }, + { + "epoch": 3.5940054495912808, + "grad_norm": 9.184635162353516, + "learning_rate": 1.9998149480163108e-05, + "loss": 1.9121, + "step": 1319 + }, + { + "epoch": 3.5967302452316074, + "grad_norm": 12.25539779663086, + "learning_rate": 1.999813246450792e-05, + "loss": 1.9648, + "step": 1320 + }, + { + "epoch": 3.5994550408719346, + "grad_norm": 12.260258674621582, + "learning_rate": 1.9998115370987595e-05, + "loss": 2.0103, + "step": 1321 + }, + { + "epoch": 3.6021798365122617, + "grad_norm": 9.864540100097656, + "learning_rate": 1.9998098199602273e-05, + "loss": 1.7336, + "step": 1322 + }, + { + "epoch": 3.6049046321525884, + "grad_norm": 10.197954177856445, + "learning_rate": 1.999808095035208e-05, + "loss": 1.8735, + "step": 1323 + }, + { + "epoch": 3.6076294277929155, + "grad_norm": 12.28921127319336, + "learning_rate": 1.9998063623237156e-05, + "loss": 2.1064, + "step": 1324 + }, + { + "epoch": 3.6103542234332426, + "grad_norm": 11.340349197387695, + "learning_rate": 1.9998046218257636e-05, + "loss": 1.8403, + "step": 1325 + }, + { + "epoch": 3.6130790190735693, + "grad_norm": 11.287467002868652, + "learning_rate": 1.9998028735413653e-05, + "loss": 1.978, + "step": 1326 + }, + { + "epoch": 3.6158038147138964, + "grad_norm": 9.40659236907959, + "learning_rate": 1.9998011174705344e-05, + "loss": 1.6609, + "step": 1327 + }, + { + "epoch": 3.6185286103542236, + "grad_norm": 10.861719131469727, + "learning_rate": 1.9997993536132846e-05, + "loss": 1.9077, + "step": 1328 + }, + { + "epoch": 3.6212534059945503, + "grad_norm": 9.687219619750977, + "learning_rate": 1.9997975819696293e-05, + "loss": 1.9351, + "step": 1329 + }, + { + "epoch": 3.6239782016348774, + "grad_norm": 9.664878845214844, + "learning_rate": 1.9997958025395826e-05, + "loss": 1.7739, + "step": 1330 + }, + { + "epoch": 3.6267029972752045, + "grad_norm": 14.998048782348633, + "learning_rate": 1.999794015323159e-05, + "loss": 1.9653, + "step": 1331 + }, + { + "epoch": 3.629427792915531, + "grad_norm": 15.942357063293457, + "learning_rate": 1.9997922203203713e-05, + "loss": 1.9585, + "step": 1332 + }, + { + "epoch": 3.6321525885558583, + "grad_norm": 11.56669807434082, + "learning_rate": 1.999790417531234e-05, + "loss": 1.927, + "step": 1333 + }, + { + "epoch": 3.6348773841961854, + "grad_norm": 9.04844856262207, + "learning_rate": 1.999788606955761e-05, + "loss": 1.8101, + "step": 1334 + }, + { + "epoch": 3.637602179836512, + "grad_norm": 11.053104400634766, + "learning_rate": 1.9997867885939668e-05, + "loss": 1.7412, + "step": 1335 + }, + { + "epoch": 3.6403269754768393, + "grad_norm": 13.446556091308594, + "learning_rate": 1.999784962445865e-05, + "loss": 2.2373, + "step": 1336 + }, + { + "epoch": 3.6430517711171664, + "grad_norm": 9.99754810333252, + "learning_rate": 1.9997831285114704e-05, + "loss": 1.8184, + "step": 1337 + }, + { + "epoch": 3.645776566757493, + "grad_norm": 10.847136497497559, + "learning_rate": 1.9997812867907966e-05, + "loss": 1.812, + "step": 1338 + }, + { + "epoch": 3.64850136239782, + "grad_norm": 10.042104721069336, + "learning_rate": 1.9997794372838584e-05, + "loss": 1.9033, + "step": 1339 + }, + { + "epoch": 3.6512261580381473, + "grad_norm": 10.487390518188477, + "learning_rate": 1.9997775799906706e-05, + "loss": 1.875, + "step": 1340 + }, + { + "epoch": 3.653950953678474, + "grad_norm": 9.03159236907959, + "learning_rate": 1.9997757149112465e-05, + "loss": 1.8364, + "step": 1341 + }, + { + "epoch": 3.656675749318801, + "grad_norm": 9.386551856994629, + "learning_rate": 1.9997738420456015e-05, + "loss": 1.8049, + "step": 1342 + }, + { + "epoch": 3.6594005449591283, + "grad_norm": 13.503704071044922, + "learning_rate": 1.9997719613937505e-05, + "loss": 2.0244, + "step": 1343 + }, + { + "epoch": 3.662125340599455, + "grad_norm": 8.827006340026855, + "learning_rate": 1.9997700729557074e-05, + "loss": 1.8726, + "step": 1344 + }, + { + "epoch": 3.664850136239782, + "grad_norm": 7.889685153961182, + "learning_rate": 1.999768176731487e-05, + "loss": 1.8403, + "step": 1345 + }, + { + "epoch": 3.667574931880109, + "grad_norm": 11.514538764953613, + "learning_rate": 1.999766272721104e-05, + "loss": 1.9133, + "step": 1346 + }, + { + "epoch": 3.670299727520436, + "grad_norm": 9.46600341796875, + "learning_rate": 1.9997643609245738e-05, + "loss": 1.7549, + "step": 1347 + }, + { + "epoch": 3.673024523160763, + "grad_norm": 10.599994659423828, + "learning_rate": 1.9997624413419108e-05, + "loss": 1.8149, + "step": 1348 + }, + { + "epoch": 3.67574931880109, + "grad_norm": 14.27822208404541, + "learning_rate": 1.99976051397313e-05, + "loss": 1.9634, + "step": 1349 + }, + { + "epoch": 3.678474114441417, + "grad_norm": 10.638948440551758, + "learning_rate": 1.999758578818247e-05, + "loss": 1.8379, + "step": 1350 + }, + { + "epoch": 3.681198910081744, + "grad_norm": 11.049464225769043, + "learning_rate": 1.9997566358772755e-05, + "loss": 1.9204, + "step": 1351 + }, + { + "epoch": 3.683923705722071, + "grad_norm": 21.863615036010742, + "learning_rate": 1.9997546851502322e-05, + "loss": 1.8022, + "step": 1352 + }, + { + "epoch": 3.6866485013623977, + "grad_norm": 12.01803970336914, + "learning_rate": 1.999752726637131e-05, + "loss": 1.9214, + "step": 1353 + }, + { + "epoch": 3.689373297002725, + "grad_norm": 11.750845909118652, + "learning_rate": 1.9997507603379883e-05, + "loss": 1.9639, + "step": 1354 + }, + { + "epoch": 3.692098092643052, + "grad_norm": 11.37834358215332, + "learning_rate": 1.9997487862528186e-05, + "loss": 2.0659, + "step": 1355 + }, + { + "epoch": 3.6948228882833787, + "grad_norm": 11.896803855895996, + "learning_rate": 1.9997468043816376e-05, + "loss": 1.7285, + "step": 1356 + }, + { + "epoch": 3.697547683923706, + "grad_norm": 10.095005989074707, + "learning_rate": 1.9997448147244607e-05, + "loss": 2.0884, + "step": 1357 + }, + { + "epoch": 3.700272479564033, + "grad_norm": 9.361732482910156, + "learning_rate": 1.999742817281303e-05, + "loss": 1.9331, + "step": 1358 + }, + { + "epoch": 3.7029972752043596, + "grad_norm": 10.310089111328125, + "learning_rate": 1.999740812052181e-05, + "loss": 1.8679, + "step": 1359 + }, + { + "epoch": 3.7057220708446867, + "grad_norm": 9.957247734069824, + "learning_rate": 1.9997387990371092e-05, + "loss": 1.8501, + "step": 1360 + }, + { + "epoch": 3.708446866485014, + "grad_norm": 9.856657028198242, + "learning_rate": 1.9997367782361042e-05, + "loss": 2.0308, + "step": 1361 + }, + { + "epoch": 3.7111716621253406, + "grad_norm": 8.72819709777832, + "learning_rate": 1.9997347496491812e-05, + "loss": 1.9629, + "step": 1362 + }, + { + "epoch": 3.7138964577656677, + "grad_norm": 9.658805847167969, + "learning_rate": 1.999732713276356e-05, + "loss": 1.9346, + "step": 1363 + }, + { + "epoch": 3.716621253405995, + "grad_norm": 12.807863235473633, + "learning_rate": 1.9997306691176448e-05, + "loss": 1.8555, + "step": 1364 + }, + { + "epoch": 3.7193460490463215, + "grad_norm": 8.534314155578613, + "learning_rate": 1.9997286171730632e-05, + "loss": 1.8364, + "step": 1365 + }, + { + "epoch": 3.7220708446866486, + "grad_norm": 8.962367057800293, + "learning_rate": 1.9997265574426276e-05, + "loss": 1.5764, + "step": 1366 + }, + { + "epoch": 3.7247956403269757, + "grad_norm": 12.41026782989502, + "learning_rate": 1.9997244899263536e-05, + "loss": 2.0601, + "step": 1367 + }, + { + "epoch": 3.7275204359673024, + "grad_norm": 11.09547233581543, + "learning_rate": 1.999722414624257e-05, + "loss": 1.9697, + "step": 1368 + }, + { + "epoch": 3.7302452316076296, + "grad_norm": 10.84226131439209, + "learning_rate": 1.999720331536355e-05, + "loss": 2.1177, + "step": 1369 + }, + { + "epoch": 3.7329700272479567, + "grad_norm": 10.707548141479492, + "learning_rate": 1.999718240662663e-05, + "loss": 1.9673, + "step": 1370 + }, + { + "epoch": 3.7356948228882834, + "grad_norm": 8.57364273071289, + "learning_rate": 1.9997161420031975e-05, + "loss": 1.9062, + "step": 1371 + }, + { + "epoch": 3.7384196185286105, + "grad_norm": 10.687947273254395, + "learning_rate": 1.999714035557975e-05, + "loss": 1.9863, + "step": 1372 + }, + { + "epoch": 3.741144414168937, + "grad_norm": 18.90679931640625, + "learning_rate": 1.9997119213270117e-05, + "loss": 1.9587, + "step": 1373 + }, + { + "epoch": 3.7438692098092643, + "grad_norm": 11.410531997680664, + "learning_rate": 1.999709799310324e-05, + "loss": 1.8726, + "step": 1374 + }, + { + "epoch": 3.7465940054495914, + "grad_norm": 10.942984580993652, + "learning_rate": 1.999707669507929e-05, + "loss": 1.9067, + "step": 1375 + }, + { + "epoch": 3.749318801089918, + "grad_norm": 9.907876968383789, + "learning_rate": 1.9997055319198422e-05, + "loss": 1.9297, + "step": 1376 + }, + { + "epoch": 3.7520435967302452, + "grad_norm": 13.171777725219727, + "learning_rate": 1.9997033865460812e-05, + "loss": 1.7925, + "step": 1377 + }, + { + "epoch": 3.7547683923705724, + "grad_norm": 10.019922256469727, + "learning_rate": 1.9997012333866623e-05, + "loss": 1.8657, + "step": 1378 + }, + { + "epoch": 3.757493188010899, + "grad_norm": 9.188364028930664, + "learning_rate": 1.9996990724416022e-05, + "loss": 1.8369, + "step": 1379 + }, + { + "epoch": 3.760217983651226, + "grad_norm": 12.900765419006348, + "learning_rate": 1.9996969037109185e-05, + "loss": 1.8818, + "step": 1380 + }, + { + "epoch": 3.7629427792915533, + "grad_norm": 9.810148239135742, + "learning_rate": 1.999694727194627e-05, + "loss": 1.6636, + "step": 1381 + }, + { + "epoch": 3.76566757493188, + "grad_norm": 12.080660820007324, + "learning_rate": 1.9996925428927456e-05, + "loss": 1.9839, + "step": 1382 + }, + { + "epoch": 3.768392370572207, + "grad_norm": 10.132020950317383, + "learning_rate": 1.9996903508052903e-05, + "loss": 1.8198, + "step": 1383 + }, + { + "epoch": 3.771117166212534, + "grad_norm": 10.986047744750977, + "learning_rate": 1.999688150932279e-05, + "loss": 1.873, + "step": 1384 + }, + { + "epoch": 3.773841961852861, + "grad_norm": 11.753776550292969, + "learning_rate": 1.9996859432737287e-05, + "loss": 1.9746, + "step": 1385 + }, + { + "epoch": 3.776566757493188, + "grad_norm": 9.40007209777832, + "learning_rate": 1.999683727829656e-05, + "loss": 1.7588, + "step": 1386 + }, + { + "epoch": 3.7792915531335147, + "grad_norm": 10.014466285705566, + "learning_rate": 1.999681504600079e-05, + "loss": 1.8784, + "step": 1387 + }, + { + "epoch": 3.782016348773842, + "grad_norm": 12.4912109375, + "learning_rate": 1.9996792735850145e-05, + "loss": 1.9907, + "step": 1388 + }, + { + "epoch": 3.784741144414169, + "grad_norm": 19.946182250976562, + "learning_rate": 1.99967703478448e-05, + "loss": 1.7798, + "step": 1389 + }, + { + "epoch": 3.7874659400544957, + "grad_norm": 14.574756622314453, + "learning_rate": 1.9996747881984928e-05, + "loss": 1.9358, + "step": 1390 + }, + { + "epoch": 3.790190735694823, + "grad_norm": 9.037312507629395, + "learning_rate": 1.9996725338270705e-05, + "loss": 2.0122, + "step": 1391 + }, + { + "epoch": 3.79291553133515, + "grad_norm": 11.350050926208496, + "learning_rate": 1.999670271670231e-05, + "loss": 1.834, + "step": 1392 + }, + { + "epoch": 3.7956403269754766, + "grad_norm": 9.058762550354004, + "learning_rate": 1.9996680017279916e-05, + "loss": 1.7659, + "step": 1393 + }, + { + "epoch": 3.7983651226158037, + "grad_norm": 9.022266387939453, + "learning_rate": 1.9996657240003692e-05, + "loss": 1.6792, + "step": 1394 + }, + { + "epoch": 3.801089918256131, + "grad_norm": 12.156946182250977, + "learning_rate": 1.9996634384873832e-05, + "loss": 1.7554, + "step": 1395 + }, + { + "epoch": 3.8038147138964575, + "grad_norm": 10.579151153564453, + "learning_rate": 1.9996611451890503e-05, + "loss": 1.8132, + "step": 1396 + }, + { + "epoch": 3.8065395095367847, + "grad_norm": 14.65162181854248, + "learning_rate": 1.9996588441053886e-05, + "loss": 2.0186, + "step": 1397 + }, + { + "epoch": 3.809264305177112, + "grad_norm": 9.863320350646973, + "learning_rate": 1.9996565352364156e-05, + "loss": 1.9731, + "step": 1398 + }, + { + "epoch": 3.8119891008174385, + "grad_norm": 13.058857917785645, + "learning_rate": 1.99965421858215e-05, + "loss": 1.9751, + "step": 1399 + }, + { + "epoch": 3.8147138964577656, + "grad_norm": 9.648780822753906, + "learning_rate": 1.9996518941426096e-05, + "loss": 1.9312, + "step": 1400 + }, + { + "epoch": 3.8174386920980927, + "grad_norm": 10.973150253295898, + "learning_rate": 1.9996495619178124e-05, + "loss": 1.9189, + "step": 1401 + }, + { + "epoch": 3.8201634877384194, + "grad_norm": 8.606739044189453, + "learning_rate": 1.999647221907776e-05, + "loss": 1.9082, + "step": 1402 + }, + { + "epoch": 3.8228882833787465, + "grad_norm": 11.51412582397461, + "learning_rate": 1.99964487411252e-05, + "loss": 1.9651, + "step": 1403 + }, + { + "epoch": 3.8256130790190737, + "grad_norm": 10.558756828308105, + "learning_rate": 1.9996425185320616e-05, + "loss": 1.9688, + "step": 1404 + }, + { + "epoch": 3.8283378746594003, + "grad_norm": 9.094059944152832, + "learning_rate": 1.9996401551664197e-05, + "loss": 1.7271, + "step": 1405 + }, + { + "epoch": 3.8310626702997275, + "grad_norm": 11.738804817199707, + "learning_rate": 1.999637784015612e-05, + "loss": 1.8857, + "step": 1406 + }, + { + "epoch": 3.8337874659400546, + "grad_norm": 11.302565574645996, + "learning_rate": 1.9996354050796577e-05, + "loss": 1.7378, + "step": 1407 + }, + { + "epoch": 3.8365122615803813, + "grad_norm": 11.154184341430664, + "learning_rate": 1.9996330183585747e-05, + "loss": 1.9048, + "step": 1408 + }, + { + "epoch": 3.8392370572207084, + "grad_norm": 12.222970008850098, + "learning_rate": 1.999630623852382e-05, + "loss": 1.9839, + "step": 1409 + }, + { + "epoch": 3.8419618528610355, + "grad_norm": 7.918453216552734, + "learning_rate": 1.9996282215610984e-05, + "loss": 1.6953, + "step": 1410 + }, + { + "epoch": 3.844686648501362, + "grad_norm": 10.142660140991211, + "learning_rate": 1.9996258114847427e-05, + "loss": 1.7627, + "step": 1411 + }, + { + "epoch": 3.8474114441416893, + "grad_norm": 10.53038501739502, + "learning_rate": 1.999623393623333e-05, + "loss": 2.0444, + "step": 1412 + }, + { + "epoch": 3.8501362397820165, + "grad_norm": 15.396425247192383, + "learning_rate": 1.999620967976888e-05, + "loss": 1.8823, + "step": 1413 + }, + { + "epoch": 3.852861035422343, + "grad_norm": 11.912347793579102, + "learning_rate": 1.999618534545428e-05, + "loss": 1.7593, + "step": 1414 + }, + { + "epoch": 3.8555858310626703, + "grad_norm": 9.395650863647461, + "learning_rate": 1.9996160933289704e-05, + "loss": 1.9619, + "step": 1415 + }, + { + "epoch": 3.8583106267029974, + "grad_norm": 14.379075050354004, + "learning_rate": 1.999613644327535e-05, + "loss": 1.729, + "step": 1416 + }, + { + "epoch": 3.861035422343324, + "grad_norm": 10.086915969848633, + "learning_rate": 1.9996111875411407e-05, + "loss": 1.9634, + "step": 1417 + }, + { + "epoch": 3.863760217983651, + "grad_norm": 10.041367530822754, + "learning_rate": 1.9996087229698064e-05, + "loss": 1.8315, + "step": 1418 + }, + { + "epoch": 3.8664850136239783, + "grad_norm": 9.252388954162598, + "learning_rate": 1.9996062506135518e-05, + "loss": 1.6943, + "step": 1419 + }, + { + "epoch": 3.869209809264305, + "grad_norm": 14.204264640808105, + "learning_rate": 1.999603770472396e-05, + "loss": 1.6887, + "step": 1420 + }, + { + "epoch": 3.871934604904632, + "grad_norm": 9.889179229736328, + "learning_rate": 1.999601282546358e-05, + "loss": 1.9517, + "step": 1421 + }, + { + "epoch": 3.8746594005449593, + "grad_norm": 12.913715362548828, + "learning_rate": 1.9995987868354577e-05, + "loss": 1.998, + "step": 1422 + }, + { + "epoch": 3.877384196185286, + "grad_norm": 11.989314079284668, + "learning_rate": 1.999596283339714e-05, + "loss": 1.9199, + "step": 1423 + }, + { + "epoch": 3.880108991825613, + "grad_norm": 11.67672061920166, + "learning_rate": 1.9995937720591464e-05, + "loss": 1.9343, + "step": 1424 + }, + { + "epoch": 3.88283378746594, + "grad_norm": 14.26172924041748, + "learning_rate": 1.999591252993775e-05, + "loss": 1.8789, + "step": 1425 + }, + { + "epoch": 3.885558583106267, + "grad_norm": 13.25046157836914, + "learning_rate": 1.9995887261436188e-05, + "loss": 1.9683, + "step": 1426 + }, + { + "epoch": 3.888283378746594, + "grad_norm": 15.621968269348145, + "learning_rate": 1.999586191508698e-05, + "loss": 1.7803, + "step": 1427 + }, + { + "epoch": 3.891008174386921, + "grad_norm": 12.299283027648926, + "learning_rate": 1.999583649089032e-05, + "loss": 1.9829, + "step": 1428 + }, + { + "epoch": 3.893732970027248, + "grad_norm": 14.862947463989258, + "learning_rate": 1.999581098884641e-05, + "loss": 1.7683, + "step": 1429 + }, + { + "epoch": 3.896457765667575, + "grad_norm": 8.998908042907715, + "learning_rate": 1.999578540895544e-05, + "loss": 1.8333, + "step": 1430 + }, + { + "epoch": 3.899182561307902, + "grad_norm": 10.61571979522705, + "learning_rate": 1.9995759751217617e-05, + "loss": 1.9771, + "step": 1431 + }, + { + "epoch": 3.9019073569482288, + "grad_norm": 14.07432746887207, + "learning_rate": 1.999573401563314e-05, + "loss": 1.8696, + "step": 1432 + }, + { + "epoch": 3.904632152588556, + "grad_norm": 13.334297180175781, + "learning_rate": 1.9995708202202212e-05, + "loss": 1.7495, + "step": 1433 + }, + { + "epoch": 3.907356948228883, + "grad_norm": 14.014077186584473, + "learning_rate": 1.9995682310925025e-05, + "loss": 2.0635, + "step": 1434 + }, + { + "epoch": 3.9100817438692097, + "grad_norm": 14.566712379455566, + "learning_rate": 1.9995656341801788e-05, + "loss": 1.832, + "step": 1435 + }, + { + "epoch": 3.912806539509537, + "grad_norm": 15.380060195922852, + "learning_rate": 1.9995630294832698e-05, + "loss": 1.9287, + "step": 1436 + }, + { + "epoch": 3.915531335149864, + "grad_norm": 13.439238548278809, + "learning_rate": 1.9995604170017967e-05, + "loss": 1.7549, + "step": 1437 + }, + { + "epoch": 3.9182561307901906, + "grad_norm": 14.134620666503906, + "learning_rate": 1.9995577967357788e-05, + "loss": 2.042, + "step": 1438 + }, + { + "epoch": 3.9209809264305178, + "grad_norm": 10.96253490447998, + "learning_rate": 1.999555168685237e-05, + "loss": 1.7932, + "step": 1439 + }, + { + "epoch": 3.923705722070845, + "grad_norm": 12.898005485534668, + "learning_rate": 1.999552532850192e-05, + "loss": 2.0718, + "step": 1440 + }, + { + "epoch": 3.9264305177111716, + "grad_norm": 13.486254692077637, + "learning_rate": 1.9995498892306634e-05, + "loss": 1.7651, + "step": 1441 + }, + { + "epoch": 3.9291553133514987, + "grad_norm": 17.048885345458984, + "learning_rate": 1.999547237826673e-05, + "loss": 1.605, + "step": 1442 + }, + { + "epoch": 3.931880108991826, + "grad_norm": 11.592516899108887, + "learning_rate": 1.9995445786382408e-05, + "loss": 1.853, + "step": 1443 + }, + { + "epoch": 3.9346049046321525, + "grad_norm": 11.45778751373291, + "learning_rate": 1.9995419116653876e-05, + "loss": 1.8711, + "step": 1444 + }, + { + "epoch": 3.9373297002724796, + "grad_norm": 13.221013069152832, + "learning_rate": 1.999539236908134e-05, + "loss": 2.1187, + "step": 1445 + }, + { + "epoch": 3.9400544959128068, + "grad_norm": 11.306771278381348, + "learning_rate": 1.999536554366501e-05, + "loss": 1.9995, + "step": 1446 + }, + { + "epoch": 3.9427792915531334, + "grad_norm": 13.746538162231445, + "learning_rate": 1.9995338640405096e-05, + "loss": 1.9072, + "step": 1447 + }, + { + "epoch": 3.9455040871934606, + "grad_norm": 9.49048900604248, + "learning_rate": 1.9995311659301804e-05, + "loss": 1.7983, + "step": 1448 + }, + { + "epoch": 3.9482288828337877, + "grad_norm": 9.7013578414917, + "learning_rate": 1.9995284600355348e-05, + "loss": 1.8359, + "step": 1449 + }, + { + "epoch": 3.9509536784741144, + "grad_norm": 11.810276985168457, + "learning_rate": 1.9995257463565937e-05, + "loss": 1.5774, + "step": 1450 + }, + { + "epoch": 3.9536784741144415, + "grad_norm": 12.751311302185059, + "learning_rate": 1.9995230248933784e-05, + "loss": 1.7988, + "step": 1451 + }, + { + "epoch": 3.9564032697547686, + "grad_norm": 11.19675064086914, + "learning_rate": 1.99952029564591e-05, + "loss": 1.8022, + "step": 1452 + }, + { + "epoch": 3.9591280653950953, + "grad_norm": 12.150336265563965, + "learning_rate": 1.9995175586142096e-05, + "loss": 2.0386, + "step": 1453 + }, + { + "epoch": 3.9618528610354224, + "grad_norm": 12.408337593078613, + "learning_rate": 1.9995148137982984e-05, + "loss": 1.8091, + "step": 1454 + }, + { + "epoch": 3.9645776566757496, + "grad_norm": 13.837706565856934, + "learning_rate": 1.9995120611981984e-05, + "loss": 1.98, + "step": 1455 + }, + { + "epoch": 3.9673024523160763, + "grad_norm": 10.49660587310791, + "learning_rate": 1.9995093008139304e-05, + "loss": 1.6807, + "step": 1456 + }, + { + "epoch": 3.9700272479564034, + "grad_norm": 11.55453872680664, + "learning_rate": 1.999506532645516e-05, + "loss": 1.9268, + "step": 1457 + }, + { + "epoch": 3.9727520435967305, + "grad_norm": 9.677781105041504, + "learning_rate": 1.9995037566929772e-05, + "loss": 1.9014, + "step": 1458 + }, + { + "epoch": 3.975476839237057, + "grad_norm": 10.551101684570312, + "learning_rate": 1.999500972956335e-05, + "loss": 1.6968, + "step": 1459 + }, + { + "epoch": 3.9782016348773843, + "grad_norm": 16.66094398498535, + "learning_rate": 1.9994981814356116e-05, + "loss": 1.7231, + "step": 1460 + }, + { + "epoch": 3.9809264305177114, + "grad_norm": 11.6234712600708, + "learning_rate": 1.9994953821308284e-05, + "loss": 1.7451, + "step": 1461 + }, + { + "epoch": 3.983651226158038, + "grad_norm": 13.92747688293457, + "learning_rate": 1.9994925750420077e-05, + "loss": 1.8594, + "step": 1462 + }, + { + "epoch": 3.9863760217983653, + "grad_norm": 9.083030700683594, + "learning_rate": 1.9994897601691706e-05, + "loss": 1.7178, + "step": 1463 + }, + { + "epoch": 3.989100817438692, + "grad_norm": 11.762439727783203, + "learning_rate": 1.9994869375123397e-05, + "loss": 1.7671, + "step": 1464 + }, + { + "epoch": 3.991825613079019, + "grad_norm": 37.79829025268555, + "learning_rate": 1.9994841070715365e-05, + "loss": 1.9292, + "step": 1465 + }, + { + "epoch": 3.994550408719346, + "grad_norm": 9.897245407104492, + "learning_rate": 1.999481268846783e-05, + "loss": 1.7383, + "step": 1466 + }, + { + "epoch": 3.997275204359673, + "grad_norm": 13.566228866577148, + "learning_rate": 1.9994784228381018e-05, + "loss": 1.9771, + "step": 1467 + }, + { + "epoch": 4.0, + "grad_norm": 16.183984756469727, + "learning_rate": 1.9994755690455154e-05, + "loss": 1.8462, + "step": 1468 + }, + { + "epoch": 4.002724795640327, + "grad_norm": 12.495182991027832, + "learning_rate": 1.9994727074690444e-05, + "loss": 1.8105, + "step": 1469 + }, + { + "epoch": 4.005449591280654, + "grad_norm": 11.816779136657715, + "learning_rate": 1.9994698381087128e-05, + "loss": 1.8804, + "step": 1470 + }, + { + "epoch": 4.008174386920981, + "grad_norm": 17.457576751708984, + "learning_rate": 1.999466960964542e-05, + "loss": 1.8481, + "step": 1471 + }, + { + "epoch": 4.010899182561308, + "grad_norm": 12.753191947937012, + "learning_rate": 1.9994640760365545e-05, + "loss": 1.9683, + "step": 1472 + }, + { + "epoch": 4.013623978201635, + "grad_norm": 10.090810775756836, + "learning_rate": 1.9994611833247733e-05, + "loss": 1.5667, + "step": 1473 + }, + { + "epoch": 4.016348773841962, + "grad_norm": 14.633957862854004, + "learning_rate": 1.9994582828292205e-05, + "loss": 1.6045, + "step": 1474 + }, + { + "epoch": 4.0190735694822886, + "grad_norm": 8.889056205749512, + "learning_rate": 1.9994553745499187e-05, + "loss": 1.8618, + "step": 1475 + }, + { + "epoch": 4.021798365122616, + "grad_norm": 13.44864559173584, + "learning_rate": 1.9994524584868907e-05, + "loss": 1.8105, + "step": 1476 + }, + { + "epoch": 4.024523160762943, + "grad_norm": 10.613789558410645, + "learning_rate": 1.999449534640159e-05, + "loss": 1.8403, + "step": 1477 + }, + { + "epoch": 4.0272479564032695, + "grad_norm": 12.439909934997559, + "learning_rate": 1.9994466030097466e-05, + "loss": 1.7319, + "step": 1478 + }, + { + "epoch": 4.029972752043597, + "grad_norm": 9.766961097717285, + "learning_rate": 1.9994436635956763e-05, + "loss": 1.8823, + "step": 1479 + }, + { + "epoch": 4.032697547683924, + "grad_norm": 11.173598289489746, + "learning_rate": 1.999440716397971e-05, + "loss": 1.895, + "step": 1480 + }, + { + "epoch": 4.03542234332425, + "grad_norm": 9.04456615447998, + "learning_rate": 1.999437761416653e-05, + "loss": 1.8838, + "step": 1481 + }, + { + "epoch": 4.038147138964578, + "grad_norm": 11.515022277832031, + "learning_rate": 1.9994347986517462e-05, + "loss": 1.9326, + "step": 1482 + }, + { + "epoch": 4.040871934604905, + "grad_norm": 13.177966117858887, + "learning_rate": 1.9994318281032733e-05, + "loss": 1.8623, + "step": 1483 + }, + { + "epoch": 4.043596730245231, + "grad_norm": 10.89008617401123, + "learning_rate": 1.9994288497712575e-05, + "loss": 2.1519, + "step": 1484 + }, + { + "epoch": 4.046321525885559, + "grad_norm": 11.134393692016602, + "learning_rate": 1.999425863655722e-05, + "loss": 1.8154, + "step": 1485 + }, + { + "epoch": 4.049046321525886, + "grad_norm": 13.724608421325684, + "learning_rate": 1.9994228697566905e-05, + "loss": 1.7354, + "step": 1486 + }, + { + "epoch": 4.051771117166212, + "grad_norm": 9.587696075439453, + "learning_rate": 1.999419868074185e-05, + "loss": 1.9072, + "step": 1487 + }, + { + "epoch": 4.05449591280654, + "grad_norm": 15.846437454223633, + "learning_rate": 1.9994168586082305e-05, + "loss": 1.658, + "step": 1488 + }, + { + "epoch": 4.0572207084468666, + "grad_norm": 9.667086601257324, + "learning_rate": 1.999413841358849e-05, + "loss": 1.7827, + "step": 1489 + }, + { + "epoch": 4.059945504087193, + "grad_norm": 19.252283096313477, + "learning_rate": 1.999410816326065e-05, + "loss": 1.5791, + "step": 1490 + }, + { + "epoch": 4.062670299727521, + "grad_norm": 9.600749015808105, + "learning_rate": 1.999407783509902e-05, + "loss": 1.8931, + "step": 1491 + }, + { + "epoch": 4.0653950953678475, + "grad_norm": 8.026127815246582, + "learning_rate": 1.9994047429103832e-05, + "loss": 1.6411, + "step": 1492 + }, + { + "epoch": 4.068119891008174, + "grad_norm": 11.90536117553711, + "learning_rate": 1.9994016945275324e-05, + "loss": 1.9187, + "step": 1493 + }, + { + "epoch": 4.070844686648502, + "grad_norm": 10.286707878112793, + "learning_rate": 1.999398638361373e-05, + "loss": 1.7402, + "step": 1494 + }, + { + "epoch": 4.073569482288828, + "grad_norm": 11.354410171508789, + "learning_rate": 1.9993955744119297e-05, + "loss": 1.7849, + "step": 1495 + }, + { + "epoch": 4.076294277929155, + "grad_norm": 11.293846130371094, + "learning_rate": 1.9993925026792252e-05, + "loss": 1.8325, + "step": 1496 + }, + { + "epoch": 4.079019073569483, + "grad_norm": 9.793984413146973, + "learning_rate": 1.9993894231632847e-05, + "loss": 1.9243, + "step": 1497 + }, + { + "epoch": 4.081743869209809, + "grad_norm": 11.538467407226562, + "learning_rate": 1.9993863358641313e-05, + "loss": 1.7949, + "step": 1498 + }, + { + "epoch": 4.084468664850136, + "grad_norm": 9.210892677307129, + "learning_rate": 1.9993832407817893e-05, + "loss": 1.6348, + "step": 1499 + }, + { + "epoch": 4.087193460490464, + "grad_norm": 9.606528282165527, + "learning_rate": 1.999380137916283e-05, + "loss": 1.8218, + "step": 1500 + }, + { + "epoch": 4.08991825613079, + "grad_norm": 12.650059700012207, + "learning_rate": 1.9993770272676358e-05, + "loss": 1.8882, + "step": 1501 + }, + { + "epoch": 4.092643051771117, + "grad_norm": 11.155830383300781, + "learning_rate": 1.9993739088358728e-05, + "loss": 1.7227, + "step": 1502 + }, + { + "epoch": 4.0953678474114446, + "grad_norm": 11.9778413772583, + "learning_rate": 1.999370782621018e-05, + "loss": 1.9614, + "step": 1503 + }, + { + "epoch": 4.098092643051771, + "grad_norm": 16.51782989501953, + "learning_rate": 1.9993676486230958e-05, + "loss": 1.8359, + "step": 1504 + }, + { + "epoch": 4.100817438692098, + "grad_norm": 11.23696231842041, + "learning_rate": 1.99936450684213e-05, + "loss": 1.7964, + "step": 1505 + }, + { + "epoch": 4.1035422343324255, + "grad_norm": 12.84441089630127, + "learning_rate": 1.9993613572781463e-05, + "loss": 1.6553, + "step": 1506 + }, + { + "epoch": 4.106267029972752, + "grad_norm": 9.473592758178711, + "learning_rate": 1.9993581999311683e-05, + "loss": 1.7896, + "step": 1507 + }, + { + "epoch": 4.108991825613079, + "grad_norm": 16.464216232299805, + "learning_rate": 1.9993550348012202e-05, + "loss": 1.8044, + "step": 1508 + }, + { + "epoch": 4.111716621253406, + "grad_norm": 19.52264976501465, + "learning_rate": 1.9993518618883278e-05, + "loss": 1.6797, + "step": 1509 + }, + { + "epoch": 4.114441416893733, + "grad_norm": 15.042317390441895, + "learning_rate": 1.9993486811925152e-05, + "loss": 1.9888, + "step": 1510 + }, + { + "epoch": 4.11716621253406, + "grad_norm": 11.100996971130371, + "learning_rate": 1.9993454927138075e-05, + "loss": 1.7837, + "step": 1511 + }, + { + "epoch": 4.1198910081743865, + "grad_norm": 13.300409317016602, + "learning_rate": 1.999342296452229e-05, + "loss": 1.9468, + "step": 1512 + }, + { + "epoch": 4.122615803814714, + "grad_norm": 13.411114692687988, + "learning_rate": 1.9993390924078048e-05, + "loss": 1.7124, + "step": 1513 + }, + { + "epoch": 4.125340599455041, + "grad_norm": 14.598684310913086, + "learning_rate": 1.99933588058056e-05, + "loss": 1.644, + "step": 1514 + }, + { + "epoch": 4.128065395095367, + "grad_norm": 14.471258163452148, + "learning_rate": 1.9993326609705193e-05, + "loss": 1.8794, + "step": 1515 + }, + { + "epoch": 4.130790190735695, + "grad_norm": 12.10798168182373, + "learning_rate": 1.999329433577708e-05, + "loss": 1.6577, + "step": 1516 + }, + { + "epoch": 4.133514986376022, + "grad_norm": 16.480541229248047, + "learning_rate": 1.9993261984021516e-05, + "loss": 1.9307, + "step": 1517 + }, + { + "epoch": 4.136239782016348, + "grad_norm": 18.721946716308594, + "learning_rate": 1.9993229554438748e-05, + "loss": 1.7847, + "step": 1518 + }, + { + "epoch": 4.138964577656676, + "grad_norm": 16.204620361328125, + "learning_rate": 1.999319704702903e-05, + "loss": 2.0347, + "step": 1519 + }, + { + "epoch": 4.141689373297003, + "grad_norm": 13.440073013305664, + "learning_rate": 1.9993164461792617e-05, + "loss": 1.5464, + "step": 1520 + }, + { + "epoch": 4.144414168937329, + "grad_norm": 12.055974960327148, + "learning_rate": 1.9993131798729757e-05, + "loss": 1.8345, + "step": 1521 + }, + { + "epoch": 4.147138964577657, + "grad_norm": 27.193063735961914, + "learning_rate": 1.999309905784071e-05, + "loss": 1.6394, + "step": 1522 + }, + { + "epoch": 4.1498637602179835, + "grad_norm": 36.53542709350586, + "learning_rate": 1.9993066239125726e-05, + "loss": 1.7129, + "step": 1523 + }, + { + "epoch": 4.15258855585831, + "grad_norm": 11.463371276855469, + "learning_rate": 1.9993033342585068e-05, + "loss": 1.5171, + "step": 1524 + }, + { + "epoch": 4.155313351498638, + "grad_norm": 13.343096733093262, + "learning_rate": 1.9993000368218985e-05, + "loss": 1.8806, + "step": 1525 + }, + { + "epoch": 4.1580381471389645, + "grad_norm": 14.698657035827637, + "learning_rate": 1.9992967316027738e-05, + "loss": 1.7224, + "step": 1526 + }, + { + "epoch": 4.160762942779291, + "grad_norm": 15.240327835083008, + "learning_rate": 1.9992934186011582e-05, + "loss": 1.792, + "step": 1527 + }, + { + "epoch": 4.163487738419619, + "grad_norm": 19.695175170898438, + "learning_rate": 1.999290097817078e-05, + "loss": 1.9006, + "step": 1528 + }, + { + "epoch": 4.166212534059945, + "grad_norm": 14.388656616210938, + "learning_rate": 1.9992867692505582e-05, + "loss": 1.7368, + "step": 1529 + }, + { + "epoch": 4.168937329700272, + "grad_norm": 18.168359756469727, + "learning_rate": 1.9992834329016256e-05, + "loss": 1.8735, + "step": 1530 + }, + { + "epoch": 4.1716621253406, + "grad_norm": 158.9042510986328, + "learning_rate": 1.9992800887703057e-05, + "loss": 1.8633, + "step": 1531 + }, + { + "epoch": 4.174386920980926, + "grad_norm": 20.479694366455078, + "learning_rate": 1.9992767368566244e-05, + "loss": 1.8296, + "step": 1532 + }, + { + "epoch": 4.177111716621253, + "grad_norm": 26.53901481628418, + "learning_rate": 1.9992733771606082e-05, + "loss": 1.7979, + "step": 1533 + }, + { + "epoch": 4.179836512261581, + "grad_norm": 16.466264724731445, + "learning_rate": 1.999270009682283e-05, + "loss": 1.7959, + "step": 1534 + }, + { + "epoch": 4.182561307901907, + "grad_norm": 13.911393165588379, + "learning_rate": 1.9992666344216754e-05, + "loss": 1.96, + "step": 1535 + }, + { + "epoch": 4.185286103542234, + "grad_norm": 24.931947708129883, + "learning_rate": 1.999263251378811e-05, + "loss": 1.8481, + "step": 1536 + }, + { + "epoch": 4.1880108991825615, + "grad_norm": 17.262683868408203, + "learning_rate": 1.999259860553717e-05, + "loss": 1.7502, + "step": 1537 + }, + { + "epoch": 4.190735694822888, + "grad_norm": 28.27671241760254, + "learning_rate": 1.999256461946419e-05, + "loss": 1.7588, + "step": 1538 + }, + { + "epoch": 4.193460490463215, + "grad_norm": 21.149972915649414, + "learning_rate": 1.999253055556944e-05, + "loss": 1.9121, + "step": 1539 + }, + { + "epoch": 4.1961852861035425, + "grad_norm": 15.513473510742188, + "learning_rate": 1.999249641385318e-05, + "loss": 1.7434, + "step": 1540 + }, + { + "epoch": 4.198910081743869, + "grad_norm": 14.91957950592041, + "learning_rate": 1.9992462194315685e-05, + "loss": 1.8267, + "step": 1541 + }, + { + "epoch": 4.201634877384196, + "grad_norm": 18.212005615234375, + "learning_rate": 1.9992427896957214e-05, + "loss": 1.6914, + "step": 1542 + }, + { + "epoch": 4.204359673024523, + "grad_norm": 14.364083290100098, + "learning_rate": 1.9992393521778038e-05, + "loss": 1.8149, + "step": 1543 + }, + { + "epoch": 4.20708446866485, + "grad_norm": 23.741731643676758, + "learning_rate": 1.999235906877842e-05, + "loss": 1.8225, + "step": 1544 + }, + { + "epoch": 4.209809264305177, + "grad_norm": 20.84150505065918, + "learning_rate": 1.9992324537958628e-05, + "loss": 1.7402, + "step": 1545 + }, + { + "epoch": 4.212534059945504, + "grad_norm": 43.37743377685547, + "learning_rate": 1.9992289929318944e-05, + "loss": 1.7632, + "step": 1546 + }, + { + "epoch": 4.215258855585831, + "grad_norm": 14.563302993774414, + "learning_rate": 1.9992255242859618e-05, + "loss": 1.7861, + "step": 1547 + }, + { + "epoch": 4.217983651226158, + "grad_norm": 18.320777893066406, + "learning_rate": 1.9992220478580936e-05, + "loss": 2.0103, + "step": 1548 + }, + { + "epoch": 4.220708446866485, + "grad_norm": 17.307558059692383, + "learning_rate": 1.999218563648316e-05, + "loss": 1.8047, + "step": 1549 + }, + { + "epoch": 4.223433242506812, + "grad_norm": 14.111106872558594, + "learning_rate": 1.9992150716566564e-05, + "loss": 1.9575, + "step": 1550 + }, + { + "epoch": 4.226158038147139, + "grad_norm": 27.04886245727539, + "learning_rate": 1.9992115718831416e-05, + "loss": 1.6965, + "step": 1551 + }, + { + "epoch": 4.228882833787466, + "grad_norm": 20.34300994873047, + "learning_rate": 1.9992080643278e-05, + "loss": 1.7808, + "step": 1552 + }, + { + "epoch": 4.231607629427793, + "grad_norm": 12.827519416809082, + "learning_rate": 1.9992045489906578e-05, + "loss": 1.8965, + "step": 1553 + }, + { + "epoch": 4.23433242506812, + "grad_norm": 10.950469970703125, + "learning_rate": 1.9992010258717423e-05, + "loss": 1.6541, + "step": 1554 + }, + { + "epoch": 4.237057220708447, + "grad_norm": 15.466451644897461, + "learning_rate": 1.9991974949710823e-05, + "loss": 2.0952, + "step": 1555 + }, + { + "epoch": 4.239782016348774, + "grad_norm": 15.410811424255371, + "learning_rate": 1.9991939562887035e-05, + "loss": 1.999, + "step": 1556 + }, + { + "epoch": 4.2425068119891005, + "grad_norm": 15.858236312866211, + "learning_rate": 1.9991904098246347e-05, + "loss": 1.7847, + "step": 1557 + }, + { + "epoch": 4.245231607629428, + "grad_norm": 18.37849235534668, + "learning_rate": 1.999186855578903e-05, + "loss": 1.9233, + "step": 1558 + }, + { + "epoch": 4.247956403269755, + "grad_norm": 21.132099151611328, + "learning_rate": 1.9991832935515366e-05, + "loss": 1.7544, + "step": 1559 + }, + { + "epoch": 4.2506811989100814, + "grad_norm": 11.251901626586914, + "learning_rate": 1.9991797237425625e-05, + "loss": 1.9648, + "step": 1560 + }, + { + "epoch": 4.253405994550409, + "grad_norm": 10.464017868041992, + "learning_rate": 1.9991761461520088e-05, + "loss": 1.7173, + "step": 1561 + }, + { + "epoch": 4.256130790190736, + "grad_norm": 15.851114273071289, + "learning_rate": 1.9991725607799037e-05, + "loss": 1.8613, + "step": 1562 + }, + { + "epoch": 4.258855585831062, + "grad_norm": 12.207009315490723, + "learning_rate": 1.999168967626275e-05, + "loss": 1.7659, + "step": 1563 + }, + { + "epoch": 4.26158038147139, + "grad_norm": 16.404396057128906, + "learning_rate": 1.99916536669115e-05, + "loss": 1.9849, + "step": 1564 + }, + { + "epoch": 4.264305177111717, + "grad_norm": 19.986793518066406, + "learning_rate": 1.999161757974558e-05, + "loss": 2.0391, + "step": 1565 + }, + { + "epoch": 4.267029972752043, + "grad_norm": 12.699073791503906, + "learning_rate": 1.9991581414765256e-05, + "loss": 1.7935, + "step": 1566 + }, + { + "epoch": 4.269754768392371, + "grad_norm": 10.729422569274902, + "learning_rate": 1.9991545171970822e-05, + "loss": 1.7974, + "step": 1567 + }, + { + "epoch": 4.272479564032698, + "grad_norm": 11.770853996276855, + "learning_rate": 1.9991508851362555e-05, + "loss": 1.77, + "step": 1568 + }, + { + "epoch": 4.275204359673024, + "grad_norm": 17.789634704589844, + "learning_rate": 1.9991472452940738e-05, + "loss": 1.9048, + "step": 1569 + }, + { + "epoch": 4.277929155313352, + "grad_norm": 16.31340217590332, + "learning_rate": 1.9991435976705657e-05, + "loss": 1.8638, + "step": 1570 + }, + { + "epoch": 4.2806539509536785, + "grad_norm": 16.50969123840332, + "learning_rate": 1.9991399422657593e-05, + "loss": 2.0146, + "step": 1571 + }, + { + "epoch": 4.283378746594005, + "grad_norm": 14.991809844970703, + "learning_rate": 1.999136279079683e-05, + "loss": 1.9717, + "step": 1572 + }, + { + "epoch": 4.286103542234333, + "grad_norm": 20.145408630371094, + "learning_rate": 1.999132608112366e-05, + "loss": 1.8589, + "step": 1573 + }, + { + "epoch": 4.2888283378746594, + "grad_norm": 16.198291778564453, + "learning_rate": 1.999128929363836e-05, + "loss": 1.8687, + "step": 1574 + }, + { + "epoch": 4.291553133514986, + "grad_norm": 11.562917709350586, + "learning_rate": 1.9991252428341222e-05, + "loss": 1.7009, + "step": 1575 + }, + { + "epoch": 4.294277929155314, + "grad_norm": 8.705707550048828, + "learning_rate": 1.999121548523253e-05, + "loss": 1.7183, + "step": 1576 + }, + { + "epoch": 4.29700272479564, + "grad_norm": 10.386330604553223, + "learning_rate": 1.9991178464312575e-05, + "loss": 1.801, + "step": 1577 + }, + { + "epoch": 4.299727520435967, + "grad_norm": 13.204593658447266, + "learning_rate": 1.9991141365581644e-05, + "loss": 1.7529, + "step": 1578 + }, + { + "epoch": 4.302452316076295, + "grad_norm": 11.083606719970703, + "learning_rate": 1.9991104189040024e-05, + "loss": 1.7524, + "step": 1579 + }, + { + "epoch": 4.305177111716621, + "grad_norm": 12.340747833251953, + "learning_rate": 1.999106693468801e-05, + "loss": 1.8311, + "step": 1580 + }, + { + "epoch": 4.307901907356948, + "grad_norm": 11.777390480041504, + "learning_rate": 1.9991029602525884e-05, + "loss": 2.0127, + "step": 1581 + }, + { + "epoch": 4.310626702997276, + "grad_norm": 12.502350807189941, + "learning_rate": 1.999099219255394e-05, + "loss": 2.0781, + "step": 1582 + }, + { + "epoch": 4.313351498637602, + "grad_norm": 12.655232429504395, + "learning_rate": 1.9990954704772473e-05, + "loss": 1.7717, + "step": 1583 + }, + { + "epoch": 4.316076294277929, + "grad_norm": 12.700472831726074, + "learning_rate": 1.9990917139181772e-05, + "loss": 2.0933, + "step": 1584 + }, + { + "epoch": 4.3188010899182565, + "grad_norm": 11.673563003540039, + "learning_rate": 1.999087949578213e-05, + "loss": 1.6792, + "step": 1585 + }, + { + "epoch": 4.321525885558583, + "grad_norm": 13.173969268798828, + "learning_rate": 1.9990841774573843e-05, + "loss": 1.9663, + "step": 1586 + }, + { + "epoch": 4.32425068119891, + "grad_norm": 13.962111473083496, + "learning_rate": 1.9990803975557197e-05, + "loss": 1.9666, + "step": 1587 + }, + { + "epoch": 4.3269754768392374, + "grad_norm": 15.190113067626953, + "learning_rate": 1.9990766098732493e-05, + "loss": 1.7192, + "step": 1588 + }, + { + "epoch": 4.329700272479564, + "grad_norm": 14.03504467010498, + "learning_rate": 1.9990728144100025e-05, + "loss": 1.8108, + "step": 1589 + }, + { + "epoch": 4.332425068119891, + "grad_norm": 10.579913139343262, + "learning_rate": 1.999069011166009e-05, + "loss": 1.8877, + "step": 1590 + }, + { + "epoch": 4.335149863760218, + "grad_norm": 12.852388381958008, + "learning_rate": 1.9990652001412973e-05, + "loss": 1.9597, + "step": 1591 + }, + { + "epoch": 4.337874659400545, + "grad_norm": 11.49439525604248, + "learning_rate": 1.9990613813358987e-05, + "loss": 1.894, + "step": 1592 + }, + { + "epoch": 4.340599455040872, + "grad_norm": 10.72061538696289, + "learning_rate": 1.999057554749842e-05, + "loss": 1.8101, + "step": 1593 + }, + { + "epoch": 4.343324250681199, + "grad_norm": 11.686420440673828, + "learning_rate": 1.9990537203831573e-05, + "loss": 2.0156, + "step": 1594 + }, + { + "epoch": 4.346049046321526, + "grad_norm": 13.056648254394531, + "learning_rate": 1.9990498782358745e-05, + "loss": 1.9202, + "step": 1595 + }, + { + "epoch": 4.348773841961853, + "grad_norm": 12.927536964416504, + "learning_rate": 1.9990460283080232e-05, + "loss": 1.9849, + "step": 1596 + }, + { + "epoch": 4.35149863760218, + "grad_norm": 10.1175537109375, + "learning_rate": 1.9990421705996336e-05, + "loss": 1.8677, + "step": 1597 + }, + { + "epoch": 4.354223433242507, + "grad_norm": 10.478602409362793, + "learning_rate": 1.999038305110736e-05, + "loss": 1.9634, + "step": 1598 + }, + { + "epoch": 4.356948228882834, + "grad_norm": 13.643245697021484, + "learning_rate": 1.9990344318413598e-05, + "loss": 1.7224, + "step": 1599 + }, + { + "epoch": 4.359673024523161, + "grad_norm": 10.597620010375977, + "learning_rate": 1.999030550791536e-05, + "loss": 1.8633, + "step": 1600 + }, + { + "epoch": 4.362397820163488, + "grad_norm": 18.982633590698242, + "learning_rate": 1.999026661961294e-05, + "loss": 1.7788, + "step": 1601 + }, + { + "epoch": 4.3651226158038146, + "grad_norm": 14.29390811920166, + "learning_rate": 1.999022765350665e-05, + "loss": 1.8198, + "step": 1602 + }, + { + "epoch": 4.367847411444142, + "grad_norm": 14.045916557312012, + "learning_rate": 1.9990188609596786e-05, + "loss": 1.6416, + "step": 1603 + }, + { + "epoch": 4.370572207084469, + "grad_norm": 9.716156005859375, + "learning_rate": 1.9990149487883653e-05, + "loss": 2.0276, + "step": 1604 + }, + { + "epoch": 4.3732970027247955, + "grad_norm": 12.709885597229004, + "learning_rate": 1.999011028836756e-05, + "loss": 1.804, + "step": 1605 + }, + { + "epoch": 4.376021798365123, + "grad_norm": 13.103960037231445, + "learning_rate": 1.9990071011048807e-05, + "loss": 1.8384, + "step": 1606 + }, + { + "epoch": 4.37874659400545, + "grad_norm": 11.972681999206543, + "learning_rate": 1.999003165592771e-05, + "loss": 1.9453, + "step": 1607 + }, + { + "epoch": 4.381471389645776, + "grad_norm": 23.582698822021484, + "learning_rate": 1.998999222300456e-05, + "loss": 1.6707, + "step": 1608 + }, + { + "epoch": 4.384196185286104, + "grad_norm": 11.656493186950684, + "learning_rate": 1.9989952712279674e-05, + "loss": 1.8208, + "step": 1609 + }, + { + "epoch": 4.386920980926431, + "grad_norm": 10.497620582580566, + "learning_rate": 1.998991312375336e-05, + "loss": 1.8674, + "step": 1610 + }, + { + "epoch": 4.389645776566757, + "grad_norm": 12.55628776550293, + "learning_rate": 1.9989873457425922e-05, + "loss": 1.7979, + "step": 1611 + }, + { + "epoch": 4.392370572207085, + "grad_norm": 12.809096336364746, + "learning_rate": 1.998983371329767e-05, + "loss": 1.9019, + "step": 1612 + }, + { + "epoch": 4.395095367847412, + "grad_norm": 15.382226943969727, + "learning_rate": 1.9989793891368915e-05, + "loss": 1.7056, + "step": 1613 + }, + { + "epoch": 4.397820163487738, + "grad_norm": 11.492066383361816, + "learning_rate": 1.9989753991639968e-05, + "loss": 1.814, + "step": 1614 + }, + { + "epoch": 4.400544959128065, + "grad_norm": 14.366987228393555, + "learning_rate": 1.998971401411114e-05, + "loss": 1.7908, + "step": 1615 + }, + { + "epoch": 4.4032697547683926, + "grad_norm": 13.31606388092041, + "learning_rate": 1.9989673958782735e-05, + "loss": 1.802, + "step": 1616 + }, + { + "epoch": 4.405994550408719, + "grad_norm": 26.214847564697266, + "learning_rate": 1.998963382565508e-05, + "loss": 1.8096, + "step": 1617 + }, + { + "epoch": 4.408719346049046, + "grad_norm": 12.695902824401855, + "learning_rate": 1.998959361472847e-05, + "loss": 1.7192, + "step": 1618 + }, + { + "epoch": 4.4114441416893735, + "grad_norm": 14.11608600616455, + "learning_rate": 1.9989553326003226e-05, + "loss": 1.8149, + "step": 1619 + }, + { + "epoch": 4.4141689373297, + "grad_norm": 14.843645095825195, + "learning_rate": 1.9989512959479666e-05, + "loss": 1.8113, + "step": 1620 + }, + { + "epoch": 4.416893732970027, + "grad_norm": 12.413495063781738, + "learning_rate": 1.9989472515158102e-05, + "loss": 2.0884, + "step": 1621 + }, + { + "epoch": 4.419618528610354, + "grad_norm": 14.569469451904297, + "learning_rate": 1.9989431993038842e-05, + "loss": 1.9043, + "step": 1622 + }, + { + "epoch": 4.422343324250681, + "grad_norm": 13.531723976135254, + "learning_rate": 1.998939139312221e-05, + "loss": 1.7754, + "step": 1623 + }, + { + "epoch": 4.425068119891008, + "grad_norm": 15.61850643157959, + "learning_rate": 1.9989350715408525e-05, + "loss": 1.7192, + "step": 1624 + }, + { + "epoch": 4.427792915531335, + "grad_norm": 12.612687110900879, + "learning_rate": 1.998930995989809e-05, + "loss": 1.8931, + "step": 1625 + }, + { + "epoch": 4.430517711171662, + "grad_norm": 13.903953552246094, + "learning_rate": 1.9989269126591236e-05, + "loss": 2.0015, + "step": 1626 + }, + { + "epoch": 4.433242506811989, + "grad_norm": 11.026742935180664, + "learning_rate": 1.9989228215488273e-05, + "loss": 1.5745, + "step": 1627 + }, + { + "epoch": 4.435967302452316, + "grad_norm": 22.10861587524414, + "learning_rate": 1.9989187226589522e-05, + "loss": 1.916, + "step": 1628 + }, + { + "epoch": 4.438692098092643, + "grad_norm": 21.367530822753906, + "learning_rate": 1.9989146159895305e-05, + "loss": 1.9092, + "step": 1629 + }, + { + "epoch": 4.44141689373297, + "grad_norm": 12.559633255004883, + "learning_rate": 1.9989105015405935e-05, + "loss": 1.8308, + "step": 1630 + }, + { + "epoch": 4.444141689373297, + "grad_norm": 15.54616928100586, + "learning_rate": 1.9989063793121736e-05, + "loss": 2.0679, + "step": 1631 + }, + { + "epoch": 4.446866485013624, + "grad_norm": 12.716418266296387, + "learning_rate": 1.9989022493043033e-05, + "loss": 1.7646, + "step": 1632 + }, + { + "epoch": 4.449591280653951, + "grad_norm": 16.063173294067383, + "learning_rate": 1.9988981115170144e-05, + "loss": 1.9248, + "step": 1633 + }, + { + "epoch": 4.452316076294278, + "grad_norm": 22.75617027282715, + "learning_rate": 1.998893965950339e-05, + "loss": 2.1328, + "step": 1634 + }, + { + "epoch": 4.455040871934605, + "grad_norm": 14.810853004455566, + "learning_rate": 1.99888981260431e-05, + "loss": 1.6895, + "step": 1635 + }, + { + "epoch": 4.4577656675749315, + "grad_norm": 23.45295524597168, + "learning_rate": 1.998885651478959e-05, + "loss": 1.8169, + "step": 1636 + }, + { + "epoch": 4.460490463215259, + "grad_norm": 23.975677490234375, + "learning_rate": 1.9988814825743183e-05, + "loss": 1.7471, + "step": 1637 + }, + { + "epoch": 4.463215258855586, + "grad_norm": 18.05084800720215, + "learning_rate": 1.9988773058904213e-05, + "loss": 1.6943, + "step": 1638 + }, + { + "epoch": 4.4659400544959125, + "grad_norm": 17.506332397460938, + "learning_rate": 1.9988731214272995e-05, + "loss": 1.9805, + "step": 1639 + }, + { + "epoch": 4.46866485013624, + "grad_norm": 45.82698059082031, + "learning_rate": 1.9988689291849865e-05, + "loss": 1.8711, + "step": 1640 + }, + { + "epoch": 4.471389645776567, + "grad_norm": 20.599950790405273, + "learning_rate": 1.9988647291635143e-05, + "loss": 2.0127, + "step": 1641 + }, + { + "epoch": 4.474114441416893, + "grad_norm": 27.706125259399414, + "learning_rate": 1.9988605213629157e-05, + "loss": 1.7874, + "step": 1642 + }, + { + "epoch": 4.476839237057221, + "grad_norm": 26.521753311157227, + "learning_rate": 1.9988563057832234e-05, + "loss": 1.834, + "step": 1643 + }, + { + "epoch": 4.479564032697548, + "grad_norm": 28.991363525390625, + "learning_rate": 1.9988520824244703e-05, + "loss": 1.8335, + "step": 1644 + }, + { + "epoch": 4.482288828337874, + "grad_norm": 13.267407417297363, + "learning_rate": 1.9988478512866893e-05, + "loss": 1.8252, + "step": 1645 + }, + { + "epoch": 4.485013623978202, + "grad_norm": 15.971419334411621, + "learning_rate": 1.9988436123699135e-05, + "loss": 1.6104, + "step": 1646 + }, + { + "epoch": 4.487738419618529, + "grad_norm": 12.338957786560059, + "learning_rate": 1.998839365674176e-05, + "loss": 1.9094, + "step": 1647 + }, + { + "epoch": 4.490463215258855, + "grad_norm": 12.820110321044922, + "learning_rate": 1.9988351111995095e-05, + "loss": 1.7393, + "step": 1648 + }, + { + "epoch": 4.493188010899183, + "grad_norm": 20.78042221069336, + "learning_rate": 1.998830848945947e-05, + "loss": 1.9839, + "step": 1649 + }, + { + "epoch": 4.4959128065395095, + "grad_norm": 15.028311729431152, + "learning_rate": 1.9988265789135224e-05, + "loss": 1.853, + "step": 1650 + }, + { + "epoch": 4.498637602179836, + "grad_norm": 16.6220645904541, + "learning_rate": 1.9988223011022686e-05, + "loss": 1.7827, + "step": 1651 + }, + { + "epoch": 4.501362397820164, + "grad_norm": 17.394527435302734, + "learning_rate": 1.9988180155122187e-05, + "loss": 1.8818, + "step": 1652 + }, + { + "epoch": 4.5040871934604905, + "grad_norm": 19.727069854736328, + "learning_rate": 1.998813722143406e-05, + "loss": 1.9028, + "step": 1653 + }, + { + "epoch": 4.506811989100817, + "grad_norm": 18.605106353759766, + "learning_rate": 1.9988094209958644e-05, + "loss": 1.8357, + "step": 1654 + }, + { + "epoch": 4.509536784741145, + "grad_norm": 14.147246360778809, + "learning_rate": 1.998805112069627e-05, + "loss": 1.7061, + "step": 1655 + }, + { + "epoch": 4.512261580381471, + "grad_norm": 14.222494125366211, + "learning_rate": 1.9988007953647278e-05, + "loss": 1.6477, + "step": 1656 + }, + { + "epoch": 4.514986376021798, + "grad_norm": 16.673221588134766, + "learning_rate": 1.9987964708812e-05, + "loss": 1.802, + "step": 1657 + }, + { + "epoch": 4.517711171662126, + "grad_norm": 13.81769847869873, + "learning_rate": 1.9987921386190777e-05, + "loss": 1.8066, + "step": 1658 + }, + { + "epoch": 4.520435967302452, + "grad_norm": 11.60045337677002, + "learning_rate": 1.998787798578394e-05, + "loss": 1.8171, + "step": 1659 + }, + { + "epoch": 4.523160762942779, + "grad_norm": 14.101318359375, + "learning_rate": 1.9987834507591834e-05, + "loss": 1.8599, + "step": 1660 + }, + { + "epoch": 4.525885558583107, + "grad_norm": 32.92286682128906, + "learning_rate": 1.9987790951614792e-05, + "loss": 2.0098, + "step": 1661 + }, + { + "epoch": 4.528610354223433, + "grad_norm": 14.645931243896484, + "learning_rate": 1.9987747317853156e-05, + "loss": 1.7949, + "step": 1662 + }, + { + "epoch": 4.53133514986376, + "grad_norm": 13.726556777954102, + "learning_rate": 1.9987703606307268e-05, + "loss": 1.8081, + "step": 1663 + }, + { + "epoch": 4.5340599455040875, + "grad_norm": 14.259086608886719, + "learning_rate": 1.998765981697746e-05, + "loss": 1.9502, + "step": 1664 + }, + { + "epoch": 4.536784741144414, + "grad_norm": 13.587321281433105, + "learning_rate": 1.9987615949864085e-05, + "loss": 2.0098, + "step": 1665 + }, + { + "epoch": 4.539509536784741, + "grad_norm": 17.23871612548828, + "learning_rate": 1.9987572004967474e-05, + "loss": 1.9043, + "step": 1666 + }, + { + "epoch": 4.5422343324250685, + "grad_norm": 11.833878517150879, + "learning_rate": 1.9987527982287977e-05, + "loss": 1.8086, + "step": 1667 + }, + { + "epoch": 4.544959128065395, + "grad_norm": 14.381035804748535, + "learning_rate": 1.9987483881825928e-05, + "loss": 1.8198, + "step": 1668 + }, + { + "epoch": 4.547683923705722, + "grad_norm": 13.35680103302002, + "learning_rate": 1.998743970358168e-05, + "loss": 1.7485, + "step": 1669 + }, + { + "epoch": 4.550408719346049, + "grad_norm": 9.395089149475098, + "learning_rate": 1.9987395447555574e-05, + "loss": 1.551, + "step": 1670 + }, + { + "epoch": 4.553133514986376, + "grad_norm": 11.275160789489746, + "learning_rate": 1.9987351113747953e-05, + "loss": 1.7605, + "step": 1671 + }, + { + "epoch": 4.555858310626703, + "grad_norm": 37.18361282348633, + "learning_rate": 1.998730670215916e-05, + "loss": 1.7385, + "step": 1672 + }, + { + "epoch": 4.55858310626703, + "grad_norm": 15.461226463317871, + "learning_rate": 1.9987262212789547e-05, + "loss": 1.7046, + "step": 1673 + }, + { + "epoch": 4.561307901907357, + "grad_norm": 11.419524192810059, + "learning_rate": 1.998721764563946e-05, + "loss": 1.6311, + "step": 1674 + }, + { + "epoch": 4.564032697547684, + "grad_norm": 11.717555046081543, + "learning_rate": 1.9987173000709238e-05, + "loss": 1.9062, + "step": 1675 + }, + { + "epoch": 4.566757493188011, + "grad_norm": 11.768439292907715, + "learning_rate": 1.9987128277999236e-05, + "loss": 1.8047, + "step": 1676 + }, + { + "epoch": 4.569482288828338, + "grad_norm": 11.077784538269043, + "learning_rate": 1.99870834775098e-05, + "loss": 1.8286, + "step": 1677 + }, + { + "epoch": 4.572207084468665, + "grad_norm": 9.806815147399902, + "learning_rate": 1.998703859924128e-05, + "loss": 1.8022, + "step": 1678 + }, + { + "epoch": 4.574931880108992, + "grad_norm": 21.835113525390625, + "learning_rate": 1.9986993643194022e-05, + "loss": 1.8, + "step": 1679 + }, + { + "epoch": 4.577656675749319, + "grad_norm": 11.922440528869629, + "learning_rate": 1.9986948609368385e-05, + "loss": 1.959, + "step": 1680 + }, + { + "epoch": 4.580381471389646, + "grad_norm": 12.709155082702637, + "learning_rate": 1.998690349776471e-05, + "loss": 1.7598, + "step": 1681 + }, + { + "epoch": 4.583106267029972, + "grad_norm": 12.793139457702637, + "learning_rate": 1.998685830838335e-05, + "loss": 1.7505, + "step": 1682 + }, + { + "epoch": 4.5858310626703, + "grad_norm": 12.681434631347656, + "learning_rate": 1.9986813041224662e-05, + "loss": 1.75, + "step": 1683 + }, + { + "epoch": 4.5885558583106265, + "grad_norm": 10.861709594726562, + "learning_rate": 1.9986767696288997e-05, + "loss": 1.9194, + "step": 1684 + }, + { + "epoch": 4.591280653950953, + "grad_norm": 10.562196731567383, + "learning_rate": 1.9986722273576703e-05, + "loss": 1.8896, + "step": 1685 + }, + { + "epoch": 4.594005449591281, + "grad_norm": 10.61209487915039, + "learning_rate": 1.9986676773088137e-05, + "loss": 1.6443, + "step": 1686 + }, + { + "epoch": 4.5967302452316074, + "grad_norm": 11.602971076965332, + "learning_rate": 1.9986631194823657e-05, + "loss": 1.7312, + "step": 1687 + }, + { + "epoch": 4.599455040871934, + "grad_norm": 11.791472434997559, + "learning_rate": 1.998658553878361e-05, + "loss": 1.6738, + "step": 1688 + }, + { + "epoch": 4.602179836512262, + "grad_norm": 10.37132740020752, + "learning_rate": 1.998653980496836e-05, + "loss": 1.6467, + "step": 1689 + }, + { + "epoch": 4.604904632152588, + "grad_norm": 11.563543319702148, + "learning_rate": 1.998649399337826e-05, + "loss": 2.0576, + "step": 1690 + }, + { + "epoch": 4.607629427792915, + "grad_norm": 11.379239082336426, + "learning_rate": 1.9986448104013664e-05, + "loss": 1.6252, + "step": 1691 + }, + { + "epoch": 4.610354223433243, + "grad_norm": 16.69204330444336, + "learning_rate": 1.998640213687493e-05, + "loss": 1.8271, + "step": 1692 + }, + { + "epoch": 4.613079019073569, + "grad_norm": 11.283498764038086, + "learning_rate": 1.9986356091962423e-05, + "loss": 1.7749, + "step": 1693 + }, + { + "epoch": 4.615803814713896, + "grad_norm": 11.236751556396484, + "learning_rate": 1.998630996927649e-05, + "loss": 1.9575, + "step": 1694 + }, + { + "epoch": 4.618528610354224, + "grad_norm": 9.967838287353516, + "learning_rate": 1.9986263768817502e-05, + "loss": 1.8423, + "step": 1695 + }, + { + "epoch": 4.62125340599455, + "grad_norm": 10.786258697509766, + "learning_rate": 1.998621749058581e-05, + "loss": 1.7085, + "step": 1696 + }, + { + "epoch": 4.623978201634877, + "grad_norm": 10.914759635925293, + "learning_rate": 1.9986171134581778e-05, + "loss": 1.7256, + "step": 1697 + }, + { + "epoch": 4.6267029972752045, + "grad_norm": 10.664731979370117, + "learning_rate": 1.9986124700805764e-05, + "loss": 1.644, + "step": 1698 + }, + { + "epoch": 4.629427792915531, + "grad_norm": 11.085412979125977, + "learning_rate": 1.998607818925814e-05, + "loss": 1.7568, + "step": 1699 + }, + { + "epoch": 4.632152588555858, + "grad_norm": 9.910640716552734, + "learning_rate": 1.9986031599939253e-05, + "loss": 1.7383, + "step": 1700 + }, + { + "epoch": 4.6348773841961854, + "grad_norm": 11.176325798034668, + "learning_rate": 1.9985984932849475e-05, + "loss": 1.5896, + "step": 1701 + }, + { + "epoch": 4.637602179836512, + "grad_norm": 11.895498275756836, + "learning_rate": 1.998593818798917e-05, + "loss": 1.9604, + "step": 1702 + }, + { + "epoch": 4.640326975476839, + "grad_norm": 10.814287185668945, + "learning_rate": 1.9985891365358697e-05, + "loss": 1.5288, + "step": 1703 + }, + { + "epoch": 4.643051771117166, + "grad_norm": 13.177926063537598, + "learning_rate": 1.9985844464958423e-05, + "loss": 2.0076, + "step": 1704 + }, + { + "epoch": 4.645776566757493, + "grad_norm": 12.39803695678711, + "learning_rate": 1.998579748678872e-05, + "loss": 2.041, + "step": 1705 + }, + { + "epoch": 4.64850136239782, + "grad_norm": 12.203011512756348, + "learning_rate": 1.998575043084994e-05, + "loss": 1.865, + "step": 1706 + }, + { + "epoch": 4.651226158038147, + "grad_norm": 14.263901710510254, + "learning_rate": 1.998570329714246e-05, + "loss": 1.8115, + "step": 1707 + }, + { + "epoch": 4.653950953678474, + "grad_norm": 11.454439163208008, + "learning_rate": 1.9985656085666646e-05, + "loss": 1.8589, + "step": 1708 + }, + { + "epoch": 4.656675749318801, + "grad_norm": 10.870101928710938, + "learning_rate": 1.9985608796422863e-05, + "loss": 1.5823, + "step": 1709 + }, + { + "epoch": 4.659400544959128, + "grad_norm": 10.731388092041016, + "learning_rate": 1.9985561429411478e-05, + "loss": 1.603, + "step": 1710 + }, + { + "epoch": 4.662125340599455, + "grad_norm": 11.784908294677734, + "learning_rate": 1.998551398463286e-05, + "loss": 1.7156, + "step": 1711 + }, + { + "epoch": 4.664850136239782, + "grad_norm": 11.44052505493164, + "learning_rate": 1.9985466462087383e-05, + "loss": 1.7234, + "step": 1712 + }, + { + "epoch": 4.667574931880109, + "grad_norm": 9.635643005371094, + "learning_rate": 1.9985418861775416e-05, + "loss": 1.7871, + "step": 1713 + }, + { + "epoch": 4.670299727520436, + "grad_norm": 10.105297088623047, + "learning_rate": 1.9985371183697327e-05, + "loss": 1.7383, + "step": 1714 + }, + { + "epoch": 4.6730245231607626, + "grad_norm": 11.22205638885498, + "learning_rate": 1.9985323427853492e-05, + "loss": 1.8931, + "step": 1715 + }, + { + "epoch": 4.67574931880109, + "grad_norm": 9.009623527526855, + "learning_rate": 1.9985275594244277e-05, + "loss": 1.6968, + "step": 1716 + }, + { + "epoch": 4.678474114441417, + "grad_norm": 9.375571250915527, + "learning_rate": 1.9985227682870054e-05, + "loss": 1.5361, + "step": 1717 + }, + { + "epoch": 4.6811989100817435, + "grad_norm": 19.648733139038086, + "learning_rate": 1.9985179693731204e-05, + "loss": 1.8423, + "step": 1718 + }, + { + "epoch": 4.683923705722071, + "grad_norm": 10.109658241271973, + "learning_rate": 1.9985131626828092e-05, + "loss": 1.6052, + "step": 1719 + }, + { + "epoch": 4.686648501362398, + "grad_norm": 12.355353355407715, + "learning_rate": 1.9985083482161098e-05, + "loss": 1.6052, + "step": 1720 + }, + { + "epoch": 4.689373297002724, + "grad_norm": 10.802824020385742, + "learning_rate": 1.9985035259730593e-05, + "loss": 1.8369, + "step": 1721 + }, + { + "epoch": 4.692098092643052, + "grad_norm": 11.200514793395996, + "learning_rate": 1.998498695953696e-05, + "loss": 1.8716, + "step": 1722 + }, + { + "epoch": 4.694822888283379, + "grad_norm": 11.038694381713867, + "learning_rate": 1.9984938581580566e-05, + "loss": 1.7036, + "step": 1723 + }, + { + "epoch": 4.697547683923705, + "grad_norm": 12.441304206848145, + "learning_rate": 1.998489012586179e-05, + "loss": 2.0435, + "step": 1724 + }, + { + "epoch": 4.700272479564033, + "grad_norm": 13.135621070861816, + "learning_rate": 1.9984841592381014e-05, + "loss": 1.6655, + "step": 1725 + }, + { + "epoch": 4.70299727520436, + "grad_norm": 11.036510467529297, + "learning_rate": 1.9984792981138616e-05, + "loss": 1.7988, + "step": 1726 + }, + { + "epoch": 4.705722070844686, + "grad_norm": 15.357640266418457, + "learning_rate": 1.9984744292134964e-05, + "loss": 1.8721, + "step": 1727 + }, + { + "epoch": 4.708446866485014, + "grad_norm": 11.371448516845703, + "learning_rate": 1.998469552537045e-05, + "loss": 1.8281, + "step": 1728 + }, + { + "epoch": 4.7111716621253406, + "grad_norm": 9.8068208694458, + "learning_rate": 1.9984646680845446e-05, + "loss": 1.5767, + "step": 1729 + }, + { + "epoch": 4.713896457765667, + "grad_norm": 13.548954010009766, + "learning_rate": 1.998459775856034e-05, + "loss": 2.1074, + "step": 1730 + }, + { + "epoch": 4.716621253405995, + "grad_norm": 10.1837158203125, + "learning_rate": 1.9984548758515503e-05, + "loss": 1.5684, + "step": 1731 + }, + { + "epoch": 4.7193460490463215, + "grad_norm": 8.237529754638672, + "learning_rate": 1.9984499680711322e-05, + "loss": 1.6902, + "step": 1732 + }, + { + "epoch": 4.722070844686648, + "grad_norm": 14.443774223327637, + "learning_rate": 1.9984450525148184e-05, + "loss": 1.7354, + "step": 1733 + }, + { + "epoch": 4.724795640326976, + "grad_norm": 13.338621139526367, + "learning_rate": 1.998440129182646e-05, + "loss": 1.791, + "step": 1734 + }, + { + "epoch": 4.727520435967302, + "grad_norm": 11.367993354797363, + "learning_rate": 1.9984351980746545e-05, + "loss": 1.7681, + "step": 1735 + }, + { + "epoch": 4.730245231607629, + "grad_norm": 8.49145221710205, + "learning_rate": 1.9984302591908812e-05, + "loss": 1.9062, + "step": 1736 + }, + { + "epoch": 4.732970027247957, + "grad_norm": 13.06961441040039, + "learning_rate": 1.998425312531366e-05, + "loss": 1.7966, + "step": 1737 + }, + { + "epoch": 4.735694822888283, + "grad_norm": 10.855565071105957, + "learning_rate": 1.998420358096146e-05, + "loss": 1.9082, + "step": 1738 + }, + { + "epoch": 4.73841961852861, + "grad_norm": 11.271066665649414, + "learning_rate": 1.9984153958852605e-05, + "loss": 1.8032, + "step": 1739 + }, + { + "epoch": 4.741144414168938, + "grad_norm": 10.016924858093262, + "learning_rate": 1.998410425898748e-05, + "loss": 1.6357, + "step": 1740 + }, + { + "epoch": 4.743869209809264, + "grad_norm": 13.83434772491455, + "learning_rate": 1.9984054481366474e-05, + "loss": 1.8184, + "step": 1741 + }, + { + "epoch": 4.746594005449591, + "grad_norm": 11.466126441955566, + "learning_rate": 1.9984004625989974e-05, + "loss": 1.7693, + "step": 1742 + }, + { + "epoch": 4.7493188010899186, + "grad_norm": 10.852738380432129, + "learning_rate": 1.9983954692858363e-05, + "loss": 1.5586, + "step": 1743 + }, + { + "epoch": 4.752043596730245, + "grad_norm": 11.944601058959961, + "learning_rate": 1.9983904681972034e-05, + "loss": 1.7754, + "step": 1744 + }, + { + "epoch": 4.754768392370572, + "grad_norm": 12.560547828674316, + "learning_rate": 1.998385459333138e-05, + "loss": 1.6797, + "step": 1745 + }, + { + "epoch": 4.7574931880108995, + "grad_norm": 12.880969047546387, + "learning_rate": 1.9983804426936787e-05, + "loss": 2.043, + "step": 1746 + }, + { + "epoch": 4.760217983651226, + "grad_norm": 10.755345344543457, + "learning_rate": 1.9983754182788647e-05, + "loss": 1.8086, + "step": 1747 + }, + { + "epoch": 4.762942779291553, + "grad_norm": 11.871491432189941, + "learning_rate": 1.9983703860887355e-05, + "loss": 1.7256, + "step": 1748 + }, + { + "epoch": 4.76566757493188, + "grad_norm": 10.811038970947266, + "learning_rate": 1.998365346123329e-05, + "loss": 1.6748, + "step": 1749 + }, + { + "epoch": 4.768392370572207, + "grad_norm": 12.117204666137695, + "learning_rate": 1.998360298382686e-05, + "loss": 1.9011, + "step": 1750 + }, + { + "epoch": 4.771117166212534, + "grad_norm": 12.1402587890625, + "learning_rate": 1.9983552428668448e-05, + "loss": 1.9209, + "step": 1751 + }, + { + "epoch": 4.773841961852861, + "grad_norm": 14.859792709350586, + "learning_rate": 1.998350179575845e-05, + "loss": 1.9126, + "step": 1752 + }, + { + "epoch": 4.776566757493188, + "grad_norm": 11.106743812561035, + "learning_rate": 1.9983451085097262e-05, + "loss": 1.8184, + "step": 1753 + }, + { + "epoch": 4.779291553133515, + "grad_norm": 16.94355583190918, + "learning_rate": 1.998340029668528e-05, + "loss": 1.6704, + "step": 1754 + }, + { + "epoch": 4.782016348773842, + "grad_norm": 9.108786582946777, + "learning_rate": 1.9983349430522896e-05, + "loss": 1.5703, + "step": 1755 + }, + { + "epoch": 4.784741144414169, + "grad_norm": 14.48527717590332, + "learning_rate": 1.9983298486610508e-05, + "loss": 1.6475, + "step": 1756 + }, + { + "epoch": 4.787465940054496, + "grad_norm": 10.127340316772461, + "learning_rate": 1.9983247464948515e-05, + "loss": 1.6936, + "step": 1757 + }, + { + "epoch": 4.790190735694823, + "grad_norm": 9.771352767944336, + "learning_rate": 1.9983196365537313e-05, + "loss": 1.6338, + "step": 1758 + }, + { + "epoch": 4.79291553133515, + "grad_norm": 11.561280250549316, + "learning_rate": 1.9983145188377297e-05, + "loss": 1.8057, + "step": 1759 + }, + { + "epoch": 4.795640326975477, + "grad_norm": 10.189553260803223, + "learning_rate": 1.9983093933468864e-05, + "loss": 1.5601, + "step": 1760 + }, + { + "epoch": 4.798365122615804, + "grad_norm": 10.330784797668457, + "learning_rate": 1.9983042600812423e-05, + "loss": 1.7271, + "step": 1761 + }, + { + "epoch": 4.801089918256131, + "grad_norm": 9.032349586486816, + "learning_rate": 1.9982991190408362e-05, + "loss": 1.5364, + "step": 1762 + }, + { + "epoch": 4.8038147138964575, + "grad_norm": 9.430227279663086, + "learning_rate": 1.9982939702257088e-05, + "loss": 1.7295, + "step": 1763 + }, + { + "epoch": 4.806539509536785, + "grad_norm": 13.426956176757812, + "learning_rate": 1.9982888136359e-05, + "loss": 2.0376, + "step": 1764 + }, + { + "epoch": 4.809264305177112, + "grad_norm": 9.60643196105957, + "learning_rate": 1.9982836492714505e-05, + "loss": 1.439, + "step": 1765 + }, + { + "epoch": 4.8119891008174385, + "grad_norm": 11.653831481933594, + "learning_rate": 1.9982784771324e-05, + "loss": 1.6733, + "step": 1766 + }, + { + "epoch": 4.814713896457766, + "grad_norm": 9.333499908447266, + "learning_rate": 1.9982732972187884e-05, + "loss": 1.7495, + "step": 1767 + }, + { + "epoch": 4.817438692098093, + "grad_norm": 10.512800216674805, + "learning_rate": 1.998268109530657e-05, + "loss": 1.6362, + "step": 1768 + }, + { + "epoch": 4.820163487738419, + "grad_norm": 11.654182434082031, + "learning_rate": 1.9982629140680453e-05, + "loss": 1.8032, + "step": 1769 + }, + { + "epoch": 4.822888283378747, + "grad_norm": 9.613519668579102, + "learning_rate": 1.9982577108309945e-05, + "loss": 1.7002, + "step": 1770 + }, + { + "epoch": 4.825613079019074, + "grad_norm": 10.996225357055664, + "learning_rate": 1.9982524998195446e-05, + "loss": 1.8635, + "step": 1771 + }, + { + "epoch": 4.8283378746594, + "grad_norm": 10.677639961242676, + "learning_rate": 1.9982472810337363e-05, + "loss": 1.6965, + "step": 1772 + }, + { + "epoch": 4.831062670299728, + "grad_norm": 11.29150104522705, + "learning_rate": 1.9982420544736106e-05, + "loss": 1.9971, + "step": 1773 + }, + { + "epoch": 4.833787465940055, + "grad_norm": 12.019180297851562, + "learning_rate": 1.9982368201392074e-05, + "loss": 1.5317, + "step": 1774 + }, + { + "epoch": 4.836512261580381, + "grad_norm": 11.11221981048584, + "learning_rate": 1.998231578030568e-05, + "loss": 1.6997, + "step": 1775 + }, + { + "epoch": 4.839237057220709, + "grad_norm": 13.890466690063477, + "learning_rate": 1.9982263281477338e-05, + "loss": 1.7688, + "step": 1776 + }, + { + "epoch": 4.8419618528610355, + "grad_norm": 10.007216453552246, + "learning_rate": 1.9982210704907446e-05, + "loss": 1.7949, + "step": 1777 + }, + { + "epoch": 4.844686648501362, + "grad_norm": 11.3532133102417, + "learning_rate": 1.998215805059642e-05, + "loss": 1.624, + "step": 1778 + }, + { + "epoch": 4.84741144414169, + "grad_norm": 12.174700736999512, + "learning_rate": 1.998210531854467e-05, + "loss": 1.8188, + "step": 1779 + }, + { + "epoch": 4.8501362397820165, + "grad_norm": 9.562557220458984, + "learning_rate": 1.9982052508752605e-05, + "loss": 1.7285, + "step": 1780 + }, + { + "epoch": 4.852861035422343, + "grad_norm": 11.95835018157959, + "learning_rate": 1.998199962122063e-05, + "loss": 1.5879, + "step": 1781 + }, + { + "epoch": 4.855585831062671, + "grad_norm": 8.104500770568848, + "learning_rate": 1.998194665594917e-05, + "loss": 1.7051, + "step": 1782 + }, + { + "epoch": 4.858310626702997, + "grad_norm": 10.136801719665527, + "learning_rate": 1.9981893612938624e-05, + "loss": 1.9111, + "step": 1783 + }, + { + "epoch": 4.861035422343324, + "grad_norm": 10.49084186553955, + "learning_rate": 1.998184049218942e-05, + "loss": 1.8105, + "step": 1784 + }, + { + "epoch": 4.863760217983652, + "grad_norm": 8.479459762573242, + "learning_rate": 1.9981787293701956e-05, + "loss": 1.6277, + "step": 1785 + }, + { + "epoch": 4.866485013623978, + "grad_norm": 20.927406311035156, + "learning_rate": 1.998173401747666e-05, + "loss": 1.7363, + "step": 1786 + }, + { + "epoch": 4.869209809264305, + "grad_norm": 10.920572280883789, + "learning_rate": 1.998168066351394e-05, + "loss": 1.8013, + "step": 1787 + }, + { + "epoch": 4.871934604904633, + "grad_norm": 9.645325660705566, + "learning_rate": 1.9981627231814207e-05, + "loss": 1.9629, + "step": 1788 + }, + { + "epoch": 4.874659400544959, + "grad_norm": 10.725105285644531, + "learning_rate": 1.9981573722377888e-05, + "loss": 1.7422, + "step": 1789 + }, + { + "epoch": 4.877384196185286, + "grad_norm": 19.972970962524414, + "learning_rate": 1.998152013520539e-05, + "loss": 1.7646, + "step": 1790 + }, + { + "epoch": 4.8801089918256135, + "grad_norm": 10.030486106872559, + "learning_rate": 1.9981466470297136e-05, + "loss": 1.9072, + "step": 1791 + }, + { + "epoch": 4.88283378746594, + "grad_norm": 11.005029678344727, + "learning_rate": 1.9981412727653544e-05, + "loss": 1.4939, + "step": 1792 + }, + { + "epoch": 4.885558583106267, + "grad_norm": 14.201371192932129, + "learning_rate": 1.998135890727503e-05, + "loss": 1.897, + "step": 1793 + }, + { + "epoch": 4.8882833787465945, + "grad_norm": 15.717061042785645, + "learning_rate": 1.998130500916201e-05, + "loss": 1.7451, + "step": 1794 + }, + { + "epoch": 4.891008174386921, + "grad_norm": 11.440669059753418, + "learning_rate": 1.9981251033314914e-05, + "loss": 1.5527, + "step": 1795 + }, + { + "epoch": 4.893732970027248, + "grad_norm": 10.5989990234375, + "learning_rate": 1.9981196979734157e-05, + "loss": 1.876, + "step": 1796 + }, + { + "epoch": 4.896457765667575, + "grad_norm": 13.592907905578613, + "learning_rate": 1.9981142848420152e-05, + "loss": 1.6316, + "step": 1797 + }, + { + "epoch": 4.899182561307902, + "grad_norm": 20.18497085571289, + "learning_rate": 1.9981088639373335e-05, + "loss": 1.9888, + "step": 1798 + }, + { + "epoch": 4.901907356948229, + "grad_norm": 9.938689231872559, + "learning_rate": 1.9981034352594117e-05, + "loss": 1.6448, + "step": 1799 + }, + { + "epoch": 4.904632152588556, + "grad_norm": 7.556951999664307, + "learning_rate": 1.9980979988082923e-05, + "loss": 1.7573, + "step": 1800 + }, + { + "epoch": 4.907356948228883, + "grad_norm": 9.85840129852295, + "learning_rate": 1.9980925545840183e-05, + "loss": 1.752, + "step": 1801 + }, + { + "epoch": 4.91008174386921, + "grad_norm": 8.957093238830566, + "learning_rate": 1.9980871025866314e-05, + "loss": 1.7471, + "step": 1802 + }, + { + "epoch": 4.912806539509537, + "grad_norm": 12.380105972290039, + "learning_rate": 1.998081642816174e-05, + "loss": 1.6592, + "step": 1803 + }, + { + "epoch": 4.915531335149864, + "grad_norm": 7.244705677032471, + "learning_rate": 1.998076175272689e-05, + "loss": 1.6409, + "step": 1804 + }, + { + "epoch": 4.918256130790191, + "grad_norm": 10.387642860412598, + "learning_rate": 1.998070699956219e-05, + "loss": 1.7148, + "step": 1805 + }, + { + "epoch": 4.920980926430518, + "grad_norm": 9.52930736541748, + "learning_rate": 1.9980652168668063e-05, + "loss": 1.8584, + "step": 1806 + }, + { + "epoch": 4.923705722070845, + "grad_norm": 10.156198501586914, + "learning_rate": 1.9980597260044944e-05, + "loss": 1.7664, + "step": 1807 + }, + { + "epoch": 4.926430517711172, + "grad_norm": 10.294306755065918, + "learning_rate": 1.998054227369325e-05, + "loss": 1.9492, + "step": 1808 + }, + { + "epoch": 4.929155313351498, + "grad_norm": 8.773594856262207, + "learning_rate": 1.998048720961341e-05, + "loss": 1.7065, + "step": 1809 + }, + { + "epoch": 4.931880108991826, + "grad_norm": 10.288111686706543, + "learning_rate": 1.9980432067805865e-05, + "loss": 1.7935, + "step": 1810 + }, + { + "epoch": 4.9346049046321525, + "grad_norm": 9.438074111938477, + "learning_rate": 1.9980376848271032e-05, + "loss": 1.7935, + "step": 1811 + }, + { + "epoch": 4.937329700272479, + "grad_norm": 9.358190536499023, + "learning_rate": 1.998032155100935e-05, + "loss": 1.6648, + "step": 1812 + }, + { + "epoch": 4.940054495912807, + "grad_norm": 14.03318977355957, + "learning_rate": 1.998026617602124e-05, + "loss": 1.8315, + "step": 1813 + }, + { + "epoch": 4.9427792915531334, + "grad_norm": 12.71858024597168, + "learning_rate": 1.998021072330714e-05, + "loss": 1.6411, + "step": 1814 + }, + { + "epoch": 4.94550408719346, + "grad_norm": 9.145251274108887, + "learning_rate": 1.9980155192867477e-05, + "loss": 1.8184, + "step": 1815 + }, + { + "epoch": 4.948228882833788, + "grad_norm": 11.447920799255371, + "learning_rate": 1.998009958470269e-05, + "loss": 1.8403, + "step": 1816 + }, + { + "epoch": 4.950953678474114, + "grad_norm": 12.897775650024414, + "learning_rate": 1.9980043898813206e-05, + "loss": 1.8479, + "step": 1817 + }, + { + "epoch": 4.953678474114441, + "grad_norm": 9.578463554382324, + "learning_rate": 1.9979988135199464e-05, + "loss": 1.7861, + "step": 1818 + }, + { + "epoch": 4.956403269754769, + "grad_norm": 9.109416007995605, + "learning_rate": 1.9979932293861895e-05, + "loss": 1.7188, + "step": 1819 + }, + { + "epoch": 4.959128065395095, + "grad_norm": 10.429159164428711, + "learning_rate": 1.9979876374800935e-05, + "loss": 1.4775, + "step": 1820 + }, + { + "epoch": 4.961852861035422, + "grad_norm": 9.446931838989258, + "learning_rate": 1.9979820378017017e-05, + "loss": 1.5884, + "step": 1821 + }, + { + "epoch": 4.96457765667575, + "grad_norm": 13.700077056884766, + "learning_rate": 1.997976430351058e-05, + "loss": 1.8855, + "step": 1822 + }, + { + "epoch": 4.967302452316076, + "grad_norm": 10.119503021240234, + "learning_rate": 1.997970815128206e-05, + "loss": 1.6887, + "step": 1823 + }, + { + "epoch": 4.970027247956403, + "grad_norm": 12.266241073608398, + "learning_rate": 1.9979651921331893e-05, + "loss": 1.8296, + "step": 1824 + }, + { + "epoch": 4.9727520435967305, + "grad_norm": 10.371781349182129, + "learning_rate": 1.997959561366052e-05, + "loss": 1.8691, + "step": 1825 + }, + { + "epoch": 4.975476839237057, + "grad_norm": 9.75312328338623, + "learning_rate": 1.9979539228268377e-05, + "loss": 1.9424, + "step": 1826 + }, + { + "epoch": 4.978201634877384, + "grad_norm": 9.707611083984375, + "learning_rate": 1.9979482765155905e-05, + "loss": 1.6619, + "step": 1827 + }, + { + "epoch": 4.9809264305177114, + "grad_norm": 12.377727508544922, + "learning_rate": 1.997942622432354e-05, + "loss": 1.6523, + "step": 1828 + }, + { + "epoch": 4.983651226158038, + "grad_norm": 9.129666328430176, + "learning_rate": 1.9979369605771722e-05, + "loss": 1.7437, + "step": 1829 + }, + { + "epoch": 4.986376021798365, + "grad_norm": 10.96391487121582, + "learning_rate": 1.9979312909500902e-05, + "loss": 1.5151, + "step": 1830 + }, + { + "epoch": 4.989100817438692, + "grad_norm": 8.620485305786133, + "learning_rate": 1.997925613551151e-05, + "loss": 1.7695, + "step": 1831 + }, + { + "epoch": 4.991825613079019, + "grad_norm": 9.796248435974121, + "learning_rate": 1.9979199283803994e-05, + "loss": 1.7188, + "step": 1832 + }, + { + "epoch": 4.994550408719346, + "grad_norm": 11.4308443069458, + "learning_rate": 1.9979142354378793e-05, + "loss": 1.7048, + "step": 1833 + }, + { + "epoch": 4.997275204359673, + "grad_norm": 11.859092712402344, + "learning_rate": 1.9979085347236355e-05, + "loss": 1.7302, + "step": 1834 + }, + { + "epoch": 5.0, + "grad_norm": 9.439201354980469, + "learning_rate": 1.997902826237712e-05, + "loss": 1.7229, + "step": 1835 + }, + { + "epoch": 5.002724795640327, + "grad_norm": 9.204095840454102, + "learning_rate": 1.9978971099801532e-05, + "loss": 1.4448, + "step": 1836 + }, + { + "epoch": 5.005449591280654, + "grad_norm": 7.906982421875, + "learning_rate": 1.997891385951004e-05, + "loss": 1.6667, + "step": 1837 + }, + { + "epoch": 5.008174386920981, + "grad_norm": 10.754129409790039, + "learning_rate": 1.997885654150309e-05, + "loss": 1.6953, + "step": 1838 + }, + { + "epoch": 5.010899182561308, + "grad_norm": 10.338284492492676, + "learning_rate": 1.9978799145781123e-05, + "loss": 1.9326, + "step": 1839 + }, + { + "epoch": 5.013623978201635, + "grad_norm": 8.468027114868164, + "learning_rate": 1.9978741672344594e-05, + "loss": 1.4824, + "step": 1840 + }, + { + "epoch": 5.016348773841962, + "grad_norm": 12.986717224121094, + "learning_rate": 1.9978684121193944e-05, + "loss": 1.6636, + "step": 1841 + }, + { + "epoch": 5.0190735694822886, + "grad_norm": 8.562746047973633, + "learning_rate": 1.997862649232962e-05, + "loss": 1.6724, + "step": 1842 + }, + { + "epoch": 5.021798365122616, + "grad_norm": 10.53598690032959, + "learning_rate": 1.9978568785752077e-05, + "loss": 1.6729, + "step": 1843 + }, + { + "epoch": 5.024523160762943, + "grad_norm": 11.25537109375, + "learning_rate": 1.997851100146176e-05, + "loss": 1.6594, + "step": 1844 + }, + { + "epoch": 5.0272479564032695, + "grad_norm": 9.552088737487793, + "learning_rate": 1.9978453139459123e-05, + "loss": 1.5952, + "step": 1845 + }, + { + "epoch": 5.029972752043597, + "grad_norm": 8.246376991271973, + "learning_rate": 1.997839519974461e-05, + "loss": 1.4541, + "step": 1846 + }, + { + "epoch": 5.032697547683924, + "grad_norm": 11.155094146728516, + "learning_rate": 1.9978337182318678e-05, + "loss": 1.5488, + "step": 1847 + }, + { + "epoch": 5.03542234332425, + "grad_norm": 9.724387168884277, + "learning_rate": 1.997827908718178e-05, + "loss": 1.7109, + "step": 1848 + }, + { + "epoch": 5.038147138964578, + "grad_norm": 11.168493270874023, + "learning_rate": 1.9978220914334363e-05, + "loss": 1.7383, + "step": 1849 + }, + { + "epoch": 5.040871934604905, + "grad_norm": 10.093647003173828, + "learning_rate": 1.9978162663776882e-05, + "loss": 1.7061, + "step": 1850 + }, + { + "epoch": 5.043596730245231, + "grad_norm": 9.386709213256836, + "learning_rate": 1.9978104335509796e-05, + "loss": 1.5657, + "step": 1851 + }, + { + "epoch": 5.046321525885559, + "grad_norm": 9.914746284484863, + "learning_rate": 1.997804592953355e-05, + "loss": 1.6787, + "step": 1852 + }, + { + "epoch": 5.049046321525886, + "grad_norm": 9.252211570739746, + "learning_rate": 1.9977987445848604e-05, + "loss": 1.6392, + "step": 1853 + }, + { + "epoch": 5.051771117166212, + "grad_norm": 8.123111724853516, + "learning_rate": 1.9977928884455412e-05, + "loss": 1.3396, + "step": 1854 + }, + { + "epoch": 5.05449591280654, + "grad_norm": 28.510730743408203, + "learning_rate": 1.9977870245354435e-05, + "loss": 1.8601, + "step": 1855 + }, + { + "epoch": 5.0572207084468666, + "grad_norm": 11.948402404785156, + "learning_rate": 1.9977811528546124e-05, + "loss": 1.7791, + "step": 1856 + }, + { + "epoch": 5.059945504087193, + "grad_norm": 8.497076988220215, + "learning_rate": 1.9977752734030935e-05, + "loss": 1.7415, + "step": 1857 + }, + { + "epoch": 5.062670299727521, + "grad_norm": 8.519002914428711, + "learning_rate": 1.9977693861809333e-05, + "loss": 1.5273, + "step": 1858 + }, + { + "epoch": 5.0653950953678475, + "grad_norm": 10.040315628051758, + "learning_rate": 1.997763491188177e-05, + "loss": 1.5908, + "step": 1859 + }, + { + "epoch": 5.068119891008174, + "grad_norm": 8.36683177947998, + "learning_rate": 1.9977575884248707e-05, + "loss": 1.4683, + "step": 1860 + }, + { + "epoch": 5.070844686648502, + "grad_norm": 13.225173950195312, + "learning_rate": 1.9977516778910607e-05, + "loss": 1.7437, + "step": 1861 + }, + { + "epoch": 5.073569482288828, + "grad_norm": 12.044672012329102, + "learning_rate": 1.9977457595867924e-05, + "loss": 1.7295, + "step": 1862 + }, + { + "epoch": 5.076294277929155, + "grad_norm": 11.419569969177246, + "learning_rate": 1.9977398335121126e-05, + "loss": 1.833, + "step": 1863 + }, + { + "epoch": 5.079019073569483, + "grad_norm": 9.895974159240723, + "learning_rate": 1.9977338996670665e-05, + "loss": 1.5835, + "step": 1864 + }, + { + "epoch": 5.081743869209809, + "grad_norm": 9.599562644958496, + "learning_rate": 1.9977279580517014e-05, + "loss": 1.6733, + "step": 1865 + }, + { + "epoch": 5.084468664850136, + "grad_norm": 8.531063079833984, + "learning_rate": 1.997722008666063e-05, + "loss": 1.708, + "step": 1866 + }, + { + "epoch": 5.087193460490464, + "grad_norm": 9.288894653320312, + "learning_rate": 1.9977160515101975e-05, + "loss": 1.5151, + "step": 1867 + }, + { + "epoch": 5.08991825613079, + "grad_norm": 10.671904563903809, + "learning_rate": 1.9977100865841516e-05, + "loss": 1.7759, + "step": 1868 + }, + { + "epoch": 5.092643051771117, + "grad_norm": 12.006613731384277, + "learning_rate": 1.997704113887972e-05, + "loss": 1.8088, + "step": 1869 + }, + { + "epoch": 5.0953678474114446, + "grad_norm": 10.795671463012695, + "learning_rate": 1.9976981334217046e-05, + "loss": 1.7363, + "step": 1870 + }, + { + "epoch": 5.098092643051771, + "grad_norm": 8.825675010681152, + "learning_rate": 1.997692145185396e-05, + "loss": 1.7041, + "step": 1871 + }, + { + "epoch": 5.100817438692098, + "grad_norm": 13.146547317504883, + "learning_rate": 1.9976861491790936e-05, + "loss": 1.7576, + "step": 1872 + }, + { + "epoch": 5.1035422343324255, + "grad_norm": 9.561686515808105, + "learning_rate": 1.997680145402843e-05, + "loss": 1.7068, + "step": 1873 + }, + { + "epoch": 5.106267029972752, + "grad_norm": 10.36915111541748, + "learning_rate": 1.997674133856692e-05, + "loss": 1.7524, + "step": 1874 + }, + { + "epoch": 5.108991825613079, + "grad_norm": 8.635497093200684, + "learning_rate": 1.997668114540687e-05, + "loss": 1.7163, + "step": 1875 + }, + { + "epoch": 5.111716621253406, + "grad_norm": 13.613897323608398, + "learning_rate": 1.997662087454874e-05, + "loss": 1.811, + "step": 1876 + }, + { + "epoch": 5.114441416893733, + "grad_norm": 10.332918167114258, + "learning_rate": 1.9976560525993015e-05, + "loss": 1.4631, + "step": 1877 + }, + { + "epoch": 5.11716621253406, + "grad_norm": 9.466386795043945, + "learning_rate": 1.997650009974016e-05, + "loss": 1.4214, + "step": 1878 + }, + { + "epoch": 5.1198910081743865, + "grad_norm": 9.696146011352539, + "learning_rate": 1.997643959579064e-05, + "loss": 1.4692, + "step": 1879 + }, + { + "epoch": 5.122615803814714, + "grad_norm": 11.486430168151855, + "learning_rate": 1.997637901414493e-05, + "loss": 1.6816, + "step": 1880 + }, + { + "epoch": 5.125340599455041, + "grad_norm": 14.753457069396973, + "learning_rate": 1.99763183548035e-05, + "loss": 1.5132, + "step": 1881 + }, + { + "epoch": 5.128065395095367, + "grad_norm": 11.152593612670898, + "learning_rate": 1.9976257617766824e-05, + "loss": 1.6729, + "step": 1882 + }, + { + "epoch": 5.130790190735695, + "grad_norm": 10.37635612487793, + "learning_rate": 1.9976196803035375e-05, + "loss": 1.575, + "step": 1883 + }, + { + "epoch": 5.133514986376022, + "grad_norm": 10.139860153198242, + "learning_rate": 1.9976135910609627e-05, + "loss": 1.7305, + "step": 1884 + }, + { + "epoch": 5.136239782016348, + "grad_norm": 12.509878158569336, + "learning_rate": 1.9976074940490052e-05, + "loss": 1.6179, + "step": 1885 + }, + { + "epoch": 5.138964577656676, + "grad_norm": 12.507528305053711, + "learning_rate": 1.997601389267713e-05, + "loss": 1.6895, + "step": 1886 + }, + { + "epoch": 5.141689373297003, + "grad_norm": 16.414642333984375, + "learning_rate": 1.997595276717133e-05, + "loss": 1.71, + "step": 1887 + }, + { + "epoch": 5.144414168937329, + "grad_norm": 12.145785331726074, + "learning_rate": 1.9975891563973132e-05, + "loss": 1.6699, + "step": 1888 + }, + { + "epoch": 5.147138964577657, + "grad_norm": 14.2864990234375, + "learning_rate": 1.997583028308301e-05, + "loss": 1.7114, + "step": 1889 + }, + { + "epoch": 5.1498637602179835, + "grad_norm": 16.97840690612793, + "learning_rate": 1.9975768924501444e-05, + "loss": 1.5745, + "step": 1890 + }, + { + "epoch": 5.15258855585831, + "grad_norm": 12.979388236999512, + "learning_rate": 1.997570748822891e-05, + "loss": 1.7158, + "step": 1891 + }, + { + "epoch": 5.155313351498638, + "grad_norm": 15.826199531555176, + "learning_rate": 1.997564597426589e-05, + "loss": 1.7612, + "step": 1892 + }, + { + "epoch": 5.1580381471389645, + "grad_norm": 15.385902404785156, + "learning_rate": 1.9975584382612855e-05, + "loss": 1.6587, + "step": 1893 + }, + { + "epoch": 5.160762942779291, + "grad_norm": 18.13292121887207, + "learning_rate": 1.9975522713270296e-05, + "loss": 1.5845, + "step": 1894 + }, + { + "epoch": 5.163487738419619, + "grad_norm": 11.18834114074707, + "learning_rate": 1.997546096623868e-05, + "loss": 1.6758, + "step": 1895 + }, + { + "epoch": 5.166212534059945, + "grad_norm": 10.812143325805664, + "learning_rate": 1.99753991415185e-05, + "loss": 1.7686, + "step": 1896 + }, + { + "epoch": 5.168937329700272, + "grad_norm": 16.42559814453125, + "learning_rate": 1.997533723911023e-05, + "loss": 1.6782, + "step": 1897 + }, + { + "epoch": 5.1716621253406, + "grad_norm": 13.681118965148926, + "learning_rate": 1.997527525901436e-05, + "loss": 1.8354, + "step": 1898 + }, + { + "epoch": 5.174386920980926, + "grad_norm": 47.688968658447266, + "learning_rate": 1.9975213201231363e-05, + "loss": 1.645, + "step": 1899 + }, + { + "epoch": 5.177111716621253, + "grad_norm": 14.734868049621582, + "learning_rate": 1.9975151065761728e-05, + "loss": 1.7627, + "step": 1900 + }, + { + "epoch": 5.179836512261581, + "grad_norm": 14.048941612243652, + "learning_rate": 1.9975088852605938e-05, + "loss": 1.7166, + "step": 1901 + }, + { + "epoch": 5.182561307901907, + "grad_norm": 10.565567970275879, + "learning_rate": 1.9975026561764474e-05, + "loss": 1.5193, + "step": 1902 + }, + { + "epoch": 5.185286103542234, + "grad_norm": 24.844717025756836, + "learning_rate": 1.9974964193237823e-05, + "loss": 1.8198, + "step": 1903 + }, + { + "epoch": 5.1880108991825615, + "grad_norm": 11.01167106628418, + "learning_rate": 1.9974901747026474e-05, + "loss": 1.5588, + "step": 1904 + }, + { + "epoch": 5.190735694822888, + "grad_norm": 12.473700523376465, + "learning_rate": 1.997483922313092e-05, + "loss": 1.6191, + "step": 1905 + }, + { + "epoch": 5.193460490463215, + "grad_norm": 19.939329147338867, + "learning_rate": 1.997477662155163e-05, + "loss": 1.6272, + "step": 1906 + }, + { + "epoch": 5.1961852861035425, + "grad_norm": 10.474801063537598, + "learning_rate": 1.99747139422891e-05, + "loss": 1.658, + "step": 1907 + }, + { + "epoch": 5.198910081743869, + "grad_norm": 9.368407249450684, + "learning_rate": 1.9974651185343822e-05, + "loss": 1.6333, + "step": 1908 + }, + { + "epoch": 5.201634877384196, + "grad_norm": 11.387381553649902, + "learning_rate": 1.997458835071628e-05, + "loss": 1.6475, + "step": 1909 + }, + { + "epoch": 5.204359673024523, + "grad_norm": 10.220231056213379, + "learning_rate": 1.9974525438406966e-05, + "loss": 1.8, + "step": 1910 + }, + { + "epoch": 5.20708446866485, + "grad_norm": 12.36602783203125, + "learning_rate": 1.9974462448416365e-05, + "loss": 1.686, + "step": 1911 + }, + { + "epoch": 5.209809264305177, + "grad_norm": 8.590251922607422, + "learning_rate": 1.9974399380744976e-05, + "loss": 1.647, + "step": 1912 + }, + { + "epoch": 5.212534059945504, + "grad_norm": 9.52476692199707, + "learning_rate": 1.9974336235393283e-05, + "loss": 1.6436, + "step": 1913 + }, + { + "epoch": 5.215258855585831, + "grad_norm": 13.15280532836914, + "learning_rate": 1.9974273012361784e-05, + "loss": 1.7412, + "step": 1914 + }, + { + "epoch": 5.217983651226158, + "grad_norm": 12.537514686584473, + "learning_rate": 1.9974209711650964e-05, + "loss": 1.7622, + "step": 1915 + }, + { + "epoch": 5.220708446866485, + "grad_norm": 14.053447723388672, + "learning_rate": 1.9974146333261323e-05, + "loss": 1.7861, + "step": 1916 + }, + { + "epoch": 5.223433242506812, + "grad_norm": 8.49190616607666, + "learning_rate": 1.997408287719335e-05, + "loss": 1.7324, + "step": 1917 + }, + { + "epoch": 5.226158038147139, + "grad_norm": 10.375123023986816, + "learning_rate": 1.997401934344754e-05, + "loss": 1.6785, + "step": 1918 + }, + { + "epoch": 5.228882833787466, + "grad_norm": 11.195998191833496, + "learning_rate": 1.997395573202439e-05, + "loss": 1.6948, + "step": 1919 + }, + { + "epoch": 5.231607629427793, + "grad_norm": 13.794561386108398, + "learning_rate": 1.997389204292439e-05, + "loss": 1.6665, + "step": 1920 + }, + { + "epoch": 5.23433242506812, + "grad_norm": 8.96519947052002, + "learning_rate": 1.9973828276148043e-05, + "loss": 1.4685, + "step": 1921 + }, + { + "epoch": 5.237057220708447, + "grad_norm": 9.925034523010254, + "learning_rate": 1.9973764431695844e-05, + "loss": 1.7209, + "step": 1922 + }, + { + "epoch": 5.239782016348774, + "grad_norm": 10.551443099975586, + "learning_rate": 1.9973700509568287e-05, + "loss": 1.8154, + "step": 1923 + }, + { + "epoch": 5.2425068119891005, + "grad_norm": 8.865917205810547, + "learning_rate": 1.997363650976587e-05, + "loss": 1.6018, + "step": 1924 + }, + { + "epoch": 5.245231607629428, + "grad_norm": 10.166401863098145, + "learning_rate": 1.9973572432289094e-05, + "loss": 1.7842, + "step": 1925 + }, + { + "epoch": 5.247956403269755, + "grad_norm": 9.873787879943848, + "learning_rate": 1.9973508277138457e-05, + "loss": 1.6418, + "step": 1926 + }, + { + "epoch": 5.2506811989100814, + "grad_norm": 30.08473777770996, + "learning_rate": 1.9973444044314458e-05, + "loss": 1.6238, + "step": 1927 + }, + { + "epoch": 5.253405994550409, + "grad_norm": 11.543693542480469, + "learning_rate": 1.99733797338176e-05, + "loss": 1.6841, + "step": 1928 + }, + { + "epoch": 5.256130790190736, + "grad_norm": 15.977535247802734, + "learning_rate": 1.9973315345648374e-05, + "loss": 1.8975, + "step": 1929 + }, + { + "epoch": 5.258855585831062, + "grad_norm": 11.794048309326172, + "learning_rate": 1.9973250879807295e-05, + "loss": 1.708, + "step": 1930 + }, + { + "epoch": 5.26158038147139, + "grad_norm": 11.914398193359375, + "learning_rate": 1.9973186336294857e-05, + "loss": 1.9424, + "step": 1931 + }, + { + "epoch": 5.264305177111717, + "grad_norm": 12.993264198303223, + "learning_rate": 1.9973121715111568e-05, + "loss": 1.7119, + "step": 1932 + }, + { + "epoch": 5.267029972752043, + "grad_norm": 8.076578140258789, + "learning_rate": 1.997305701625793e-05, + "loss": 1.5771, + "step": 1933 + }, + { + "epoch": 5.269754768392371, + "grad_norm": 22.118816375732422, + "learning_rate": 1.997299223973444e-05, + "loss": 1.5959, + "step": 1934 + }, + { + "epoch": 5.272479564032698, + "grad_norm": 13.975380897521973, + "learning_rate": 1.997292738554161e-05, + "loss": 1.7395, + "step": 1935 + }, + { + "epoch": 5.275204359673024, + "grad_norm": 28.772640228271484, + "learning_rate": 1.997286245367994e-05, + "loss": 1.792, + "step": 1936 + }, + { + "epoch": 5.277929155313352, + "grad_norm": 12.679280281066895, + "learning_rate": 1.997279744414994e-05, + "loss": 1.6987, + "step": 1937 + }, + { + "epoch": 5.2806539509536785, + "grad_norm": 10.289875984191895, + "learning_rate": 1.9972732356952115e-05, + "loss": 1.8115, + "step": 1938 + }, + { + "epoch": 5.283378746594005, + "grad_norm": 9.017131805419922, + "learning_rate": 1.997266719208697e-05, + "loss": 1.4751, + "step": 1939 + }, + { + "epoch": 5.286103542234333, + "grad_norm": 11.865049362182617, + "learning_rate": 1.9972601949555015e-05, + "loss": 2.021, + "step": 1940 + }, + { + "epoch": 5.2888283378746594, + "grad_norm": 15.10794734954834, + "learning_rate": 1.9972536629356756e-05, + "loss": 1.8965, + "step": 1941 + }, + { + "epoch": 5.291553133514986, + "grad_norm": 11.373397827148438, + "learning_rate": 1.99724712314927e-05, + "loss": 1.8027, + "step": 1942 + }, + { + "epoch": 5.294277929155314, + "grad_norm": 12.007485389709473, + "learning_rate": 1.9972405755963362e-05, + "loss": 1.7007, + "step": 1943 + }, + { + "epoch": 5.29700272479564, + "grad_norm": 11.727828025817871, + "learning_rate": 1.997234020276925e-05, + "loss": 1.6819, + "step": 1944 + }, + { + "epoch": 5.299727520435967, + "grad_norm": 23.94923973083496, + "learning_rate": 1.9972274571910873e-05, + "loss": 1.5952, + "step": 1945 + }, + { + "epoch": 5.302452316076295, + "grad_norm": 15.61506175994873, + "learning_rate": 1.9972208863388744e-05, + "loss": 1.5334, + "step": 1946 + }, + { + "epoch": 5.305177111716621, + "grad_norm": 10.43548583984375, + "learning_rate": 1.997214307720337e-05, + "loss": 1.7183, + "step": 1947 + }, + { + "epoch": 5.307901907356948, + "grad_norm": 15.498167991638184, + "learning_rate": 1.997207721335527e-05, + "loss": 1.7815, + "step": 1948 + }, + { + "epoch": 5.310626702997276, + "grad_norm": 10.394688606262207, + "learning_rate": 1.997201127184495e-05, + "loss": 1.8184, + "step": 1949 + }, + { + "epoch": 5.313351498637602, + "grad_norm": 10.260842323303223, + "learning_rate": 1.9971945252672927e-05, + "loss": 1.7708, + "step": 1950 + }, + { + "epoch": 5.316076294277929, + "grad_norm": 10.0009765625, + "learning_rate": 1.9971879155839717e-05, + "loss": 1.6846, + "step": 1951 + }, + { + "epoch": 5.3188010899182565, + "grad_norm": 11.772761344909668, + "learning_rate": 1.9971812981345834e-05, + "loss": 1.5054, + "step": 1952 + }, + { + "epoch": 5.321525885558583, + "grad_norm": 14.363198280334473, + "learning_rate": 1.9971746729191792e-05, + "loss": 1.8584, + "step": 1953 + }, + { + "epoch": 5.32425068119891, + "grad_norm": 11.569507598876953, + "learning_rate": 1.9971680399378107e-05, + "loss": 1.5986, + "step": 1954 + }, + { + "epoch": 5.3269754768392374, + "grad_norm": 10.486541748046875, + "learning_rate": 1.9971613991905298e-05, + "loss": 1.4114, + "step": 1955 + }, + { + "epoch": 5.329700272479564, + "grad_norm": 9.989212989807129, + "learning_rate": 1.9971547506773875e-05, + "loss": 1.6077, + "step": 1956 + }, + { + "epoch": 5.332425068119891, + "grad_norm": 10.298331260681152, + "learning_rate": 1.9971480943984364e-05, + "loss": 1.7222, + "step": 1957 + }, + { + "epoch": 5.335149863760218, + "grad_norm": 13.963698387145996, + "learning_rate": 1.997141430353728e-05, + "loss": 1.5579, + "step": 1958 + }, + { + "epoch": 5.337874659400545, + "grad_norm": 9.665743827819824, + "learning_rate": 1.9971347585433145e-05, + "loss": 1.6621, + "step": 1959 + }, + { + "epoch": 5.340599455040872, + "grad_norm": 20.565250396728516, + "learning_rate": 1.9971280789672474e-05, + "loss": 1.4971, + "step": 1960 + }, + { + "epoch": 5.343324250681199, + "grad_norm": 9.76312255859375, + "learning_rate": 1.9971213916255788e-05, + "loss": 1.689, + "step": 1961 + }, + { + "epoch": 5.346049046321526, + "grad_norm": 13.125452041625977, + "learning_rate": 1.997114696518361e-05, + "loss": 1.6313, + "step": 1962 + }, + { + "epoch": 5.348773841961853, + "grad_norm": 10.671045303344727, + "learning_rate": 1.997107993645646e-05, + "loss": 1.5195, + "step": 1963 + }, + { + "epoch": 5.35149863760218, + "grad_norm": 12.833518028259277, + "learning_rate": 1.997101283007486e-05, + "loss": 1.8257, + "step": 1964 + }, + { + "epoch": 5.354223433242507, + "grad_norm": 13.581474304199219, + "learning_rate": 1.9970945646039336e-05, + "loss": 1.8911, + "step": 1965 + }, + { + "epoch": 5.356948228882834, + "grad_norm": 8.949580192565918, + "learning_rate": 1.9970878384350404e-05, + "loss": 1.5591, + "step": 1966 + }, + { + "epoch": 5.359673024523161, + "grad_norm": 8.894742965698242, + "learning_rate": 1.9970811045008592e-05, + "loss": 1.5896, + "step": 1967 + }, + { + "epoch": 5.362397820163488, + "grad_norm": 11.158965110778809, + "learning_rate": 1.9970743628014428e-05, + "loss": 1.7842, + "step": 1968 + }, + { + "epoch": 5.3651226158038146, + "grad_norm": 10.686578750610352, + "learning_rate": 1.997067613336843e-05, + "loss": 1.6257, + "step": 1969 + }, + { + "epoch": 5.367847411444142, + "grad_norm": 10.511839866638184, + "learning_rate": 1.997060856107113e-05, + "loss": 1.8301, + "step": 1970 + }, + { + "epoch": 5.370572207084469, + "grad_norm": 8.157552719116211, + "learning_rate": 1.9970540911123052e-05, + "loss": 1.6621, + "step": 1971 + }, + { + "epoch": 5.3732970027247955, + "grad_norm": 14.843273162841797, + "learning_rate": 1.997047318352472e-05, + "loss": 1.5149, + "step": 1972 + }, + { + "epoch": 5.376021798365123, + "grad_norm": 12.004420280456543, + "learning_rate": 1.9970405378276666e-05, + "loss": 1.6685, + "step": 1973 + }, + { + "epoch": 5.37874659400545, + "grad_norm": 11.34261417388916, + "learning_rate": 1.997033749537941e-05, + "loss": 1.8472, + "step": 1974 + }, + { + "epoch": 5.381471389645776, + "grad_norm": 11.158589363098145, + "learning_rate": 1.9970269534833492e-05, + "loss": 1.4712, + "step": 1975 + }, + { + "epoch": 5.384196185286104, + "grad_norm": 8.92293643951416, + "learning_rate": 1.9970201496639436e-05, + "loss": 1.6367, + "step": 1976 + }, + { + "epoch": 5.386920980926431, + "grad_norm": 8.600255966186523, + "learning_rate": 1.997013338079777e-05, + "loss": 1.5042, + "step": 1977 + }, + { + "epoch": 5.389645776566757, + "grad_norm": 9.92839527130127, + "learning_rate": 1.9970065187309025e-05, + "loss": 1.6592, + "step": 1978 + }, + { + "epoch": 5.392370572207085, + "grad_norm": 21.944948196411133, + "learning_rate": 1.9969996916173735e-05, + "loss": 1.9316, + "step": 1979 + }, + { + "epoch": 5.395095367847412, + "grad_norm": 12.78380012512207, + "learning_rate": 1.996992856739243e-05, + "loss": 1.8149, + "step": 1980 + }, + { + "epoch": 5.397820163487738, + "grad_norm": 11.880173683166504, + "learning_rate": 1.9969860140965643e-05, + "loss": 1.6606, + "step": 1981 + }, + { + "epoch": 5.400544959128065, + "grad_norm": 9.758583068847656, + "learning_rate": 1.9969791636893904e-05, + "loss": 1.6963, + "step": 1982 + }, + { + "epoch": 5.4032697547683926, + "grad_norm": 12.348323822021484, + "learning_rate": 1.9969723055177748e-05, + "loss": 1.7661, + "step": 1983 + }, + { + "epoch": 5.405994550408719, + "grad_norm": 18.636323928833008, + "learning_rate": 1.9969654395817714e-05, + "loss": 1.6973, + "step": 1984 + }, + { + "epoch": 5.408719346049046, + "grad_norm": 10.546487808227539, + "learning_rate": 1.9969585658814327e-05, + "loss": 1.8486, + "step": 1985 + }, + { + "epoch": 5.4114441416893735, + "grad_norm": 9.425722122192383, + "learning_rate": 1.9969516844168132e-05, + "loss": 1.5786, + "step": 1986 + }, + { + "epoch": 5.4141689373297, + "grad_norm": 10.106487274169922, + "learning_rate": 1.9969447951879655e-05, + "loss": 1.8281, + "step": 1987 + }, + { + "epoch": 5.416893732970027, + "grad_norm": 9.693245887756348, + "learning_rate": 1.9969378981949445e-05, + "loss": 1.6099, + "step": 1988 + }, + { + "epoch": 5.419618528610354, + "grad_norm": 9.235607147216797, + "learning_rate": 1.996930993437803e-05, + "loss": 1.6379, + "step": 1989 + }, + { + "epoch": 5.422343324250681, + "grad_norm": 11.294902801513672, + "learning_rate": 1.9969240809165948e-05, + "loss": 1.614, + "step": 1990 + }, + { + "epoch": 5.425068119891008, + "grad_norm": 12.546422958374023, + "learning_rate": 1.9969171606313742e-05, + "loss": 1.6875, + "step": 1991 + }, + { + "epoch": 5.427792915531335, + "grad_norm": 10.250531196594238, + "learning_rate": 1.9969102325821947e-05, + "loss": 1.7649, + "step": 1992 + }, + { + "epoch": 5.430517711171662, + "grad_norm": 9.09671688079834, + "learning_rate": 1.9969032967691106e-05, + "loss": 1.7554, + "step": 1993 + }, + { + "epoch": 5.433242506811989, + "grad_norm": 9.852420806884766, + "learning_rate": 1.9968963531921753e-05, + "loss": 1.6787, + "step": 1994 + }, + { + "epoch": 5.435967302452316, + "grad_norm": 9.900439262390137, + "learning_rate": 1.9968894018514434e-05, + "loss": 1.5818, + "step": 1995 + }, + { + "epoch": 5.438692098092643, + "grad_norm": 9.226574897766113, + "learning_rate": 1.996882442746969e-05, + "loss": 1.4751, + "step": 1996 + }, + { + "epoch": 5.44141689373297, + "grad_norm": 9.87454605102539, + "learning_rate": 1.9968754758788064e-05, + "loss": 1.7722, + "step": 1997 + }, + { + "epoch": 5.444141689373297, + "grad_norm": 10.80100154876709, + "learning_rate": 1.9968685012470097e-05, + "loss": 1.6931, + "step": 1998 + }, + { + "epoch": 5.446866485013624, + "grad_norm": 9.997541427612305, + "learning_rate": 1.996861518851633e-05, + "loss": 1.7524, + "step": 1999 + }, + { + "epoch": 5.449591280653951, + "grad_norm": 10.228842735290527, + "learning_rate": 1.996854528692731e-05, + "loss": 1.6123, + "step": 2000 + }, + { + "epoch": 5.452316076294278, + "grad_norm": 10.22179889678955, + "learning_rate": 1.996847530770358e-05, + "loss": 1.4919, + "step": 2001 + }, + { + "epoch": 5.455040871934605, + "grad_norm": 22.50702667236328, + "learning_rate": 1.996840525084568e-05, + "loss": 1.8882, + "step": 2002 + }, + { + "epoch": 5.4577656675749315, + "grad_norm": 9.13119125366211, + "learning_rate": 1.996833511635417e-05, + "loss": 1.4927, + "step": 2003 + }, + { + "epoch": 5.460490463215259, + "grad_norm": 10.396625518798828, + "learning_rate": 1.996826490422958e-05, + "loss": 1.769, + "step": 2004 + }, + { + "epoch": 5.463215258855586, + "grad_norm": 10.584822654724121, + "learning_rate": 1.9968194614472465e-05, + "loss": 1.4788, + "step": 2005 + }, + { + "epoch": 5.4659400544959125, + "grad_norm": 14.889788627624512, + "learning_rate": 1.9968124247083375e-05, + "loss": 1.4604, + "step": 2006 + }, + { + "epoch": 5.46866485013624, + "grad_norm": 8.787952423095703, + "learning_rate": 1.996805380206285e-05, + "loss": 1.6577, + "step": 2007 + }, + { + "epoch": 5.471389645776567, + "grad_norm": 36.39643096923828, + "learning_rate": 1.9967983279411442e-05, + "loss": 1.5061, + "step": 2008 + }, + { + "epoch": 5.474114441416893, + "grad_norm": 10.348734855651855, + "learning_rate": 1.9967912679129708e-05, + "loss": 1.7217, + "step": 2009 + }, + { + "epoch": 5.476839237057221, + "grad_norm": 12.849311828613281, + "learning_rate": 1.9967842001218183e-05, + "loss": 1.6465, + "step": 2010 + }, + { + "epoch": 5.479564032697548, + "grad_norm": 16.13958740234375, + "learning_rate": 1.9967771245677427e-05, + "loss": 1.7622, + "step": 2011 + }, + { + "epoch": 5.482288828337874, + "grad_norm": 14.944127082824707, + "learning_rate": 1.996770041250799e-05, + "loss": 1.854, + "step": 2012 + }, + { + "epoch": 5.485013623978202, + "grad_norm": 9.569435119628906, + "learning_rate": 1.9967629501710423e-05, + "loss": 1.605, + "step": 2013 + }, + { + "epoch": 5.487738419618529, + "grad_norm": 10.095573425292969, + "learning_rate": 1.996755851328528e-05, + "loss": 1.7275, + "step": 2014 + }, + { + "epoch": 5.490463215258855, + "grad_norm": 10.504908561706543, + "learning_rate": 1.9967487447233114e-05, + "loss": 1.7283, + "step": 2015 + }, + { + "epoch": 5.493188010899183, + "grad_norm": 8.080174446105957, + "learning_rate": 1.9967416303554472e-05, + "loss": 1.458, + "step": 2016 + }, + { + "epoch": 5.4959128065395095, + "grad_norm": 11.463164329528809, + "learning_rate": 1.9967345082249912e-05, + "loss": 1.7104, + "step": 2017 + }, + { + "epoch": 5.498637602179836, + "grad_norm": 13.109505653381348, + "learning_rate": 1.9967273783319993e-05, + "loss": 1.5955, + "step": 2018 + }, + { + "epoch": 5.501362397820164, + "grad_norm": 10.553297996520996, + "learning_rate": 1.996720240676527e-05, + "loss": 1.7117, + "step": 2019 + }, + { + "epoch": 5.5040871934604905, + "grad_norm": 9.326204299926758, + "learning_rate": 1.9967130952586286e-05, + "loss": 1.6833, + "step": 2020 + }, + { + "epoch": 5.506811989100817, + "grad_norm": 11.271936416625977, + "learning_rate": 1.9967059420783612e-05, + "loss": 1.7017, + "step": 2021 + }, + { + "epoch": 5.509536784741145, + "grad_norm": 9.598100662231445, + "learning_rate": 1.9966987811357798e-05, + "loss": 1.6323, + "step": 2022 + }, + { + "epoch": 5.512261580381471, + "grad_norm": 8.798504829406738, + "learning_rate": 1.9966916124309404e-05, + "loss": 1.543, + "step": 2023 + }, + { + "epoch": 5.514986376021798, + "grad_norm": 10.221184730529785, + "learning_rate": 1.9966844359638992e-05, + "loss": 1.7039, + "step": 2024 + }, + { + "epoch": 5.517711171662126, + "grad_norm": 9.18807601928711, + "learning_rate": 1.9966772517347114e-05, + "loss": 1.6016, + "step": 2025 + }, + { + "epoch": 5.520435967302452, + "grad_norm": 10.857856750488281, + "learning_rate": 1.9966700597434333e-05, + "loss": 1.6917, + "step": 2026 + }, + { + "epoch": 5.523160762942779, + "grad_norm": 9.961305618286133, + "learning_rate": 1.9966628599901208e-05, + "loss": 1.5222, + "step": 2027 + }, + { + "epoch": 5.525885558583107, + "grad_norm": 12.995038032531738, + "learning_rate": 1.99665565247483e-05, + "loss": 1.72, + "step": 2028 + }, + { + "epoch": 5.528610354223433, + "grad_norm": 11.066896438598633, + "learning_rate": 1.9966484371976168e-05, + "loss": 1.9131, + "step": 2029 + }, + { + "epoch": 5.53133514986376, + "grad_norm": 9.92104721069336, + "learning_rate": 1.996641214158538e-05, + "loss": 1.8105, + "step": 2030 + }, + { + "epoch": 5.5340599455040875, + "grad_norm": 11.066975593566895, + "learning_rate": 1.9966339833576496e-05, + "loss": 1.6252, + "step": 2031 + }, + { + "epoch": 5.536784741144414, + "grad_norm": 10.61975383758545, + "learning_rate": 1.9966267447950076e-05, + "loss": 1.8926, + "step": 2032 + }, + { + "epoch": 5.539509536784741, + "grad_norm": 11.257098197937012, + "learning_rate": 1.9966194984706686e-05, + "loss": 1.707, + "step": 2033 + }, + { + "epoch": 5.5422343324250685, + "grad_norm": 9.231466293334961, + "learning_rate": 1.996612244384689e-05, + "loss": 1.7954, + "step": 2034 + }, + { + "epoch": 5.544959128065395, + "grad_norm": 12.137299537658691, + "learning_rate": 1.9966049825371254e-05, + "loss": 1.8252, + "step": 2035 + }, + { + "epoch": 5.547683923705722, + "grad_norm": 9.002218246459961, + "learning_rate": 1.9965977129280344e-05, + "loss": 1.6177, + "step": 2036 + }, + { + "epoch": 5.550408719346049, + "grad_norm": 11.364861488342285, + "learning_rate": 1.9965904355574723e-05, + "loss": 1.7212, + "step": 2037 + }, + { + "epoch": 5.553133514986376, + "grad_norm": 13.221735000610352, + "learning_rate": 1.996583150425496e-05, + "loss": 1.9946, + "step": 2038 + }, + { + "epoch": 5.555858310626703, + "grad_norm": 10.66685962677002, + "learning_rate": 1.996575857532162e-05, + "loss": 1.6626, + "step": 2039 + }, + { + "epoch": 5.55858310626703, + "grad_norm": 8.7399320602417, + "learning_rate": 1.996568556877528e-05, + "loss": 1.6018, + "step": 2040 + }, + { + "epoch": 5.561307901907357, + "grad_norm": 10.089179039001465, + "learning_rate": 1.996561248461649e-05, + "loss": 1.6326, + "step": 2041 + }, + { + "epoch": 5.564032697547684, + "grad_norm": 9.229874610900879, + "learning_rate": 1.996553932284584e-05, + "loss": 1.6128, + "step": 2042 + }, + { + "epoch": 5.566757493188011, + "grad_norm": 10.963753700256348, + "learning_rate": 1.9965466083463886e-05, + "loss": 1.4976, + "step": 2043 + }, + { + "epoch": 5.569482288828338, + "grad_norm": 11.130434036254883, + "learning_rate": 1.9965392766471205e-05, + "loss": 1.915, + "step": 2044 + }, + { + "epoch": 5.572207084468665, + "grad_norm": 8.809657096862793, + "learning_rate": 1.9965319371868367e-05, + "loss": 1.4905, + "step": 2045 + }, + { + "epoch": 5.574931880108992, + "grad_norm": 10.36462116241455, + "learning_rate": 1.996524589965594e-05, + "loss": 1.7361, + "step": 2046 + }, + { + "epoch": 5.577656675749319, + "grad_norm": 41.264801025390625, + "learning_rate": 1.99651723498345e-05, + "loss": 1.623, + "step": 2047 + }, + { + "epoch": 5.580381471389646, + "grad_norm": 8.902155876159668, + "learning_rate": 1.9965098722404617e-05, + "loss": 1.551, + "step": 2048 + }, + { + "epoch": 5.583106267029972, + "grad_norm": 11.729252815246582, + "learning_rate": 1.9965025017366867e-05, + "loss": 1.8154, + "step": 2049 + }, + { + "epoch": 5.5858310626703, + "grad_norm": 9.16838264465332, + "learning_rate": 1.9964951234721824e-05, + "loss": 1.7109, + "step": 2050 + }, + { + "epoch": 5.5885558583106265, + "grad_norm": 9.499626159667969, + "learning_rate": 1.996487737447006e-05, + "loss": 1.5315, + "step": 2051 + }, + { + "epoch": 5.591280653950953, + "grad_norm": 11.185776710510254, + "learning_rate": 1.9964803436612152e-05, + "loss": 1.7524, + "step": 2052 + }, + { + "epoch": 5.594005449591281, + "grad_norm": 14.046220779418945, + "learning_rate": 1.9964729421148676e-05, + "loss": 1.6965, + "step": 2053 + }, + { + "epoch": 5.5967302452316074, + "grad_norm": 10.339086532592773, + "learning_rate": 1.9964655328080207e-05, + "loss": 1.5032, + "step": 2054 + }, + { + "epoch": 5.599455040871934, + "grad_norm": 9.257699012756348, + "learning_rate": 1.9964581157407324e-05, + "loss": 1.4612, + "step": 2055 + }, + { + "epoch": 5.602179836512262, + "grad_norm": 8.680740356445312, + "learning_rate": 1.99645069091306e-05, + "loss": 1.4697, + "step": 2056 + }, + { + "epoch": 5.604904632152588, + "grad_norm": 15.50500202178955, + "learning_rate": 1.996443258325062e-05, + "loss": 1.7192, + "step": 2057 + }, + { + "epoch": 5.607629427792915, + "grad_norm": 10.124307632446289, + "learning_rate": 1.996435817976796e-05, + "loss": 1.6511, + "step": 2058 + }, + { + "epoch": 5.610354223433243, + "grad_norm": 18.231836318969727, + "learning_rate": 1.99642836986832e-05, + "loss": 1.7922, + "step": 2059 + }, + { + "epoch": 5.613079019073569, + "grad_norm": 10.452853202819824, + "learning_rate": 1.9964209139996917e-05, + "loss": 1.5552, + "step": 2060 + }, + { + "epoch": 5.615803814713896, + "grad_norm": 10.715081214904785, + "learning_rate": 1.9964134503709695e-05, + "loss": 1.5347, + "step": 2061 + }, + { + "epoch": 5.618528610354224, + "grad_norm": 9.665472030639648, + "learning_rate": 1.9964059789822118e-05, + "loss": 1.9624, + "step": 2062 + }, + { + "epoch": 5.62125340599455, + "grad_norm": 10.516495704650879, + "learning_rate": 1.9963984998334757e-05, + "loss": 1.6941, + "step": 2063 + }, + { + "epoch": 5.623978201634877, + "grad_norm": 10.411148071289062, + "learning_rate": 1.9963910129248206e-05, + "loss": 1.6367, + "step": 2064 + }, + { + "epoch": 5.6267029972752045, + "grad_norm": 10.789862632751465, + "learning_rate": 1.9963835182563043e-05, + "loss": 1.8081, + "step": 2065 + }, + { + "epoch": 5.629427792915531, + "grad_norm": 10.961912155151367, + "learning_rate": 1.996376015827985e-05, + "loss": 1.4958, + "step": 2066 + }, + { + "epoch": 5.632152588555858, + "grad_norm": 9.865840911865234, + "learning_rate": 1.9963685056399217e-05, + "loss": 1.5815, + "step": 2067 + }, + { + "epoch": 5.6348773841961854, + "grad_norm": 12.462875366210938, + "learning_rate": 1.9963609876921722e-05, + "loss": 1.7671, + "step": 2068 + }, + { + "epoch": 5.637602179836512, + "grad_norm": 11.314741134643555, + "learning_rate": 1.9963534619847956e-05, + "loss": 1.8618, + "step": 2069 + }, + { + "epoch": 5.640326975476839, + "grad_norm": 86.43844604492188, + "learning_rate": 1.9963459285178505e-05, + "loss": 1.699, + "step": 2070 + }, + { + "epoch": 5.643051771117166, + "grad_norm": 10.88832950592041, + "learning_rate": 1.996338387291395e-05, + "loss": 1.5166, + "step": 2071 + }, + { + "epoch": 5.645776566757493, + "grad_norm": 13.507354736328125, + "learning_rate": 1.9963308383054883e-05, + "loss": 1.5952, + "step": 2072 + }, + { + "epoch": 5.64850136239782, + "grad_norm": 9.790104866027832, + "learning_rate": 1.9963232815601896e-05, + "loss": 1.696, + "step": 2073 + }, + { + "epoch": 5.651226158038147, + "grad_norm": 10.6688814163208, + "learning_rate": 1.9963157170555564e-05, + "loss": 1.6699, + "step": 2074 + }, + { + "epoch": 5.653950953678474, + "grad_norm": 10.911157608032227, + "learning_rate": 1.996308144791649e-05, + "loss": 1.7339, + "step": 2075 + }, + { + "epoch": 5.656675749318801, + "grad_norm": 16.183406829833984, + "learning_rate": 1.9963005647685256e-05, + "loss": 1.4517, + "step": 2076 + }, + { + "epoch": 5.659400544959128, + "grad_norm": 11.098819732666016, + "learning_rate": 1.9962929769862456e-05, + "loss": 1.73, + "step": 2077 + }, + { + "epoch": 5.662125340599455, + "grad_norm": 13.996894836425781, + "learning_rate": 1.996285381444868e-05, + "loss": 1.6396, + "step": 2078 + }, + { + "epoch": 5.664850136239782, + "grad_norm": 15.200331687927246, + "learning_rate": 1.9962777781444518e-05, + "loss": 1.7942, + "step": 2079 + }, + { + "epoch": 5.667574931880109, + "grad_norm": 26.82591438293457, + "learning_rate": 1.9962701670850566e-05, + "loss": 1.8101, + "step": 2080 + }, + { + "epoch": 5.670299727520436, + "grad_norm": 9.281715393066406, + "learning_rate": 1.996262548266741e-05, + "loss": 1.55, + "step": 2081 + }, + { + "epoch": 5.6730245231607626, + "grad_norm": 14.311118125915527, + "learning_rate": 1.996254921689565e-05, + "loss": 1.7439, + "step": 2082 + }, + { + "epoch": 5.67574931880109, + "grad_norm": 15.628812789916992, + "learning_rate": 1.9962472873535877e-05, + "loss": 1.8042, + "step": 2083 + }, + { + "epoch": 5.678474114441417, + "grad_norm": 12.210664749145508, + "learning_rate": 1.9962396452588684e-05, + "loss": 1.7661, + "step": 2084 + }, + { + "epoch": 5.6811989100817435, + "grad_norm": 12.074110984802246, + "learning_rate": 1.996231995405467e-05, + "loss": 1.551, + "step": 2085 + }, + { + "epoch": 5.683923705722071, + "grad_norm": 8.891280174255371, + "learning_rate": 1.996224337793443e-05, + "loss": 1.3794, + "step": 2086 + }, + { + "epoch": 5.686648501362398, + "grad_norm": 12.006574630737305, + "learning_rate": 1.996216672422856e-05, + "loss": 1.7454, + "step": 2087 + }, + { + "epoch": 5.689373297002724, + "grad_norm": 12.251750946044922, + "learning_rate": 1.996208999293765e-05, + "loss": 1.6145, + "step": 2088 + }, + { + "epoch": 5.692098092643052, + "grad_norm": 12.137250900268555, + "learning_rate": 1.9962013184062308e-05, + "loss": 1.595, + "step": 2089 + }, + { + "epoch": 5.694822888283379, + "grad_norm": 16.92084312438965, + "learning_rate": 1.996193629760313e-05, + "loss": 1.4574, + "step": 2090 + }, + { + "epoch": 5.697547683923705, + "grad_norm": 15.800286293029785, + "learning_rate": 1.9961859333560708e-05, + "loss": 1.8149, + "step": 2091 + }, + { + "epoch": 5.700272479564033, + "grad_norm": 17.070358276367188, + "learning_rate": 1.9961782291935648e-05, + "loss": 1.7407, + "step": 2092 + }, + { + "epoch": 5.70299727520436, + "grad_norm": 11.122482299804688, + "learning_rate": 1.9961705172728547e-05, + "loss": 1.7949, + "step": 2093 + }, + { + "epoch": 5.705722070844686, + "grad_norm": 13.73668384552002, + "learning_rate": 1.996162797594001e-05, + "loss": 1.7913, + "step": 2094 + }, + { + "epoch": 5.708446866485014, + "grad_norm": 10.459869384765625, + "learning_rate": 1.9961550701570633e-05, + "loss": 1.3384, + "step": 2095 + }, + { + "epoch": 5.7111716621253406, + "grad_norm": 10.803874015808105, + "learning_rate": 1.996147334962102e-05, + "loss": 1.8022, + "step": 2096 + }, + { + "epoch": 5.713896457765667, + "grad_norm": 10.83578872680664, + "learning_rate": 1.9961395920091773e-05, + "loss": 1.6157, + "step": 2097 + }, + { + "epoch": 5.716621253405995, + "grad_norm": 15.397379875183105, + "learning_rate": 1.9961318412983494e-05, + "loss": 1.7383, + "step": 2098 + }, + { + "epoch": 5.7193460490463215, + "grad_norm": 15.053755760192871, + "learning_rate": 1.996124082829679e-05, + "loss": 1.7429, + "step": 2099 + }, + { + "epoch": 5.722070844686648, + "grad_norm": 14.341357231140137, + "learning_rate": 1.996116316603226e-05, + "loss": 2.02, + "step": 2100 + }, + { + "epoch": 5.724795640326976, + "grad_norm": 20.855138778686523, + "learning_rate": 1.9961085426190516e-05, + "loss": 1.9399, + "step": 2101 + }, + { + "epoch": 5.727520435967302, + "grad_norm": 11.542928695678711, + "learning_rate": 1.9961007608772157e-05, + "loss": 1.7102, + "step": 2102 + }, + { + "epoch": 5.730245231607629, + "grad_norm": 11.331934928894043, + "learning_rate": 1.996092971377779e-05, + "loss": 1.8606, + "step": 2103 + }, + { + "epoch": 5.732970027247957, + "grad_norm": 10.98530387878418, + "learning_rate": 1.996085174120803e-05, + "loss": 1.7747, + "step": 2104 + }, + { + "epoch": 5.735694822888283, + "grad_norm": 11.881148338317871, + "learning_rate": 1.9960773691063468e-05, + "loss": 1.7354, + "step": 2105 + }, + { + "epoch": 5.73841961852861, + "grad_norm": 13.253885269165039, + "learning_rate": 1.9960695563344727e-05, + "loss": 1.8047, + "step": 2106 + }, + { + "epoch": 5.741144414168938, + "grad_norm": 14.778120040893555, + "learning_rate": 1.9960617358052404e-05, + "loss": 1.7551, + "step": 2107 + }, + { + "epoch": 5.743869209809264, + "grad_norm": 10.513572692871094, + "learning_rate": 1.9960539075187116e-05, + "loss": 1.5071, + "step": 2108 + }, + { + "epoch": 5.746594005449591, + "grad_norm": 13.157445907592773, + "learning_rate": 1.996046071474947e-05, + "loss": 1.8066, + "step": 2109 + }, + { + "epoch": 5.7493188010899186, + "grad_norm": 9.51871395111084, + "learning_rate": 1.996038227674008e-05, + "loss": 1.5996, + "step": 2110 + }, + { + "epoch": 5.752043596730245, + "grad_norm": 16.539831161499023, + "learning_rate": 1.9960303761159552e-05, + "loss": 1.6382, + "step": 2111 + }, + { + "epoch": 5.754768392370572, + "grad_norm": 11.248241424560547, + "learning_rate": 1.9960225168008498e-05, + "loss": 1.4172, + "step": 2112 + }, + { + "epoch": 5.7574931880108995, + "grad_norm": 11.98831558227539, + "learning_rate": 1.9960146497287532e-05, + "loss": 1.7786, + "step": 2113 + }, + { + "epoch": 5.760217983651226, + "grad_norm": 12.180619239807129, + "learning_rate": 1.9960067748997264e-05, + "loss": 1.8003, + "step": 2114 + }, + { + "epoch": 5.762942779291553, + "grad_norm": 10.6093168258667, + "learning_rate": 1.995998892313831e-05, + "loss": 1.5938, + "step": 2115 + }, + { + "epoch": 5.76566757493188, + "grad_norm": 9.59289836883545, + "learning_rate": 1.9959910019711282e-05, + "loss": 1.646, + "step": 2116 + }, + { + "epoch": 5.768392370572207, + "grad_norm": 24.2403564453125, + "learning_rate": 1.9959831038716798e-05, + "loss": 1.6519, + "step": 2117 + }, + { + "epoch": 5.771117166212534, + "grad_norm": 21.29315185546875, + "learning_rate": 1.9959751980155465e-05, + "loss": 1.7158, + "step": 2118 + }, + { + "epoch": 5.773841961852861, + "grad_norm": 11.449963569641113, + "learning_rate": 1.995967284402791e-05, + "loss": 1.7832, + "step": 2119 + }, + { + "epoch": 5.776566757493188, + "grad_norm": 11.538114547729492, + "learning_rate": 1.995959363033474e-05, + "loss": 1.5942, + "step": 2120 + }, + { + "epoch": 5.779291553133515, + "grad_norm": 13.878122329711914, + "learning_rate": 1.9959514339076575e-05, + "loss": 1.7637, + "step": 2121 + }, + { + "epoch": 5.782016348773842, + "grad_norm": 19.71577262878418, + "learning_rate": 1.9959434970254036e-05, + "loss": 1.7839, + "step": 2122 + }, + { + "epoch": 5.784741144414169, + "grad_norm": 14.786399841308594, + "learning_rate": 1.9959355523867734e-05, + "loss": 1.7043, + "step": 2123 + }, + { + "epoch": 5.787465940054496, + "grad_norm": 11.029261589050293, + "learning_rate": 1.9959275999918293e-05, + "loss": 1.7603, + "step": 2124 + }, + { + "epoch": 5.790190735694823, + "grad_norm": 9.883845329284668, + "learning_rate": 1.9959196398406334e-05, + "loss": 1.5271, + "step": 2125 + }, + { + "epoch": 5.79291553133515, + "grad_norm": 14.708576202392578, + "learning_rate": 1.9959116719332468e-05, + "loss": 1.5571, + "step": 2126 + }, + { + "epoch": 5.795640326975477, + "grad_norm": 11.166234970092773, + "learning_rate": 1.9959036962697327e-05, + "loss": 1.7852, + "step": 2127 + }, + { + "epoch": 5.798365122615804, + "grad_norm": 11.428666114807129, + "learning_rate": 1.9958957128501528e-05, + "loss": 1.5862, + "step": 2128 + }, + { + "epoch": 5.801089918256131, + "grad_norm": 21.812938690185547, + "learning_rate": 1.9958877216745685e-05, + "loss": 1.6514, + "step": 2129 + }, + { + "epoch": 5.8038147138964575, + "grad_norm": 10.75883674621582, + "learning_rate": 1.995879722743043e-05, + "loss": 1.7747, + "step": 2130 + }, + { + "epoch": 5.806539509536785, + "grad_norm": 9.681130409240723, + "learning_rate": 1.9958717160556385e-05, + "loss": 1.5186, + "step": 2131 + }, + { + "epoch": 5.809264305177112, + "grad_norm": 12.587305068969727, + "learning_rate": 1.9958637016124167e-05, + "loss": 1.5547, + "step": 2132 + }, + { + "epoch": 5.8119891008174385, + "grad_norm": 9.57124137878418, + "learning_rate": 1.9958556794134407e-05, + "loss": 1.8291, + "step": 2133 + }, + { + "epoch": 5.814713896457766, + "grad_norm": 9.282252311706543, + "learning_rate": 1.9958476494587725e-05, + "loss": 1.9062, + "step": 2134 + }, + { + "epoch": 5.817438692098093, + "grad_norm": 19.19476890563965, + "learning_rate": 1.995839611748475e-05, + "loss": 1.6582, + "step": 2135 + }, + { + "epoch": 5.820163487738419, + "grad_norm": 10.15176010131836, + "learning_rate": 1.995831566282611e-05, + "loss": 1.6479, + "step": 2136 + }, + { + "epoch": 5.822888283378747, + "grad_norm": 11.221248626708984, + "learning_rate": 1.9958235130612423e-05, + "loss": 1.7581, + "step": 2137 + }, + { + "epoch": 5.825613079019074, + "grad_norm": 14.83688735961914, + "learning_rate": 1.9958154520844326e-05, + "loss": 1.8569, + "step": 2138 + }, + { + "epoch": 5.8283378746594, + "grad_norm": 10.33976936340332, + "learning_rate": 1.9958073833522437e-05, + "loss": 1.7148, + "step": 2139 + }, + { + "epoch": 5.831062670299728, + "grad_norm": 12.592178344726562, + "learning_rate": 1.9957993068647394e-05, + "loss": 1.5762, + "step": 2140 + }, + { + "epoch": 5.833787465940055, + "grad_norm": 12.909204483032227, + "learning_rate": 1.9957912226219817e-05, + "loss": 1.7793, + "step": 2141 + }, + { + "epoch": 5.836512261580381, + "grad_norm": 10.267101287841797, + "learning_rate": 1.9957831306240343e-05, + "loss": 1.8643, + "step": 2142 + }, + { + "epoch": 5.839237057220709, + "grad_norm": 8.997322082519531, + "learning_rate": 1.9957750308709598e-05, + "loss": 1.728, + "step": 2143 + }, + { + "epoch": 5.8419618528610355, + "grad_norm": 10.750346183776855, + "learning_rate": 1.9957669233628216e-05, + "loss": 1.7119, + "step": 2144 + }, + { + "epoch": 5.844686648501362, + "grad_norm": 10.793237686157227, + "learning_rate": 1.9957588080996825e-05, + "loss": 1.7256, + "step": 2145 + }, + { + "epoch": 5.84741144414169, + "grad_norm": 7.666360855102539, + "learning_rate": 1.995750685081606e-05, + "loss": 1.5859, + "step": 2146 + }, + { + "epoch": 5.8501362397820165, + "grad_norm": 8.329882621765137, + "learning_rate": 1.995742554308655e-05, + "loss": 1.7261, + "step": 2147 + }, + { + "epoch": 5.852861035422343, + "grad_norm": 11.187580108642578, + "learning_rate": 1.995734415780893e-05, + "loss": 1.9126, + "step": 2148 + }, + { + "epoch": 5.855585831062671, + "grad_norm": 9.039776802062988, + "learning_rate": 1.9957262694983837e-05, + "loss": 1.7249, + "step": 2149 + }, + { + "epoch": 5.858310626702997, + "grad_norm": 11.114256858825684, + "learning_rate": 1.9957181154611903e-05, + "loss": 1.6907, + "step": 2150 + }, + { + "epoch": 5.861035422343324, + "grad_norm": 11.95982551574707, + "learning_rate": 1.995709953669376e-05, + "loss": 1.5112, + "step": 2151 + }, + { + "epoch": 5.863760217983652, + "grad_norm": 11.137290000915527, + "learning_rate": 1.9957017841230045e-05, + "loss": 1.7397, + "step": 2152 + }, + { + "epoch": 5.866485013623978, + "grad_norm": 11.245691299438477, + "learning_rate": 1.9956936068221396e-05, + "loss": 1.4753, + "step": 2153 + }, + { + "epoch": 5.869209809264305, + "grad_norm": 10.877267837524414, + "learning_rate": 1.995685421766845e-05, + "loss": 1.8682, + "step": 2154 + }, + { + "epoch": 5.871934604904633, + "grad_norm": 16.539710998535156, + "learning_rate": 1.9956772289571845e-05, + "loss": 1.5327, + "step": 2155 + }, + { + "epoch": 5.874659400544959, + "grad_norm": 10.097494125366211, + "learning_rate": 1.995669028393222e-05, + "loss": 1.6814, + "step": 2156 + }, + { + "epoch": 5.877384196185286, + "grad_norm": 8.638931274414062, + "learning_rate": 1.995660820075021e-05, + "loss": 1.8547, + "step": 2157 + }, + { + "epoch": 5.8801089918256135, + "grad_norm": 18.214252471923828, + "learning_rate": 1.9956526040026453e-05, + "loss": 1.5378, + "step": 2158 + }, + { + "epoch": 5.88283378746594, + "grad_norm": 8.704755783081055, + "learning_rate": 1.9956443801761593e-05, + "loss": 1.4504, + "step": 2159 + }, + { + "epoch": 5.885558583106267, + "grad_norm": 7.709156513214111, + "learning_rate": 1.995636148595627e-05, + "loss": 1.6738, + "step": 2160 + }, + { + "epoch": 5.8882833787465945, + "grad_norm": 10.272282600402832, + "learning_rate": 1.9956279092611123e-05, + "loss": 1.8521, + "step": 2161 + }, + { + "epoch": 5.891008174386921, + "grad_norm": 8.876688957214355, + "learning_rate": 1.9956196621726794e-05, + "loss": 1.665, + "step": 2162 + }, + { + "epoch": 5.893732970027248, + "grad_norm": 12.127043724060059, + "learning_rate": 1.995611407330393e-05, + "loss": 1.5745, + "step": 2163 + }, + { + "epoch": 5.896457765667575, + "grad_norm": 9.917612075805664, + "learning_rate": 1.9956031447343166e-05, + "loss": 1.7146, + "step": 2164 + }, + { + "epoch": 5.899182561307902, + "grad_norm": 8.613646507263184, + "learning_rate": 1.9955948743845152e-05, + "loss": 1.418, + "step": 2165 + }, + { + "epoch": 5.901907356948229, + "grad_norm": 14.007044792175293, + "learning_rate": 1.995586596281053e-05, + "loss": 1.6123, + "step": 2166 + }, + { + "epoch": 5.904632152588556, + "grad_norm": 10.300485610961914, + "learning_rate": 1.9955783104239943e-05, + "loss": 1.708, + "step": 2167 + }, + { + "epoch": 5.907356948228883, + "grad_norm": 9.43236255645752, + "learning_rate": 1.995570016813404e-05, + "loss": 1.6816, + "step": 2168 + }, + { + "epoch": 5.91008174386921, + "grad_norm": 8.837135314941406, + "learning_rate": 1.9955617154493462e-05, + "loss": 1.6973, + "step": 2169 + }, + { + "epoch": 5.912806539509537, + "grad_norm": 8.825847625732422, + "learning_rate": 1.995553406331886e-05, + "loss": 1.5781, + "step": 2170 + }, + { + "epoch": 5.915531335149864, + "grad_norm": 13.152094841003418, + "learning_rate": 1.9955450894610875e-05, + "loss": 1.6084, + "step": 2171 + }, + { + "epoch": 5.918256130790191, + "grad_norm": 9.993326187133789, + "learning_rate": 1.995536764837016e-05, + "loss": 1.5632, + "step": 2172 + }, + { + "epoch": 5.920980926430518, + "grad_norm": 10.549430847167969, + "learning_rate": 1.9955284324597365e-05, + "loss": 1.8931, + "step": 2173 + }, + { + "epoch": 5.923705722070845, + "grad_norm": 11.248650550842285, + "learning_rate": 1.9955200923293134e-05, + "loss": 1.52, + "step": 2174 + }, + { + "epoch": 5.926430517711172, + "grad_norm": 10.428131103515625, + "learning_rate": 1.9955117444458118e-05, + "loss": 1.8013, + "step": 2175 + }, + { + "epoch": 5.929155313351498, + "grad_norm": 10.206390380859375, + "learning_rate": 1.9955033888092973e-05, + "loss": 1.623, + "step": 2176 + }, + { + "epoch": 5.931880108991826, + "grad_norm": 12.52747917175293, + "learning_rate": 1.995495025419834e-05, + "loss": 1.6709, + "step": 2177 + }, + { + "epoch": 5.9346049046321525, + "grad_norm": 12.243200302124023, + "learning_rate": 1.9954866542774872e-05, + "loss": 1.7246, + "step": 2178 + }, + { + "epoch": 5.937329700272479, + "grad_norm": 8.610759735107422, + "learning_rate": 1.9954782753823227e-05, + "loss": 1.5435, + "step": 2179 + }, + { + "epoch": 5.940054495912807, + "grad_norm": 8.388009071350098, + "learning_rate": 1.9954698887344057e-05, + "loss": 1.6885, + "step": 2180 + }, + { + "epoch": 5.9427792915531334, + "grad_norm": 8.853168487548828, + "learning_rate": 1.995461494333801e-05, + "loss": 1.8015, + "step": 2181 + }, + { + "epoch": 5.94550408719346, + "grad_norm": 8.397902488708496, + "learning_rate": 1.995453092180574e-05, + "loss": 1.6548, + "step": 2182 + }, + { + "epoch": 5.948228882833788, + "grad_norm": 10.568078994750977, + "learning_rate": 1.9954446822747905e-05, + "loss": 1.7788, + "step": 2183 + }, + { + "epoch": 5.950953678474114, + "grad_norm": 12.230669021606445, + "learning_rate": 1.995436264616516e-05, + "loss": 1.6689, + "step": 2184 + }, + { + "epoch": 5.953678474114441, + "grad_norm": 9.328551292419434, + "learning_rate": 1.995427839205816e-05, + "loss": 1.71, + "step": 2185 + }, + { + "epoch": 5.956403269754769, + "grad_norm": 10.6898193359375, + "learning_rate": 1.9954194060427557e-05, + "loss": 1.8257, + "step": 2186 + }, + { + "epoch": 5.959128065395095, + "grad_norm": 11.12633991241455, + "learning_rate": 1.9954109651274015e-05, + "loss": 1.6909, + "step": 2187 + }, + { + "epoch": 5.961852861035422, + "grad_norm": 8.994038581848145, + "learning_rate": 1.9954025164598184e-05, + "loss": 1.5422, + "step": 2188 + }, + { + "epoch": 5.96457765667575, + "grad_norm": 14.928201675415039, + "learning_rate": 1.9953940600400726e-05, + "loss": 1.6475, + "step": 2189 + }, + { + "epoch": 5.967302452316076, + "grad_norm": 13.77098274230957, + "learning_rate": 1.9953855958682297e-05, + "loss": 1.6206, + "step": 2190 + }, + { + "epoch": 5.970027247956403, + "grad_norm": 8.098898887634277, + "learning_rate": 1.9953771239443562e-05, + "loss": 1.5703, + "step": 2191 + }, + { + "epoch": 5.9727520435967305, + "grad_norm": 7.796526908874512, + "learning_rate": 1.9953686442685175e-05, + "loss": 1.5212, + "step": 2192 + }, + { + "epoch": 5.975476839237057, + "grad_norm": 9.103816986083984, + "learning_rate": 1.99536015684078e-05, + "loss": 1.6255, + "step": 2193 + }, + { + "epoch": 5.978201634877384, + "grad_norm": 8.29758071899414, + "learning_rate": 1.9953516616612093e-05, + "loss": 1.4558, + "step": 2194 + }, + { + "epoch": 5.9809264305177114, + "grad_norm": 11.29628849029541, + "learning_rate": 1.9953431587298723e-05, + "loss": 1.8486, + "step": 2195 + }, + { + "epoch": 5.983651226158038, + "grad_norm": 9.009011268615723, + "learning_rate": 1.9953346480468347e-05, + "loss": 1.6904, + "step": 2196 + }, + { + "epoch": 5.986376021798365, + "grad_norm": 12.899435997009277, + "learning_rate": 1.9953261296121625e-05, + "loss": 1.8438, + "step": 2197 + }, + { + "epoch": 5.989100817438692, + "grad_norm": 9.92809009552002, + "learning_rate": 1.995317603425923e-05, + "loss": 1.8542, + "step": 2198 + }, + { + "epoch": 5.991825613079019, + "grad_norm": 9.189982414245605, + "learning_rate": 1.9953090694881815e-05, + "loss": 1.73, + "step": 2199 + }, + { + "epoch": 5.994550408719346, + "grad_norm": 12.12692642211914, + "learning_rate": 1.9953005277990054e-05, + "loss": 1.7061, + "step": 2200 + }, + { + "epoch": 5.997275204359673, + "grad_norm": 10.086868286132812, + "learning_rate": 1.9952919783584608e-05, + "loss": 1.7578, + "step": 2201 + }, + { + "epoch": 6.0, + "grad_norm": 11.160868644714355, + "learning_rate": 1.995283421166614e-05, + "loss": 1.5291, + "step": 2202 + }, + { + "epoch": 6.002724795640327, + "grad_norm": 10.200235366821289, + "learning_rate": 1.9952748562235325e-05, + "loss": 1.4353, + "step": 2203 + }, + { + "epoch": 6.005449591280654, + "grad_norm": 13.496068954467773, + "learning_rate": 1.995266283529282e-05, + "loss": 1.5662, + "step": 2204 + }, + { + "epoch": 6.008174386920981, + "grad_norm": 7.2131242752075195, + "learning_rate": 1.9952577030839297e-05, + "loss": 1.3428, + "step": 2205 + }, + { + "epoch": 6.010899182561308, + "grad_norm": 9.206995964050293, + "learning_rate": 1.9952491148875427e-05, + "loss": 1.3918, + "step": 2206 + }, + { + "epoch": 6.013623978201635, + "grad_norm": 8.290966033935547, + "learning_rate": 1.9952405189401872e-05, + "loss": 1.5034, + "step": 2207 + }, + { + "epoch": 6.016348773841962, + "grad_norm": 10.639963150024414, + "learning_rate": 1.9952319152419314e-05, + "loss": 1.5547, + "step": 2208 + }, + { + "epoch": 6.0190735694822886, + "grad_norm": 11.235346794128418, + "learning_rate": 1.9952233037928406e-05, + "loss": 1.5151, + "step": 2209 + }, + { + "epoch": 6.021798365122616, + "grad_norm": 7.436095714569092, + "learning_rate": 1.9952146845929833e-05, + "loss": 1.4702, + "step": 2210 + }, + { + "epoch": 6.024523160762943, + "grad_norm": 10.257650375366211, + "learning_rate": 1.9952060576424256e-05, + "loss": 1.501, + "step": 2211 + }, + { + "epoch": 6.0272479564032695, + "grad_norm": 10.27843952178955, + "learning_rate": 1.9951974229412355e-05, + "loss": 1.5029, + "step": 2212 + }, + { + "epoch": 6.029972752043597, + "grad_norm": 11.819791793823242, + "learning_rate": 1.99518878048948e-05, + "loss": 1.4094, + "step": 2213 + }, + { + "epoch": 6.032697547683924, + "grad_norm": 11.006246566772461, + "learning_rate": 1.995180130287226e-05, + "loss": 1.6929, + "step": 2214 + }, + { + "epoch": 6.03542234332425, + "grad_norm": 9.352935791015625, + "learning_rate": 1.995171472334541e-05, + "loss": 1.7075, + "step": 2215 + }, + { + "epoch": 6.038147138964578, + "grad_norm": 9.678173065185547, + "learning_rate": 1.9951628066314928e-05, + "loss": 1.4509, + "step": 2216 + }, + { + "epoch": 6.040871934604905, + "grad_norm": 11.307157516479492, + "learning_rate": 1.995154133178149e-05, + "loss": 1.6777, + "step": 2217 + }, + { + "epoch": 6.043596730245231, + "grad_norm": 8.42729377746582, + "learning_rate": 1.9951454519745767e-05, + "loss": 1.4922, + "step": 2218 + }, + { + "epoch": 6.046321525885559, + "grad_norm": 8.440991401672363, + "learning_rate": 1.9951367630208437e-05, + "loss": 1.5571, + "step": 2219 + }, + { + "epoch": 6.049046321525886, + "grad_norm": 8.879366874694824, + "learning_rate": 1.9951280663170174e-05, + "loss": 1.5613, + "step": 2220 + }, + { + "epoch": 6.051771117166212, + "grad_norm": 8.939628601074219, + "learning_rate": 1.9951193618631655e-05, + "loss": 1.563, + "step": 2221 + }, + { + "epoch": 6.05449591280654, + "grad_norm": 10.681466102600098, + "learning_rate": 1.9951106496593566e-05, + "loss": 1.7241, + "step": 2222 + }, + { + "epoch": 6.0572207084468666, + "grad_norm": 8.742968559265137, + "learning_rate": 1.995101929705658e-05, + "loss": 1.5901, + "step": 2223 + }, + { + "epoch": 6.059945504087193, + "grad_norm": 9.580309867858887, + "learning_rate": 1.9950932020021372e-05, + "loss": 1.6521, + "step": 2224 + }, + { + "epoch": 6.062670299727521, + "grad_norm": 10.331524848937988, + "learning_rate": 1.9950844665488626e-05, + "loss": 1.8003, + "step": 2225 + }, + { + "epoch": 6.0653950953678475, + "grad_norm": 10.002351760864258, + "learning_rate": 1.9950757233459022e-05, + "loss": 1.6375, + "step": 2226 + }, + { + "epoch": 6.068119891008174, + "grad_norm": 8.716421127319336, + "learning_rate": 1.9950669723933246e-05, + "loss": 1.5286, + "step": 2227 + }, + { + "epoch": 6.070844686648502, + "grad_norm": 10.600811958312988, + "learning_rate": 1.9950582136911972e-05, + "loss": 1.7808, + "step": 2228 + }, + { + "epoch": 6.073569482288828, + "grad_norm": 8.420156478881836, + "learning_rate": 1.995049447239588e-05, + "loss": 1.3865, + "step": 2229 + }, + { + "epoch": 6.076294277929155, + "grad_norm": 11.201637268066406, + "learning_rate": 1.9950406730385663e-05, + "loss": 1.5684, + "step": 2230 + }, + { + "epoch": 6.079019073569483, + "grad_norm": 8.961545944213867, + "learning_rate": 1.9950318910881993e-05, + "loss": 1.4878, + "step": 2231 + }, + { + "epoch": 6.081743869209809, + "grad_norm": 7.664729118347168, + "learning_rate": 1.9950231013885566e-05, + "loss": 1.5403, + "step": 2232 + }, + { + "epoch": 6.084468664850136, + "grad_norm": 8.747848510742188, + "learning_rate": 1.9950143039397056e-05, + "loss": 1.5457, + "step": 2233 + }, + { + "epoch": 6.087193460490464, + "grad_norm": 10.3059663772583, + "learning_rate": 1.995005498741715e-05, + "loss": 1.4146, + "step": 2234 + }, + { + "epoch": 6.08991825613079, + "grad_norm": 10.38664722442627, + "learning_rate": 1.994996685794654e-05, + "loss": 1.6313, + "step": 2235 + }, + { + "epoch": 6.092643051771117, + "grad_norm": 9.838129997253418, + "learning_rate": 1.994987865098591e-05, + "loss": 1.5403, + "step": 2236 + }, + { + "epoch": 6.0953678474114446, + "grad_norm": 10.536702156066895, + "learning_rate": 1.9949790366535943e-05, + "loss": 1.5447, + "step": 2237 + }, + { + "epoch": 6.098092643051771, + "grad_norm": 11.688711166381836, + "learning_rate": 1.9949702004597327e-05, + "loss": 1.5115, + "step": 2238 + }, + { + "epoch": 6.100817438692098, + "grad_norm": 9.537701606750488, + "learning_rate": 1.9949613565170755e-05, + "loss": 1.584, + "step": 2239 + }, + { + "epoch": 6.1035422343324255, + "grad_norm": 10.0718355178833, + "learning_rate": 1.994952504825691e-05, + "loss": 1.478, + "step": 2240 + }, + { + "epoch": 6.106267029972752, + "grad_norm": 12.579290390014648, + "learning_rate": 1.9949436453856487e-05, + "loss": 1.5327, + "step": 2241 + }, + { + "epoch": 6.108991825613079, + "grad_norm": 14.01674747467041, + "learning_rate": 1.9949347781970172e-05, + "loss": 1.7759, + "step": 2242 + }, + { + "epoch": 6.111716621253406, + "grad_norm": 15.666253089904785, + "learning_rate": 1.9949259032598656e-05, + "loss": 1.3484, + "step": 2243 + }, + { + "epoch": 6.114441416893733, + "grad_norm": 10.228379249572754, + "learning_rate": 1.994917020574263e-05, + "loss": 1.6025, + "step": 2244 + }, + { + "epoch": 6.11716621253406, + "grad_norm": 9.948064804077148, + "learning_rate": 1.994908130140279e-05, + "loss": 1.4221, + "step": 2245 + }, + { + "epoch": 6.1198910081743865, + "grad_norm": 14.202163696289062, + "learning_rate": 1.9948992319579822e-05, + "loss": 1.4207, + "step": 2246 + }, + { + "epoch": 6.122615803814714, + "grad_norm": 8.870183944702148, + "learning_rate": 1.9948903260274424e-05, + "loss": 1.4668, + "step": 2247 + }, + { + "epoch": 6.125340599455041, + "grad_norm": 12.374833106994629, + "learning_rate": 1.9948814123487286e-05, + "loss": 1.6436, + "step": 2248 + }, + { + "epoch": 6.128065395095367, + "grad_norm": 11.639524459838867, + "learning_rate": 1.9948724909219104e-05, + "loss": 1.7617, + "step": 2249 + }, + { + "epoch": 6.130790190735695, + "grad_norm": 10.247749328613281, + "learning_rate": 1.9948635617470572e-05, + "loss": 1.3259, + "step": 2250 + }, + { + "epoch": 6.133514986376022, + "grad_norm": 10.985930442810059, + "learning_rate": 1.994854624824239e-05, + "loss": 1.5647, + "step": 2251 + }, + { + "epoch": 6.136239782016348, + "grad_norm": 12.321182250976562, + "learning_rate": 1.9948456801535247e-05, + "loss": 1.5081, + "step": 2252 + }, + { + "epoch": 6.138964577656676, + "grad_norm": 22.540081024169922, + "learning_rate": 1.994836727734984e-05, + "loss": 1.6118, + "step": 2253 + }, + { + "epoch": 6.141689373297003, + "grad_norm": 14.029481887817383, + "learning_rate": 1.9948277675686873e-05, + "loss": 1.5061, + "step": 2254 + }, + { + "epoch": 6.144414168937329, + "grad_norm": 11.365158081054688, + "learning_rate": 1.9948187996547037e-05, + "loss": 1.6843, + "step": 2255 + }, + { + "epoch": 6.147138964577657, + "grad_norm": 12.896124839782715, + "learning_rate": 1.9948098239931035e-05, + "loss": 1.7524, + "step": 2256 + }, + { + "epoch": 6.1498637602179835, + "grad_norm": 11.004476547241211, + "learning_rate": 1.994800840583956e-05, + "loss": 1.6116, + "step": 2257 + }, + { + "epoch": 6.15258855585831, + "grad_norm": 14.635592460632324, + "learning_rate": 1.9947918494273322e-05, + "loss": 1.5481, + "step": 2258 + }, + { + "epoch": 6.155313351498638, + "grad_norm": 10.547788619995117, + "learning_rate": 1.994782850523301e-05, + "loss": 1.6958, + "step": 2259 + }, + { + "epoch": 6.1580381471389645, + "grad_norm": 12.902785301208496, + "learning_rate": 1.9947738438719332e-05, + "loss": 1.7449, + "step": 2260 + }, + { + "epoch": 6.160762942779291, + "grad_norm": 11.040125846862793, + "learning_rate": 1.9947648294732988e-05, + "loss": 1.74, + "step": 2261 + }, + { + "epoch": 6.163487738419619, + "grad_norm": 39.967002868652344, + "learning_rate": 1.994755807327468e-05, + "loss": 1.5569, + "step": 2262 + }, + { + "epoch": 6.166212534059945, + "grad_norm": 8.66330623626709, + "learning_rate": 1.9947467774345108e-05, + "loss": 1.564, + "step": 2263 + }, + { + "epoch": 6.168937329700272, + "grad_norm": 9.942988395690918, + "learning_rate": 1.9947377397944974e-05, + "loss": 1.5427, + "step": 2264 + }, + { + "epoch": 6.1716621253406, + "grad_norm": 11.946412086486816, + "learning_rate": 1.994728694407499e-05, + "loss": 1.4629, + "step": 2265 + }, + { + "epoch": 6.174386920980926, + "grad_norm": 14.022274017333984, + "learning_rate": 1.9947196412735855e-05, + "loss": 1.9458, + "step": 2266 + }, + { + "epoch": 6.177111716621253, + "grad_norm": 11.036538124084473, + "learning_rate": 1.9947105803928272e-05, + "loss": 1.5564, + "step": 2267 + }, + { + "epoch": 6.179836512261581, + "grad_norm": 12.539093971252441, + "learning_rate": 1.994701511765295e-05, + "loss": 1.4727, + "step": 2268 + }, + { + "epoch": 6.182561307901907, + "grad_norm": 15.075506210327148, + "learning_rate": 1.9946924353910595e-05, + "loss": 1.5957, + "step": 2269 + }, + { + "epoch": 6.185286103542234, + "grad_norm": 11.200881958007812, + "learning_rate": 1.994683351270191e-05, + "loss": 1.6321, + "step": 2270 + }, + { + "epoch": 6.1880108991825615, + "grad_norm": 9.643436431884766, + "learning_rate": 1.994674259402761e-05, + "loss": 1.7334, + "step": 2271 + }, + { + "epoch": 6.190735694822888, + "grad_norm": 10.168499946594238, + "learning_rate": 1.99466515978884e-05, + "loss": 1.5505, + "step": 2272 + }, + { + "epoch": 6.193460490463215, + "grad_norm": 13.098001480102539, + "learning_rate": 1.9946560524284985e-05, + "loss": 1.6384, + "step": 2273 + }, + { + "epoch": 6.1961852861035425, + "grad_norm": 13.747922897338867, + "learning_rate": 1.9946469373218076e-05, + "loss": 1.4556, + "step": 2274 + }, + { + "epoch": 6.198910081743869, + "grad_norm": 12.153290748596191, + "learning_rate": 1.994637814468838e-05, + "loss": 1.6526, + "step": 2275 + }, + { + "epoch": 6.201634877384196, + "grad_norm": 10.517086029052734, + "learning_rate": 1.994628683869662e-05, + "loss": 1.4062, + "step": 2276 + }, + { + "epoch": 6.204359673024523, + "grad_norm": 19.21754264831543, + "learning_rate": 1.9946195455243494e-05, + "loss": 1.5022, + "step": 2277 + }, + { + "epoch": 6.20708446866485, + "grad_norm": 12.603913307189941, + "learning_rate": 1.9946103994329714e-05, + "loss": 1.6313, + "step": 2278 + }, + { + "epoch": 6.209809264305177, + "grad_norm": 17.378110885620117, + "learning_rate": 1.9946012455956004e-05, + "loss": 1.7715, + "step": 2279 + }, + { + "epoch": 6.212534059945504, + "grad_norm": 11.949447631835938, + "learning_rate": 1.9945920840123062e-05, + "loss": 1.583, + "step": 2280 + }, + { + "epoch": 6.215258855585831, + "grad_norm": 8.07461929321289, + "learning_rate": 1.9945829146831614e-05, + "loss": 1.4766, + "step": 2281 + }, + { + "epoch": 6.217983651226158, + "grad_norm": 9.490711212158203, + "learning_rate": 1.9945737376082363e-05, + "loss": 1.7275, + "step": 2282 + }, + { + "epoch": 6.220708446866485, + "grad_norm": 9.92374324798584, + "learning_rate": 1.9945645527876033e-05, + "loss": 1.6096, + "step": 2283 + }, + { + "epoch": 6.223433242506812, + "grad_norm": 15.487894058227539, + "learning_rate": 1.9945553602213336e-05, + "loss": 1.6487, + "step": 2284 + }, + { + "epoch": 6.226158038147139, + "grad_norm": 9.092809677124023, + "learning_rate": 1.994546159909499e-05, + "loss": 1.3423, + "step": 2285 + }, + { + "epoch": 6.228882833787466, + "grad_norm": 11.397137641906738, + "learning_rate": 1.9945369518521704e-05, + "loss": 1.7844, + "step": 2286 + }, + { + "epoch": 6.231607629427793, + "grad_norm": 10.459543228149414, + "learning_rate": 1.9945277360494204e-05, + "loss": 1.4954, + "step": 2287 + }, + { + "epoch": 6.23433242506812, + "grad_norm": 10.375653266906738, + "learning_rate": 1.99451851250132e-05, + "loss": 1.7891, + "step": 2288 + }, + { + "epoch": 6.237057220708447, + "grad_norm": 11.958422660827637, + "learning_rate": 1.994509281207942e-05, + "loss": 1.6511, + "step": 2289 + }, + { + "epoch": 6.239782016348774, + "grad_norm": 10.102315902709961, + "learning_rate": 1.9945000421693574e-05, + "loss": 1.6758, + "step": 2290 + }, + { + "epoch": 6.2425068119891005, + "grad_norm": 9.557490348815918, + "learning_rate": 1.9944907953856384e-05, + "loss": 1.5181, + "step": 2291 + }, + { + "epoch": 6.245231607629428, + "grad_norm": 11.85209846496582, + "learning_rate": 1.9944815408568572e-05, + "loss": 1.5681, + "step": 2292 + }, + { + "epoch": 6.247956403269755, + "grad_norm": 11.734000205993652, + "learning_rate": 1.9944722785830855e-05, + "loss": 1.7017, + "step": 2293 + }, + { + "epoch": 6.2506811989100814, + "grad_norm": 9.606616973876953, + "learning_rate": 1.994463008564396e-05, + "loss": 1.6003, + "step": 2294 + }, + { + "epoch": 6.253405994550409, + "grad_norm": 9.383480072021484, + "learning_rate": 1.9944537308008606e-05, + "loss": 1.4241, + "step": 2295 + }, + { + "epoch": 6.256130790190736, + "grad_norm": 9.445914268493652, + "learning_rate": 1.9944444452925514e-05, + "loss": 1.3701, + "step": 2296 + }, + { + "epoch": 6.258855585831062, + "grad_norm": 10.938509941101074, + "learning_rate": 1.994435152039541e-05, + "loss": 1.6641, + "step": 2297 + }, + { + "epoch": 6.26158038147139, + "grad_norm": 9.327269554138184, + "learning_rate": 1.9944258510419018e-05, + "loss": 1.6255, + "step": 2298 + }, + { + "epoch": 6.264305177111717, + "grad_norm": 21.856826782226562, + "learning_rate": 1.9944165422997058e-05, + "loss": 1.6892, + "step": 2299 + }, + { + "epoch": 6.267029972752043, + "grad_norm": 10.677403450012207, + "learning_rate": 1.994407225813026e-05, + "loss": 1.6177, + "step": 2300 + }, + { + "epoch": 6.269754768392371, + "grad_norm": 9.786881446838379, + "learning_rate": 1.9943979015819343e-05, + "loss": 1.6742, + "step": 2301 + }, + { + "epoch": 6.272479564032698, + "grad_norm": 10.130830764770508, + "learning_rate": 1.994388569606504e-05, + "loss": 1.6331, + "step": 2302 + }, + { + "epoch": 6.275204359673024, + "grad_norm": 10.384533882141113, + "learning_rate": 1.9943792298868076e-05, + "loss": 1.7134, + "step": 2303 + }, + { + "epoch": 6.277929155313352, + "grad_norm": 11.189226150512695, + "learning_rate": 1.994369882422918e-05, + "loss": 1.696, + "step": 2304 + }, + { + "epoch": 6.2806539509536785, + "grad_norm": 8.195403099060059, + "learning_rate": 1.9943605272149074e-05, + "loss": 1.4683, + "step": 2305 + }, + { + "epoch": 6.283378746594005, + "grad_norm": 10.447251319885254, + "learning_rate": 1.9943511642628488e-05, + "loss": 1.3259, + "step": 2306 + }, + { + "epoch": 6.286103542234333, + "grad_norm": 28.25797462463379, + "learning_rate": 1.9943417935668158e-05, + "loss": 1.6973, + "step": 2307 + }, + { + "epoch": 6.2888283378746594, + "grad_norm": 9.958805084228516, + "learning_rate": 1.9943324151268807e-05, + "loss": 1.7207, + "step": 2308 + }, + { + "epoch": 6.291553133514986, + "grad_norm": 10.296317100524902, + "learning_rate": 1.994323028943117e-05, + "loss": 1.5947, + "step": 2309 + }, + { + "epoch": 6.294277929155314, + "grad_norm": 13.088888168334961, + "learning_rate": 1.994313635015597e-05, + "loss": 1.6792, + "step": 2310 + }, + { + "epoch": 6.29700272479564, + "grad_norm": 10.405101776123047, + "learning_rate": 1.994304233344395e-05, + "loss": 1.6931, + "step": 2311 + }, + { + "epoch": 6.299727520435967, + "grad_norm": 10.78155517578125, + "learning_rate": 1.9942948239295833e-05, + "loss": 1.6045, + "step": 2312 + }, + { + "epoch": 6.302452316076295, + "grad_norm": 14.911649703979492, + "learning_rate": 1.9942854067712355e-05, + "loss": 1.4097, + "step": 2313 + }, + { + "epoch": 6.305177111716621, + "grad_norm": 11.39924430847168, + "learning_rate": 1.994275981869425e-05, + "loss": 1.6233, + "step": 2314 + }, + { + "epoch": 6.307901907356948, + "grad_norm": 13.633781433105469, + "learning_rate": 1.9942665492242256e-05, + "loss": 1.6016, + "step": 2315 + }, + { + "epoch": 6.310626702997276, + "grad_norm": 13.581009864807129, + "learning_rate": 1.9942571088357095e-05, + "loss": 1.4766, + "step": 2316 + }, + { + "epoch": 6.313351498637602, + "grad_norm": 11.985243797302246, + "learning_rate": 1.994247660703952e-05, + "loss": 1.5881, + "step": 2317 + }, + { + "epoch": 6.316076294277929, + "grad_norm": 14.857428550720215, + "learning_rate": 1.9942382048290248e-05, + "loss": 1.603, + "step": 2318 + }, + { + "epoch": 6.3188010899182565, + "grad_norm": 13.543075561523438, + "learning_rate": 1.994228741211003e-05, + "loss": 1.4346, + "step": 2319 + }, + { + "epoch": 6.321525885558583, + "grad_norm": 11.29600715637207, + "learning_rate": 1.9942192698499596e-05, + "loss": 1.6895, + "step": 2320 + }, + { + "epoch": 6.32425068119891, + "grad_norm": 10.868379592895508, + "learning_rate": 1.9942097907459687e-05, + "loss": 1.6465, + "step": 2321 + }, + { + "epoch": 6.3269754768392374, + "grad_norm": 25.268985748291016, + "learning_rate": 1.9942003038991035e-05, + "loss": 1.5962, + "step": 2322 + }, + { + "epoch": 6.329700272479564, + "grad_norm": 26.629039764404297, + "learning_rate": 1.9941908093094387e-05, + "loss": 1.4805, + "step": 2323 + }, + { + "epoch": 6.332425068119891, + "grad_norm": 12.916640281677246, + "learning_rate": 1.9941813069770478e-05, + "loss": 1.3672, + "step": 2324 + }, + { + "epoch": 6.335149863760218, + "grad_norm": 11.686497688293457, + "learning_rate": 1.9941717969020046e-05, + "loss": 1.6721, + "step": 2325 + }, + { + "epoch": 6.337874659400545, + "grad_norm": 10.163697242736816, + "learning_rate": 1.994162279084384e-05, + "loss": 1.4741, + "step": 2326 + }, + { + "epoch": 6.340599455040872, + "grad_norm": 10.932123184204102, + "learning_rate": 1.9941527535242592e-05, + "loss": 1.7891, + "step": 2327 + }, + { + "epoch": 6.343324250681199, + "grad_norm": 9.418354988098145, + "learning_rate": 1.9941432202217047e-05, + "loss": 1.5466, + "step": 2328 + }, + { + "epoch": 6.346049046321526, + "grad_norm": 11.555414199829102, + "learning_rate": 1.994133679176795e-05, + "loss": 1.6089, + "step": 2329 + }, + { + "epoch": 6.348773841961853, + "grad_norm": 12.213624000549316, + "learning_rate": 1.994124130389604e-05, + "loss": 1.5686, + "step": 2330 + }, + { + "epoch": 6.35149863760218, + "grad_norm": 13.881996154785156, + "learning_rate": 1.9941145738602065e-05, + "loss": 1.4187, + "step": 2331 + }, + { + "epoch": 6.354223433242507, + "grad_norm": 10.478837966918945, + "learning_rate": 1.9941050095886763e-05, + "loss": 1.7446, + "step": 2332 + }, + { + "epoch": 6.356948228882834, + "grad_norm": 12.292433738708496, + "learning_rate": 1.9940954375750888e-05, + "loss": 1.6624, + "step": 2333 + }, + { + "epoch": 6.359673024523161, + "grad_norm": 21.07522201538086, + "learning_rate": 1.994085857819518e-05, + "loss": 1.8042, + "step": 2334 + }, + { + "epoch": 6.362397820163488, + "grad_norm": 9.90341567993164, + "learning_rate": 1.9940762703220383e-05, + "loss": 1.4639, + "step": 2335 + }, + { + "epoch": 6.3651226158038146, + "grad_norm": 10.5038423538208, + "learning_rate": 1.9940666750827247e-05, + "loss": 1.7549, + "step": 2336 + }, + { + "epoch": 6.367847411444142, + "grad_norm": 13.10082721710205, + "learning_rate": 1.9940570721016516e-05, + "loss": 1.4827, + "step": 2337 + }, + { + "epoch": 6.370572207084469, + "grad_norm": 9.728696823120117, + "learning_rate": 1.994047461378894e-05, + "loss": 1.4875, + "step": 2338 + }, + { + "epoch": 6.3732970027247955, + "grad_norm": 10.2384614944458, + "learning_rate": 1.994037842914527e-05, + "loss": 1.7046, + "step": 2339 + }, + { + "epoch": 6.376021798365123, + "grad_norm": 23.558156967163086, + "learning_rate": 1.9940282167086255e-05, + "loss": 1.5261, + "step": 2340 + }, + { + "epoch": 6.37874659400545, + "grad_norm": 12.822075843811035, + "learning_rate": 1.9940185827612638e-05, + "loss": 1.5405, + "step": 2341 + }, + { + "epoch": 6.381471389645776, + "grad_norm": 12.047752380371094, + "learning_rate": 1.9940089410725174e-05, + "loss": 1.5564, + "step": 2342 + }, + { + "epoch": 6.384196185286104, + "grad_norm": 33.5240364074707, + "learning_rate": 1.9939992916424614e-05, + "loss": 1.4438, + "step": 2343 + }, + { + "epoch": 6.386920980926431, + "grad_norm": 10.042675018310547, + "learning_rate": 1.9939896344711714e-05, + "loss": 1.6416, + "step": 2344 + }, + { + "epoch": 6.389645776566757, + "grad_norm": 11.133225440979004, + "learning_rate": 1.9939799695587213e-05, + "loss": 1.6123, + "step": 2345 + }, + { + "epoch": 6.392370572207085, + "grad_norm": 19.349576950073242, + "learning_rate": 1.9939702969051876e-05, + "loss": 1.5417, + "step": 2346 + }, + { + "epoch": 6.395095367847412, + "grad_norm": 15.16633415222168, + "learning_rate": 1.993960616510645e-05, + "loss": 1.5361, + "step": 2347 + }, + { + "epoch": 6.397820163487738, + "grad_norm": 10.151996612548828, + "learning_rate": 1.9939509283751696e-05, + "loss": 1.4199, + "step": 2348 + }, + { + "epoch": 6.400544959128065, + "grad_norm": 12.841211318969727, + "learning_rate": 1.993941232498836e-05, + "loss": 1.4395, + "step": 2349 + }, + { + "epoch": 6.4032697547683926, + "grad_norm": 14.988808631896973, + "learning_rate": 1.9939315288817203e-05, + "loss": 1.6819, + "step": 2350 + }, + { + "epoch": 6.405994550408719, + "grad_norm": 10.59081745147705, + "learning_rate": 1.993921817523898e-05, + "loss": 1.5515, + "step": 2351 + }, + { + "epoch": 6.408719346049046, + "grad_norm": 10.21403694152832, + "learning_rate": 1.993912098425444e-05, + "loss": 1.3684, + "step": 2352 + }, + { + "epoch": 6.4114441416893735, + "grad_norm": 16.891313552856445, + "learning_rate": 1.993902371586435e-05, + "loss": 1.6753, + "step": 2353 + }, + { + "epoch": 6.4141689373297, + "grad_norm": 12.440431594848633, + "learning_rate": 1.993892637006946e-05, + "loss": 1.7651, + "step": 2354 + }, + { + "epoch": 6.416893732970027, + "grad_norm": 11.252609252929688, + "learning_rate": 1.993882894687053e-05, + "loss": 1.739, + "step": 2355 + }, + { + "epoch": 6.419618528610354, + "grad_norm": 8.985031127929688, + "learning_rate": 1.993873144626833e-05, + "loss": 1.5359, + "step": 2356 + }, + { + "epoch": 6.422343324250681, + "grad_norm": 10.893987655639648, + "learning_rate": 1.9938633868263597e-05, + "loss": 1.7124, + "step": 2357 + }, + { + "epoch": 6.425068119891008, + "grad_norm": 9.890556335449219, + "learning_rate": 1.993853621285711e-05, + "loss": 1.3611, + "step": 2358 + }, + { + "epoch": 6.427792915531335, + "grad_norm": 9.026385307312012, + "learning_rate": 1.993843848004962e-05, + "loss": 1.677, + "step": 2359 + }, + { + "epoch": 6.430517711171662, + "grad_norm": 9.886550903320312, + "learning_rate": 1.9938340669841893e-05, + "loss": 1.4731, + "step": 2360 + }, + { + "epoch": 6.433242506811989, + "grad_norm": 9.005744934082031, + "learning_rate": 1.993824278223469e-05, + "loss": 1.6106, + "step": 2361 + }, + { + "epoch": 6.435967302452316, + "grad_norm": 13.120516777038574, + "learning_rate": 1.993814481722877e-05, + "loss": 1.626, + "step": 2362 + }, + { + "epoch": 6.438692098092643, + "grad_norm": 12.961750984191895, + "learning_rate": 1.9938046774824897e-05, + "loss": 1.6194, + "step": 2363 + }, + { + "epoch": 6.44141689373297, + "grad_norm": 11.148823738098145, + "learning_rate": 1.9937948655023838e-05, + "loss": 1.6655, + "step": 2364 + }, + { + "epoch": 6.444141689373297, + "grad_norm": 8.781012535095215, + "learning_rate": 1.9937850457826354e-05, + "loss": 1.5259, + "step": 2365 + }, + { + "epoch": 6.446866485013624, + "grad_norm": 11.232917785644531, + "learning_rate": 1.993775218323321e-05, + "loss": 1.6318, + "step": 2366 + }, + { + "epoch": 6.449591280653951, + "grad_norm": 13.188098907470703, + "learning_rate": 1.993765383124517e-05, + "loss": 1.7705, + "step": 2367 + }, + { + "epoch": 6.452316076294278, + "grad_norm": 17.013540267944336, + "learning_rate": 1.9937555401863005e-05, + "loss": 1.583, + "step": 2368 + }, + { + "epoch": 6.455040871934605, + "grad_norm": 10.890372276306152, + "learning_rate": 1.9937456895087477e-05, + "loss": 1.616, + "step": 2369 + }, + { + "epoch": 6.4577656675749315, + "grad_norm": 10.225186347961426, + "learning_rate": 1.9937358310919356e-05, + "loss": 1.6235, + "step": 2370 + }, + { + "epoch": 6.460490463215259, + "grad_norm": 12.753676414489746, + "learning_rate": 1.9937259649359406e-05, + "loss": 1.6106, + "step": 2371 + }, + { + "epoch": 6.463215258855586, + "grad_norm": 10.8523530960083, + "learning_rate": 1.9937160910408396e-05, + "loss": 1.7925, + "step": 2372 + }, + { + "epoch": 6.4659400544959125, + "grad_norm": 10.743764877319336, + "learning_rate": 1.99370620940671e-05, + "loss": 1.5129, + "step": 2373 + }, + { + "epoch": 6.46866485013624, + "grad_norm": 8.791482925415039, + "learning_rate": 1.9936963200336287e-05, + "loss": 1.4031, + "step": 2374 + }, + { + "epoch": 6.471389645776567, + "grad_norm": 8.918050765991211, + "learning_rate": 1.9936864229216718e-05, + "loss": 1.3892, + "step": 2375 + }, + { + "epoch": 6.474114441416893, + "grad_norm": 9.868968963623047, + "learning_rate": 1.9936765180709173e-05, + "loss": 1.4968, + "step": 2376 + }, + { + "epoch": 6.476839237057221, + "grad_norm": 12.836007118225098, + "learning_rate": 1.993666605481442e-05, + "loss": 1.4861, + "step": 2377 + }, + { + "epoch": 6.479564032697548, + "grad_norm": 10.597851753234863, + "learning_rate": 1.9936566851533232e-05, + "loss": 1.4966, + "step": 2378 + }, + { + "epoch": 6.482288828337874, + "grad_norm": 8.851969718933105, + "learning_rate": 1.9936467570866384e-05, + "loss": 1.2188, + "step": 2379 + }, + { + "epoch": 6.485013623978202, + "grad_norm": 11.105555534362793, + "learning_rate": 1.9936368212814643e-05, + "loss": 1.7676, + "step": 2380 + }, + { + "epoch": 6.487738419618529, + "grad_norm": 10.325815200805664, + "learning_rate": 1.9936268777378785e-05, + "loss": 1.4563, + "step": 2381 + }, + { + "epoch": 6.490463215258855, + "grad_norm": 9.311816215515137, + "learning_rate": 1.993616926455959e-05, + "loss": 1.4685, + "step": 2382 + }, + { + "epoch": 6.493188010899183, + "grad_norm": 9.058845520019531, + "learning_rate": 1.9936069674357826e-05, + "loss": 1.5105, + "step": 2383 + }, + { + "epoch": 6.4959128065395095, + "grad_norm": 24.743215560913086, + "learning_rate": 1.993597000677427e-05, + "loss": 1.5391, + "step": 2384 + }, + { + "epoch": 6.498637602179836, + "grad_norm": 10.185152053833008, + "learning_rate": 1.9935870261809703e-05, + "loss": 1.6858, + "step": 2385 + }, + { + "epoch": 6.501362397820164, + "grad_norm": 9.319504737854004, + "learning_rate": 1.9935770439464896e-05, + "loss": 1.5894, + "step": 2386 + }, + { + "epoch": 6.5040871934604905, + "grad_norm": 9.412171363830566, + "learning_rate": 1.9935670539740626e-05, + "loss": 1.5222, + "step": 2387 + }, + { + "epoch": 6.506811989100817, + "grad_norm": 16.216398239135742, + "learning_rate": 1.9935570562637675e-05, + "loss": 1.5078, + "step": 2388 + }, + { + "epoch": 6.509536784741145, + "grad_norm": 11.490829467773438, + "learning_rate": 1.993547050815682e-05, + "loss": 1.6562, + "step": 2389 + }, + { + "epoch": 6.512261580381471, + "grad_norm": 10.294737815856934, + "learning_rate": 1.9935370376298842e-05, + "loss": 1.4717, + "step": 2390 + }, + { + "epoch": 6.514986376021798, + "grad_norm": 31.39698028564453, + "learning_rate": 1.9935270167064523e-05, + "loss": 1.4307, + "step": 2391 + }, + { + "epoch": 6.517711171662126, + "grad_norm": 11.936128616333008, + "learning_rate": 1.9935169880454635e-05, + "loss": 1.5737, + "step": 2392 + }, + { + "epoch": 6.520435967302452, + "grad_norm": 15.877132415771484, + "learning_rate": 1.9935069516469964e-05, + "loss": 1.562, + "step": 2393 + }, + { + "epoch": 6.523160762942779, + "grad_norm": 10.936116218566895, + "learning_rate": 1.993496907511129e-05, + "loss": 1.6309, + "step": 2394 + }, + { + "epoch": 6.525885558583107, + "grad_norm": 8.006392478942871, + "learning_rate": 1.99348685563794e-05, + "loss": 1.4521, + "step": 2395 + }, + { + "epoch": 6.528610354223433, + "grad_norm": 11.510782241821289, + "learning_rate": 1.993476796027507e-05, + "loss": 1.6775, + "step": 2396 + }, + { + "epoch": 6.53133514986376, + "grad_norm": 15.735798835754395, + "learning_rate": 1.993466728679909e-05, + "loss": 1.6934, + "step": 2397 + }, + { + "epoch": 6.5340599455040875, + "grad_norm": 13.140318870544434, + "learning_rate": 1.993456653595224e-05, + "loss": 1.3596, + "step": 2398 + }, + { + "epoch": 6.536784741144414, + "grad_norm": 11.08877944946289, + "learning_rate": 1.9934465707735304e-05, + "loss": 1.6812, + "step": 2399 + }, + { + "epoch": 6.539509536784741, + "grad_norm": 12.190179824829102, + "learning_rate": 1.993436480214907e-05, + "loss": 1.4988, + "step": 2400 + }, + { + "epoch": 6.5422343324250685, + "grad_norm": 20.818950653076172, + "learning_rate": 1.993426381919432e-05, + "loss": 1.4949, + "step": 2401 + }, + { + "epoch": 6.544959128065395, + "grad_norm": 13.064900398254395, + "learning_rate": 1.993416275887185e-05, + "loss": 1.7405, + "step": 2402 + }, + { + "epoch": 6.547683923705722, + "grad_norm": 12.698445320129395, + "learning_rate": 1.9934061621182433e-05, + "loss": 1.5542, + "step": 2403 + }, + { + "epoch": 6.550408719346049, + "grad_norm": 11.332972526550293, + "learning_rate": 1.993396040612687e-05, + "loss": 1.4771, + "step": 2404 + }, + { + "epoch": 6.553133514986376, + "grad_norm": 14.005719184875488, + "learning_rate": 1.9933859113705937e-05, + "loss": 1.5176, + "step": 2405 + }, + { + "epoch": 6.555858310626703, + "grad_norm": 11.294587135314941, + "learning_rate": 1.9933757743920433e-05, + "loss": 1.6316, + "step": 2406 + }, + { + "epoch": 6.55858310626703, + "grad_norm": 10.821269035339355, + "learning_rate": 1.993365629677114e-05, + "loss": 1.6152, + "step": 2407 + }, + { + "epoch": 6.561307901907357, + "grad_norm": 10.606854438781738, + "learning_rate": 1.9933554772258853e-05, + "loss": 1.6602, + "step": 2408 + }, + { + "epoch": 6.564032697547684, + "grad_norm": 13.516182899475098, + "learning_rate": 1.9933453170384363e-05, + "loss": 1.5715, + "step": 2409 + }, + { + "epoch": 6.566757493188011, + "grad_norm": 10.468656539916992, + "learning_rate": 1.993335149114846e-05, + "loss": 1.4802, + "step": 2410 + }, + { + "epoch": 6.569482288828338, + "grad_norm": 11.097125053405762, + "learning_rate": 1.9933249734551934e-05, + "loss": 1.5691, + "step": 2411 + }, + { + "epoch": 6.572207084468665, + "grad_norm": 10.488286972045898, + "learning_rate": 1.9933147900595576e-05, + "loss": 1.6445, + "step": 2412 + }, + { + "epoch": 6.574931880108992, + "grad_norm": 14.706908226013184, + "learning_rate": 1.9933045989280188e-05, + "loss": 1.4363, + "step": 2413 + }, + { + "epoch": 6.577656675749319, + "grad_norm": 10.991456985473633, + "learning_rate": 1.993294400060655e-05, + "loss": 1.6826, + "step": 2414 + }, + { + "epoch": 6.580381471389646, + "grad_norm": 14.5840425491333, + "learning_rate": 1.9932841934575468e-05, + "loss": 1.8613, + "step": 2415 + }, + { + "epoch": 6.583106267029972, + "grad_norm": 13.031789779663086, + "learning_rate": 1.9932739791187733e-05, + "loss": 1.7136, + "step": 2416 + }, + { + "epoch": 6.5858310626703, + "grad_norm": 10.509198188781738, + "learning_rate": 1.9932637570444138e-05, + "loss": 1.4597, + "step": 2417 + }, + { + "epoch": 6.5885558583106265, + "grad_norm": 10.194021224975586, + "learning_rate": 1.9932535272345482e-05, + "loss": 1.6216, + "step": 2418 + }, + { + "epoch": 6.591280653950953, + "grad_norm": 7.701805114746094, + "learning_rate": 1.9932432896892563e-05, + "loss": 1.4561, + "step": 2419 + }, + { + "epoch": 6.594005449591281, + "grad_norm": 10.746231079101562, + "learning_rate": 1.9932330444086175e-05, + "loss": 1.6001, + "step": 2420 + }, + { + "epoch": 6.5967302452316074, + "grad_norm": 15.582562446594238, + "learning_rate": 1.993222791392712e-05, + "loss": 1.3887, + "step": 2421 + }, + { + "epoch": 6.599455040871934, + "grad_norm": 9.70804500579834, + "learning_rate": 1.9932125306416185e-05, + "loss": 1.5044, + "step": 2422 + }, + { + "epoch": 6.602179836512262, + "grad_norm": 10.683446884155273, + "learning_rate": 1.9932022621554185e-05, + "loss": 1.6841, + "step": 2423 + }, + { + "epoch": 6.604904632152588, + "grad_norm": 11.003694534301758, + "learning_rate": 1.993191985934191e-05, + "loss": 1.5566, + "step": 2424 + }, + { + "epoch": 6.607629427792915, + "grad_norm": 20.193443298339844, + "learning_rate": 1.9931817019780165e-05, + "loss": 1.7471, + "step": 2425 + }, + { + "epoch": 6.610354223433243, + "grad_norm": 10.888099670410156, + "learning_rate": 1.993171410286975e-05, + "loss": 1.5444, + "step": 2426 + }, + { + "epoch": 6.613079019073569, + "grad_norm": 9.50598430633545, + "learning_rate": 1.9931611108611458e-05, + "loss": 1.6055, + "step": 2427 + }, + { + "epoch": 6.615803814713896, + "grad_norm": 9.374114990234375, + "learning_rate": 1.9931508037006106e-05, + "loss": 1.6694, + "step": 2428 + }, + { + "epoch": 6.618528610354224, + "grad_norm": 10.345595359802246, + "learning_rate": 1.9931404888054486e-05, + "loss": 1.6248, + "step": 2429 + }, + { + "epoch": 6.62125340599455, + "grad_norm": 12.015646934509277, + "learning_rate": 1.99313016617574e-05, + "loss": 1.3783, + "step": 2430 + }, + { + "epoch": 6.623978201634877, + "grad_norm": 10.096620559692383, + "learning_rate": 1.9931198358115665e-05, + "loss": 1.2698, + "step": 2431 + }, + { + "epoch": 6.6267029972752045, + "grad_norm": 13.323445320129395, + "learning_rate": 1.9931094977130072e-05, + "loss": 1.5256, + "step": 2432 + }, + { + "epoch": 6.629427792915531, + "grad_norm": 10.597187995910645, + "learning_rate": 1.9930991518801434e-05, + "loss": 1.6113, + "step": 2433 + }, + { + "epoch": 6.632152588555858, + "grad_norm": 11.72788143157959, + "learning_rate": 1.993088798313055e-05, + "loss": 1.6721, + "step": 2434 + }, + { + "epoch": 6.6348773841961854, + "grad_norm": 12.03602123260498, + "learning_rate": 1.993078437011823e-05, + "loss": 1.6377, + "step": 2435 + }, + { + "epoch": 6.637602179836512, + "grad_norm": 10.530377388000488, + "learning_rate": 1.9930680679765283e-05, + "loss": 1.6748, + "step": 2436 + }, + { + "epoch": 6.640326975476839, + "grad_norm": 9.889983177185059, + "learning_rate": 1.9930576912072514e-05, + "loss": 1.6863, + "step": 2437 + }, + { + "epoch": 6.643051771117166, + "grad_norm": 16.77570152282715, + "learning_rate": 1.993047306704073e-05, + "loss": 1.4214, + "step": 2438 + }, + { + "epoch": 6.645776566757493, + "grad_norm": 9.434869766235352, + "learning_rate": 1.9930369144670744e-05, + "loss": 1.585, + "step": 2439 + }, + { + "epoch": 6.64850136239782, + "grad_norm": 10.706549644470215, + "learning_rate": 1.993026514496336e-05, + "loss": 1.6279, + "step": 2440 + }, + { + "epoch": 6.651226158038147, + "grad_norm": 10.672386169433594, + "learning_rate": 1.9930161067919392e-05, + "loss": 1.5964, + "step": 2441 + }, + { + "epoch": 6.653950953678474, + "grad_norm": 14.484672546386719, + "learning_rate": 1.9930056913539647e-05, + "loss": 1.6155, + "step": 2442 + }, + { + "epoch": 6.656675749318801, + "grad_norm": 9.874717712402344, + "learning_rate": 1.9929952681824944e-05, + "loss": 1.6836, + "step": 2443 + }, + { + "epoch": 6.659400544959128, + "grad_norm": 10.416218757629395, + "learning_rate": 1.9929848372776085e-05, + "loss": 1.6025, + "step": 2444 + }, + { + "epoch": 6.662125340599455, + "grad_norm": 12.917311668395996, + "learning_rate": 1.9929743986393886e-05, + "loss": 1.6995, + "step": 2445 + }, + { + "epoch": 6.664850136239782, + "grad_norm": 10.260004043579102, + "learning_rate": 1.9929639522679163e-05, + "loss": 1.4712, + "step": 2446 + }, + { + "epoch": 6.667574931880109, + "grad_norm": 8.553717613220215, + "learning_rate": 1.9929534981632726e-05, + "loss": 1.572, + "step": 2447 + }, + { + "epoch": 6.670299727520436, + "grad_norm": 8.03495979309082, + "learning_rate": 1.9929430363255387e-05, + "loss": 1.3491, + "step": 2448 + }, + { + "epoch": 6.6730245231607626, + "grad_norm": 8.828189849853516, + "learning_rate": 1.9929325667547968e-05, + "loss": 1.6265, + "step": 2449 + }, + { + "epoch": 6.67574931880109, + "grad_norm": 10.107748031616211, + "learning_rate": 1.9929220894511275e-05, + "loss": 1.5894, + "step": 2450 + }, + { + "epoch": 6.678474114441417, + "grad_norm": 10.143497467041016, + "learning_rate": 1.9929116044146137e-05, + "loss": 1.6353, + "step": 2451 + }, + { + "epoch": 6.6811989100817435, + "grad_norm": 11.173709869384766, + "learning_rate": 1.9929011116453358e-05, + "loss": 1.6279, + "step": 2452 + }, + { + "epoch": 6.683923705722071, + "grad_norm": 10.3662109375, + "learning_rate": 1.9928906111433762e-05, + "loss": 1.4197, + "step": 2453 + }, + { + "epoch": 6.686648501362398, + "grad_norm": 9.1519775390625, + "learning_rate": 1.9928801029088162e-05, + "loss": 1.4307, + "step": 2454 + }, + { + "epoch": 6.689373297002724, + "grad_norm": 11.98711109161377, + "learning_rate": 1.9928695869417383e-05, + "loss": 1.7588, + "step": 2455 + }, + { + "epoch": 6.692098092643052, + "grad_norm": 12.33102798461914, + "learning_rate": 1.9928590632422236e-05, + "loss": 1.5356, + "step": 2456 + }, + { + "epoch": 6.694822888283379, + "grad_norm": 13.80027961730957, + "learning_rate": 1.9928485318103545e-05, + "loss": 1.5417, + "step": 2457 + }, + { + "epoch": 6.697547683923705, + "grad_norm": 11.349905967712402, + "learning_rate": 1.992837992646213e-05, + "loss": 1.8628, + "step": 2458 + }, + { + "epoch": 6.700272479564033, + "grad_norm": 12.577153205871582, + "learning_rate": 1.9928274457498818e-05, + "loss": 1.5457, + "step": 2459 + }, + { + "epoch": 6.70299727520436, + "grad_norm": 12.215507507324219, + "learning_rate": 1.9928168911214415e-05, + "loss": 1.5699, + "step": 2460 + }, + { + "epoch": 6.705722070844686, + "grad_norm": 11.409568786621094, + "learning_rate": 1.9928063287609758e-05, + "loss": 1.6504, + "step": 2461 + }, + { + "epoch": 6.708446866485014, + "grad_norm": 11.919694900512695, + "learning_rate": 1.9927957586685664e-05, + "loss": 1.5984, + "step": 2462 + }, + { + "epoch": 6.7111716621253406, + "grad_norm": 11.449212074279785, + "learning_rate": 1.992785180844295e-05, + "loss": 1.5847, + "step": 2463 + }, + { + "epoch": 6.713896457765667, + "grad_norm": 9.151398658752441, + "learning_rate": 1.9927745952882452e-05, + "loss": 1.5081, + "step": 2464 + }, + { + "epoch": 6.716621253405995, + "grad_norm": 10.904823303222656, + "learning_rate": 1.9927640020004985e-05, + "loss": 1.5444, + "step": 2465 + }, + { + "epoch": 6.7193460490463215, + "grad_norm": 9.86526870727539, + "learning_rate": 1.9927534009811377e-05, + "loss": 1.6147, + "step": 2466 + }, + { + "epoch": 6.722070844686648, + "grad_norm": 10.476258277893066, + "learning_rate": 1.9927427922302452e-05, + "loss": 1.6111, + "step": 2467 + }, + { + "epoch": 6.724795640326976, + "grad_norm": 9.763236045837402, + "learning_rate": 1.9927321757479043e-05, + "loss": 1.4932, + "step": 2468 + }, + { + "epoch": 6.727520435967302, + "grad_norm": 12.400291442871094, + "learning_rate": 1.992721551534197e-05, + "loss": 1.491, + "step": 2469 + }, + { + "epoch": 6.730245231607629, + "grad_norm": 11.978157043457031, + "learning_rate": 1.9927109195892062e-05, + "loss": 1.4448, + "step": 2470 + }, + { + "epoch": 6.732970027247957, + "grad_norm": 9.739986419677734, + "learning_rate": 1.9927002799130144e-05, + "loss": 1.7478, + "step": 2471 + }, + { + "epoch": 6.735694822888283, + "grad_norm": 10.663016319274902, + "learning_rate": 1.992689632505705e-05, + "loss": 1.5623, + "step": 2472 + }, + { + "epoch": 6.73841961852861, + "grad_norm": 12.673657417297363, + "learning_rate": 1.9926789773673606e-05, + "loss": 1.771, + "step": 2473 + }, + { + "epoch": 6.741144414168938, + "grad_norm": 13.936773300170898, + "learning_rate": 1.9926683144980643e-05, + "loss": 1.7021, + "step": 2474 + }, + { + "epoch": 6.743869209809264, + "grad_norm": 11.60373592376709, + "learning_rate": 1.992657643897899e-05, + "loss": 1.7454, + "step": 2475 + }, + { + "epoch": 6.746594005449591, + "grad_norm": 10.127052307128906, + "learning_rate": 1.992646965566948e-05, + "loss": 1.5261, + "step": 2476 + }, + { + "epoch": 6.7493188010899186, + "grad_norm": 11.759267807006836, + "learning_rate": 1.9926362795052947e-05, + "loss": 1.5005, + "step": 2477 + }, + { + "epoch": 6.752043596730245, + "grad_norm": 13.64344596862793, + "learning_rate": 1.9926255857130216e-05, + "loss": 1.645, + "step": 2478 + }, + { + "epoch": 6.754768392370572, + "grad_norm": 11.076778411865234, + "learning_rate": 1.9926148841902123e-05, + "loss": 1.4646, + "step": 2479 + }, + { + "epoch": 6.7574931880108995, + "grad_norm": 15.128584861755371, + "learning_rate": 1.9926041749369507e-05, + "loss": 1.6904, + "step": 2480 + }, + { + "epoch": 6.760217983651226, + "grad_norm": 11.720351219177246, + "learning_rate": 1.9925934579533195e-05, + "loss": 1.728, + "step": 2481 + }, + { + "epoch": 6.762942779291553, + "grad_norm": 8.59024429321289, + "learning_rate": 1.9925827332394023e-05, + "loss": 1.4097, + "step": 2482 + }, + { + "epoch": 6.76566757493188, + "grad_norm": 13.756746292114258, + "learning_rate": 1.9925720007952826e-05, + "loss": 1.6008, + "step": 2483 + }, + { + "epoch": 6.768392370572207, + "grad_norm": 11.337132453918457, + "learning_rate": 1.9925612606210446e-05, + "loss": 1.4539, + "step": 2484 + }, + { + "epoch": 6.771117166212534, + "grad_norm": 11.355990409851074, + "learning_rate": 1.992550512716771e-05, + "loss": 1.738, + "step": 2485 + }, + { + "epoch": 6.773841961852861, + "grad_norm": 12.595316886901855, + "learning_rate": 1.9925397570825463e-05, + "loss": 1.6526, + "step": 2486 + }, + { + "epoch": 6.776566757493188, + "grad_norm": 10.657020568847656, + "learning_rate": 1.9925289937184534e-05, + "loss": 1.6196, + "step": 2487 + }, + { + "epoch": 6.779291553133515, + "grad_norm": 12.440933227539062, + "learning_rate": 1.992518222624577e-05, + "loss": 1.6235, + "step": 2488 + }, + { + "epoch": 6.782016348773842, + "grad_norm": 9.319437026977539, + "learning_rate": 1.992507443801001e-05, + "loss": 1.6362, + "step": 2489 + }, + { + "epoch": 6.784741144414169, + "grad_norm": 41.49929428100586, + "learning_rate": 1.9924966572478083e-05, + "loss": 1.5034, + "step": 2490 + }, + { + "epoch": 6.787465940054496, + "grad_norm": 15.431757926940918, + "learning_rate": 1.992485862965084e-05, + "loss": 1.4822, + "step": 2491 + }, + { + "epoch": 6.790190735694823, + "grad_norm": 13.493185043334961, + "learning_rate": 1.9924750609529116e-05, + "loss": 1.4744, + "step": 2492 + }, + { + "epoch": 6.79291553133515, + "grad_norm": 18.08843421936035, + "learning_rate": 1.992464251211375e-05, + "loss": 1.6089, + "step": 2493 + }, + { + "epoch": 6.795640326975477, + "grad_norm": 12.009065628051758, + "learning_rate": 1.992453433740559e-05, + "loss": 1.6089, + "step": 2494 + }, + { + "epoch": 6.798365122615804, + "grad_norm": 11.761157989501953, + "learning_rate": 1.9924426085405478e-05, + "loss": 1.5273, + "step": 2495 + }, + { + "epoch": 6.801089918256131, + "grad_norm": 10.267550468444824, + "learning_rate": 1.9924317756114255e-05, + "loss": 1.5486, + "step": 2496 + }, + { + "epoch": 6.8038147138964575, + "grad_norm": 11.865041732788086, + "learning_rate": 1.9924209349532763e-05, + "loss": 1.5554, + "step": 2497 + }, + { + "epoch": 6.806539509536785, + "grad_norm": 9.561129570007324, + "learning_rate": 1.992410086566185e-05, + "loss": 1.4812, + "step": 2498 + }, + { + "epoch": 6.809264305177112, + "grad_norm": 9.084714889526367, + "learning_rate": 1.9923992304502357e-05, + "loss": 1.3855, + "step": 2499 + }, + { + "epoch": 6.8119891008174385, + "grad_norm": 12.381909370422363, + "learning_rate": 1.9923883666055133e-05, + "loss": 1.5867, + "step": 2500 + }, + { + "epoch": 6.814713896457766, + "grad_norm": 15.723135948181152, + "learning_rate": 1.992377495032102e-05, + "loss": 1.6187, + "step": 2501 + }, + { + "epoch": 6.817438692098093, + "grad_norm": 16.490381240844727, + "learning_rate": 1.992366615730087e-05, + "loss": 1.6401, + "step": 2502 + }, + { + "epoch": 6.820163487738419, + "grad_norm": 13.186235427856445, + "learning_rate": 1.9923557286995524e-05, + "loss": 1.4634, + "step": 2503 + }, + { + "epoch": 6.822888283378747, + "grad_norm": 12.261408805847168, + "learning_rate": 1.9923448339405835e-05, + "loss": 1.4092, + "step": 2504 + }, + { + "epoch": 6.825613079019074, + "grad_norm": 21.39244842529297, + "learning_rate": 1.992333931453265e-05, + "loss": 1.6294, + "step": 2505 + }, + { + "epoch": 6.8283378746594, + "grad_norm": 12.436821937561035, + "learning_rate": 1.992323021237682e-05, + "loss": 1.5833, + "step": 2506 + }, + { + "epoch": 6.831062670299728, + "grad_norm": 13.260921478271484, + "learning_rate": 1.992312103293919e-05, + "loss": 1.5767, + "step": 2507 + }, + { + "epoch": 6.833787465940055, + "grad_norm": 15.177225112915039, + "learning_rate": 1.9923011776220612e-05, + "loss": 1.5896, + "step": 2508 + }, + { + "epoch": 6.836512261580381, + "grad_norm": 15.003098487854004, + "learning_rate": 1.992290244222194e-05, + "loss": 1.8267, + "step": 2509 + }, + { + "epoch": 6.839237057220709, + "grad_norm": 11.336455345153809, + "learning_rate": 1.992279303094402e-05, + "loss": 1.5039, + "step": 2510 + }, + { + "epoch": 6.8419618528610355, + "grad_norm": 11.886491775512695, + "learning_rate": 1.9922683542387707e-05, + "loss": 1.6057, + "step": 2511 + }, + { + "epoch": 6.844686648501362, + "grad_norm": 14.85074234008789, + "learning_rate": 1.9922573976553857e-05, + "loss": 1.7595, + "step": 2512 + }, + { + "epoch": 6.84741144414169, + "grad_norm": 11.935297966003418, + "learning_rate": 1.9922464333443318e-05, + "loss": 1.4692, + "step": 2513 + }, + { + "epoch": 6.8501362397820165, + "grad_norm": 12.974621772766113, + "learning_rate": 1.9922354613056946e-05, + "loss": 1.5085, + "step": 2514 + }, + { + "epoch": 6.852861035422343, + "grad_norm": 10.358409881591797, + "learning_rate": 1.9922244815395597e-05, + "loss": 1.4092, + "step": 2515 + }, + { + "epoch": 6.855585831062671, + "grad_norm": 29.964595794677734, + "learning_rate": 1.9922134940460126e-05, + "loss": 1.5103, + "step": 2516 + }, + { + "epoch": 6.858310626702997, + "grad_norm": 12.04236125946045, + "learning_rate": 1.9922024988251384e-05, + "loss": 1.4392, + "step": 2517 + }, + { + "epoch": 6.861035422343324, + "grad_norm": 10.837052345275879, + "learning_rate": 1.9921914958770235e-05, + "loss": 1.5547, + "step": 2518 + }, + { + "epoch": 6.863760217983652, + "grad_norm": 12.022932052612305, + "learning_rate": 1.992180485201753e-05, + "loss": 1.5935, + "step": 2519 + }, + { + "epoch": 6.866485013623978, + "grad_norm": 13.637711524963379, + "learning_rate": 1.9921694667994126e-05, + "loss": 1.749, + "step": 2520 + }, + { + "epoch": 6.869209809264305, + "grad_norm": 10.001995086669922, + "learning_rate": 1.9921584406700883e-05, + "loss": 1.918, + "step": 2521 + }, + { + "epoch": 6.871934604904633, + "grad_norm": 29.265378952026367, + "learning_rate": 1.9921474068138665e-05, + "loss": 1.5459, + "step": 2522 + }, + { + "epoch": 6.874659400544959, + "grad_norm": 12.276293754577637, + "learning_rate": 1.9921363652308324e-05, + "loss": 1.4941, + "step": 2523 + }, + { + "epoch": 6.877384196185286, + "grad_norm": 11.9083251953125, + "learning_rate": 1.9921253159210718e-05, + "loss": 1.6221, + "step": 2524 + }, + { + "epoch": 6.8801089918256135, + "grad_norm": 11.969018936157227, + "learning_rate": 1.9921142588846717e-05, + "loss": 1.5964, + "step": 2525 + }, + { + "epoch": 6.88283378746594, + "grad_norm": 9.593964576721191, + "learning_rate": 1.9921031941217173e-05, + "loss": 1.458, + "step": 2526 + }, + { + "epoch": 6.885558583106267, + "grad_norm": 9.690338134765625, + "learning_rate": 1.9920921216322953e-05, + "loss": 1.3936, + "step": 2527 + }, + { + "epoch": 6.8882833787465945, + "grad_norm": 10.085105895996094, + "learning_rate": 1.992081041416492e-05, + "loss": 1.5444, + "step": 2528 + }, + { + "epoch": 6.891008174386921, + "grad_norm": 14.536722183227539, + "learning_rate": 1.9920699534743932e-05, + "loss": 1.7988, + "step": 2529 + }, + { + "epoch": 6.893732970027248, + "grad_norm": 10.853922843933105, + "learning_rate": 1.9920588578060854e-05, + "loss": 1.6394, + "step": 2530 + }, + { + "epoch": 6.896457765667575, + "grad_norm": 12.865930557250977, + "learning_rate": 1.9920477544116554e-05, + "loss": 1.481, + "step": 2531 + }, + { + "epoch": 6.899182561307902, + "grad_norm": 9.311355590820312, + "learning_rate": 1.9920366432911895e-05, + "loss": 1.7463, + "step": 2532 + }, + { + "epoch": 6.901907356948229, + "grad_norm": 13.008605003356934, + "learning_rate": 1.992025524444774e-05, + "loss": 1.6851, + "step": 2533 + }, + { + "epoch": 6.904632152588556, + "grad_norm": 17.339941024780273, + "learning_rate": 1.9920143978724958e-05, + "loss": 1.6743, + "step": 2534 + }, + { + "epoch": 6.907356948228883, + "grad_norm": 11.650899887084961, + "learning_rate": 1.992003263574441e-05, + "loss": 1.675, + "step": 2535 + }, + { + "epoch": 6.91008174386921, + "grad_norm": 9.174309730529785, + "learning_rate": 1.991992121550697e-05, + "loss": 1.5598, + "step": 2536 + }, + { + "epoch": 6.912806539509537, + "grad_norm": 9.838683128356934, + "learning_rate": 1.9919809718013505e-05, + "loss": 1.48, + "step": 2537 + }, + { + "epoch": 6.915531335149864, + "grad_norm": 8.482483863830566, + "learning_rate": 1.991969814326488e-05, + "loss": 1.5427, + "step": 2538 + }, + { + "epoch": 6.918256130790191, + "grad_norm": 11.64597225189209, + "learning_rate": 1.9919586491261962e-05, + "loss": 1.6533, + "step": 2539 + }, + { + "epoch": 6.920980926430518, + "grad_norm": 11.544082641601562, + "learning_rate": 1.9919474762005625e-05, + "loss": 1.8208, + "step": 2540 + }, + { + "epoch": 6.923705722070845, + "grad_norm": 12.081391334533691, + "learning_rate": 1.991936295549674e-05, + "loss": 1.7241, + "step": 2541 + }, + { + "epoch": 6.926430517711172, + "grad_norm": 12.315491676330566, + "learning_rate": 1.9919251071736176e-05, + "loss": 1.6943, + "step": 2542 + }, + { + "epoch": 6.929155313351498, + "grad_norm": 8.521120071411133, + "learning_rate": 1.9919139110724798e-05, + "loss": 1.6357, + "step": 2543 + }, + { + "epoch": 6.931880108991826, + "grad_norm": 9.169511795043945, + "learning_rate": 1.991902707246349e-05, + "loss": 1.5173, + "step": 2544 + }, + { + "epoch": 6.9346049046321525, + "grad_norm": 9.596213340759277, + "learning_rate": 1.9918914956953116e-05, + "loss": 1.5217, + "step": 2545 + }, + { + "epoch": 6.937329700272479, + "grad_norm": 8.34455394744873, + "learning_rate": 1.991880276419455e-05, + "loss": 1.5686, + "step": 2546 + }, + { + "epoch": 6.940054495912807, + "grad_norm": 9.147504806518555, + "learning_rate": 1.991869049418867e-05, + "loss": 1.4917, + "step": 2547 + }, + { + "epoch": 6.9427792915531334, + "grad_norm": 11.00312614440918, + "learning_rate": 1.9918578146936346e-05, + "loss": 1.8115, + "step": 2548 + }, + { + "epoch": 6.94550408719346, + "grad_norm": 11.378459930419922, + "learning_rate": 1.9918465722438456e-05, + "loss": 1.6875, + "step": 2549 + }, + { + "epoch": 6.948228882833788, + "grad_norm": 9.615368843078613, + "learning_rate": 1.9918353220695875e-05, + "loss": 1.6191, + "step": 2550 + }, + { + "epoch": 6.950953678474114, + "grad_norm": 8.775830268859863, + "learning_rate": 1.9918240641709475e-05, + "loss": 1.5447, + "step": 2551 + }, + { + "epoch": 6.953678474114441, + "grad_norm": 9.215841293334961, + "learning_rate": 1.991812798548014e-05, + "loss": 1.7075, + "step": 2552 + }, + { + "epoch": 6.956403269754769, + "grad_norm": 11.271383285522461, + "learning_rate": 1.991801525200874e-05, + "loss": 1.5977, + "step": 2553 + }, + { + "epoch": 6.959128065395095, + "grad_norm": 9.250890731811523, + "learning_rate": 1.9917902441296156e-05, + "loss": 1.6226, + "step": 2554 + }, + { + "epoch": 6.961852861035422, + "grad_norm": 8.830961227416992, + "learning_rate": 1.991778955334327e-05, + "loss": 1.5269, + "step": 2555 + }, + { + "epoch": 6.96457765667575, + "grad_norm": 11.751460075378418, + "learning_rate": 1.991767658815096e-05, + "loss": 1.7437, + "step": 2556 + }, + { + "epoch": 6.967302452316076, + "grad_norm": 12.019865036010742, + "learning_rate": 1.9917563545720098e-05, + "loss": 1.7788, + "step": 2557 + }, + { + "epoch": 6.970027247956403, + "grad_norm": 9.664366722106934, + "learning_rate": 1.9917450426051572e-05, + "loss": 1.595, + "step": 2558 + }, + { + "epoch": 6.9727520435967305, + "grad_norm": 10.568838119506836, + "learning_rate": 1.9917337229146266e-05, + "loss": 1.5591, + "step": 2559 + }, + { + "epoch": 6.975476839237057, + "grad_norm": 7.393206596374512, + "learning_rate": 1.9917223955005053e-05, + "loss": 1.4487, + "step": 2560 + }, + { + "epoch": 6.978201634877384, + "grad_norm": 9.041869163513184, + "learning_rate": 1.9917110603628818e-05, + "loss": 1.5823, + "step": 2561 + }, + { + "epoch": 6.9809264305177114, + "grad_norm": 8.957469940185547, + "learning_rate": 1.9916997175018445e-05, + "loss": 1.4365, + "step": 2562 + }, + { + "epoch": 6.983651226158038, + "grad_norm": 8.627134323120117, + "learning_rate": 1.9916883669174818e-05, + "loss": 1.5144, + "step": 2563 + }, + { + "epoch": 6.986376021798365, + "grad_norm": 9.489056587219238, + "learning_rate": 1.991677008609882e-05, + "loss": 1.6389, + "step": 2564 + }, + { + "epoch": 6.989100817438692, + "grad_norm": 10.777949333190918, + "learning_rate": 1.9916656425791338e-05, + "loss": 1.3235, + "step": 2565 + }, + { + "epoch": 6.991825613079019, + "grad_norm": 11.10266399383545, + "learning_rate": 1.9916542688253253e-05, + "loss": 1.6667, + "step": 2566 + }, + { + "epoch": 6.994550408719346, + "grad_norm": 16.274316787719727, + "learning_rate": 1.9916428873485452e-05, + "loss": 1.7275, + "step": 2567 + }, + { + "epoch": 6.997275204359673, + "grad_norm": 10.998518943786621, + "learning_rate": 1.9916314981488822e-05, + "loss": 1.5061, + "step": 2568 + }, + { + "epoch": 7.0, + "grad_norm": 13.744210243225098, + "learning_rate": 1.9916201012264255e-05, + "loss": 1.4661, + "step": 2569 + }, + { + "epoch": 7.002724795640327, + "grad_norm": 12.455055236816406, + "learning_rate": 1.9916086965812627e-05, + "loss": 1.5776, + "step": 2570 + }, + { + "epoch": 7.005449591280654, + "grad_norm": 8.5689115524292, + "learning_rate": 1.9915972842134837e-05, + "loss": 1.5989, + "step": 2571 + }, + { + "epoch": 7.008174386920981, + "grad_norm": 9.611258506774902, + "learning_rate": 1.991585864123177e-05, + "loss": 1.5684, + "step": 2572 + }, + { + "epoch": 7.010899182561308, + "grad_norm": 10.000003814697266, + "learning_rate": 1.991574436310431e-05, + "loss": 1.6243, + "step": 2573 + }, + { + "epoch": 7.013623978201635, + "grad_norm": 9.323932647705078, + "learning_rate": 1.991563000775336e-05, + "loss": 1.6792, + "step": 2574 + }, + { + "epoch": 7.016348773841962, + "grad_norm": 13.849161148071289, + "learning_rate": 1.9915515575179793e-05, + "loss": 1.4006, + "step": 2575 + }, + { + "epoch": 7.0190735694822886, + "grad_norm": 12.729543685913086, + "learning_rate": 1.9915401065384518e-05, + "loss": 1.6182, + "step": 2576 + }, + { + "epoch": 7.021798365122616, + "grad_norm": 9.167952537536621, + "learning_rate": 1.9915286478368414e-05, + "loss": 1.5718, + "step": 2577 + }, + { + "epoch": 7.024523160762943, + "grad_norm": 10.326859474182129, + "learning_rate": 1.9915171814132378e-05, + "loss": 1.3718, + "step": 2578 + }, + { + "epoch": 7.0272479564032695, + "grad_norm": 9.17179012298584, + "learning_rate": 1.9915057072677305e-05, + "loss": 1.4885, + "step": 2579 + }, + { + "epoch": 7.029972752043597, + "grad_norm": 10.229643821716309, + "learning_rate": 1.9914942254004086e-05, + "loss": 1.668, + "step": 2580 + }, + { + "epoch": 7.032697547683924, + "grad_norm": 12.10188102722168, + "learning_rate": 1.9914827358113616e-05, + "loss": 1.3757, + "step": 2581 + }, + { + "epoch": 7.03542234332425, + "grad_norm": 8.516680717468262, + "learning_rate": 1.991471238500679e-05, + "loss": 1.5469, + "step": 2582 + }, + { + "epoch": 7.038147138964578, + "grad_norm": 16.977920532226562, + "learning_rate": 1.9914597334684502e-05, + "loss": 1.5964, + "step": 2583 + }, + { + "epoch": 7.040871934604905, + "grad_norm": 10.091428756713867, + "learning_rate": 1.9914482207147648e-05, + "loss": 1.5515, + "step": 2584 + }, + { + "epoch": 7.043596730245231, + "grad_norm": 11.44006061553955, + "learning_rate": 1.9914367002397127e-05, + "loss": 1.5601, + "step": 2585 + }, + { + "epoch": 7.046321525885559, + "grad_norm": 10.585381507873535, + "learning_rate": 1.9914251720433837e-05, + "loss": 1.3669, + "step": 2586 + }, + { + "epoch": 7.049046321525886, + "grad_norm": 12.6299467086792, + "learning_rate": 1.9914136361258673e-05, + "loss": 1.7812, + "step": 2587 + }, + { + "epoch": 7.051771117166212, + "grad_norm": 23.789104461669922, + "learning_rate": 1.991402092487253e-05, + "loss": 1.6086, + "step": 2588 + }, + { + "epoch": 7.05449591280654, + "grad_norm": 10.832141876220703, + "learning_rate": 1.991390541127632e-05, + "loss": 1.5283, + "step": 2589 + }, + { + "epoch": 7.0572207084468666, + "grad_norm": 9.405333518981934, + "learning_rate": 1.9913789820470925e-05, + "loss": 1.6958, + "step": 2590 + }, + { + "epoch": 7.059945504087193, + "grad_norm": 10.257238388061523, + "learning_rate": 1.9913674152457254e-05, + "loss": 1.4604, + "step": 2591 + }, + { + "epoch": 7.062670299727521, + "grad_norm": 9.994807243347168, + "learning_rate": 1.991355840723621e-05, + "loss": 1.5125, + "step": 2592 + }, + { + "epoch": 7.0653950953678475, + "grad_norm": 10.089841842651367, + "learning_rate": 1.9913442584808694e-05, + "loss": 1.4565, + "step": 2593 + }, + { + "epoch": 7.068119891008174, + "grad_norm": 9.78079605102539, + "learning_rate": 1.9913326685175606e-05, + "loss": 1.4182, + "step": 2594 + }, + { + "epoch": 7.070844686648502, + "grad_norm": 15.902073860168457, + "learning_rate": 1.991321070833785e-05, + "loss": 1.3955, + "step": 2595 + }, + { + "epoch": 7.073569482288828, + "grad_norm": 17.8822078704834, + "learning_rate": 1.9913094654296324e-05, + "loss": 1.4043, + "step": 2596 + }, + { + "epoch": 7.076294277929155, + "grad_norm": 13.469987869262695, + "learning_rate": 1.9912978523051936e-05, + "loss": 1.3516, + "step": 2597 + }, + { + "epoch": 7.079019073569483, + "grad_norm": 18.184144973754883, + "learning_rate": 1.9912862314605594e-05, + "loss": 1.4761, + "step": 2598 + }, + { + "epoch": 7.081743869209809, + "grad_norm": 10.457294464111328, + "learning_rate": 1.9912746028958195e-05, + "loss": 1.5325, + "step": 2599 + }, + { + "epoch": 7.084468664850136, + "grad_norm": 13.190240859985352, + "learning_rate": 1.9912629666110656e-05, + "loss": 1.5283, + "step": 2600 + }, + { + "epoch": 7.087193460490464, + "grad_norm": 12.5562105178833, + "learning_rate": 1.9912513226063866e-05, + "loss": 1.3442, + "step": 2601 + }, + { + "epoch": 7.08991825613079, + "grad_norm": 11.620115280151367, + "learning_rate": 1.9912396708818748e-05, + "loss": 1.5303, + "step": 2602 + }, + { + "epoch": 7.092643051771117, + "grad_norm": 16.161975860595703, + "learning_rate": 1.9912280114376205e-05, + "loss": 1.7246, + "step": 2603 + }, + { + "epoch": 7.0953678474114446, + "grad_norm": 12.94520378112793, + "learning_rate": 1.9912163442737143e-05, + "loss": 1.4026, + "step": 2604 + }, + { + "epoch": 7.098092643051771, + "grad_norm": 32.33180236816406, + "learning_rate": 1.9912046693902466e-05, + "loss": 1.6226, + "step": 2605 + }, + { + "epoch": 7.100817438692098, + "grad_norm": 14.084209442138672, + "learning_rate": 1.9911929867873093e-05, + "loss": 1.6404, + "step": 2606 + }, + { + "epoch": 7.1035422343324255, + "grad_norm": 12.616997718811035, + "learning_rate": 1.991181296464993e-05, + "loss": 1.3081, + "step": 2607 + }, + { + "epoch": 7.106267029972752, + "grad_norm": 11.319100379943848, + "learning_rate": 1.9911695984233885e-05, + "loss": 1.3953, + "step": 2608 + }, + { + "epoch": 7.108991825613079, + "grad_norm": 19.24335289001465, + "learning_rate": 1.991157892662587e-05, + "loss": 1.5649, + "step": 2609 + }, + { + "epoch": 7.111716621253406, + "grad_norm": 19.046993255615234, + "learning_rate": 1.99114617918268e-05, + "loss": 1.4734, + "step": 2610 + }, + { + "epoch": 7.114441416893733, + "grad_norm": 35.106143951416016, + "learning_rate": 1.991134457983758e-05, + "loss": 1.6211, + "step": 2611 + }, + { + "epoch": 7.11716621253406, + "grad_norm": 12.001912117004395, + "learning_rate": 1.991122729065913e-05, + "loss": 1.5916, + "step": 2612 + }, + { + "epoch": 7.1198910081743865, + "grad_norm": 14.034006118774414, + "learning_rate": 1.9911109924292362e-05, + "loss": 1.3315, + "step": 2613 + }, + { + "epoch": 7.122615803814714, + "grad_norm": 24.54100799560547, + "learning_rate": 1.991099248073819e-05, + "loss": 1.3369, + "step": 2614 + }, + { + "epoch": 7.125340599455041, + "grad_norm": 18.295448303222656, + "learning_rate": 1.991087495999752e-05, + "loss": 1.4895, + "step": 2615 + }, + { + "epoch": 7.128065395095367, + "grad_norm": 10.534333229064941, + "learning_rate": 1.9910757362071282e-05, + "loss": 1.282, + "step": 2616 + }, + { + "epoch": 7.130790190735695, + "grad_norm": 16.28651237487793, + "learning_rate": 1.9910639686960382e-05, + "loss": 1.387, + "step": 2617 + }, + { + "epoch": 7.133514986376022, + "grad_norm": 17.221111297607422, + "learning_rate": 1.991052193466574e-05, + "loss": 1.5898, + "step": 2618 + }, + { + "epoch": 7.136239782016348, + "grad_norm": 12.247292518615723, + "learning_rate": 1.991040410518827e-05, + "loss": 1.3435, + "step": 2619 + }, + { + "epoch": 7.138964577656676, + "grad_norm": 14.799015998840332, + "learning_rate": 1.9910286198528897e-05, + "loss": 1.5859, + "step": 2620 + }, + { + "epoch": 7.141689373297003, + "grad_norm": 13.674405097961426, + "learning_rate": 1.9910168214688527e-05, + "loss": 1.4153, + "step": 2621 + }, + { + "epoch": 7.144414168937329, + "grad_norm": 54.96337890625, + "learning_rate": 1.991005015366809e-05, + "loss": 1.3645, + "step": 2622 + }, + { + "epoch": 7.147138964577657, + "grad_norm": 19.959274291992188, + "learning_rate": 1.9909932015468504e-05, + "loss": 1.5613, + "step": 2623 + }, + { + "epoch": 7.1498637602179835, + "grad_norm": 15.985265731811523, + "learning_rate": 1.9909813800090682e-05, + "loss": 1.4902, + "step": 2624 + }, + { + "epoch": 7.15258855585831, + "grad_norm": 19.88857650756836, + "learning_rate": 1.9909695507535552e-05, + "loss": 1.5559, + "step": 2625 + }, + { + "epoch": 7.155313351498638, + "grad_norm": 18.16654396057129, + "learning_rate": 1.9909577137804028e-05, + "loss": 1.4475, + "step": 2626 + }, + { + "epoch": 7.1580381471389645, + "grad_norm": 18.870697021484375, + "learning_rate": 1.9909458690897038e-05, + "loss": 1.2856, + "step": 2627 + }, + { + "epoch": 7.160762942779291, + "grad_norm": 35.931060791015625, + "learning_rate": 1.9909340166815504e-05, + "loss": 1.5642, + "step": 2628 + }, + { + "epoch": 7.163487738419619, + "grad_norm": 23.01498794555664, + "learning_rate": 1.9909221565560348e-05, + "loss": 1.4214, + "step": 2629 + }, + { + "epoch": 7.166212534059945, + "grad_norm": 16.723155975341797, + "learning_rate": 1.9909102887132494e-05, + "loss": 1.541, + "step": 2630 + }, + { + "epoch": 7.168937329700272, + "grad_norm": 14.408949851989746, + "learning_rate": 1.9908984131532865e-05, + "loss": 1.4429, + "step": 2631 + }, + { + "epoch": 7.1716621253406, + "grad_norm": 54.55207824707031, + "learning_rate": 1.9908865298762384e-05, + "loss": 1.697, + "step": 2632 + }, + { + "epoch": 7.174386920980926, + "grad_norm": 37.38616943359375, + "learning_rate": 1.990874638882198e-05, + "loss": 1.374, + "step": 2633 + }, + { + "epoch": 7.177111716621253, + "grad_norm": 15.120404243469238, + "learning_rate": 1.990862740171258e-05, + "loss": 1.4287, + "step": 2634 + }, + { + "epoch": 7.179836512261581, + "grad_norm": 16.63327407836914, + "learning_rate": 1.990850833743511e-05, + "loss": 1.5898, + "step": 2635 + }, + { + "epoch": 7.182561307901907, + "grad_norm": 16.18759536743164, + "learning_rate": 1.9908389195990492e-05, + "loss": 1.5266, + "step": 2636 + }, + { + "epoch": 7.185286103542234, + "grad_norm": 19.903820037841797, + "learning_rate": 1.9908269977379658e-05, + "loss": 1.4631, + "step": 2637 + }, + { + "epoch": 7.1880108991825615, + "grad_norm": 20.78038787841797, + "learning_rate": 1.990815068160354e-05, + "loss": 1.4155, + "step": 2638 + }, + { + "epoch": 7.190735694822888, + "grad_norm": 65.83699798583984, + "learning_rate": 1.990803130866306e-05, + "loss": 1.468, + "step": 2639 + }, + { + "epoch": 7.193460490463215, + "grad_norm": 12.93549633026123, + "learning_rate": 1.990791185855915e-05, + "loss": 1.561, + "step": 2640 + }, + { + "epoch": 7.1961852861035425, + "grad_norm": 13.24904727935791, + "learning_rate": 1.9907792331292747e-05, + "loss": 1.4609, + "step": 2641 + }, + { + "epoch": 7.198910081743869, + "grad_norm": 14.132883071899414, + "learning_rate": 1.9907672726864772e-05, + "loss": 1.5366, + "step": 2642 + }, + { + "epoch": 7.201634877384196, + "grad_norm": 21.078025817871094, + "learning_rate": 1.9907553045276158e-05, + "loss": 1.6311, + "step": 2643 + }, + { + "epoch": 7.204359673024523, + "grad_norm": 17.943523406982422, + "learning_rate": 1.9907433286527843e-05, + "loss": 1.5339, + "step": 2644 + }, + { + "epoch": 7.20708446866485, + "grad_norm": 11.418760299682617, + "learning_rate": 1.990731345062076e-05, + "loss": 1.7036, + "step": 2645 + }, + { + "epoch": 7.209809264305177, + "grad_norm": 28.595006942749023, + "learning_rate": 1.9907193537555832e-05, + "loss": 1.5769, + "step": 2646 + }, + { + "epoch": 7.212534059945504, + "grad_norm": 17.612186431884766, + "learning_rate": 1.9907073547334002e-05, + "loss": 1.3901, + "step": 2647 + }, + { + "epoch": 7.215258855585831, + "grad_norm": 13.393107414245605, + "learning_rate": 1.9906953479956206e-05, + "loss": 1.4292, + "step": 2648 + }, + { + "epoch": 7.217983651226158, + "grad_norm": 15.393351554870605, + "learning_rate": 1.990683333542337e-05, + "loss": 1.5747, + "step": 2649 + }, + { + "epoch": 7.220708446866485, + "grad_norm": 11.29178237915039, + "learning_rate": 1.990671311373644e-05, + "loss": 1.5178, + "step": 2650 + }, + { + "epoch": 7.223433242506812, + "grad_norm": 10.266595840454102, + "learning_rate": 1.9906592814896343e-05, + "loss": 1.6135, + "step": 2651 + }, + { + "epoch": 7.226158038147139, + "grad_norm": 13.928282737731934, + "learning_rate": 1.990647243890402e-05, + "loss": 1.5029, + "step": 2652 + }, + { + "epoch": 7.228882833787466, + "grad_norm": 11.35490894317627, + "learning_rate": 1.990635198576041e-05, + "loss": 1.5884, + "step": 2653 + }, + { + "epoch": 7.231607629427793, + "grad_norm": 11.80521011352539, + "learning_rate": 1.990623145546645e-05, + "loss": 1.5706, + "step": 2654 + }, + { + "epoch": 7.23433242506812, + "grad_norm": 16.76881217956543, + "learning_rate": 1.9906110848023074e-05, + "loss": 1.5825, + "step": 2655 + }, + { + "epoch": 7.237057220708447, + "grad_norm": 29.365928649902344, + "learning_rate": 1.990599016343123e-05, + "loss": 1.5627, + "step": 2656 + }, + { + "epoch": 7.239782016348774, + "grad_norm": 16.728803634643555, + "learning_rate": 1.9905869401691854e-05, + "loss": 1.467, + "step": 2657 + }, + { + "epoch": 7.2425068119891005, + "grad_norm": 8.949308395385742, + "learning_rate": 1.990574856280588e-05, + "loss": 1.4473, + "step": 2658 + }, + { + "epoch": 7.245231607629428, + "grad_norm": 14.383991241455078, + "learning_rate": 1.9905627646774262e-05, + "loss": 1.5891, + "step": 2659 + }, + { + "epoch": 7.247956403269755, + "grad_norm": 14.508793830871582, + "learning_rate": 1.990550665359793e-05, + "loss": 1.6321, + "step": 2660 + }, + { + "epoch": 7.2506811989100814, + "grad_norm": 13.771912574768066, + "learning_rate": 1.9905385583277834e-05, + "loss": 1.624, + "step": 2661 + }, + { + "epoch": 7.253405994550409, + "grad_norm": 18.602794647216797, + "learning_rate": 1.9905264435814913e-05, + "loss": 1.4531, + "step": 2662 + }, + { + "epoch": 7.256130790190736, + "grad_norm": 12.330023765563965, + "learning_rate": 1.990514321121011e-05, + "loss": 1.4819, + "step": 2663 + }, + { + "epoch": 7.258855585831062, + "grad_norm": 16.42203712463379, + "learning_rate": 1.9905021909464372e-05, + "loss": 1.5513, + "step": 2664 + }, + { + "epoch": 7.26158038147139, + "grad_norm": 13.549471855163574, + "learning_rate": 1.9904900530578643e-05, + "loss": 1.5002, + "step": 2665 + }, + { + "epoch": 7.264305177111717, + "grad_norm": 10.781227111816406, + "learning_rate": 1.9904779074553864e-05, + "loss": 1.5864, + "step": 2666 + }, + { + "epoch": 7.267029972752043, + "grad_norm": 18.10679054260254, + "learning_rate": 1.990465754139099e-05, + "loss": 1.647, + "step": 2667 + }, + { + "epoch": 7.269754768392371, + "grad_norm": 12.661219596862793, + "learning_rate": 1.9904535931090957e-05, + "loss": 1.6035, + "step": 2668 + }, + { + "epoch": 7.272479564032698, + "grad_norm": 12.699142456054688, + "learning_rate": 1.9904414243654716e-05, + "loss": 1.4862, + "step": 2669 + }, + { + "epoch": 7.275204359673024, + "grad_norm": 12.930998802185059, + "learning_rate": 1.9904292479083217e-05, + "loss": 1.4475, + "step": 2670 + }, + { + "epoch": 7.277929155313352, + "grad_norm": 12.240517616271973, + "learning_rate": 1.9904170637377408e-05, + "loss": 1.6685, + "step": 2671 + }, + { + "epoch": 7.2806539509536785, + "grad_norm": 18.07870864868164, + "learning_rate": 1.9904048718538238e-05, + "loss": 1.4385, + "step": 2672 + }, + { + "epoch": 7.283378746594005, + "grad_norm": 15.409016609191895, + "learning_rate": 1.9903926722566655e-05, + "loss": 1.4524, + "step": 2673 + }, + { + "epoch": 7.286103542234333, + "grad_norm": 10.995656967163086, + "learning_rate": 1.990380464946361e-05, + "loss": 1.4021, + "step": 2674 + }, + { + "epoch": 7.2888283378746594, + "grad_norm": 16.83498764038086, + "learning_rate": 1.990368249923005e-05, + "loss": 1.7432, + "step": 2675 + }, + { + "epoch": 7.291553133514986, + "grad_norm": 11.144207954406738, + "learning_rate": 1.990356027186693e-05, + "loss": 1.4312, + "step": 2676 + }, + { + "epoch": 7.294277929155314, + "grad_norm": 10.032282829284668, + "learning_rate": 1.9903437967375202e-05, + "loss": 1.4509, + "step": 2677 + }, + { + "epoch": 7.29700272479564, + "grad_norm": 11.693425178527832, + "learning_rate": 1.990331558575582e-05, + "loss": 1.5181, + "step": 2678 + }, + { + "epoch": 7.299727520435967, + "grad_norm": 16.339767456054688, + "learning_rate": 1.990319312700973e-05, + "loss": 1.4441, + "step": 2679 + }, + { + "epoch": 7.302452316076295, + "grad_norm": 13.989665985107422, + "learning_rate": 1.9903070591137898e-05, + "loss": 1.2375, + "step": 2680 + }, + { + "epoch": 7.305177111716621, + "grad_norm": 14.806517601013184, + "learning_rate": 1.9902947978141265e-05, + "loss": 1.4504, + "step": 2681 + }, + { + "epoch": 7.307901907356948, + "grad_norm": 15.431193351745605, + "learning_rate": 1.9902825288020794e-05, + "loss": 1.5498, + "step": 2682 + }, + { + "epoch": 7.310626702997276, + "grad_norm": 14.844110488891602, + "learning_rate": 1.990270252077744e-05, + "loss": 1.8154, + "step": 2683 + }, + { + "epoch": 7.313351498637602, + "grad_norm": 12.310922622680664, + "learning_rate": 1.9902579676412154e-05, + "loss": 1.5247, + "step": 2684 + }, + { + "epoch": 7.316076294277929, + "grad_norm": 11.25191593170166, + "learning_rate": 1.9902456754925898e-05, + "loss": 1.4375, + "step": 2685 + }, + { + "epoch": 7.3188010899182565, + "grad_norm": 12.803166389465332, + "learning_rate": 1.990233375631963e-05, + "loss": 1.5872, + "step": 2686 + }, + { + "epoch": 7.321525885558583, + "grad_norm": 11.506999969482422, + "learning_rate": 1.99022106805943e-05, + "loss": 1.469, + "step": 2687 + }, + { + "epoch": 7.32425068119891, + "grad_norm": 11.528977394104004, + "learning_rate": 1.9902087527750876e-05, + "loss": 1.6492, + "step": 2688 + }, + { + "epoch": 7.3269754768392374, + "grad_norm": 15.200810432434082, + "learning_rate": 1.990196429779031e-05, + "loss": 1.6326, + "step": 2689 + }, + { + "epoch": 7.329700272479564, + "grad_norm": 8.964735984802246, + "learning_rate": 1.9901840990713566e-05, + "loss": 1.4773, + "step": 2690 + }, + { + "epoch": 7.332425068119891, + "grad_norm": 13.632256507873535, + "learning_rate": 1.9901717606521607e-05, + "loss": 1.6499, + "step": 2691 + }, + { + "epoch": 7.335149863760218, + "grad_norm": 10.2181396484375, + "learning_rate": 1.9901594145215382e-05, + "loss": 1.6406, + "step": 2692 + }, + { + "epoch": 7.337874659400545, + "grad_norm": 15.948305130004883, + "learning_rate": 1.9901470606795867e-05, + "loss": 1.4795, + "step": 2693 + }, + { + "epoch": 7.340599455040872, + "grad_norm": 10.267861366271973, + "learning_rate": 1.9901346991264018e-05, + "loss": 1.4495, + "step": 2694 + }, + { + "epoch": 7.343324250681199, + "grad_norm": 10.505049705505371, + "learning_rate": 1.9901223298620793e-05, + "loss": 1.4509, + "step": 2695 + }, + { + "epoch": 7.346049046321526, + "grad_norm": 10.342820167541504, + "learning_rate": 1.9901099528867164e-05, + "loss": 1.6152, + "step": 2696 + }, + { + "epoch": 7.348773841961853, + "grad_norm": 12.281599998474121, + "learning_rate": 1.9900975682004088e-05, + "loss": 1.4797, + "step": 2697 + }, + { + "epoch": 7.35149863760218, + "grad_norm": 11.366495132446289, + "learning_rate": 1.990085175803253e-05, + "loss": 1.5854, + "step": 2698 + }, + { + "epoch": 7.354223433242507, + "grad_norm": 10.912250518798828, + "learning_rate": 1.990072775695346e-05, + "loss": 1.5161, + "step": 2699 + }, + { + "epoch": 7.356948228882834, + "grad_norm": 12.146465301513672, + "learning_rate": 1.990060367876784e-05, + "loss": 1.5774, + "step": 2700 + }, + { + "epoch": 7.359673024523161, + "grad_norm": 13.08321762084961, + "learning_rate": 1.9900479523476637e-05, + "loss": 1.5476, + "step": 2701 + }, + { + "epoch": 7.362397820163488, + "grad_norm": 11.220298767089844, + "learning_rate": 1.9900355291080816e-05, + "loss": 1.5044, + "step": 2702 + }, + { + "epoch": 7.3651226158038146, + "grad_norm": 13.201688766479492, + "learning_rate": 1.990023098158135e-05, + "loss": 1.6455, + "step": 2703 + }, + { + "epoch": 7.367847411444142, + "grad_norm": 10.523879051208496, + "learning_rate": 1.9900106594979204e-05, + "loss": 1.5427, + "step": 2704 + }, + { + "epoch": 7.370572207084469, + "grad_norm": 11.078397750854492, + "learning_rate": 1.9899982131275345e-05, + "loss": 1.4673, + "step": 2705 + }, + { + "epoch": 7.3732970027247955, + "grad_norm": 12.766281127929688, + "learning_rate": 1.9899857590470745e-05, + "loss": 1.51, + "step": 2706 + }, + { + "epoch": 7.376021798365123, + "grad_norm": 15.339536666870117, + "learning_rate": 1.989973297256637e-05, + "loss": 1.4934, + "step": 2707 + }, + { + "epoch": 7.37874659400545, + "grad_norm": 10.396599769592285, + "learning_rate": 1.9899608277563197e-05, + "loss": 1.4001, + "step": 2708 + }, + { + "epoch": 7.381471389645776, + "grad_norm": 8.053894996643066, + "learning_rate": 1.989948350546219e-05, + "loss": 1.3518, + "step": 2709 + }, + { + "epoch": 7.384196185286104, + "grad_norm": 10.564316749572754, + "learning_rate": 1.9899358656264325e-05, + "loss": 1.4333, + "step": 2710 + }, + { + "epoch": 7.386920980926431, + "grad_norm": 9.205158233642578, + "learning_rate": 1.9899233729970576e-05, + "loss": 1.2275, + "step": 2711 + }, + { + "epoch": 7.389645776566757, + "grad_norm": 10.553511619567871, + "learning_rate": 1.9899108726581907e-05, + "loss": 1.3894, + "step": 2712 + }, + { + "epoch": 7.392370572207085, + "grad_norm": 8.432306289672852, + "learning_rate": 1.9898983646099304e-05, + "loss": 1.3279, + "step": 2713 + }, + { + "epoch": 7.395095367847412, + "grad_norm": 13.820378303527832, + "learning_rate": 1.989885848852373e-05, + "loss": 1.5513, + "step": 2714 + }, + { + "epoch": 7.397820163487738, + "grad_norm": 13.580961227416992, + "learning_rate": 1.989873325385617e-05, + "loss": 1.4382, + "step": 2715 + }, + { + "epoch": 7.400544959128065, + "grad_norm": 10.945294380187988, + "learning_rate": 1.989860794209759e-05, + "loss": 1.5232, + "step": 2716 + }, + { + "epoch": 7.4032697547683926, + "grad_norm": 10.951699256896973, + "learning_rate": 1.989848255324897e-05, + "loss": 1.564, + "step": 2717 + }, + { + "epoch": 7.405994550408719, + "grad_norm": 10.355441093444824, + "learning_rate": 1.989835708731129e-05, + "loss": 1.3796, + "step": 2718 + }, + { + "epoch": 7.408719346049046, + "grad_norm": 9.621257781982422, + "learning_rate": 1.9898231544285523e-05, + "loss": 1.5391, + "step": 2719 + }, + { + "epoch": 7.4114441416893735, + "grad_norm": 11.549651145935059, + "learning_rate": 1.9898105924172647e-05, + "loss": 1.4773, + "step": 2720 + }, + { + "epoch": 7.4141689373297, + "grad_norm": 10.521002769470215, + "learning_rate": 1.989798022697364e-05, + "loss": 1.2507, + "step": 2721 + }, + { + "epoch": 7.416893732970027, + "grad_norm": 12.156377792358398, + "learning_rate": 1.989785445268948e-05, + "loss": 1.5168, + "step": 2722 + }, + { + "epoch": 7.419618528610354, + "grad_norm": 12.271047592163086, + "learning_rate": 1.9897728601321148e-05, + "loss": 1.6658, + "step": 2723 + }, + { + "epoch": 7.422343324250681, + "grad_norm": 9.159317016601562, + "learning_rate": 1.9897602672869624e-05, + "loss": 1.406, + "step": 2724 + }, + { + "epoch": 7.425068119891008, + "grad_norm": 11.248191833496094, + "learning_rate": 1.989747666733589e-05, + "loss": 1.4246, + "step": 2725 + }, + { + "epoch": 7.427792915531335, + "grad_norm": 11.331597328186035, + "learning_rate": 1.9897350584720928e-05, + "loss": 1.5464, + "step": 2726 + }, + { + "epoch": 7.430517711171662, + "grad_norm": 18.228622436523438, + "learning_rate": 1.9897224425025716e-05, + "loss": 1.4749, + "step": 2727 + }, + { + "epoch": 7.433242506811989, + "grad_norm": 10.95228385925293, + "learning_rate": 1.9897098188251244e-05, + "loss": 1.3252, + "step": 2728 + }, + { + "epoch": 7.435967302452316, + "grad_norm": 11.155035018920898, + "learning_rate": 1.9896971874398485e-05, + "loss": 1.6357, + "step": 2729 + }, + { + "epoch": 7.438692098092643, + "grad_norm": 19.57489776611328, + "learning_rate": 1.9896845483468424e-05, + "loss": 1.5891, + "step": 2730 + }, + { + "epoch": 7.44141689373297, + "grad_norm": 11.665769577026367, + "learning_rate": 1.9896719015462055e-05, + "loss": 1.3945, + "step": 2731 + }, + { + "epoch": 7.444141689373297, + "grad_norm": 11.477259635925293, + "learning_rate": 1.9896592470380354e-05, + "loss": 1.5493, + "step": 2732 + }, + { + "epoch": 7.446866485013624, + "grad_norm": 9.968441009521484, + "learning_rate": 1.9896465848224312e-05, + "loss": 1.5725, + "step": 2733 + }, + { + "epoch": 7.449591280653951, + "grad_norm": 11.057966232299805, + "learning_rate": 1.9896339148994906e-05, + "loss": 1.3958, + "step": 2734 + }, + { + "epoch": 7.452316076294278, + "grad_norm": 23.53868865966797, + "learning_rate": 1.9896212372693135e-05, + "loss": 1.54, + "step": 2735 + }, + { + "epoch": 7.455040871934605, + "grad_norm": 12.037323951721191, + "learning_rate": 1.9896085519319982e-05, + "loss": 1.6038, + "step": 2736 + }, + { + "epoch": 7.4577656675749315, + "grad_norm": 10.729537010192871, + "learning_rate": 1.989595858887643e-05, + "loss": 1.4729, + "step": 2737 + }, + { + "epoch": 7.460490463215259, + "grad_norm": 10.37804126739502, + "learning_rate": 1.989583158136347e-05, + "loss": 1.4558, + "step": 2738 + }, + { + "epoch": 7.463215258855586, + "grad_norm": 11.308197975158691, + "learning_rate": 1.9895704496782097e-05, + "loss": 1.7019, + "step": 2739 + }, + { + "epoch": 7.4659400544959125, + "grad_norm": 12.422118186950684, + "learning_rate": 1.989557733513329e-05, + "loss": 1.4006, + "step": 2740 + }, + { + "epoch": 7.46866485013624, + "grad_norm": 14.516019821166992, + "learning_rate": 1.989545009641805e-05, + "loss": 1.325, + "step": 2741 + }, + { + "epoch": 7.471389645776567, + "grad_norm": 20.607149124145508, + "learning_rate": 1.9895322780637358e-05, + "loss": 1.4851, + "step": 2742 + }, + { + "epoch": 7.474114441416893, + "grad_norm": 10.987537384033203, + "learning_rate": 1.9895195387792214e-05, + "loss": 1.3845, + "step": 2743 + }, + { + "epoch": 7.476839237057221, + "grad_norm": 19.764270782470703, + "learning_rate": 1.989506791788361e-05, + "loss": 1.5945, + "step": 2744 + }, + { + "epoch": 7.479564032697548, + "grad_norm": 11.385480880737305, + "learning_rate": 1.989494037091253e-05, + "loss": 1.5222, + "step": 2745 + }, + { + "epoch": 7.482288828337874, + "grad_norm": 14.623588562011719, + "learning_rate": 1.9894812746879976e-05, + "loss": 1.4697, + "step": 2746 + }, + { + "epoch": 7.485013623978202, + "grad_norm": 13.755199432373047, + "learning_rate": 1.9894685045786935e-05, + "loss": 1.5461, + "step": 2747 + }, + { + "epoch": 7.487738419618529, + "grad_norm": 18.120471954345703, + "learning_rate": 1.989455726763441e-05, + "loss": 1.5591, + "step": 2748 + }, + { + "epoch": 7.490463215258855, + "grad_norm": 11.236099243164062, + "learning_rate": 1.9894429412423388e-05, + "loss": 1.3884, + "step": 2749 + }, + { + "epoch": 7.493188010899183, + "grad_norm": 12.378520011901855, + "learning_rate": 1.9894301480154873e-05, + "loss": 1.522, + "step": 2750 + }, + { + "epoch": 7.4959128065395095, + "grad_norm": 11.089034080505371, + "learning_rate": 1.9894173470829853e-05, + "loss": 1.4741, + "step": 2751 + }, + { + "epoch": 7.498637602179836, + "grad_norm": 8.702698707580566, + "learning_rate": 1.9894045384449328e-05, + "loss": 1.333, + "step": 2752 + }, + { + "epoch": 7.501362397820164, + "grad_norm": 9.997475624084473, + "learning_rate": 1.9893917221014294e-05, + "loss": 1.5024, + "step": 2753 + }, + { + "epoch": 7.5040871934604905, + "grad_norm": 10.9384765625, + "learning_rate": 1.9893788980525756e-05, + "loss": 1.4797, + "step": 2754 + }, + { + "epoch": 7.506811989100817, + "grad_norm": 13.521172523498535, + "learning_rate": 1.9893660662984705e-05, + "loss": 1.4785, + "step": 2755 + }, + { + "epoch": 7.509536784741145, + "grad_norm": 10.863540649414062, + "learning_rate": 1.9893532268392143e-05, + "loss": 1.3005, + "step": 2756 + }, + { + "epoch": 7.512261580381471, + "grad_norm": 24.522600173950195, + "learning_rate": 1.989340379674907e-05, + "loss": 1.6479, + "step": 2757 + }, + { + "epoch": 7.514986376021798, + "grad_norm": 11.219182014465332, + "learning_rate": 1.989327524805649e-05, + "loss": 1.5334, + "step": 2758 + }, + { + "epoch": 7.517711171662126, + "grad_norm": 15.490386009216309, + "learning_rate": 1.9893146622315398e-05, + "loss": 1.6729, + "step": 2759 + }, + { + "epoch": 7.520435967302452, + "grad_norm": 15.81369400024414, + "learning_rate": 1.9893017919526798e-05, + "loss": 1.6035, + "step": 2760 + }, + { + "epoch": 7.523160762942779, + "grad_norm": 10.370918273925781, + "learning_rate": 1.9892889139691695e-05, + "loss": 1.5022, + "step": 2761 + }, + { + "epoch": 7.525885558583107, + "grad_norm": 8.687206268310547, + "learning_rate": 1.9892760282811085e-05, + "loss": 1.7324, + "step": 2762 + }, + { + "epoch": 7.528610354223433, + "grad_norm": 19.682769775390625, + "learning_rate": 1.989263134888598e-05, + "loss": 1.3579, + "step": 2763 + }, + { + "epoch": 7.53133514986376, + "grad_norm": 10.744647026062012, + "learning_rate": 1.9892502337917382e-05, + "loss": 1.5437, + "step": 2764 + }, + { + "epoch": 7.5340599455040875, + "grad_norm": 12.050798416137695, + "learning_rate": 1.9892373249906292e-05, + "loss": 1.418, + "step": 2765 + }, + { + "epoch": 7.536784741144414, + "grad_norm": 20.06696319580078, + "learning_rate": 1.989224408485372e-05, + "loss": 1.7356, + "step": 2766 + }, + { + "epoch": 7.539509536784741, + "grad_norm": 10.467229843139648, + "learning_rate": 1.9892114842760666e-05, + "loss": 1.4651, + "step": 2767 + }, + { + "epoch": 7.5422343324250685, + "grad_norm": 10.829195976257324, + "learning_rate": 1.9891985523628142e-05, + "loss": 1.7073, + "step": 2768 + }, + { + "epoch": 7.544959128065395, + "grad_norm": 16.316389083862305, + "learning_rate": 1.9891856127457152e-05, + "loss": 1.4178, + "step": 2769 + }, + { + "epoch": 7.547683923705722, + "grad_norm": 9.75391674041748, + "learning_rate": 1.9891726654248705e-05, + "loss": 1.4985, + "step": 2770 + }, + { + "epoch": 7.550408719346049, + "grad_norm": 11.315629959106445, + "learning_rate": 1.9891597104003807e-05, + "loss": 1.5781, + "step": 2771 + }, + { + "epoch": 7.553133514986376, + "grad_norm": 12.688879013061523, + "learning_rate": 1.9891467476723472e-05, + "loss": 1.5378, + "step": 2772 + }, + { + "epoch": 7.555858310626703, + "grad_norm": 10.304753303527832, + "learning_rate": 1.9891337772408706e-05, + "loss": 1.4124, + "step": 2773 + }, + { + "epoch": 7.55858310626703, + "grad_norm": 20.072845458984375, + "learning_rate": 1.9891207991060525e-05, + "loss": 1.489, + "step": 2774 + }, + { + "epoch": 7.561307901907357, + "grad_norm": 10.624418258666992, + "learning_rate": 1.989107813267993e-05, + "loss": 1.5132, + "step": 2775 + }, + { + "epoch": 7.564032697547684, + "grad_norm": 11.695839881896973, + "learning_rate": 1.9890948197267933e-05, + "loss": 1.4905, + "step": 2776 + }, + { + "epoch": 7.566757493188011, + "grad_norm": 9.317418098449707, + "learning_rate": 1.9890818184825552e-05, + "loss": 1.3589, + "step": 2777 + }, + { + "epoch": 7.569482288828338, + "grad_norm": 11.279376029968262, + "learning_rate": 1.9890688095353802e-05, + "loss": 1.4741, + "step": 2778 + }, + { + "epoch": 7.572207084468665, + "grad_norm": 12.635177612304688, + "learning_rate": 1.9890557928853685e-05, + "loss": 1.4634, + "step": 2779 + }, + { + "epoch": 7.574931880108992, + "grad_norm": 12.164665222167969, + "learning_rate": 1.9890427685326225e-05, + "loss": 1.7129, + "step": 2780 + }, + { + "epoch": 7.577656675749319, + "grad_norm": 11.033668518066406, + "learning_rate": 1.989029736477243e-05, + "loss": 1.5864, + "step": 2781 + }, + { + "epoch": 7.580381471389646, + "grad_norm": 13.097576141357422, + "learning_rate": 1.989016696719332e-05, + "loss": 1.3496, + "step": 2782 + }, + { + "epoch": 7.583106267029972, + "grad_norm": 12.860251426696777, + "learning_rate": 1.989003649258991e-05, + "loss": 1.5066, + "step": 2783 + }, + { + "epoch": 7.5858310626703, + "grad_norm": 22.703773498535156, + "learning_rate": 1.988990594096321e-05, + "loss": 1.5422, + "step": 2784 + }, + { + "epoch": 7.5885558583106265, + "grad_norm": 10.591668128967285, + "learning_rate": 1.988977531231424e-05, + "loss": 1.3936, + "step": 2785 + }, + { + "epoch": 7.591280653950953, + "grad_norm": 11.378451347351074, + "learning_rate": 1.988964460664402e-05, + "loss": 1.4924, + "step": 2786 + }, + { + "epoch": 7.594005449591281, + "grad_norm": 18.895544052124023, + "learning_rate": 1.9889513823953568e-05, + "loss": 1.5862, + "step": 2787 + }, + { + "epoch": 7.5967302452316074, + "grad_norm": 12.089540481567383, + "learning_rate": 1.9889382964243896e-05, + "loss": 1.5552, + "step": 2788 + }, + { + "epoch": 7.599455040871934, + "grad_norm": 10.115679740905762, + "learning_rate": 1.9889252027516033e-05, + "loss": 1.4866, + "step": 2789 + }, + { + "epoch": 7.602179836512262, + "grad_norm": 10.996835708618164, + "learning_rate": 1.988912101377099e-05, + "loss": 1.4475, + "step": 2790 + }, + { + "epoch": 7.604904632152588, + "grad_norm": 10.201013565063477, + "learning_rate": 1.9888989923009792e-05, + "loss": 1.5649, + "step": 2791 + }, + { + "epoch": 7.607629427792915, + "grad_norm": 12.061447143554688, + "learning_rate": 1.988885875523346e-05, + "loss": 1.6538, + "step": 2792 + }, + { + "epoch": 7.610354223433243, + "grad_norm": 13.327852249145508, + "learning_rate": 1.988872751044301e-05, + "loss": 1.3782, + "step": 2793 + }, + { + "epoch": 7.613079019073569, + "grad_norm": 11.921119689941406, + "learning_rate": 1.9888596188639476e-05, + "loss": 1.5273, + "step": 2794 + }, + { + "epoch": 7.615803814713896, + "grad_norm": 9.655643463134766, + "learning_rate": 1.9888464789823867e-05, + "loss": 1.4753, + "step": 2795 + }, + { + "epoch": 7.618528610354224, + "grad_norm": 13.065455436706543, + "learning_rate": 1.9888333313997212e-05, + "loss": 1.4873, + "step": 2796 + }, + { + "epoch": 7.62125340599455, + "grad_norm": 18.854360580444336, + "learning_rate": 1.988820176116054e-05, + "loss": 1.4998, + "step": 2797 + }, + { + "epoch": 7.623978201634877, + "grad_norm": 12.455496788024902, + "learning_rate": 1.988807013131487e-05, + "loss": 1.5913, + "step": 2798 + }, + { + "epoch": 7.6267029972752045, + "grad_norm": 10.86870288848877, + "learning_rate": 1.9887938424461224e-05, + "loss": 1.2312, + "step": 2799 + }, + { + "epoch": 7.629427792915531, + "grad_norm": 13.03520393371582, + "learning_rate": 1.9887806640600633e-05, + "loss": 1.5659, + "step": 2800 + }, + { + "epoch": 7.632152588555858, + "grad_norm": 13.637677192687988, + "learning_rate": 1.9887674779734125e-05, + "loss": 1.3696, + "step": 2801 + }, + { + "epoch": 7.6348773841961854, + "grad_norm": 18.14453125, + "learning_rate": 1.9887542841862723e-05, + "loss": 1.7529, + "step": 2802 + }, + { + "epoch": 7.637602179836512, + "grad_norm": 11.575101852416992, + "learning_rate": 1.9887410826987455e-05, + "loss": 1.4529, + "step": 2803 + }, + { + "epoch": 7.640326975476839, + "grad_norm": 11.00442123413086, + "learning_rate": 1.988727873510935e-05, + "loss": 1.3838, + "step": 2804 + }, + { + "epoch": 7.643051771117166, + "grad_norm": 12.96632194519043, + "learning_rate": 1.9887146566229437e-05, + "loss": 1.6182, + "step": 2805 + }, + { + "epoch": 7.645776566757493, + "grad_norm": 10.884385108947754, + "learning_rate": 1.988701432034874e-05, + "loss": 1.2805, + "step": 2806 + }, + { + "epoch": 7.64850136239782, + "grad_norm": 10.20749282836914, + "learning_rate": 1.9886881997468298e-05, + "loss": 1.5005, + "step": 2807 + }, + { + "epoch": 7.651226158038147, + "grad_norm": 10.603687286376953, + "learning_rate": 1.988674959758914e-05, + "loss": 1.4885, + "step": 2808 + }, + { + "epoch": 7.653950953678474, + "grad_norm": 13.288247108459473, + "learning_rate": 1.988661712071229e-05, + "loss": 1.5601, + "step": 2809 + }, + { + "epoch": 7.656675749318801, + "grad_norm": 13.069999694824219, + "learning_rate": 1.9886484566838785e-05, + "loss": 1.5508, + "step": 2810 + }, + { + "epoch": 7.659400544959128, + "grad_norm": 10.288311004638672, + "learning_rate": 1.9886351935969658e-05, + "loss": 1.5603, + "step": 2811 + }, + { + "epoch": 7.662125340599455, + "grad_norm": 11.068655014038086, + "learning_rate": 1.9886219228105937e-05, + "loss": 1.6333, + "step": 2812 + }, + { + "epoch": 7.664850136239782, + "grad_norm": 11.532331466674805, + "learning_rate": 1.9886086443248663e-05, + "loss": 1.479, + "step": 2813 + }, + { + "epoch": 7.667574931880109, + "grad_norm": 10.423901557922363, + "learning_rate": 1.9885953581398862e-05, + "loss": 1.511, + "step": 2814 + }, + { + "epoch": 7.670299727520436, + "grad_norm": 15.353683471679688, + "learning_rate": 1.9885820642557574e-05, + "loss": 1.5251, + "step": 2815 + }, + { + "epoch": 7.6730245231607626, + "grad_norm": 24.267702102661133, + "learning_rate": 1.9885687626725833e-05, + "loss": 1.5012, + "step": 2816 + }, + { + "epoch": 7.67574931880109, + "grad_norm": 11.486735343933105, + "learning_rate": 1.9885554533904673e-05, + "loss": 1.5339, + "step": 2817 + }, + { + "epoch": 7.678474114441417, + "grad_norm": 21.975114822387695, + "learning_rate": 1.988542136409514e-05, + "loss": 1.4797, + "step": 2818 + }, + { + "epoch": 7.6811989100817435, + "grad_norm": 17.301342010498047, + "learning_rate": 1.9885288117298256e-05, + "loss": 1.2908, + "step": 2819 + }, + { + "epoch": 7.683923705722071, + "grad_norm": 16.25150489807129, + "learning_rate": 1.9885154793515066e-05, + "loss": 1.5159, + "step": 2820 + }, + { + "epoch": 7.686648501362398, + "grad_norm": 10.66357421875, + "learning_rate": 1.9885021392746614e-05, + "loss": 1.2976, + "step": 2821 + }, + { + "epoch": 7.689373297002724, + "grad_norm": 11.739712715148926, + "learning_rate": 1.9884887914993932e-05, + "loss": 1.5776, + "step": 2822 + }, + { + "epoch": 7.692098092643052, + "grad_norm": 13.113489151000977, + "learning_rate": 1.9884754360258058e-05, + "loss": 1.6941, + "step": 2823 + }, + { + "epoch": 7.694822888283379, + "grad_norm": 12.707517623901367, + "learning_rate": 1.9884620728540035e-05, + "loss": 1.4915, + "step": 2824 + }, + { + "epoch": 7.697547683923705, + "grad_norm": 11.471800804138184, + "learning_rate": 1.9884487019840907e-05, + "loss": 1.5256, + "step": 2825 + }, + { + "epoch": 7.700272479564033, + "grad_norm": 11.221733093261719, + "learning_rate": 1.9884353234161713e-05, + "loss": 1.4993, + "step": 2826 + }, + { + "epoch": 7.70299727520436, + "grad_norm": 11.2644681930542, + "learning_rate": 1.988421937150349e-05, + "loss": 1.3865, + "step": 2827 + }, + { + "epoch": 7.705722070844686, + "grad_norm": 11.004400253295898, + "learning_rate": 1.9884085431867287e-05, + "loss": 1.4805, + "step": 2828 + }, + { + "epoch": 7.708446866485014, + "grad_norm": 11.438688278198242, + "learning_rate": 1.9883951415254146e-05, + "loss": 1.5256, + "step": 2829 + }, + { + "epoch": 7.7111716621253406, + "grad_norm": 10.083905220031738, + "learning_rate": 1.988381732166511e-05, + "loss": 1.3486, + "step": 2830 + }, + { + "epoch": 7.713896457765667, + "grad_norm": 9.939655303955078, + "learning_rate": 1.988368315110122e-05, + "loss": 1.3533, + "step": 2831 + }, + { + "epoch": 7.716621253405995, + "grad_norm": 14.37730884552002, + "learning_rate": 1.9883548903563525e-05, + "loss": 1.5068, + "step": 2832 + }, + { + "epoch": 7.7193460490463215, + "grad_norm": 12.536720275878906, + "learning_rate": 1.988341457905307e-05, + "loss": 1.4836, + "step": 2833 + }, + { + "epoch": 7.722070844686648, + "grad_norm": 13.156996726989746, + "learning_rate": 1.9883280177570898e-05, + "loss": 1.7607, + "step": 2834 + }, + { + "epoch": 7.724795640326976, + "grad_norm": 11.064411163330078, + "learning_rate": 1.988314569911806e-05, + "loss": 1.3481, + "step": 2835 + }, + { + "epoch": 7.727520435967302, + "grad_norm": 15.014034271240234, + "learning_rate": 1.98830111436956e-05, + "loss": 1.4448, + "step": 2836 + }, + { + "epoch": 7.730245231607629, + "grad_norm": 13.946884155273438, + "learning_rate": 1.988287651130457e-05, + "loss": 1.7812, + "step": 2837 + }, + { + "epoch": 7.732970027247957, + "grad_norm": 10.989984512329102, + "learning_rate": 1.9882741801946014e-05, + "loss": 1.4023, + "step": 2838 + }, + { + "epoch": 7.735694822888283, + "grad_norm": 12.584571838378906, + "learning_rate": 1.988260701562098e-05, + "loss": 1.645, + "step": 2839 + }, + { + "epoch": 7.73841961852861, + "grad_norm": 11.218289375305176, + "learning_rate": 1.9882472152330522e-05, + "loss": 1.5212, + "step": 2840 + }, + { + "epoch": 7.741144414168938, + "grad_norm": 10.804743766784668, + "learning_rate": 1.9882337212075693e-05, + "loss": 1.3257, + "step": 2841 + }, + { + "epoch": 7.743869209809264, + "grad_norm": 31.348562240600586, + "learning_rate": 1.9882202194857537e-05, + "loss": 1.5823, + "step": 2842 + }, + { + "epoch": 7.746594005449591, + "grad_norm": 10.572625160217285, + "learning_rate": 1.988206710067711e-05, + "loss": 1.3733, + "step": 2843 + }, + { + "epoch": 7.7493188010899186, + "grad_norm": 10.134716987609863, + "learning_rate": 1.9881931929535462e-05, + "loss": 1.4509, + "step": 2844 + }, + { + "epoch": 7.752043596730245, + "grad_norm": 16.209062576293945, + "learning_rate": 1.988179668143364e-05, + "loss": 1.5938, + "step": 2845 + }, + { + "epoch": 7.754768392370572, + "grad_norm": 9.616616249084473, + "learning_rate": 1.988166135637271e-05, + "loss": 1.5181, + "step": 2846 + }, + { + "epoch": 7.7574931880108995, + "grad_norm": 16.432865142822266, + "learning_rate": 1.988152595435372e-05, + "loss": 1.8037, + "step": 2847 + }, + { + "epoch": 7.760217983651226, + "grad_norm": 11.593768119812012, + "learning_rate": 1.988139047537772e-05, + "loss": 1.4939, + "step": 2848 + }, + { + "epoch": 7.762942779291553, + "grad_norm": 11.875847816467285, + "learning_rate": 1.9881254919445773e-05, + "loss": 1.5664, + "step": 2849 + }, + { + "epoch": 7.76566757493188, + "grad_norm": 12.916208267211914, + "learning_rate": 1.9881119286558927e-05, + "loss": 1.4985, + "step": 2850 + }, + { + "epoch": 7.768392370572207, + "grad_norm": 10.447370529174805, + "learning_rate": 1.9880983576718247e-05, + "loss": 1.5913, + "step": 2851 + }, + { + "epoch": 7.771117166212534, + "grad_norm": 25.152677536010742, + "learning_rate": 1.988084778992478e-05, + "loss": 1.3577, + "step": 2852 + }, + { + "epoch": 7.773841961852861, + "grad_norm": 20.927114486694336, + "learning_rate": 1.988071192617959e-05, + "loss": 1.679, + "step": 2853 + }, + { + "epoch": 7.776566757493188, + "grad_norm": 14.398178100585938, + "learning_rate": 1.9880575985483734e-05, + "loss": 1.73, + "step": 2854 + }, + { + "epoch": 7.779291553133515, + "grad_norm": 12.64029312133789, + "learning_rate": 1.988043996783827e-05, + "loss": 1.3472, + "step": 2855 + }, + { + "epoch": 7.782016348773842, + "grad_norm": 16.54973793029785, + "learning_rate": 1.9880303873244258e-05, + "loss": 1.6577, + "step": 2856 + }, + { + "epoch": 7.784741144414169, + "grad_norm": 13.682854652404785, + "learning_rate": 1.9880167701702757e-05, + "loss": 1.5327, + "step": 2857 + }, + { + "epoch": 7.787465940054496, + "grad_norm": 45.27207946777344, + "learning_rate": 1.988003145321483e-05, + "loss": 1.6543, + "step": 2858 + }, + { + "epoch": 7.790190735694823, + "grad_norm": 11.389158248901367, + "learning_rate": 1.9879895127781533e-05, + "loss": 1.2905, + "step": 2859 + }, + { + "epoch": 7.79291553133515, + "grad_norm": 10.155439376831055, + "learning_rate": 1.987975872540393e-05, + "loss": 1.5613, + "step": 2860 + }, + { + "epoch": 7.795640326975477, + "grad_norm": 19.872411727905273, + "learning_rate": 1.9879622246083087e-05, + "loss": 1.3677, + "step": 2861 + }, + { + "epoch": 7.798365122615804, + "grad_norm": 15.025500297546387, + "learning_rate": 1.987948568982006e-05, + "loss": 1.5881, + "step": 2862 + }, + { + "epoch": 7.801089918256131, + "grad_norm": 11.375299453735352, + "learning_rate": 1.987934905661592e-05, + "loss": 1.4883, + "step": 2863 + }, + { + "epoch": 7.8038147138964575, + "grad_norm": 21.228652954101562, + "learning_rate": 1.9879212346471726e-05, + "loss": 1.6218, + "step": 2864 + }, + { + "epoch": 7.806539509536785, + "grad_norm": 12.07156753540039, + "learning_rate": 1.9879075559388547e-05, + "loss": 1.4431, + "step": 2865 + }, + { + "epoch": 7.809264305177112, + "grad_norm": 11.72398853302002, + "learning_rate": 1.9878938695367444e-05, + "loss": 1.373, + "step": 2866 + }, + { + "epoch": 7.8119891008174385, + "grad_norm": 13.358327865600586, + "learning_rate": 1.987880175440948e-05, + "loss": 1.3994, + "step": 2867 + }, + { + "epoch": 7.814713896457766, + "grad_norm": 13.322922706604004, + "learning_rate": 1.9878664736515732e-05, + "loss": 1.5703, + "step": 2868 + }, + { + "epoch": 7.817438692098093, + "grad_norm": 17.724384307861328, + "learning_rate": 1.9878527641687255e-05, + "loss": 1.376, + "step": 2869 + }, + { + "epoch": 7.820163487738419, + "grad_norm": 10.315452575683594, + "learning_rate": 1.987839046992513e-05, + "loss": 1.4697, + "step": 2870 + }, + { + "epoch": 7.822888283378747, + "grad_norm": 18.188642501831055, + "learning_rate": 1.9878253221230414e-05, + "loss": 1.835, + "step": 2871 + }, + { + "epoch": 7.825613079019074, + "grad_norm": 11.028203964233398, + "learning_rate": 1.9878115895604178e-05, + "loss": 1.4543, + "step": 2872 + }, + { + "epoch": 7.8283378746594, + "grad_norm": 10.556264877319336, + "learning_rate": 1.9877978493047496e-05, + "loss": 1.3467, + "step": 2873 + }, + { + "epoch": 7.831062670299728, + "grad_norm": 11.126514434814453, + "learning_rate": 1.987784101356143e-05, + "loss": 1.4661, + "step": 2874 + }, + { + "epoch": 7.833787465940055, + "grad_norm": 12.39341926574707, + "learning_rate": 1.9877703457147062e-05, + "loss": 1.4817, + "step": 2875 + }, + { + "epoch": 7.836512261580381, + "grad_norm": 15.889671325683594, + "learning_rate": 1.987756582380546e-05, + "loss": 1.5522, + "step": 2876 + }, + { + "epoch": 7.839237057220709, + "grad_norm": 39.488895416259766, + "learning_rate": 1.9877428113537686e-05, + "loss": 1.582, + "step": 2877 + }, + { + "epoch": 7.8419618528610355, + "grad_norm": 24.53476333618164, + "learning_rate": 1.9877290326344826e-05, + "loss": 1.5332, + "step": 2878 + }, + { + "epoch": 7.844686648501362, + "grad_norm": 15.040446281433105, + "learning_rate": 1.987715246222794e-05, + "loss": 1.6968, + "step": 2879 + }, + { + "epoch": 7.84741144414169, + "grad_norm": 18.096458435058594, + "learning_rate": 1.9877014521188115e-05, + "loss": 1.6333, + "step": 2880 + }, + { + "epoch": 7.8501362397820165, + "grad_norm": 12.122450828552246, + "learning_rate": 1.9876876503226418e-05, + "loss": 1.502, + "step": 2881 + }, + { + "epoch": 7.852861035422343, + "grad_norm": 12.410628318786621, + "learning_rate": 1.987673840834392e-05, + "loss": 1.3496, + "step": 2882 + }, + { + "epoch": 7.855585831062671, + "grad_norm": 11.923356056213379, + "learning_rate": 1.9876600236541705e-05, + "loss": 1.4607, + "step": 2883 + }, + { + "epoch": 7.858310626702997, + "grad_norm": 19.3748779296875, + "learning_rate": 1.9876461987820847e-05, + "loss": 1.5439, + "step": 2884 + }, + { + "epoch": 7.861035422343324, + "grad_norm": 17.764400482177734, + "learning_rate": 1.9876323662182417e-05, + "loss": 1.4241, + "step": 2885 + }, + { + "epoch": 7.863760217983652, + "grad_norm": 18.320411682128906, + "learning_rate": 1.9876185259627498e-05, + "loss": 1.6548, + "step": 2886 + }, + { + "epoch": 7.866485013623978, + "grad_norm": 650.7084350585938, + "learning_rate": 1.987604678015716e-05, + "loss": 1.6074, + "step": 2887 + }, + { + "epoch": 7.869209809264305, + "grad_norm": 19.571046829223633, + "learning_rate": 1.9875908223772497e-05, + "loss": 1.6182, + "step": 2888 + }, + { + "epoch": 7.871934604904633, + "grad_norm": 17.87520980834961, + "learning_rate": 1.9875769590474574e-05, + "loss": 1.4395, + "step": 2889 + }, + { + "epoch": 7.874659400544959, + "grad_norm": 38.276268005371094, + "learning_rate": 1.9875630880264474e-05, + "loss": 2.0103, + "step": 2890 + }, + { + "epoch": 7.877384196185286, + "grad_norm": 36.80160903930664, + "learning_rate": 1.987549209314328e-05, + "loss": 1.8755, + "step": 2891 + }, + { + "epoch": 7.8801089918256135, + "grad_norm": 20.255399703979492, + "learning_rate": 1.9875353229112076e-05, + "loss": 1.7363, + "step": 2892 + }, + { + "epoch": 7.88283378746594, + "grad_norm": 18.29572868347168, + "learning_rate": 1.9875214288171932e-05, + "loss": 1.6235, + "step": 2893 + }, + { + "epoch": 7.885558583106267, + "grad_norm": 26.875980377197266, + "learning_rate": 1.9875075270323942e-05, + "loss": 1.978, + "step": 2894 + }, + { + "epoch": 7.8882833787465945, + "grad_norm": 18.455490112304688, + "learning_rate": 1.9874936175569178e-05, + "loss": 1.8594, + "step": 2895 + }, + { + "epoch": 7.891008174386921, + "grad_norm": 22.575532913208008, + "learning_rate": 1.9874797003908735e-05, + "loss": 2.0298, + "step": 2896 + }, + { + "epoch": 7.893732970027248, + "grad_norm": 19.369121551513672, + "learning_rate": 1.9874657755343688e-05, + "loss": 1.7678, + "step": 2897 + }, + { + "epoch": 7.896457765667575, + "grad_norm": 15.469361305236816, + "learning_rate": 1.9874518429875126e-05, + "loss": 1.7583, + "step": 2898 + }, + { + "epoch": 7.899182561307902, + "grad_norm": 19.114458084106445, + "learning_rate": 1.987437902750413e-05, + "loss": 1.7402, + "step": 2899 + }, + { + "epoch": 7.901907356948229, + "grad_norm": 16.01736068725586, + "learning_rate": 1.9874239548231786e-05, + "loss": 1.6477, + "step": 2900 + }, + { + "epoch": 7.904632152588556, + "grad_norm": 12.80774211883545, + "learning_rate": 1.9874099992059185e-05, + "loss": 1.9751, + "step": 2901 + }, + { + "epoch": 7.907356948228883, + "grad_norm": 13.939897537231445, + "learning_rate": 1.9873960358987414e-05, + "loss": 1.7957, + "step": 2902 + }, + { + "epoch": 7.91008174386921, + "grad_norm": 10.73560905456543, + "learning_rate": 1.9873820649017553e-05, + "loss": 1.7783, + "step": 2903 + }, + { + "epoch": 7.912806539509537, + "grad_norm": 11.912135124206543, + "learning_rate": 1.9873680862150694e-05, + "loss": 1.6841, + "step": 2904 + }, + { + "epoch": 7.915531335149864, + "grad_norm": 14.469831466674805, + "learning_rate": 1.9873540998387928e-05, + "loss": 1.7317, + "step": 2905 + }, + { + "epoch": 7.918256130790191, + "grad_norm": 12.055585861206055, + "learning_rate": 1.9873401057730345e-05, + "loss": 1.6538, + "step": 2906 + }, + { + "epoch": 7.920980926430518, + "grad_norm": 17.054702758789062, + "learning_rate": 1.987326104017903e-05, + "loss": 1.843, + "step": 2907 + }, + { + "epoch": 7.923705722070845, + "grad_norm": 10.581183433532715, + "learning_rate": 1.9873120945735073e-05, + "loss": 1.9011, + "step": 2908 + }, + { + "epoch": 7.926430517711172, + "grad_norm": 11.802868843078613, + "learning_rate": 1.9872980774399573e-05, + "loss": 1.6802, + "step": 2909 + }, + { + "epoch": 7.929155313351498, + "grad_norm": 11.520299911499023, + "learning_rate": 1.987284052617361e-05, + "loss": 1.4148, + "step": 2910 + }, + { + "epoch": 7.931880108991826, + "grad_norm": 11.749201774597168, + "learning_rate": 1.9872700201058287e-05, + "loss": 1.7168, + "step": 2911 + }, + { + "epoch": 7.9346049046321525, + "grad_norm": 12.393478393554688, + "learning_rate": 1.9872559799054695e-05, + "loss": 1.7373, + "step": 2912 + }, + { + "epoch": 7.937329700272479, + "grad_norm": 10.606557846069336, + "learning_rate": 1.9872419320163924e-05, + "loss": 1.6995, + "step": 2913 + }, + { + "epoch": 7.940054495912807, + "grad_norm": 13.502483367919922, + "learning_rate": 1.9872278764387064e-05, + "loss": 1.5396, + "step": 2914 + }, + { + "epoch": 7.9427792915531334, + "grad_norm": 10.935478210449219, + "learning_rate": 1.987213813172522e-05, + "loss": 1.5857, + "step": 2915 + }, + { + "epoch": 7.94550408719346, + "grad_norm": 11.298049926757812, + "learning_rate": 1.987199742217948e-05, + "loss": 1.5662, + "step": 2916 + }, + { + "epoch": 7.948228882833788, + "grad_norm": 9.997447967529297, + "learning_rate": 1.987185663575094e-05, + "loss": 1.5146, + "step": 2917 + }, + { + "epoch": 7.950953678474114, + "grad_norm": 14.285991668701172, + "learning_rate": 1.98717157724407e-05, + "loss": 1.5615, + "step": 2918 + }, + { + "epoch": 7.953678474114441, + "grad_norm": 14.525003433227539, + "learning_rate": 1.9871574832249858e-05, + "loss": 1.5081, + "step": 2919 + }, + { + "epoch": 7.956403269754769, + "grad_norm": 13.308977127075195, + "learning_rate": 1.9871433815179505e-05, + "loss": 1.4858, + "step": 2920 + }, + { + "epoch": 7.959128065395095, + "grad_norm": 11.913995742797852, + "learning_rate": 1.9871292721230745e-05, + "loss": 1.439, + "step": 2921 + }, + { + "epoch": 7.961852861035422, + "grad_norm": 15.985111236572266, + "learning_rate": 1.9871151550404675e-05, + "loss": 1.6733, + "step": 2922 + }, + { + "epoch": 7.96457765667575, + "grad_norm": 11.745784759521484, + "learning_rate": 1.9871010302702393e-05, + "loss": 1.7202, + "step": 2923 + }, + { + "epoch": 7.967302452316076, + "grad_norm": 20.185394287109375, + "learning_rate": 1.9870868978125003e-05, + "loss": 1.749, + "step": 2924 + }, + { + "epoch": 7.970027247956403, + "grad_norm": 10.806917190551758, + "learning_rate": 1.98707275766736e-05, + "loss": 1.4927, + "step": 2925 + }, + { + "epoch": 7.9727520435967305, + "grad_norm": 11.449009895324707, + "learning_rate": 1.9870586098349288e-05, + "loss": 1.4761, + "step": 2926 + }, + { + "epoch": 7.975476839237057, + "grad_norm": 9.038079261779785, + "learning_rate": 1.987044454315317e-05, + "loss": 1.688, + "step": 2927 + }, + { + "epoch": 7.978201634877384, + "grad_norm": 14.575750350952148, + "learning_rate": 1.987030291108635e-05, + "loss": 1.6382, + "step": 2928 + }, + { + "epoch": 7.9809264305177114, + "grad_norm": 10.708087921142578, + "learning_rate": 1.987016120214993e-05, + "loss": 1.7874, + "step": 2929 + }, + { + "epoch": 7.983651226158038, + "grad_norm": 14.858932495117188, + "learning_rate": 1.9870019416345008e-05, + "loss": 1.7944, + "step": 2930 + }, + { + "epoch": 7.986376021798365, + "grad_norm": 13.036943435668945, + "learning_rate": 1.9869877553672693e-05, + "loss": 1.5779, + "step": 2931 + }, + { + "epoch": 7.989100817438692, + "grad_norm": 10.370837211608887, + "learning_rate": 1.9869735614134092e-05, + "loss": 1.6997, + "step": 2932 + }, + { + "epoch": 7.991825613079019, + "grad_norm": 18.72672462463379, + "learning_rate": 1.9869593597730305e-05, + "loss": 1.4355, + "step": 2933 + }, + { + "epoch": 7.994550408719346, + "grad_norm": 12.96975040435791, + "learning_rate": 1.986945150446244e-05, + "loss": 1.3271, + "step": 2934 + }, + { + "epoch": 7.997275204359673, + "grad_norm": 16.942413330078125, + "learning_rate": 1.9869309334331606e-05, + "loss": 1.7856, + "step": 2935 + }, + { + "epoch": 8.0, + "grad_norm": 14.696255683898926, + "learning_rate": 1.9869167087338908e-05, + "loss": 1.6475, + "step": 2936 + }, + { + "epoch": 8.002724795640328, + "grad_norm": 10.834300994873047, + "learning_rate": 1.9869024763485454e-05, + "loss": 1.623, + "step": 2937 + }, + { + "epoch": 8.005449591280653, + "grad_norm": 11.849433898925781, + "learning_rate": 1.9868882362772356e-05, + "loss": 1.5503, + "step": 2938 + }, + { + "epoch": 8.008174386920981, + "grad_norm": 9.379240036010742, + "learning_rate": 1.9868739885200718e-05, + "loss": 1.7466, + "step": 2939 + }, + { + "epoch": 8.010899182561309, + "grad_norm": 18.678430557250977, + "learning_rate": 1.9868597330771648e-05, + "loss": 1.7124, + "step": 2940 + }, + { + "epoch": 8.013623978201634, + "grad_norm": 12.0128755569458, + "learning_rate": 1.986845469948626e-05, + "loss": 1.5017, + "step": 2941 + }, + { + "epoch": 8.016348773841962, + "grad_norm": 10.23306655883789, + "learning_rate": 1.986831199134567e-05, + "loss": 1.3601, + "step": 2942 + }, + { + "epoch": 8.01907356948229, + "grad_norm": 10.015888214111328, + "learning_rate": 1.986816920635098e-05, + "loss": 1.5457, + "step": 2943 + }, + { + "epoch": 8.021798365122615, + "grad_norm": 10.267995834350586, + "learning_rate": 1.9868026344503307e-05, + "loss": 1.4854, + "step": 2944 + }, + { + "epoch": 8.024523160762943, + "grad_norm": 9.181854248046875, + "learning_rate": 1.986788340580376e-05, + "loss": 1.239, + "step": 2945 + }, + { + "epoch": 8.02724795640327, + "grad_norm": 11.752165794372559, + "learning_rate": 1.9867740390253458e-05, + "loss": 1.4785, + "step": 2946 + }, + { + "epoch": 8.029972752043596, + "grad_norm": 13.72391414642334, + "learning_rate": 1.986759729785351e-05, + "loss": 1.4178, + "step": 2947 + }, + { + "epoch": 8.032697547683924, + "grad_norm": 11.265132904052734, + "learning_rate": 1.9867454128605033e-05, + "loss": 1.689, + "step": 2948 + }, + { + "epoch": 8.035422343324251, + "grad_norm": 10.6729154586792, + "learning_rate": 1.9867310882509136e-05, + "loss": 1.3896, + "step": 2949 + }, + { + "epoch": 8.038147138964577, + "grad_norm": 14.195324897766113, + "learning_rate": 1.9867167559566944e-05, + "loss": 1.363, + "step": 2950 + }, + { + "epoch": 8.040871934604905, + "grad_norm": 11.9901762008667, + "learning_rate": 1.986702415977957e-05, + "loss": 1.4023, + "step": 2951 + }, + { + "epoch": 8.043596730245232, + "grad_norm": 11.18156909942627, + "learning_rate": 1.9866880683148128e-05, + "loss": 1.4705, + "step": 2952 + }, + { + "epoch": 8.046321525885558, + "grad_norm": 14.364361763000488, + "learning_rate": 1.9866737129673733e-05, + "loss": 1.4668, + "step": 2953 + }, + { + "epoch": 8.049046321525886, + "grad_norm": 36.69050598144531, + "learning_rate": 1.9866593499357508e-05, + "loss": 1.7817, + "step": 2954 + }, + { + "epoch": 8.051771117166213, + "grad_norm": 10.556742668151855, + "learning_rate": 1.9866449792200572e-05, + "loss": 1.5327, + "step": 2955 + }, + { + "epoch": 8.054495912806539, + "grad_norm": 13.603948593139648, + "learning_rate": 1.9866306008204042e-05, + "loss": 1.3187, + "step": 2956 + }, + { + "epoch": 8.057220708446867, + "grad_norm": 11.465261459350586, + "learning_rate": 1.986616214736904e-05, + "loss": 1.7153, + "step": 2957 + }, + { + "epoch": 8.059945504087194, + "grad_norm": 32.16316604614258, + "learning_rate": 1.9866018209696686e-05, + "loss": 1.9456, + "step": 2958 + }, + { + "epoch": 8.06267029972752, + "grad_norm": 13.840081214904785, + "learning_rate": 1.9865874195188095e-05, + "loss": 1.585, + "step": 2959 + }, + { + "epoch": 8.065395095367847, + "grad_norm": 10.292863845825195, + "learning_rate": 1.9865730103844397e-05, + "loss": 1.5513, + "step": 2960 + }, + { + "epoch": 8.068119891008175, + "grad_norm": 10.423396110534668, + "learning_rate": 1.9865585935666706e-05, + "loss": 1.5293, + "step": 2961 + }, + { + "epoch": 8.0708446866485, + "grad_norm": 18.91510772705078, + "learning_rate": 1.9865441690656154e-05, + "loss": 1.2377, + "step": 2962 + }, + { + "epoch": 8.073569482288828, + "grad_norm": 9.956671714782715, + "learning_rate": 1.986529736881386e-05, + "loss": 1.4131, + "step": 2963 + }, + { + "epoch": 8.076294277929156, + "grad_norm": 20.656063079833984, + "learning_rate": 1.9865152970140946e-05, + "loss": 1.6997, + "step": 2964 + }, + { + "epoch": 8.079019073569482, + "grad_norm": 10.994516372680664, + "learning_rate": 1.9865008494638536e-05, + "loss": 1.5242, + "step": 2965 + }, + { + "epoch": 8.08174386920981, + "grad_norm": 12.00313949584961, + "learning_rate": 1.986486394230776e-05, + "loss": 1.4519, + "step": 2966 + }, + { + "epoch": 8.084468664850137, + "grad_norm": 10.38339900970459, + "learning_rate": 1.986471931314974e-05, + "loss": 1.4712, + "step": 2967 + }, + { + "epoch": 8.087193460490463, + "grad_norm": 11.970154762268066, + "learning_rate": 1.9864574607165602e-05, + "loss": 1.5349, + "step": 2968 + }, + { + "epoch": 8.08991825613079, + "grad_norm": 14.663086891174316, + "learning_rate": 1.9864429824356478e-05, + "loss": 1.4507, + "step": 2969 + }, + { + "epoch": 8.092643051771118, + "grad_norm": 11.080653190612793, + "learning_rate": 1.9864284964723488e-05, + "loss": 1.5071, + "step": 2970 + }, + { + "epoch": 8.095367847411444, + "grad_norm": 13.981965065002441, + "learning_rate": 1.9864140028267767e-05, + "loss": 1.7878, + "step": 2971 + }, + { + "epoch": 8.098092643051771, + "grad_norm": 11.915581703186035, + "learning_rate": 1.986399501499044e-05, + "loss": 1.5005, + "step": 2972 + }, + { + "epoch": 8.100817438692099, + "grad_norm": 11.16733455657959, + "learning_rate": 1.986384992489264e-05, + "loss": 1.4048, + "step": 2973 + }, + { + "epoch": 8.103542234332425, + "grad_norm": 11.649931907653809, + "learning_rate": 1.9863704757975492e-05, + "loss": 1.3342, + "step": 2974 + }, + { + "epoch": 8.106267029972752, + "grad_norm": 10.512341499328613, + "learning_rate": 1.9863559514240128e-05, + "loss": 1.4778, + "step": 2975 + }, + { + "epoch": 8.10899182561308, + "grad_norm": 12.347107887268066, + "learning_rate": 1.986341419368768e-05, + "loss": 1.4309, + "step": 2976 + }, + { + "epoch": 8.111716621253406, + "grad_norm": 10.135472297668457, + "learning_rate": 1.9863268796319278e-05, + "loss": 1.4036, + "step": 2977 + }, + { + "epoch": 8.114441416893733, + "grad_norm": 37.992225646972656, + "learning_rate": 1.9863123322136058e-05, + "loss": 1.4419, + "step": 2978 + }, + { + "epoch": 8.11716621253406, + "grad_norm": 9.647393226623535, + "learning_rate": 1.9862977771139154e-05, + "loss": 1.5249, + "step": 2979 + }, + { + "epoch": 8.119891008174386, + "grad_norm": 11.539268493652344, + "learning_rate": 1.9862832143329694e-05, + "loss": 1.4644, + "step": 2980 + }, + { + "epoch": 8.122615803814714, + "grad_norm": 9.759735107421875, + "learning_rate": 1.9862686438708813e-05, + "loss": 1.2756, + "step": 2981 + }, + { + "epoch": 8.125340599455042, + "grad_norm": 11.171850204467773, + "learning_rate": 1.986254065727765e-05, + "loss": 1.3867, + "step": 2982 + }, + { + "epoch": 8.128065395095367, + "grad_norm": 11.682690620422363, + "learning_rate": 1.9862394799037338e-05, + "loss": 1.5037, + "step": 2983 + }, + { + "epoch": 8.130790190735695, + "grad_norm": 10.766770362854004, + "learning_rate": 1.986224886398901e-05, + "loss": 1.5959, + "step": 2984 + }, + { + "epoch": 8.133514986376023, + "grad_norm": 12.399341583251953, + "learning_rate": 1.986210285213381e-05, + "loss": 1.4543, + "step": 2985 + }, + { + "epoch": 8.136239782016348, + "grad_norm": 9.954695701599121, + "learning_rate": 1.9861956763472866e-05, + "loss": 1.4868, + "step": 2986 + }, + { + "epoch": 8.138964577656676, + "grad_norm": 11.342049598693848, + "learning_rate": 1.986181059800732e-05, + "loss": 1.6086, + "step": 2987 + }, + { + "epoch": 8.141689373297003, + "grad_norm": 10.286776542663574, + "learning_rate": 1.986166435573831e-05, + "loss": 1.3677, + "step": 2988 + }, + { + "epoch": 8.14441416893733, + "grad_norm": 9.159870147705078, + "learning_rate": 1.9861518036666978e-05, + "loss": 1.5474, + "step": 2989 + }, + { + "epoch": 8.147138964577657, + "grad_norm": 10.327608108520508, + "learning_rate": 1.986137164079446e-05, + "loss": 1.3647, + "step": 2990 + }, + { + "epoch": 8.149863760217984, + "grad_norm": 12.476815223693848, + "learning_rate": 1.98612251681219e-05, + "loss": 1.4353, + "step": 2991 + }, + { + "epoch": 8.15258855585831, + "grad_norm": 8.87645435333252, + "learning_rate": 1.986107861865043e-05, + "loss": 1.4033, + "step": 2992 + }, + { + "epoch": 8.155313351498638, + "grad_norm": 13.785514831542969, + "learning_rate": 1.9860931992381202e-05, + "loss": 1.4614, + "step": 2993 + }, + { + "epoch": 8.158038147138965, + "grad_norm": 8.921813011169434, + "learning_rate": 1.9860785289315352e-05, + "loss": 1.2593, + "step": 2994 + }, + { + "epoch": 8.160762942779291, + "grad_norm": 10.972900390625, + "learning_rate": 1.986063850945402e-05, + "loss": 1.5112, + "step": 2995 + }, + { + "epoch": 8.163487738419619, + "grad_norm": 11.340409278869629, + "learning_rate": 1.9860491652798358e-05, + "loss": 1.5261, + "step": 2996 + }, + { + "epoch": 8.166212534059946, + "grad_norm": 11.435660362243652, + "learning_rate": 1.98603447193495e-05, + "loss": 1.5381, + "step": 2997 + }, + { + "epoch": 8.168937329700272, + "grad_norm": 10.339703559875488, + "learning_rate": 1.9860197709108596e-05, + "loss": 1.3696, + "step": 2998 + }, + { + "epoch": 8.1716621253406, + "grad_norm": 10.372658729553223, + "learning_rate": 1.986005062207679e-05, + "loss": 1.3369, + "step": 2999 + }, + { + "epoch": 8.174386920980927, + "grad_norm": 12.192550659179688, + "learning_rate": 1.9859903458255227e-05, + "loss": 1.5547, + "step": 3000 + }, + { + "epoch": 8.177111716621253, + "grad_norm": 9.437643051147461, + "learning_rate": 1.9859756217645054e-05, + "loss": 1.4419, + "step": 3001 + }, + { + "epoch": 8.17983651226158, + "grad_norm": 30.47894287109375, + "learning_rate": 1.9859608900247417e-05, + "loss": 1.4702, + "step": 3002 + }, + { + "epoch": 8.182561307901908, + "grad_norm": 9.573280334472656, + "learning_rate": 1.985946150606346e-05, + "loss": 1.542, + "step": 3003 + }, + { + "epoch": 8.185286103542234, + "grad_norm": 8.637099266052246, + "learning_rate": 1.985931403509434e-05, + "loss": 1.4841, + "step": 3004 + }, + { + "epoch": 8.188010899182562, + "grad_norm": 10.783534049987793, + "learning_rate": 1.9859166487341194e-05, + "loss": 1.4346, + "step": 3005 + }, + { + "epoch": 8.190735694822889, + "grad_norm": 9.640056610107422, + "learning_rate": 1.985901886280518e-05, + "loss": 1.3105, + "step": 3006 + }, + { + "epoch": 8.193460490463215, + "grad_norm": 10.957379341125488, + "learning_rate": 1.985887116148744e-05, + "loss": 1.4785, + "step": 3007 + }, + { + "epoch": 8.196185286103542, + "grad_norm": 8.909079551696777, + "learning_rate": 1.9858723383389134e-05, + "loss": 1.2114, + "step": 3008 + }, + { + "epoch": 8.19891008174387, + "grad_norm": 9.386533737182617, + "learning_rate": 1.9858575528511406e-05, + "loss": 1.4482, + "step": 3009 + }, + { + "epoch": 8.201634877384196, + "grad_norm": 23.52212142944336, + "learning_rate": 1.9858427596855407e-05, + "loss": 1.5076, + "step": 3010 + }, + { + "epoch": 8.204359673024523, + "grad_norm": 11.575129508972168, + "learning_rate": 1.9858279588422294e-05, + "loss": 1.4038, + "step": 3011 + }, + { + "epoch": 8.207084468664851, + "grad_norm": 13.577309608459473, + "learning_rate": 1.9858131503213214e-05, + "loss": 1.5769, + "step": 3012 + }, + { + "epoch": 8.209809264305177, + "grad_norm": 11.172263145446777, + "learning_rate": 1.9857983341229326e-05, + "loss": 1.6812, + "step": 3013 + }, + { + "epoch": 8.212534059945504, + "grad_norm": 10.272761344909668, + "learning_rate": 1.985783510247178e-05, + "loss": 1.5347, + "step": 3014 + }, + { + "epoch": 8.215258855585832, + "grad_norm": 10.700855255126953, + "learning_rate": 1.9857686786941733e-05, + "loss": 1.4775, + "step": 3015 + }, + { + "epoch": 8.217983651226158, + "grad_norm": 9.62952995300293, + "learning_rate": 1.9857538394640336e-05, + "loss": 1.3901, + "step": 3016 + }, + { + "epoch": 8.220708446866485, + "grad_norm": 9.708124160766602, + "learning_rate": 1.9857389925568745e-05, + "loss": 1.5703, + "step": 3017 + }, + { + "epoch": 8.223433242506813, + "grad_norm": 17.98137092590332, + "learning_rate": 1.9857241379728122e-05, + "loss": 1.5413, + "step": 3018 + }, + { + "epoch": 8.226158038147139, + "grad_norm": 11.248151779174805, + "learning_rate": 1.9857092757119622e-05, + "loss": 1.5107, + "step": 3019 + }, + { + "epoch": 8.228882833787466, + "grad_norm": 12.324178695678711, + "learning_rate": 1.9856944057744398e-05, + "loss": 1.5288, + "step": 3020 + }, + { + "epoch": 8.231607629427794, + "grad_norm": 10.10075855255127, + "learning_rate": 1.985679528160361e-05, + "loss": 1.4973, + "step": 3021 + }, + { + "epoch": 8.23433242506812, + "grad_norm": 14.341442108154297, + "learning_rate": 1.985664642869842e-05, + "loss": 1.2368, + "step": 3022 + }, + { + "epoch": 8.237057220708447, + "grad_norm": 11.082841873168945, + "learning_rate": 1.9856497499029987e-05, + "loss": 1.3391, + "step": 3023 + }, + { + "epoch": 8.239782016348773, + "grad_norm": 10.736616134643555, + "learning_rate": 1.9856348492599464e-05, + "loss": 1.4377, + "step": 3024 + }, + { + "epoch": 8.2425068119891, + "grad_norm": 9.020471572875977, + "learning_rate": 1.9856199409408017e-05, + "loss": 1.2141, + "step": 3025 + }, + { + "epoch": 8.245231607629428, + "grad_norm": 11.725255012512207, + "learning_rate": 1.9856050249456808e-05, + "loss": 1.3958, + "step": 3026 + }, + { + "epoch": 8.247956403269754, + "grad_norm": 10.40517807006836, + "learning_rate": 1.9855901012746996e-05, + "loss": 1.4919, + "step": 3027 + }, + { + "epoch": 8.250681198910081, + "grad_norm": 11.07318115234375, + "learning_rate": 1.9855751699279745e-05, + "loss": 1.5129, + "step": 3028 + }, + { + "epoch": 8.253405994550409, + "grad_norm": 9.537273406982422, + "learning_rate": 1.9855602309056216e-05, + "loss": 1.4246, + "step": 3029 + }, + { + "epoch": 8.256130790190735, + "grad_norm": 11.27015495300293, + "learning_rate": 1.9855452842077573e-05, + "loss": 1.7637, + "step": 3030 + }, + { + "epoch": 8.258855585831062, + "grad_norm": 11.040712356567383, + "learning_rate": 1.9855303298344985e-05, + "loss": 1.3016, + "step": 3031 + }, + { + "epoch": 8.26158038147139, + "grad_norm": 12.095251083374023, + "learning_rate": 1.9855153677859604e-05, + "loss": 1.5215, + "step": 3032 + }, + { + "epoch": 8.264305177111716, + "grad_norm": 10.048185348510742, + "learning_rate": 1.985500398062261e-05, + "loss": 1.345, + "step": 3033 + }, + { + "epoch": 8.267029972752043, + "grad_norm": 11.623002052307129, + "learning_rate": 1.985485420663516e-05, + "loss": 1.4788, + "step": 3034 + }, + { + "epoch": 8.269754768392371, + "grad_norm": 10.471136093139648, + "learning_rate": 1.985470435589842e-05, + "loss": 1.3445, + "step": 3035 + }, + { + "epoch": 8.272479564032697, + "grad_norm": 26.749555587768555, + "learning_rate": 1.9854554428413563e-05, + "loss": 1.4272, + "step": 3036 + }, + { + "epoch": 8.275204359673024, + "grad_norm": 10.94150447845459, + "learning_rate": 1.9854404424181752e-05, + "loss": 1.3726, + "step": 3037 + }, + { + "epoch": 8.277929155313352, + "grad_norm": 17.83536148071289, + "learning_rate": 1.9854254343204155e-05, + "loss": 1.3127, + "step": 3038 + }, + { + "epoch": 8.280653950953678, + "grad_norm": 10.491273880004883, + "learning_rate": 1.9854104185481944e-05, + "loss": 1.396, + "step": 3039 + }, + { + "epoch": 8.283378746594005, + "grad_norm": 15.343791961669922, + "learning_rate": 1.985395395101629e-05, + "loss": 1.4219, + "step": 3040 + }, + { + "epoch": 8.286103542234333, + "grad_norm": 11.310440063476562, + "learning_rate": 1.9853803639808357e-05, + "loss": 1.3748, + "step": 3041 + }, + { + "epoch": 8.288828337874659, + "grad_norm": 12.330083847045898, + "learning_rate": 1.9853653251859315e-05, + "loss": 1.3645, + "step": 3042 + }, + { + "epoch": 8.291553133514986, + "grad_norm": 16.09228515625, + "learning_rate": 1.9853502787170345e-05, + "loss": 1.4675, + "step": 3043 + }, + { + "epoch": 8.294277929155314, + "grad_norm": 11.356207847595215, + "learning_rate": 1.985335224574261e-05, + "loss": 1.5474, + "step": 3044 + }, + { + "epoch": 8.29700272479564, + "grad_norm": 14.240828514099121, + "learning_rate": 1.9853201627577283e-05, + "loss": 1.4148, + "step": 3045 + }, + { + "epoch": 8.299727520435967, + "grad_norm": 15.836702346801758, + "learning_rate": 1.985305093267554e-05, + "loss": 1.4309, + "step": 3046 + }, + { + "epoch": 8.302452316076295, + "grad_norm": 8.947978019714355, + "learning_rate": 1.9852900161038552e-05, + "loss": 1.3464, + "step": 3047 + }, + { + "epoch": 8.30517711171662, + "grad_norm": 20.330575942993164, + "learning_rate": 1.9852749312667496e-05, + "loss": 1.3528, + "step": 3048 + }, + { + "epoch": 8.307901907356948, + "grad_norm": 12.280182838439941, + "learning_rate": 1.9852598387563545e-05, + "loss": 1.4248, + "step": 3049 + }, + { + "epoch": 8.310626702997276, + "grad_norm": 12.325653076171875, + "learning_rate": 1.9852447385727876e-05, + "loss": 1.3672, + "step": 3050 + }, + { + "epoch": 8.313351498637601, + "grad_norm": 15.524264335632324, + "learning_rate": 1.985229630716166e-05, + "loss": 1.614, + "step": 3051 + }, + { + "epoch": 8.316076294277929, + "grad_norm": 12.32604694366455, + "learning_rate": 1.985214515186608e-05, + "loss": 1.6929, + "step": 3052 + }, + { + "epoch": 8.318801089918257, + "grad_norm": 18.24497413635254, + "learning_rate": 1.9851993919842314e-05, + "loss": 1.3445, + "step": 3053 + }, + { + "epoch": 8.321525885558582, + "grad_norm": 10.476236343383789, + "learning_rate": 1.9851842611091534e-05, + "loss": 1.5415, + "step": 3054 + }, + { + "epoch": 8.32425068119891, + "grad_norm": 13.16490364074707, + "learning_rate": 1.985169122561492e-05, + "loss": 1.4502, + "step": 3055 + }, + { + "epoch": 8.326975476839237, + "grad_norm": 8.830989837646484, + "learning_rate": 1.9851539763413653e-05, + "loss": 1.3802, + "step": 3056 + }, + { + "epoch": 8.329700272479563, + "grad_norm": 14.608965873718262, + "learning_rate": 1.985138822448891e-05, + "loss": 1.436, + "step": 3057 + }, + { + "epoch": 8.33242506811989, + "grad_norm": 9.7664155960083, + "learning_rate": 1.9851236608841874e-05, + "loss": 1.3562, + "step": 3058 + }, + { + "epoch": 8.335149863760218, + "grad_norm": 8.381041526794434, + "learning_rate": 1.985108491647372e-05, + "loss": 1.374, + "step": 3059 + }, + { + "epoch": 8.337874659400544, + "grad_norm": 8.069664001464844, + "learning_rate": 1.9850933147385637e-05, + "loss": 1.3459, + "step": 3060 + }, + { + "epoch": 8.340599455040872, + "grad_norm": 11.313298225402832, + "learning_rate": 1.9850781301578808e-05, + "loss": 1.4307, + "step": 3061 + }, + { + "epoch": 8.3433242506812, + "grad_norm": 16.71454620361328, + "learning_rate": 1.985062937905441e-05, + "loss": 1.4785, + "step": 3062 + }, + { + "epoch": 8.346049046321525, + "grad_norm": 15.24333667755127, + "learning_rate": 1.9850477379813622e-05, + "loss": 1.5354, + "step": 3063 + }, + { + "epoch": 8.348773841961853, + "grad_norm": 8.75456714630127, + "learning_rate": 1.9850325303857634e-05, + "loss": 1.4526, + "step": 3064 + }, + { + "epoch": 8.35149863760218, + "grad_norm": 11.578174591064453, + "learning_rate": 1.9850173151187634e-05, + "loss": 1.4067, + "step": 3065 + }, + { + "epoch": 8.354223433242506, + "grad_norm": 16.258743286132812, + "learning_rate": 1.9850020921804797e-05, + "loss": 1.5942, + "step": 3066 + }, + { + "epoch": 8.356948228882834, + "grad_norm": 9.28243350982666, + "learning_rate": 1.9849868615710316e-05, + "loss": 1.4578, + "step": 3067 + }, + { + "epoch": 8.359673024523161, + "grad_norm": 9.199224472045898, + "learning_rate": 1.9849716232905378e-05, + "loss": 1.3044, + "step": 3068 + }, + { + "epoch": 8.362397820163487, + "grad_norm": 12.875617027282715, + "learning_rate": 1.9849563773391163e-05, + "loss": 1.4543, + "step": 3069 + }, + { + "epoch": 8.365122615803815, + "grad_norm": 10.499556541442871, + "learning_rate": 1.9849411237168866e-05, + "loss": 1.4924, + "step": 3070 + }, + { + "epoch": 8.367847411444142, + "grad_norm": 10.636470794677734, + "learning_rate": 1.9849258624239672e-05, + "loss": 1.5032, + "step": 3071 + }, + { + "epoch": 8.370572207084468, + "grad_norm": 12.64499282836914, + "learning_rate": 1.9849105934604766e-05, + "loss": 1.5383, + "step": 3072 + }, + { + "epoch": 8.373297002724795, + "grad_norm": 11.598895072937012, + "learning_rate": 1.9848953168265342e-05, + "loss": 1.3938, + "step": 3073 + }, + { + "epoch": 8.376021798365123, + "grad_norm": 10.648917198181152, + "learning_rate": 1.9848800325222585e-05, + "loss": 1.5962, + "step": 3074 + }, + { + "epoch": 8.378746594005449, + "grad_norm": 11.883172988891602, + "learning_rate": 1.984864740547769e-05, + "loss": 1.5996, + "step": 3075 + }, + { + "epoch": 8.381471389645776, + "grad_norm": 9.24280834197998, + "learning_rate": 1.9848494409031843e-05, + "loss": 1.1299, + "step": 3076 + }, + { + "epoch": 8.384196185286104, + "grad_norm": 22.34482765197754, + "learning_rate": 1.9848341335886243e-05, + "loss": 1.5037, + "step": 3077 + }, + { + "epoch": 8.38692098092643, + "grad_norm": 9.828432083129883, + "learning_rate": 1.9848188186042077e-05, + "loss": 1.4204, + "step": 3078 + }, + { + "epoch": 8.389645776566757, + "grad_norm": 9.711224555969238, + "learning_rate": 1.9848034959500535e-05, + "loss": 1.3201, + "step": 3079 + }, + { + "epoch": 8.392370572207085, + "grad_norm": 14.278112411499023, + "learning_rate": 1.9847881656262816e-05, + "loss": 1.6392, + "step": 3080 + }, + { + "epoch": 8.39509536784741, + "grad_norm": 10.200750350952148, + "learning_rate": 1.9847728276330113e-05, + "loss": 1.3245, + "step": 3081 + }, + { + "epoch": 8.397820163487738, + "grad_norm": 12.277810096740723, + "learning_rate": 1.9847574819703617e-05, + "loss": 1.4807, + "step": 3082 + }, + { + "epoch": 8.400544959128066, + "grad_norm": 9.278221130371094, + "learning_rate": 1.9847421286384526e-05, + "loss": 1.3394, + "step": 3083 + }, + { + "epoch": 8.403269754768392, + "grad_norm": 13.014542579650879, + "learning_rate": 1.9847267676374035e-05, + "loss": 1.3337, + "step": 3084 + }, + { + "epoch": 8.40599455040872, + "grad_norm": 25.616065979003906, + "learning_rate": 1.984711398967334e-05, + "loss": 1.342, + "step": 3085 + }, + { + "epoch": 8.408719346049047, + "grad_norm": 10.43862533569336, + "learning_rate": 1.9846960226283638e-05, + "loss": 1.5442, + "step": 3086 + }, + { + "epoch": 8.411444141689373, + "grad_norm": 10.15013313293457, + "learning_rate": 1.9846806386206127e-05, + "loss": 1.605, + "step": 3087 + }, + { + "epoch": 8.4141689373297, + "grad_norm": 18.991050720214844, + "learning_rate": 1.9846652469442003e-05, + "loss": 1.6562, + "step": 3088 + }, + { + "epoch": 8.416893732970028, + "grad_norm": 13.327840805053711, + "learning_rate": 1.9846498475992467e-05, + "loss": 1.4358, + "step": 3089 + }, + { + "epoch": 8.419618528610354, + "grad_norm": 13.403010368347168, + "learning_rate": 1.984634440585872e-05, + "loss": 1.4423, + "step": 3090 + }, + { + "epoch": 8.422343324250681, + "grad_norm": 12.706461906433105, + "learning_rate": 1.9846190259041956e-05, + "loss": 1.5865, + "step": 3091 + }, + { + "epoch": 8.425068119891009, + "grad_norm": 10.648401260375977, + "learning_rate": 1.9846036035543384e-05, + "loss": 1.468, + "step": 3092 + }, + { + "epoch": 8.427792915531334, + "grad_norm": 10.862265586853027, + "learning_rate": 1.98458817353642e-05, + "loss": 1.4192, + "step": 3093 + }, + { + "epoch": 8.430517711171662, + "grad_norm": 9.958219528198242, + "learning_rate": 1.9845727358505603e-05, + "loss": 1.3962, + "step": 3094 + }, + { + "epoch": 8.43324250681199, + "grad_norm": 18.21630859375, + "learning_rate": 1.9845572904968797e-05, + "loss": 1.5098, + "step": 3095 + }, + { + "epoch": 8.435967302452315, + "grad_norm": 10.30978775024414, + "learning_rate": 1.984541837475499e-05, + "loss": 1.4932, + "step": 3096 + }, + { + "epoch": 8.438692098092643, + "grad_norm": 10.251604080200195, + "learning_rate": 1.984526376786538e-05, + "loss": 1.5325, + "step": 3097 + }, + { + "epoch": 8.44141689373297, + "grad_norm": 11.313343048095703, + "learning_rate": 1.9845109084301173e-05, + "loss": 1.4907, + "step": 3098 + }, + { + "epoch": 8.444141689373296, + "grad_norm": 11.00373649597168, + "learning_rate": 1.984495432406357e-05, + "loss": 1.4763, + "step": 3099 + }, + { + "epoch": 8.446866485013624, + "grad_norm": 10.753448486328125, + "learning_rate": 1.9844799487153782e-05, + "loss": 1.4187, + "step": 3100 + }, + { + "epoch": 8.449591280653951, + "grad_norm": 9.696673393249512, + "learning_rate": 1.9844644573573016e-05, + "loss": 1.4119, + "step": 3101 + }, + { + "epoch": 8.452316076294277, + "grad_norm": 11.8190336227417, + "learning_rate": 1.984448958332247e-05, + "loss": 1.4204, + "step": 3102 + }, + { + "epoch": 8.455040871934605, + "grad_norm": 10.040216445922852, + "learning_rate": 1.9844334516403356e-05, + "loss": 1.311, + "step": 3103 + }, + { + "epoch": 8.457765667574932, + "grad_norm": 10.194698333740234, + "learning_rate": 1.9844179372816884e-05, + "loss": 1.4722, + "step": 3104 + }, + { + "epoch": 8.460490463215258, + "grad_norm": 12.599777221679688, + "learning_rate": 1.984402415256426e-05, + "loss": 1.708, + "step": 3105 + }, + { + "epoch": 8.463215258855586, + "grad_norm": 10.403139114379883, + "learning_rate": 1.984386885564669e-05, + "loss": 1.3508, + "step": 3106 + }, + { + "epoch": 8.465940054495913, + "grad_norm": 16.842971801757812, + "learning_rate": 1.984371348206539e-05, + "loss": 1.4905, + "step": 3107 + }, + { + "epoch": 8.46866485013624, + "grad_norm": 13.428004264831543, + "learning_rate": 1.9843558031821563e-05, + "loss": 1.6121, + "step": 3108 + }, + { + "epoch": 8.471389645776567, + "grad_norm": 12.502063751220703, + "learning_rate": 1.9843402504916424e-05, + "loss": 1.7378, + "step": 3109 + }, + { + "epoch": 8.474114441416894, + "grad_norm": 8.010069847106934, + "learning_rate": 1.9843246901351184e-05, + "loss": 1.3679, + "step": 3110 + }, + { + "epoch": 8.47683923705722, + "grad_norm": 11.141092300415039, + "learning_rate": 1.9843091221127053e-05, + "loss": 1.5574, + "step": 3111 + }, + { + "epoch": 8.479564032697548, + "grad_norm": 17.215499877929688, + "learning_rate": 1.9842935464245245e-05, + "loss": 1.5002, + "step": 3112 + }, + { + "epoch": 8.482288828337875, + "grad_norm": 10.081450462341309, + "learning_rate": 1.9842779630706972e-05, + "loss": 1.3403, + "step": 3113 + }, + { + "epoch": 8.485013623978201, + "grad_norm": 10.36174488067627, + "learning_rate": 1.9842623720513447e-05, + "loss": 1.4783, + "step": 3114 + }, + { + "epoch": 8.487738419618529, + "grad_norm": 9.917871475219727, + "learning_rate": 1.9842467733665886e-05, + "loss": 1.3081, + "step": 3115 + }, + { + "epoch": 8.490463215258856, + "grad_norm": 13.55300235748291, + "learning_rate": 1.9842311670165503e-05, + "loss": 1.3501, + "step": 3116 + }, + { + "epoch": 8.493188010899182, + "grad_norm": 10.539414405822754, + "learning_rate": 1.9842155530013514e-05, + "loss": 1.4915, + "step": 3117 + }, + { + "epoch": 8.49591280653951, + "grad_norm": 14.190298080444336, + "learning_rate": 1.9841999313211135e-05, + "loss": 1.5364, + "step": 3118 + }, + { + "epoch": 8.498637602179837, + "grad_norm": 11.394745826721191, + "learning_rate": 1.9841843019759583e-05, + "loss": 1.427, + "step": 3119 + }, + { + "epoch": 8.501362397820163, + "grad_norm": 11.221658706665039, + "learning_rate": 1.984168664966007e-05, + "loss": 1.394, + "step": 3120 + }, + { + "epoch": 8.50408719346049, + "grad_norm": 13.456465721130371, + "learning_rate": 1.9841530202913822e-05, + "loss": 1.386, + "step": 3121 + }, + { + "epoch": 8.506811989100818, + "grad_norm": 12.035820960998535, + "learning_rate": 1.984137367952205e-05, + "loss": 1.4299, + "step": 3122 + }, + { + "epoch": 8.509536784741144, + "grad_norm": 12.752290725708008, + "learning_rate": 1.984121707948598e-05, + "loss": 1.5894, + "step": 3123 + }, + { + "epoch": 8.512261580381471, + "grad_norm": 10.289709091186523, + "learning_rate": 1.9841060402806826e-05, + "loss": 1.4592, + "step": 3124 + }, + { + "epoch": 8.514986376021799, + "grad_norm": 12.596096992492676, + "learning_rate": 1.9840903649485812e-05, + "loss": 1.4778, + "step": 3125 + }, + { + "epoch": 8.517711171662125, + "grad_norm": 9.822829246520996, + "learning_rate": 1.9840746819524157e-05, + "loss": 1.3276, + "step": 3126 + }, + { + "epoch": 8.520435967302452, + "grad_norm": 11.025153160095215, + "learning_rate": 1.9840589912923082e-05, + "loss": 1.3391, + "step": 3127 + }, + { + "epoch": 8.52316076294278, + "grad_norm": 14.443016052246094, + "learning_rate": 1.984043292968381e-05, + "loss": 1.3357, + "step": 3128 + }, + { + "epoch": 8.525885558583106, + "grad_norm": 11.228981971740723, + "learning_rate": 1.984027586980756e-05, + "loss": 1.4622, + "step": 3129 + }, + { + "epoch": 8.528610354223433, + "grad_norm": 9.984880447387695, + "learning_rate": 1.984011873329556e-05, + "loss": 1.196, + "step": 3130 + }, + { + "epoch": 8.53133514986376, + "grad_norm": 14.243448257446289, + "learning_rate": 1.9839961520149035e-05, + "loss": 1.4465, + "step": 3131 + }, + { + "epoch": 8.534059945504087, + "grad_norm": 17.242151260375977, + "learning_rate": 1.9839804230369204e-05, + "loss": 1.3835, + "step": 3132 + }, + { + "epoch": 8.536784741144414, + "grad_norm": 10.174351692199707, + "learning_rate": 1.9839646863957294e-05, + "loss": 1.325, + "step": 3133 + }, + { + "epoch": 8.539509536784742, + "grad_norm": 14.6315279006958, + "learning_rate": 1.9839489420914533e-05, + "loss": 1.3896, + "step": 3134 + }, + { + "epoch": 8.542234332425068, + "grad_norm": 10.157470703125, + "learning_rate": 1.9839331901242144e-05, + "loss": 1.4033, + "step": 3135 + }, + { + "epoch": 8.544959128065395, + "grad_norm": 11.893716812133789, + "learning_rate": 1.983917430494135e-05, + "loss": 1.4417, + "step": 3136 + }, + { + "epoch": 8.547683923705723, + "grad_norm": 10.006495475769043, + "learning_rate": 1.9839016632013388e-05, + "loss": 1.48, + "step": 3137 + }, + { + "epoch": 8.550408719346049, + "grad_norm": 9.870905876159668, + "learning_rate": 1.9838858882459483e-05, + "loss": 1.562, + "step": 3138 + }, + { + "epoch": 8.553133514986376, + "grad_norm": 9.79379940032959, + "learning_rate": 1.9838701056280857e-05, + "loss": 1.2852, + "step": 3139 + }, + { + "epoch": 8.555858310626704, + "grad_norm": 14.175224304199219, + "learning_rate": 1.9838543153478746e-05, + "loss": 1.3904, + "step": 3140 + }, + { + "epoch": 8.55858310626703, + "grad_norm": 11.184218406677246, + "learning_rate": 1.9838385174054376e-05, + "loss": 1.4192, + "step": 3141 + }, + { + "epoch": 8.561307901907357, + "grad_norm": 14.325691223144531, + "learning_rate": 1.9838227118008982e-05, + "loss": 1.5825, + "step": 3142 + }, + { + "epoch": 8.564032697547685, + "grad_norm": 10.817137718200684, + "learning_rate": 1.983806898534379e-05, + "loss": 1.3391, + "step": 3143 + }, + { + "epoch": 8.56675749318801, + "grad_norm": 9.145304679870605, + "learning_rate": 1.9837910776060036e-05, + "loss": 1.4397, + "step": 3144 + }, + { + "epoch": 8.569482288828338, + "grad_norm": 8.59023666381836, + "learning_rate": 1.9837752490158946e-05, + "loss": 1.3081, + "step": 3145 + }, + { + "epoch": 8.572207084468666, + "grad_norm": 9.126311302185059, + "learning_rate": 1.9837594127641758e-05, + "loss": 1.4802, + "step": 3146 + }, + { + "epoch": 8.574931880108991, + "grad_norm": 9.468857765197754, + "learning_rate": 1.9837435688509704e-05, + "loss": 1.3608, + "step": 3147 + }, + { + "epoch": 8.577656675749319, + "grad_norm": 10.783597946166992, + "learning_rate": 1.9837277172764016e-05, + "loss": 1.5986, + "step": 3148 + }, + { + "epoch": 8.580381471389646, + "grad_norm": 9.311051368713379, + "learning_rate": 1.9837118580405928e-05, + "loss": 1.3455, + "step": 3149 + }, + { + "epoch": 8.583106267029972, + "grad_norm": 17.301712036132812, + "learning_rate": 1.9836959911436682e-05, + "loss": 1.5852, + "step": 3150 + }, + { + "epoch": 8.5858310626703, + "grad_norm": 9.285280227661133, + "learning_rate": 1.9836801165857507e-05, + "loss": 1.4199, + "step": 3151 + }, + { + "epoch": 8.588555858310627, + "grad_norm": 11.945184707641602, + "learning_rate": 1.983664234366964e-05, + "loss": 1.4299, + "step": 3152 + }, + { + "epoch": 8.591280653950953, + "grad_norm": 10.90672779083252, + "learning_rate": 1.9836483444874317e-05, + "loss": 1.3088, + "step": 3153 + }, + { + "epoch": 8.59400544959128, + "grad_norm": 9.78835678100586, + "learning_rate": 1.9836324469472782e-05, + "loss": 1.447, + "step": 3154 + }, + { + "epoch": 8.596730245231608, + "grad_norm": 11.199138641357422, + "learning_rate": 1.9836165417466266e-05, + "loss": 1.3364, + "step": 3155 + }, + { + "epoch": 8.599455040871934, + "grad_norm": 10.1149320602417, + "learning_rate": 1.983600628885601e-05, + "loss": 1.4536, + "step": 3156 + }, + { + "epoch": 8.602179836512262, + "grad_norm": 15.373045921325684, + "learning_rate": 1.9835847083643256e-05, + "loss": 1.7036, + "step": 3157 + }, + { + "epoch": 8.60490463215259, + "grad_norm": 11.325897216796875, + "learning_rate": 1.983568780182924e-05, + "loss": 1.3481, + "step": 3158 + }, + { + "epoch": 8.607629427792915, + "grad_norm": 10.771793365478516, + "learning_rate": 1.9835528443415205e-05, + "loss": 1.4155, + "step": 3159 + }, + { + "epoch": 8.610354223433243, + "grad_norm": 11.561205863952637, + "learning_rate": 1.983536900840239e-05, + "loss": 1.4573, + "step": 3160 + }, + { + "epoch": 8.61307901907357, + "grad_norm": 15.841632843017578, + "learning_rate": 1.9835209496792038e-05, + "loss": 1.5005, + "step": 3161 + }, + { + "epoch": 8.615803814713896, + "grad_norm": 10.387455940246582, + "learning_rate": 1.9835049908585388e-05, + "loss": 1.2476, + "step": 3162 + }, + { + "epoch": 8.618528610354224, + "grad_norm": 10.735313415527344, + "learning_rate": 1.983489024378369e-05, + "loss": 1.3098, + "step": 3163 + }, + { + "epoch": 8.621253405994551, + "grad_norm": 8.47869873046875, + "learning_rate": 1.983473050238818e-05, + "loss": 1.1816, + "step": 3164 + }, + { + "epoch": 8.623978201634877, + "grad_norm": 12.40446662902832, + "learning_rate": 1.983457068440011e-05, + "loss": 1.2859, + "step": 3165 + }, + { + "epoch": 8.626702997275205, + "grad_norm": 11.339210510253906, + "learning_rate": 1.983441078982072e-05, + "loss": 1.489, + "step": 3166 + }, + { + "epoch": 8.629427792915532, + "grad_norm": 18.086868286132812, + "learning_rate": 1.983425081865125e-05, + "loss": 1.4016, + "step": 3167 + }, + { + "epoch": 8.632152588555858, + "grad_norm": 7.482706069946289, + "learning_rate": 1.9834090770892952e-05, + "loss": 1.5005, + "step": 3168 + }, + { + "epoch": 8.634877384196185, + "grad_norm": 9.909168243408203, + "learning_rate": 1.9833930646547074e-05, + "loss": 1.3108, + "step": 3169 + }, + { + "epoch": 8.637602179836513, + "grad_norm": 14.946528434753418, + "learning_rate": 1.983377044561486e-05, + "loss": 1.592, + "step": 3170 + }, + { + "epoch": 8.640326975476839, + "grad_norm": 11.477744102478027, + "learning_rate": 1.9833610168097558e-05, + "loss": 1.4348, + "step": 3171 + }, + { + "epoch": 8.643051771117166, + "grad_norm": 13.602697372436523, + "learning_rate": 1.9833449813996416e-05, + "loss": 1.6536, + "step": 3172 + }, + { + "epoch": 8.645776566757494, + "grad_norm": 9.349848747253418, + "learning_rate": 1.9833289383312687e-05, + "loss": 1.3394, + "step": 3173 + }, + { + "epoch": 8.64850136239782, + "grad_norm": 11.529946327209473, + "learning_rate": 1.9833128876047612e-05, + "loss": 1.5176, + "step": 3174 + }, + { + "epoch": 8.651226158038147, + "grad_norm": 11.247405052185059, + "learning_rate": 1.9832968292202447e-05, + "loss": 1.4001, + "step": 3175 + }, + { + "epoch": 8.653950953678475, + "grad_norm": 7.817025184631348, + "learning_rate": 1.9832807631778443e-05, + "loss": 1.3018, + "step": 3176 + }, + { + "epoch": 8.6566757493188, + "grad_norm": 11.277419090270996, + "learning_rate": 1.9832646894776847e-05, + "loss": 1.5171, + "step": 3177 + }, + { + "epoch": 8.659400544959128, + "grad_norm": 9.400995254516602, + "learning_rate": 1.9832486081198915e-05, + "loss": 1.3835, + "step": 3178 + }, + { + "epoch": 8.662125340599456, + "grad_norm": 8.203719139099121, + "learning_rate": 1.9832325191045898e-05, + "loss": 1.2866, + "step": 3179 + }, + { + "epoch": 8.664850136239782, + "grad_norm": 10.158937454223633, + "learning_rate": 1.983216422431905e-05, + "loss": 1.4116, + "step": 3180 + }, + { + "epoch": 8.66757493188011, + "grad_norm": 9.965296745300293, + "learning_rate": 1.9832003181019622e-05, + "loss": 1.3708, + "step": 3181 + }, + { + "epoch": 8.670299727520437, + "grad_norm": 11.576178550720215, + "learning_rate": 1.983184206114887e-05, + "loss": 1.3733, + "step": 3182 + }, + { + "epoch": 8.673024523160763, + "grad_norm": 12.1446533203125, + "learning_rate": 1.983168086470805e-05, + "loss": 1.3831, + "step": 3183 + }, + { + "epoch": 8.67574931880109, + "grad_norm": 9.264537811279297, + "learning_rate": 1.9831519591698413e-05, + "loss": 1.4524, + "step": 3184 + }, + { + "epoch": 8.678474114441418, + "grad_norm": 11.140650749206543, + "learning_rate": 1.983135824212122e-05, + "loss": 1.6309, + "step": 3185 + }, + { + "epoch": 8.681198910081743, + "grad_norm": 9.234440803527832, + "learning_rate": 1.9831196815977724e-05, + "loss": 1.5391, + "step": 3186 + }, + { + "epoch": 8.683923705722071, + "grad_norm": 10.074746131896973, + "learning_rate": 1.9831035313269185e-05, + "loss": 1.582, + "step": 3187 + }, + { + "epoch": 8.686648501362399, + "grad_norm": 10.477161407470703, + "learning_rate": 1.9830873733996857e-05, + "loss": 1.5674, + "step": 3188 + }, + { + "epoch": 8.689373297002724, + "grad_norm": 8.84496784210205, + "learning_rate": 1.9830712078162e-05, + "loss": 1.4683, + "step": 3189 + }, + { + "epoch": 8.692098092643052, + "grad_norm": 9.623519897460938, + "learning_rate": 1.983055034576588e-05, + "loss": 1.5715, + "step": 3190 + }, + { + "epoch": 8.69482288828338, + "grad_norm": 27.9208927154541, + "learning_rate": 1.9830388536809746e-05, + "loss": 1.418, + "step": 3191 + }, + { + "epoch": 8.697547683923705, + "grad_norm": 14.704259872436523, + "learning_rate": 1.983022665129486e-05, + "loss": 1.6104, + "step": 3192 + }, + { + "epoch": 8.700272479564033, + "grad_norm": 10.346733093261719, + "learning_rate": 1.983006468922249e-05, + "loss": 1.5295, + "step": 3193 + }, + { + "epoch": 8.70299727520436, + "grad_norm": 7.489201068878174, + "learning_rate": 1.982990265059389e-05, + "loss": 1.408, + "step": 3194 + }, + { + "epoch": 8.705722070844686, + "grad_norm": 9.454360961914062, + "learning_rate": 1.9829740535410326e-05, + "loss": 1.3833, + "step": 3195 + }, + { + "epoch": 8.708446866485014, + "grad_norm": 10.133238792419434, + "learning_rate": 1.9829578343673058e-05, + "loss": 1.439, + "step": 3196 + }, + { + "epoch": 8.711171662125341, + "grad_norm": 10.01593017578125, + "learning_rate": 1.982941607538335e-05, + "loss": 1.623, + "step": 3197 + }, + { + "epoch": 8.713896457765667, + "grad_norm": 9.866012573242188, + "learning_rate": 1.9829253730542466e-05, + "loss": 1.325, + "step": 3198 + }, + { + "epoch": 8.716621253405995, + "grad_norm": 9.05703353881836, + "learning_rate": 1.9829091309151672e-05, + "loss": 1.3975, + "step": 3199 + }, + { + "epoch": 8.719346049046322, + "grad_norm": 8.689501762390137, + "learning_rate": 1.9828928811212228e-05, + "loss": 1.355, + "step": 3200 + }, + { + "epoch": 8.722070844686648, + "grad_norm": 89.05525207519531, + "learning_rate": 1.9828766236725406e-05, + "loss": 1.4399, + "step": 3201 + }, + { + "epoch": 8.724795640326976, + "grad_norm": 8.031493186950684, + "learning_rate": 1.9828603585692468e-05, + "loss": 1.1775, + "step": 3202 + }, + { + "epoch": 8.727520435967303, + "grad_norm": 9.144047737121582, + "learning_rate": 1.982844085811468e-05, + "loss": 1.5012, + "step": 3203 + }, + { + "epoch": 8.730245231607629, + "grad_norm": 8.287677764892578, + "learning_rate": 1.9828278053993313e-05, + "loss": 1.2903, + "step": 3204 + }, + { + "epoch": 8.732970027247957, + "grad_norm": 9.539989471435547, + "learning_rate": 1.982811517332963e-05, + "loss": 1.3569, + "step": 3205 + }, + { + "epoch": 8.735694822888284, + "grad_norm": 10.297660827636719, + "learning_rate": 1.9827952216124908e-05, + "loss": 1.6138, + "step": 3206 + }, + { + "epoch": 8.73841961852861, + "grad_norm": 9.752589225769043, + "learning_rate": 1.9827789182380407e-05, + "loss": 1.2336, + "step": 3207 + }, + { + "epoch": 8.741144414168938, + "grad_norm": 11.144782066345215, + "learning_rate": 1.9827626072097395e-05, + "loss": 1.3674, + "step": 3208 + }, + { + "epoch": 8.743869209809265, + "grad_norm": 11.73814582824707, + "learning_rate": 1.9827462885277155e-05, + "loss": 1.4758, + "step": 3209 + }, + { + "epoch": 8.746594005449591, + "grad_norm": 11.165502548217773, + "learning_rate": 1.9827299621920948e-05, + "loss": 1.5583, + "step": 3210 + }, + { + "epoch": 8.749318801089919, + "grad_norm": 10.431931495666504, + "learning_rate": 1.982713628203005e-05, + "loss": 1.5918, + "step": 3211 + }, + { + "epoch": 8.752043596730246, + "grad_norm": 14.608397483825684, + "learning_rate": 1.9826972865605725e-05, + "loss": 1.5596, + "step": 3212 + }, + { + "epoch": 8.754768392370572, + "grad_norm": 9.00948429107666, + "learning_rate": 1.9826809372649258e-05, + "loss": 1.5117, + "step": 3213 + }, + { + "epoch": 8.7574931880109, + "grad_norm": 11.614974021911621, + "learning_rate": 1.982664580316191e-05, + "loss": 1.5029, + "step": 3214 + }, + { + "epoch": 8.760217983651227, + "grad_norm": 10.131213188171387, + "learning_rate": 1.9826482157144962e-05, + "loss": 1.4861, + "step": 3215 + }, + { + "epoch": 8.762942779291553, + "grad_norm": 12.708951950073242, + "learning_rate": 1.9826318434599693e-05, + "loss": 1.4624, + "step": 3216 + }, + { + "epoch": 8.76566757493188, + "grad_norm": 10.052382469177246, + "learning_rate": 1.9826154635527368e-05, + "loss": 1.5754, + "step": 3217 + }, + { + "epoch": 8.768392370572208, + "grad_norm": 9.058707237243652, + "learning_rate": 1.982599075992927e-05, + "loss": 1.5889, + "step": 3218 + }, + { + "epoch": 8.771117166212534, + "grad_norm": 12.47221851348877, + "learning_rate": 1.9825826807806665e-05, + "loss": 1.3899, + "step": 3219 + }, + { + "epoch": 8.773841961852861, + "grad_norm": 9.93853759765625, + "learning_rate": 1.9825662779160843e-05, + "loss": 1.4197, + "step": 3220 + }, + { + "epoch": 8.776566757493189, + "grad_norm": 12.409202575683594, + "learning_rate": 1.9825498673993074e-05, + "loss": 1.4915, + "step": 3221 + }, + { + "epoch": 8.779291553133515, + "grad_norm": 11.034850120544434, + "learning_rate": 1.9825334492304637e-05, + "loss": 1.3545, + "step": 3222 + }, + { + "epoch": 8.782016348773842, + "grad_norm": 13.478449821472168, + "learning_rate": 1.9825170234096812e-05, + "loss": 1.4248, + "step": 3223 + }, + { + "epoch": 8.78474114441417, + "grad_norm": 9.65610122680664, + "learning_rate": 1.9825005899370877e-05, + "loss": 1.7104, + "step": 3224 + }, + { + "epoch": 8.787465940054496, + "grad_norm": 14.528332710266113, + "learning_rate": 1.982484148812811e-05, + "loss": 1.4719, + "step": 3225 + }, + { + "epoch": 8.790190735694823, + "grad_norm": 21.48270034790039, + "learning_rate": 1.9824677000369798e-05, + "loss": 1.5227, + "step": 3226 + }, + { + "epoch": 8.79291553133515, + "grad_norm": 9.869617462158203, + "learning_rate": 1.9824512436097216e-05, + "loss": 1.5923, + "step": 3227 + }, + { + "epoch": 8.795640326975477, + "grad_norm": 12.607680320739746, + "learning_rate": 1.9824347795311646e-05, + "loss": 1.3701, + "step": 3228 + }, + { + "epoch": 8.798365122615804, + "grad_norm": 9.923628807067871, + "learning_rate": 1.9824183078014373e-05, + "loss": 1.4026, + "step": 3229 + }, + { + "epoch": 8.80108991825613, + "grad_norm": 9.845184326171875, + "learning_rate": 1.9824018284206677e-05, + "loss": 1.3467, + "step": 3230 + }, + { + "epoch": 8.803814713896458, + "grad_norm": 10.393508911132812, + "learning_rate": 1.9823853413889846e-05, + "loss": 1.429, + "step": 3231 + }, + { + "epoch": 8.806539509536785, + "grad_norm": 8.768599510192871, + "learning_rate": 1.982368846706516e-05, + "loss": 1.3774, + "step": 3232 + }, + { + "epoch": 8.809264305177111, + "grad_norm": 10.29957103729248, + "learning_rate": 1.98235234437339e-05, + "loss": 1.5173, + "step": 3233 + }, + { + "epoch": 8.811989100817438, + "grad_norm": 11.418523788452148, + "learning_rate": 1.982335834389736e-05, + "loss": 1.3774, + "step": 3234 + }, + { + "epoch": 8.814713896457766, + "grad_norm": 13.813346862792969, + "learning_rate": 1.982319316755682e-05, + "loss": 1.5896, + "step": 3235 + }, + { + "epoch": 8.817438692098092, + "grad_norm": 13.180110931396484, + "learning_rate": 1.9823027914713567e-05, + "loss": 1.4475, + "step": 3236 + }, + { + "epoch": 8.82016348773842, + "grad_norm": 9.238238334655762, + "learning_rate": 1.982286258536889e-05, + "loss": 1.3816, + "step": 3237 + }, + { + "epoch": 8.822888283378747, + "grad_norm": 15.085087776184082, + "learning_rate": 1.9822697179524074e-05, + "loss": 1.7009, + "step": 3238 + }, + { + "epoch": 8.825613079019073, + "grad_norm": 9.169953346252441, + "learning_rate": 1.9822531697180412e-05, + "loss": 1.4221, + "step": 3239 + }, + { + "epoch": 8.8283378746594, + "grad_norm": 8.766127586364746, + "learning_rate": 1.9822366138339185e-05, + "loss": 1.5503, + "step": 3240 + }, + { + "epoch": 8.831062670299728, + "grad_norm": 8.895727157592773, + "learning_rate": 1.982220050300169e-05, + "loss": 1.5767, + "step": 3241 + }, + { + "epoch": 8.833787465940054, + "grad_norm": 18.501556396484375, + "learning_rate": 1.982203479116921e-05, + "loss": 1.6104, + "step": 3242 + }, + { + "epoch": 8.836512261580381, + "grad_norm": 9.487771987915039, + "learning_rate": 1.982186900284304e-05, + "loss": 1.5347, + "step": 3243 + }, + { + "epoch": 8.839237057220709, + "grad_norm": 8.779281616210938, + "learning_rate": 1.982170313802447e-05, + "loss": 1.5388, + "step": 3244 + }, + { + "epoch": 8.841961852861035, + "grad_norm": 15.55836009979248, + "learning_rate": 1.9821537196714797e-05, + "loss": 1.3896, + "step": 3245 + }, + { + "epoch": 8.844686648501362, + "grad_norm": 22.404815673828125, + "learning_rate": 1.9821371178915307e-05, + "loss": 1.6101, + "step": 3246 + }, + { + "epoch": 8.84741144414169, + "grad_norm": 10.606950759887695, + "learning_rate": 1.9821205084627292e-05, + "loss": 1.4644, + "step": 3247 + }, + { + "epoch": 8.850136239782016, + "grad_norm": 10.240605354309082, + "learning_rate": 1.982103891385205e-05, + "loss": 1.3381, + "step": 3248 + }, + { + "epoch": 8.852861035422343, + "grad_norm": 21.625900268554688, + "learning_rate": 1.982087266659087e-05, + "loss": 1.3345, + "step": 3249 + }, + { + "epoch": 8.85558583106267, + "grad_norm": 9.106072425842285, + "learning_rate": 1.982070634284505e-05, + "loss": 1.2634, + "step": 3250 + }, + { + "epoch": 8.858310626702997, + "grad_norm": 11.157843589782715, + "learning_rate": 1.9820539942615883e-05, + "loss": 1.4194, + "step": 3251 + }, + { + "epoch": 8.861035422343324, + "grad_norm": 11.39349365234375, + "learning_rate": 1.9820373465904672e-05, + "loss": 1.3013, + "step": 3252 + }, + { + "epoch": 8.863760217983652, + "grad_norm": 12.323468208312988, + "learning_rate": 1.982020691271271e-05, + "loss": 1.4363, + "step": 3253 + }, + { + "epoch": 8.866485013623977, + "grad_norm": 9.340956687927246, + "learning_rate": 1.9820040283041287e-05, + "loss": 1.322, + "step": 3254 + }, + { + "epoch": 8.869209809264305, + "grad_norm": 10.117134094238281, + "learning_rate": 1.9819873576891707e-05, + "loss": 1.4644, + "step": 3255 + }, + { + "epoch": 8.871934604904633, + "grad_norm": 11.121735572814941, + "learning_rate": 1.981970679426527e-05, + "loss": 1.4331, + "step": 3256 + }, + { + "epoch": 8.874659400544958, + "grad_norm": 12.51620864868164, + "learning_rate": 1.9819539935163272e-05, + "loss": 1.7354, + "step": 3257 + }, + { + "epoch": 8.877384196185286, + "grad_norm": 14.289231300354004, + "learning_rate": 1.9819372999587015e-05, + "loss": 1.5076, + "step": 3258 + }, + { + "epoch": 8.880108991825614, + "grad_norm": 9.565315246582031, + "learning_rate": 1.9819205987537792e-05, + "loss": 1.468, + "step": 3259 + }, + { + "epoch": 8.88283378746594, + "grad_norm": 34.520606994628906, + "learning_rate": 1.9819038899016913e-05, + "loss": 1.3535, + "step": 3260 + }, + { + "epoch": 8.885558583106267, + "grad_norm": 8.638131141662598, + "learning_rate": 1.9818871734025672e-05, + "loss": 1.188, + "step": 3261 + }, + { + "epoch": 8.888283378746594, + "grad_norm": 9.826519966125488, + "learning_rate": 1.9818704492565378e-05, + "loss": 1.5161, + "step": 3262 + }, + { + "epoch": 8.89100817438692, + "grad_norm": 10.681777954101562, + "learning_rate": 1.9818537174637328e-05, + "loss": 1.2725, + "step": 3263 + }, + { + "epoch": 8.893732970027248, + "grad_norm": 9.70865535736084, + "learning_rate": 1.9818369780242822e-05, + "loss": 1.4285, + "step": 3264 + }, + { + "epoch": 8.896457765667575, + "grad_norm": 9.900568962097168, + "learning_rate": 1.9818202309383173e-05, + "loss": 1.3413, + "step": 3265 + }, + { + "epoch": 8.899182561307901, + "grad_norm": 11.357996940612793, + "learning_rate": 1.9818034762059678e-05, + "loss": 1.6782, + "step": 3266 + }, + { + "epoch": 8.901907356948229, + "grad_norm": 9.975435256958008, + "learning_rate": 1.9817867138273645e-05, + "loss": 1.5435, + "step": 3267 + }, + { + "epoch": 8.904632152588556, + "grad_norm": 7.961818218231201, + "learning_rate": 1.981769943802638e-05, + "loss": 1.2671, + "step": 3268 + }, + { + "epoch": 8.907356948228882, + "grad_norm": 10.005882263183594, + "learning_rate": 1.981753166131919e-05, + "loss": 1.2932, + "step": 3269 + }, + { + "epoch": 8.91008174386921, + "grad_norm": 10.420265197753906, + "learning_rate": 1.9817363808153372e-05, + "loss": 1.5381, + "step": 3270 + }, + { + "epoch": 8.912806539509537, + "grad_norm": 19.911571502685547, + "learning_rate": 1.9817195878530247e-05, + "loss": 1.521, + "step": 3271 + }, + { + "epoch": 8.915531335149863, + "grad_norm": 10.7108736038208, + "learning_rate": 1.9817027872451112e-05, + "loss": 1.334, + "step": 3272 + }, + { + "epoch": 8.91825613079019, + "grad_norm": 10.443603515625, + "learning_rate": 1.9816859789917283e-05, + "loss": 1.604, + "step": 3273 + }, + { + "epoch": 8.920980926430518, + "grad_norm": 14.452402114868164, + "learning_rate": 1.9816691630930067e-05, + "loss": 1.3765, + "step": 3274 + }, + { + "epoch": 8.923705722070844, + "grad_norm": 14.351840019226074, + "learning_rate": 1.981652339549077e-05, + "loss": 1.5569, + "step": 3275 + }, + { + "epoch": 8.926430517711172, + "grad_norm": 11.948895454406738, + "learning_rate": 1.9816355083600704e-05, + "loss": 1.2886, + "step": 3276 + }, + { + "epoch": 8.9291553133515, + "grad_norm": 10.655186653137207, + "learning_rate": 1.9816186695261184e-05, + "loss": 1.5349, + "step": 3277 + }, + { + "epoch": 8.931880108991825, + "grad_norm": 9.585867881774902, + "learning_rate": 1.981601823047352e-05, + "loss": 1.322, + "step": 3278 + }, + { + "epoch": 8.934604904632153, + "grad_norm": 10.423274040222168, + "learning_rate": 1.9815849689239015e-05, + "loss": 1.3765, + "step": 3279 + }, + { + "epoch": 8.93732970027248, + "grad_norm": 8.449317932128906, + "learning_rate": 1.9815681071558992e-05, + "loss": 1.3672, + "step": 3280 + }, + { + "epoch": 8.940054495912806, + "grad_norm": 9.676054954528809, + "learning_rate": 1.9815512377434757e-05, + "loss": 1.4561, + "step": 3281 + }, + { + "epoch": 8.942779291553133, + "grad_norm": 9.170092582702637, + "learning_rate": 1.9815343606867632e-05, + "loss": 1.4819, + "step": 3282 + }, + { + "epoch": 8.945504087193461, + "grad_norm": 10.363265037536621, + "learning_rate": 1.9815174759858927e-05, + "loss": 1.418, + "step": 3283 + }, + { + "epoch": 8.948228882833787, + "grad_norm": 11.943129539489746, + "learning_rate": 1.9815005836409954e-05, + "loss": 1.2542, + "step": 3284 + }, + { + "epoch": 8.950953678474114, + "grad_norm": 14.964985847473145, + "learning_rate": 1.9814836836522035e-05, + "loss": 1.5339, + "step": 3285 + }, + { + "epoch": 8.953678474114442, + "grad_norm": 7.762907981872559, + "learning_rate": 1.981466776019648e-05, + "loss": 1.2019, + "step": 3286 + }, + { + "epoch": 8.956403269754768, + "grad_norm": 9.729695320129395, + "learning_rate": 1.9814498607434607e-05, + "loss": 1.2307, + "step": 3287 + }, + { + "epoch": 8.959128065395095, + "grad_norm": 8.820679664611816, + "learning_rate": 1.9814329378237738e-05, + "loss": 1.2688, + "step": 3288 + }, + { + "epoch": 8.961852861035423, + "grad_norm": 8.336542129516602, + "learning_rate": 1.9814160072607188e-05, + "loss": 1.4619, + "step": 3289 + }, + { + "epoch": 8.964577656675749, + "grad_norm": 8.730629920959473, + "learning_rate": 1.981399069054427e-05, + "loss": 1.5325, + "step": 3290 + }, + { + "epoch": 8.967302452316076, + "grad_norm": 10.467671394348145, + "learning_rate": 1.981382123205031e-05, + "loss": 1.4546, + "step": 3291 + }, + { + "epoch": 8.970027247956404, + "grad_norm": 9.506669998168945, + "learning_rate": 1.981365169712663e-05, + "loss": 1.5806, + "step": 3292 + }, + { + "epoch": 8.97275204359673, + "grad_norm": 9.008421897888184, + "learning_rate": 1.9813482085774548e-05, + "loss": 1.5046, + "step": 3293 + }, + { + "epoch": 8.975476839237057, + "grad_norm": 11.48160171508789, + "learning_rate": 1.9813312397995376e-05, + "loss": 1.574, + "step": 3294 + }, + { + "epoch": 8.978201634877385, + "grad_norm": 8.973231315612793, + "learning_rate": 1.9813142633790448e-05, + "loss": 1.3826, + "step": 3295 + }, + { + "epoch": 8.98092643051771, + "grad_norm": 10.221563339233398, + "learning_rate": 1.9812972793161077e-05, + "loss": 1.3994, + "step": 3296 + }, + { + "epoch": 8.983651226158038, + "grad_norm": 9.588338851928711, + "learning_rate": 1.9812802876108593e-05, + "loss": 1.376, + "step": 3297 + }, + { + "epoch": 8.986376021798366, + "grad_norm": 8.09337329864502, + "learning_rate": 1.9812632882634316e-05, + "loss": 1.1482, + "step": 3298 + }, + { + "epoch": 8.989100817438691, + "grad_norm": 8.78427505493164, + "learning_rate": 1.981246281273957e-05, + "loss": 1.4067, + "step": 3299 + }, + { + "epoch": 8.991825613079019, + "grad_norm": 11.519981384277344, + "learning_rate": 1.981229266642568e-05, + "loss": 1.4851, + "step": 3300 + }, + { + "epoch": 8.994550408719347, + "grad_norm": 9.364227294921875, + "learning_rate": 1.9812122443693967e-05, + "loss": 1.2976, + "step": 3301 + }, + { + "epoch": 8.997275204359672, + "grad_norm": 9.506269454956055, + "learning_rate": 1.9811952144545764e-05, + "loss": 1.6685, + "step": 3302 + }, + { + "epoch": 9.0, + "grad_norm": 10.663548469543457, + "learning_rate": 1.9811781768982392e-05, + "loss": 1.5557, + "step": 3303 + }, + { + "epoch": 9.002724795640328, + "grad_norm": 7.8914361000061035, + "learning_rate": 1.981161131700518e-05, + "loss": 1.4429, + "step": 3304 + }, + { + "epoch": 9.005449591280653, + "grad_norm": 11.845026969909668, + "learning_rate": 1.9811440788615454e-05, + "loss": 1.3181, + "step": 3305 + }, + { + "epoch": 9.008174386920981, + "grad_norm": 8.106034278869629, + "learning_rate": 1.981127018381454e-05, + "loss": 1.3188, + "step": 3306 + }, + { + "epoch": 9.010899182561309, + "grad_norm": 9.699702262878418, + "learning_rate": 1.9811099502603775e-05, + "loss": 1.1958, + "step": 3307 + }, + { + "epoch": 9.013623978201634, + "grad_norm": 9.693281173706055, + "learning_rate": 1.981092874498448e-05, + "loss": 1.4805, + "step": 3308 + }, + { + "epoch": 9.016348773841962, + "grad_norm": 11.448603630065918, + "learning_rate": 1.981075791095799e-05, + "loss": 1.355, + "step": 3309 + }, + { + "epoch": 9.01907356948229, + "grad_norm": 10.993561744689941, + "learning_rate": 1.9810587000525632e-05, + "loss": 1.4246, + "step": 3310 + }, + { + "epoch": 9.021798365122615, + "grad_norm": 12.729100227355957, + "learning_rate": 1.9810416013688737e-05, + "loss": 1.3533, + "step": 3311 + }, + { + "epoch": 9.024523160762943, + "grad_norm": 8.636086463928223, + "learning_rate": 1.9810244950448636e-05, + "loss": 1.1777, + "step": 3312 + }, + { + "epoch": 9.02724795640327, + "grad_norm": 9.697944641113281, + "learning_rate": 1.9810073810806668e-05, + "loss": 1.1409, + "step": 3313 + }, + { + "epoch": 9.029972752043596, + "grad_norm": 9.793436050415039, + "learning_rate": 1.9809902594764157e-05, + "loss": 1.4097, + "step": 3314 + }, + { + "epoch": 9.032697547683924, + "grad_norm": 9.638480186462402, + "learning_rate": 1.9809731302322443e-05, + "loss": 1.3594, + "step": 3315 + }, + { + "epoch": 9.035422343324251, + "grad_norm": 8.224684715270996, + "learning_rate": 1.9809559933482853e-05, + "loss": 1.2893, + "step": 3316 + }, + { + "epoch": 9.038147138964577, + "grad_norm": 8.498680114746094, + "learning_rate": 1.980938848824673e-05, + "loss": 1.2251, + "step": 3317 + }, + { + "epoch": 9.040871934604905, + "grad_norm": 12.3306303024292, + "learning_rate": 1.9809216966615406e-05, + "loss": 1.1919, + "step": 3318 + }, + { + "epoch": 9.043596730245232, + "grad_norm": 10.12957763671875, + "learning_rate": 1.9809045368590215e-05, + "loss": 1.1763, + "step": 3319 + }, + { + "epoch": 9.046321525885558, + "grad_norm": 9.691681861877441, + "learning_rate": 1.980887369417249e-05, + "loss": 1.4958, + "step": 3320 + }, + { + "epoch": 9.049046321525886, + "grad_norm": 9.450521469116211, + "learning_rate": 1.9808701943363577e-05, + "loss": 1.3125, + "step": 3321 + }, + { + "epoch": 9.051771117166213, + "grad_norm": 10.486001968383789, + "learning_rate": 1.980853011616481e-05, + "loss": 1.3318, + "step": 3322 + }, + { + "epoch": 9.054495912806539, + "grad_norm": 9.702750205993652, + "learning_rate": 1.9808358212577524e-05, + "loss": 1.2874, + "step": 3323 + }, + { + "epoch": 9.057220708446867, + "grad_norm": 10.693781852722168, + "learning_rate": 1.980818623260306e-05, + "loss": 1.2964, + "step": 3324 + }, + { + "epoch": 9.059945504087194, + "grad_norm": 9.388365745544434, + "learning_rate": 1.9808014176242754e-05, + "loss": 1.4871, + "step": 3325 + }, + { + "epoch": 9.06267029972752, + "grad_norm": 22.220670700073242, + "learning_rate": 1.9807842043497953e-05, + "loss": 1.1562, + "step": 3326 + }, + { + "epoch": 9.065395095367847, + "grad_norm": 25.023902893066406, + "learning_rate": 1.9807669834369996e-05, + "loss": 1.4326, + "step": 3327 + }, + { + "epoch": 9.068119891008175, + "grad_norm": 8.872845649719238, + "learning_rate": 1.9807497548860218e-05, + "loss": 1.4065, + "step": 3328 + }, + { + "epoch": 9.0708446866485, + "grad_norm": 7.357226848602295, + "learning_rate": 1.9807325186969964e-05, + "loss": 1.0891, + "step": 3329 + }, + { + "epoch": 9.073569482288828, + "grad_norm": 12.355050086975098, + "learning_rate": 1.980715274870058e-05, + "loss": 1.2792, + "step": 3330 + }, + { + "epoch": 9.076294277929156, + "grad_norm": 9.479902267456055, + "learning_rate": 1.9806980234053405e-05, + "loss": 1.614, + "step": 3331 + }, + { + "epoch": 9.079019073569482, + "grad_norm": 12.747612953186035, + "learning_rate": 1.9806807643029786e-05, + "loss": 1.4459, + "step": 3332 + }, + { + "epoch": 9.08174386920981, + "grad_norm": 13.959284782409668, + "learning_rate": 1.9806634975631062e-05, + "loss": 1.1519, + "step": 3333 + }, + { + "epoch": 9.084468664850137, + "grad_norm": 8.461284637451172, + "learning_rate": 1.980646223185858e-05, + "loss": 1.4524, + "step": 3334 + }, + { + "epoch": 9.087193460490463, + "grad_norm": 7.815034866333008, + "learning_rate": 1.9806289411713686e-05, + "loss": 1.3975, + "step": 3335 + }, + { + "epoch": 9.08991825613079, + "grad_norm": 7.936162948608398, + "learning_rate": 1.9806116515197728e-05, + "loss": 1.4258, + "step": 3336 + }, + { + "epoch": 9.092643051771118, + "grad_norm": 10.635171890258789, + "learning_rate": 1.980594354231205e-05, + "loss": 1.2351, + "step": 3337 + }, + { + "epoch": 9.095367847411444, + "grad_norm": 15.045971870422363, + "learning_rate": 1.9805770493057994e-05, + "loss": 1.6394, + "step": 3338 + }, + { + "epoch": 9.098092643051771, + "grad_norm": 9.381028175354004, + "learning_rate": 1.980559736743692e-05, + "loss": 1.3196, + "step": 3339 + }, + { + "epoch": 9.100817438692099, + "grad_norm": 10.05689525604248, + "learning_rate": 1.9805424165450164e-05, + "loss": 1.3442, + "step": 3340 + }, + { + "epoch": 9.103542234332425, + "grad_norm": 8.947305679321289, + "learning_rate": 1.980525088709908e-05, + "loss": 1.2844, + "step": 3341 + }, + { + "epoch": 9.106267029972752, + "grad_norm": 9.874502182006836, + "learning_rate": 1.9805077532385024e-05, + "loss": 1.5862, + "step": 3342 + }, + { + "epoch": 9.10899182561308, + "grad_norm": 13.851561546325684, + "learning_rate": 1.9804904101309333e-05, + "loss": 1.3845, + "step": 3343 + }, + { + "epoch": 9.111716621253406, + "grad_norm": 8.135567665100098, + "learning_rate": 1.980473059387337e-05, + "loss": 1.4084, + "step": 3344 + }, + { + "epoch": 9.114441416893733, + "grad_norm": 9.141457557678223, + "learning_rate": 1.9804557010078475e-05, + "loss": 1.4294, + "step": 3345 + }, + { + "epoch": 9.11716621253406, + "grad_norm": 9.895256042480469, + "learning_rate": 1.9804383349926007e-05, + "loss": 1.2952, + "step": 3346 + }, + { + "epoch": 9.119891008174386, + "grad_norm": 9.32097339630127, + "learning_rate": 1.980420961341732e-05, + "loss": 1.4065, + "step": 3347 + }, + { + "epoch": 9.122615803814714, + "grad_norm": 9.12514591217041, + "learning_rate": 1.9804035800553764e-05, + "loss": 1.4473, + "step": 3348 + }, + { + "epoch": 9.125340599455042, + "grad_norm": 11.255130767822266, + "learning_rate": 1.980386191133669e-05, + "loss": 1.4034, + "step": 3349 + }, + { + "epoch": 9.128065395095367, + "grad_norm": 9.776803016662598, + "learning_rate": 1.9803687945767457e-05, + "loss": 1.1127, + "step": 3350 + }, + { + "epoch": 9.130790190735695, + "grad_norm": 10.613279342651367, + "learning_rate": 1.9803513903847418e-05, + "loss": 1.3342, + "step": 3351 + }, + { + "epoch": 9.133514986376023, + "grad_norm": 9.415681838989258, + "learning_rate": 1.9803339785577926e-05, + "loss": 1.271, + "step": 3352 + }, + { + "epoch": 9.136239782016348, + "grad_norm": 8.960698127746582, + "learning_rate": 1.980316559096034e-05, + "loss": 1.4492, + "step": 3353 + }, + { + "epoch": 9.138964577656676, + "grad_norm": 9.981202125549316, + "learning_rate": 1.9802991319996015e-05, + "loss": 1.5801, + "step": 3354 + }, + { + "epoch": 9.141689373297003, + "grad_norm": 9.422486305236816, + "learning_rate": 1.980281697268631e-05, + "loss": 1.2809, + "step": 3355 + }, + { + "epoch": 9.14441416893733, + "grad_norm": 8.67933464050293, + "learning_rate": 1.9802642549032585e-05, + "loss": 1.1875, + "step": 3356 + }, + { + "epoch": 9.147138964577657, + "grad_norm": 8.95732593536377, + "learning_rate": 1.9802468049036192e-05, + "loss": 1.396, + "step": 3357 + }, + { + "epoch": 9.149863760217984, + "grad_norm": 14.806777000427246, + "learning_rate": 1.9802293472698496e-05, + "loss": 1.2542, + "step": 3358 + }, + { + "epoch": 9.15258855585831, + "grad_norm": 10.63351821899414, + "learning_rate": 1.980211882002085e-05, + "loss": 1.5439, + "step": 3359 + }, + { + "epoch": 9.155313351498638, + "grad_norm": 11.304052352905273, + "learning_rate": 1.980194409100462e-05, + "loss": 1.333, + "step": 3360 + }, + { + "epoch": 9.158038147138965, + "grad_norm": 8.953567504882812, + "learning_rate": 1.9801769285651168e-05, + "loss": 1.4475, + "step": 3361 + }, + { + "epoch": 9.160762942779291, + "grad_norm": 10.894664764404297, + "learning_rate": 1.9801594403961844e-05, + "loss": 1.4678, + "step": 3362 + }, + { + "epoch": 9.163487738419619, + "grad_norm": 8.70775032043457, + "learning_rate": 1.9801419445938027e-05, + "loss": 1.2996, + "step": 3363 + }, + { + "epoch": 9.166212534059946, + "grad_norm": 8.957754135131836, + "learning_rate": 1.9801244411581068e-05, + "loss": 1.4502, + "step": 3364 + }, + { + "epoch": 9.168937329700272, + "grad_norm": 9.401688575744629, + "learning_rate": 1.980106930089233e-05, + "loss": 1.3315, + "step": 3365 + }, + { + "epoch": 9.1716621253406, + "grad_norm": 8.487594604492188, + "learning_rate": 1.980089411387318e-05, + "loss": 1.4373, + "step": 3366 + }, + { + "epoch": 9.174386920980927, + "grad_norm": 9.587615013122559, + "learning_rate": 1.9800718850524987e-05, + "loss": 1.4124, + "step": 3367 + }, + { + "epoch": 9.177111716621253, + "grad_norm": 9.357094764709473, + "learning_rate": 1.9800543510849107e-05, + "loss": 1.4082, + "step": 3368 + }, + { + "epoch": 9.17983651226158, + "grad_norm": 8.491287231445312, + "learning_rate": 1.980036809484691e-05, + "loss": 1.2317, + "step": 3369 + }, + { + "epoch": 9.182561307901908, + "grad_norm": 10.4268159866333, + "learning_rate": 1.9800192602519762e-05, + "loss": 1.5454, + "step": 3370 + }, + { + "epoch": 9.185286103542234, + "grad_norm": 10.99485969543457, + "learning_rate": 1.9800017033869033e-05, + "loss": 1.3677, + "step": 3371 + }, + { + "epoch": 9.188010899182562, + "grad_norm": 7.159212589263916, + "learning_rate": 1.979984138889608e-05, + "loss": 1.27, + "step": 3372 + }, + { + "epoch": 9.190735694822889, + "grad_norm": 10.803590774536133, + "learning_rate": 1.9799665667602282e-05, + "loss": 1.561, + "step": 3373 + }, + { + "epoch": 9.193460490463215, + "grad_norm": 9.76352310180664, + "learning_rate": 1.9799489869989003e-05, + "loss": 1.3806, + "step": 3374 + }, + { + "epoch": 9.196185286103542, + "grad_norm": 15.681282997131348, + "learning_rate": 1.979931399605761e-05, + "loss": 1.3535, + "step": 3375 + }, + { + "epoch": 9.19891008174387, + "grad_norm": 8.559199333190918, + "learning_rate": 1.9799138045809482e-05, + "loss": 1.4304, + "step": 3376 + }, + { + "epoch": 9.201634877384196, + "grad_norm": 8.302059173583984, + "learning_rate": 1.979896201924597e-05, + "loss": 1.3557, + "step": 3377 + }, + { + "epoch": 9.204359673024523, + "grad_norm": 8.677852630615234, + "learning_rate": 1.979878591636847e-05, + "loss": 1.5125, + "step": 3378 + }, + { + "epoch": 9.207084468664851, + "grad_norm": 10.220707893371582, + "learning_rate": 1.9798609737178332e-05, + "loss": 1.3669, + "step": 3379 + }, + { + "epoch": 9.209809264305177, + "grad_norm": 10.292823791503906, + "learning_rate": 1.979843348167694e-05, + "loss": 1.5803, + "step": 3380 + }, + { + "epoch": 9.212534059945504, + "grad_norm": 7.553493499755859, + "learning_rate": 1.9798257149865664e-05, + "loss": 1.3113, + "step": 3381 + }, + { + "epoch": 9.215258855585832, + "grad_norm": 9.349052429199219, + "learning_rate": 1.9798080741745876e-05, + "loss": 1.3796, + "step": 3382 + }, + { + "epoch": 9.217983651226158, + "grad_norm": 11.313785552978516, + "learning_rate": 1.979790425731895e-05, + "loss": 1.5281, + "step": 3383 + }, + { + "epoch": 9.220708446866485, + "grad_norm": 8.335127830505371, + "learning_rate": 1.979772769658626e-05, + "loss": 1.5474, + "step": 3384 + }, + { + "epoch": 9.223433242506813, + "grad_norm": 10.918291091918945, + "learning_rate": 1.9797551059549182e-05, + "loss": 1.2739, + "step": 3385 + }, + { + "epoch": 9.226158038147139, + "grad_norm": 11.712550163269043, + "learning_rate": 1.979737434620909e-05, + "loss": 1.303, + "step": 3386 + }, + { + "epoch": 9.228882833787466, + "grad_norm": 9.832308769226074, + "learning_rate": 1.9797197556567368e-05, + "loss": 1.3599, + "step": 3387 + }, + { + "epoch": 9.231607629427794, + "grad_norm": 14.865618705749512, + "learning_rate": 1.9797020690625385e-05, + "loss": 1.3406, + "step": 3388 + }, + { + "epoch": 9.23433242506812, + "grad_norm": 8.478940963745117, + "learning_rate": 1.9796843748384516e-05, + "loss": 1.4141, + "step": 3389 + }, + { + "epoch": 9.237057220708447, + "grad_norm": 26.075153350830078, + "learning_rate": 1.979666672984615e-05, + "loss": 1.457, + "step": 3390 + }, + { + "epoch": 9.239782016348773, + "grad_norm": 10.764287948608398, + "learning_rate": 1.979648963501165e-05, + "loss": 1.4678, + "step": 3391 + }, + { + "epoch": 9.2425068119891, + "grad_norm": 9.13726806640625, + "learning_rate": 1.9796312463882413e-05, + "loss": 1.2595, + "step": 3392 + }, + { + "epoch": 9.245231607629428, + "grad_norm": 11.239102363586426, + "learning_rate": 1.9796135216459806e-05, + "loss": 1.3137, + "step": 3393 + }, + { + "epoch": 9.247956403269754, + "grad_norm": 10.32160758972168, + "learning_rate": 1.9795957892745212e-05, + "loss": 1.2859, + "step": 3394 + }, + { + "epoch": 9.250681198910081, + "grad_norm": 8.509366035461426, + "learning_rate": 1.9795780492740014e-05, + "loss": 1.4409, + "step": 3395 + }, + { + "epoch": 9.253405994550409, + "grad_norm": 8.588579177856445, + "learning_rate": 1.979560301644559e-05, + "loss": 1.3656, + "step": 3396 + }, + { + "epoch": 9.256130790190735, + "grad_norm": 7.5111308097839355, + "learning_rate": 1.9795425463863328e-05, + "loss": 1.323, + "step": 3397 + }, + { + "epoch": 9.258855585831062, + "grad_norm": 11.245231628417969, + "learning_rate": 1.979524783499461e-05, + "loss": 1.5593, + "step": 3398 + }, + { + "epoch": 9.26158038147139, + "grad_norm": 11.089567184448242, + "learning_rate": 1.9795070129840814e-05, + "loss": 1.2607, + "step": 3399 + }, + { + "epoch": 9.264305177111716, + "grad_norm": 9.891328811645508, + "learning_rate": 1.9794892348403327e-05, + "loss": 1.2742, + "step": 3400 + }, + { + "epoch": 9.267029972752043, + "grad_norm": 9.167067527770996, + "learning_rate": 1.9794714490683534e-05, + "loss": 1.2944, + "step": 3401 + }, + { + "epoch": 9.269754768392371, + "grad_norm": 8.210538864135742, + "learning_rate": 1.979453655668282e-05, + "loss": 1.0919, + "step": 3402 + }, + { + "epoch": 9.272479564032697, + "grad_norm": 10.045794486999512, + "learning_rate": 1.979435854640257e-05, + "loss": 1.2485, + "step": 3403 + }, + { + "epoch": 9.275204359673024, + "grad_norm": 8.798501968383789, + "learning_rate": 1.979418045984417e-05, + "loss": 1.3103, + "step": 3404 + }, + { + "epoch": 9.277929155313352, + "grad_norm": 8.913511276245117, + "learning_rate": 1.9794002297009012e-05, + "loss": 1.4448, + "step": 3405 + }, + { + "epoch": 9.280653950953678, + "grad_norm": 10.16838264465332, + "learning_rate": 1.979382405789848e-05, + "loss": 1.3906, + "step": 3406 + }, + { + "epoch": 9.283378746594005, + "grad_norm": 7.70815896987915, + "learning_rate": 1.9793645742513953e-05, + "loss": 1.3523, + "step": 3407 + }, + { + "epoch": 9.286103542234333, + "grad_norm": 8.3804931640625, + "learning_rate": 1.9793467350856838e-05, + "loss": 1.3953, + "step": 3408 + }, + { + "epoch": 9.288828337874659, + "grad_norm": 10.134687423706055, + "learning_rate": 1.979328888292851e-05, + "loss": 1.5552, + "step": 3409 + }, + { + "epoch": 9.291553133514986, + "grad_norm": 25.563600540161133, + "learning_rate": 1.9793110338730362e-05, + "loss": 1.2976, + "step": 3410 + }, + { + "epoch": 9.294277929155314, + "grad_norm": 7.810992240905762, + "learning_rate": 1.9792931718263786e-05, + "loss": 1.2024, + "step": 3411 + }, + { + "epoch": 9.29700272479564, + "grad_norm": 8.703335762023926, + "learning_rate": 1.9792753021530174e-05, + "loss": 1.2744, + "step": 3412 + }, + { + "epoch": 9.299727520435967, + "grad_norm": 13.916765213012695, + "learning_rate": 1.9792574248530915e-05, + "loss": 1.5369, + "step": 3413 + }, + { + "epoch": 9.302452316076295, + "grad_norm": 14.48161792755127, + "learning_rate": 1.9792395399267404e-05, + "loss": 1.1318, + "step": 3414 + }, + { + "epoch": 9.30517711171662, + "grad_norm": 8.741053581237793, + "learning_rate": 1.9792216473741035e-05, + "loss": 1.321, + "step": 3415 + }, + { + "epoch": 9.307901907356948, + "grad_norm": 9.961328506469727, + "learning_rate": 1.9792037471953196e-05, + "loss": 1.6104, + "step": 3416 + }, + { + "epoch": 9.310626702997276, + "grad_norm": 9.477543830871582, + "learning_rate": 1.9791858393905287e-05, + "loss": 1.6274, + "step": 3417 + }, + { + "epoch": 9.313351498637601, + "grad_norm": 9.631728172302246, + "learning_rate": 1.97916792395987e-05, + "loss": 1.4702, + "step": 3418 + }, + { + "epoch": 9.316076294277929, + "grad_norm": 13.435711860656738, + "learning_rate": 1.979150000903483e-05, + "loss": 1.4302, + "step": 3419 + }, + { + "epoch": 9.318801089918257, + "grad_norm": 16.355337142944336, + "learning_rate": 1.979132070221507e-05, + "loss": 1.1826, + "step": 3420 + }, + { + "epoch": 9.321525885558582, + "grad_norm": 8.597811698913574, + "learning_rate": 1.979114131914082e-05, + "loss": 1.4956, + "step": 3421 + }, + { + "epoch": 9.32425068119891, + "grad_norm": 36.2840690612793, + "learning_rate": 1.979096185981348e-05, + "loss": 1.3014, + "step": 3422 + }, + { + "epoch": 9.326975476839237, + "grad_norm": 7.845273017883301, + "learning_rate": 1.9790782324234442e-05, + "loss": 1.2791, + "step": 3423 + }, + { + "epoch": 9.329700272479563, + "grad_norm": 9.422127723693848, + "learning_rate": 1.9790602712405106e-05, + "loss": 1.2175, + "step": 3424 + }, + { + "epoch": 9.33242506811989, + "grad_norm": 12.685276985168457, + "learning_rate": 1.9790423024326873e-05, + "loss": 1.2817, + "step": 3425 + }, + { + "epoch": 9.335149863760218, + "grad_norm": 8.371520042419434, + "learning_rate": 1.979024326000114e-05, + "loss": 1.3311, + "step": 3426 + }, + { + "epoch": 9.337874659400544, + "grad_norm": 15.884763717651367, + "learning_rate": 1.9790063419429307e-05, + "loss": 1.3364, + "step": 3427 + }, + { + "epoch": 9.340599455040872, + "grad_norm": 9.083556175231934, + "learning_rate": 1.9789883502612778e-05, + "loss": 1.2952, + "step": 3428 + }, + { + "epoch": 9.3433242506812, + "grad_norm": 17.44978141784668, + "learning_rate": 1.9789703509552947e-05, + "loss": 1.4075, + "step": 3429 + }, + { + "epoch": 9.346049046321525, + "grad_norm": 10.517081260681152, + "learning_rate": 1.9789523440251223e-05, + "loss": 1.449, + "step": 3430 + }, + { + "epoch": 9.348773841961853, + "grad_norm": 11.888326644897461, + "learning_rate": 1.9789343294709e-05, + "loss": 1.2737, + "step": 3431 + }, + { + "epoch": 9.35149863760218, + "grad_norm": 9.796870231628418, + "learning_rate": 1.9789163072927696e-05, + "loss": 1.7625, + "step": 3432 + }, + { + "epoch": 9.354223433242506, + "grad_norm": 9.31047248840332, + "learning_rate": 1.9788982774908695e-05, + "loss": 1.333, + "step": 3433 + }, + { + "epoch": 9.356948228882834, + "grad_norm": 10.207380294799805, + "learning_rate": 1.9788802400653416e-05, + "loss": 1.3022, + "step": 3434 + }, + { + "epoch": 9.359673024523161, + "grad_norm": 10.310562133789062, + "learning_rate": 1.9788621950163264e-05, + "loss": 1.386, + "step": 3435 + }, + { + "epoch": 9.362397820163487, + "grad_norm": 10.685137748718262, + "learning_rate": 1.978844142343963e-05, + "loss": 1.4824, + "step": 3436 + }, + { + "epoch": 9.365122615803815, + "grad_norm": 9.386162757873535, + "learning_rate": 1.9788260820483935e-05, + "loss": 1.2722, + "step": 3437 + }, + { + "epoch": 9.367847411444142, + "grad_norm": 11.15714168548584, + "learning_rate": 1.9788080141297577e-05, + "loss": 1.1504, + "step": 3438 + }, + { + "epoch": 9.370572207084468, + "grad_norm": 14.698813438415527, + "learning_rate": 1.978789938588197e-05, + "loss": 1.6157, + "step": 3439 + }, + { + "epoch": 9.373297002724795, + "grad_norm": 12.233861923217773, + "learning_rate": 1.9787718554238516e-05, + "loss": 1.4355, + "step": 3440 + }, + { + "epoch": 9.376021798365123, + "grad_norm": 12.789555549621582, + "learning_rate": 1.978753764636862e-05, + "loss": 1.3352, + "step": 3441 + }, + { + "epoch": 9.378746594005449, + "grad_norm": 11.998162269592285, + "learning_rate": 1.9787356662273702e-05, + "loss": 1.2285, + "step": 3442 + }, + { + "epoch": 9.381471389645776, + "grad_norm": 10.554962158203125, + "learning_rate": 1.9787175601955163e-05, + "loss": 1.3799, + "step": 3443 + }, + { + "epoch": 9.384196185286104, + "grad_norm": 9.63073444366455, + "learning_rate": 1.9786994465414415e-05, + "loss": 1.5298, + "step": 3444 + }, + { + "epoch": 9.38692098092643, + "grad_norm": 7.870802879333496, + "learning_rate": 1.9786813252652866e-05, + "loss": 1.1112, + "step": 3445 + }, + { + "epoch": 9.389645776566757, + "grad_norm": 10.364745140075684, + "learning_rate": 1.9786631963671935e-05, + "loss": 1.5083, + "step": 3446 + }, + { + "epoch": 9.392370572207085, + "grad_norm": 10.149497032165527, + "learning_rate": 1.978645059847303e-05, + "loss": 1.0826, + "step": 3447 + }, + { + "epoch": 9.39509536784741, + "grad_norm": 9.680525779724121, + "learning_rate": 1.978626915705756e-05, + "loss": 1.302, + "step": 3448 + }, + { + "epoch": 9.397820163487738, + "grad_norm": 11.579989433288574, + "learning_rate": 1.9786087639426942e-05, + "loss": 1.6477, + "step": 3449 + }, + { + "epoch": 9.400544959128066, + "grad_norm": 13.586649894714355, + "learning_rate": 1.978590604558259e-05, + "loss": 1.4324, + "step": 3450 + }, + { + "epoch": 9.403269754768392, + "grad_norm": 10.524829864501953, + "learning_rate": 1.9785724375525913e-05, + "loss": 1.3755, + "step": 3451 + }, + { + "epoch": 9.40599455040872, + "grad_norm": 10.216323852539062, + "learning_rate": 1.978554262925833e-05, + "loss": 1.333, + "step": 3452 + }, + { + "epoch": 9.408719346049047, + "grad_norm": 20.44986343383789, + "learning_rate": 1.9785360806781256e-05, + "loss": 1.533, + "step": 3453 + }, + { + "epoch": 9.411444141689373, + "grad_norm": 10.247272491455078, + "learning_rate": 1.978517890809611e-05, + "loss": 1.4092, + "step": 3454 + }, + { + "epoch": 9.4141689373297, + "grad_norm": 10.937572479248047, + "learning_rate": 1.9784996933204303e-05, + "loss": 1.6558, + "step": 3455 + }, + { + "epoch": 9.416893732970028, + "grad_norm": 8.877446174621582, + "learning_rate": 1.9784814882107256e-05, + "loss": 1.3645, + "step": 3456 + }, + { + "epoch": 9.419618528610354, + "grad_norm": 9.013394355773926, + "learning_rate": 1.9784632754806385e-05, + "loss": 1.3066, + "step": 3457 + }, + { + "epoch": 9.422343324250681, + "grad_norm": 10.657892227172852, + "learning_rate": 1.978445055130311e-05, + "loss": 1.3774, + "step": 3458 + }, + { + "epoch": 9.425068119891009, + "grad_norm": 13.270530700683594, + "learning_rate": 1.9784268271598847e-05, + "loss": 1.1091, + "step": 3459 + }, + { + "epoch": 9.427792915531334, + "grad_norm": 10.21103572845459, + "learning_rate": 1.978408591569502e-05, + "loss": 1.4182, + "step": 3460 + }, + { + "epoch": 9.430517711171662, + "grad_norm": 10.06057071685791, + "learning_rate": 1.9783903483593045e-05, + "loss": 1.2573, + "step": 3461 + }, + { + "epoch": 9.43324250681199, + "grad_norm": 9.013784408569336, + "learning_rate": 1.9783720975294345e-05, + "loss": 1.3347, + "step": 3462 + }, + { + "epoch": 9.435967302452315, + "grad_norm": 9.590899467468262, + "learning_rate": 1.978353839080034e-05, + "loss": 1.3755, + "step": 3463 + }, + { + "epoch": 9.438692098092643, + "grad_norm": 10.984482765197754, + "learning_rate": 1.9783355730112454e-05, + "loss": 1.4729, + "step": 3464 + }, + { + "epoch": 9.44141689373297, + "grad_norm": 12.965763092041016, + "learning_rate": 1.978317299323211e-05, + "loss": 1.4124, + "step": 3465 + }, + { + "epoch": 9.444141689373296, + "grad_norm": 10.23265552520752, + "learning_rate": 1.9782990180160726e-05, + "loss": 1.425, + "step": 3466 + }, + { + "epoch": 9.446866485013624, + "grad_norm": 8.932223320007324, + "learning_rate": 1.9782807290899732e-05, + "loss": 1.2876, + "step": 3467 + }, + { + "epoch": 9.449591280653951, + "grad_norm": 9.65361213684082, + "learning_rate": 1.978262432545055e-05, + "loss": 1.2568, + "step": 3468 + }, + { + "epoch": 9.452316076294277, + "grad_norm": 13.760838508605957, + "learning_rate": 1.9782441283814606e-05, + "loss": 1.4006, + "step": 3469 + }, + { + "epoch": 9.455040871934605, + "grad_norm": 10.448901176452637, + "learning_rate": 1.978225816599332e-05, + "loss": 1.4226, + "step": 3470 + }, + { + "epoch": 9.457765667574932, + "grad_norm": 10.120850563049316, + "learning_rate": 1.9782074971988122e-05, + "loss": 1.2434, + "step": 3471 + }, + { + "epoch": 9.460490463215258, + "grad_norm": 11.313949584960938, + "learning_rate": 1.978189170180044e-05, + "loss": 1.3118, + "step": 3472 + }, + { + "epoch": 9.463215258855586, + "grad_norm": 11.893877029418945, + "learning_rate": 1.9781708355431704e-05, + "loss": 1.3831, + "step": 3473 + }, + { + "epoch": 9.465940054495913, + "grad_norm": 11.411081314086914, + "learning_rate": 1.9781524932883334e-05, + "loss": 1.2185, + "step": 3474 + }, + { + "epoch": 9.46866485013624, + "grad_norm": 10.715963363647461, + "learning_rate": 1.978134143415676e-05, + "loss": 1.238, + "step": 3475 + }, + { + "epoch": 9.471389645776567, + "grad_norm": 8.280133247375488, + "learning_rate": 1.9781157859253422e-05, + "loss": 1.1952, + "step": 3476 + }, + { + "epoch": 9.474114441416894, + "grad_norm": 12.157916069030762, + "learning_rate": 1.9780974208174737e-05, + "loss": 1.3921, + "step": 3477 + }, + { + "epoch": 9.47683923705722, + "grad_norm": 11.583842277526855, + "learning_rate": 1.978079048092214e-05, + "loss": 1.3665, + "step": 3478 + }, + { + "epoch": 9.479564032697548, + "grad_norm": 9.636781692504883, + "learning_rate": 1.978060667749706e-05, + "loss": 1.3503, + "step": 3479 + }, + { + "epoch": 9.482288828337875, + "grad_norm": 18.986690521240234, + "learning_rate": 1.9780422797900935e-05, + "loss": 1.3213, + "step": 3480 + }, + { + "epoch": 9.485013623978201, + "grad_norm": 7.71966552734375, + "learning_rate": 1.9780238842135184e-05, + "loss": 1.2432, + "step": 3481 + }, + { + "epoch": 9.487738419618529, + "grad_norm": 16.58133888244629, + "learning_rate": 1.9780054810201252e-05, + "loss": 1.5393, + "step": 3482 + }, + { + "epoch": 9.490463215258856, + "grad_norm": 9.143290519714355, + "learning_rate": 1.9779870702100566e-05, + "loss": 1.3428, + "step": 3483 + }, + { + "epoch": 9.493188010899182, + "grad_norm": 11.136713027954102, + "learning_rate": 1.9779686517834566e-05, + "loss": 1.2627, + "step": 3484 + }, + { + "epoch": 9.49591280653951, + "grad_norm": 8.77470874786377, + "learning_rate": 1.977950225740468e-05, + "loss": 1.1431, + "step": 3485 + }, + { + "epoch": 9.498637602179837, + "grad_norm": 8.194987297058105, + "learning_rate": 1.9779317920812345e-05, + "loss": 1.3933, + "step": 3486 + }, + { + "epoch": 9.501362397820163, + "grad_norm": 7.847334861755371, + "learning_rate": 1.9779133508058997e-05, + "loss": 1.3062, + "step": 3487 + }, + { + "epoch": 9.50408719346049, + "grad_norm": 9.563523292541504, + "learning_rate": 1.977894901914607e-05, + "loss": 1.2954, + "step": 3488 + }, + { + "epoch": 9.506811989100818, + "grad_norm": 11.261819839477539, + "learning_rate": 1.9778764454075006e-05, + "loss": 1.6628, + "step": 3489 + }, + { + "epoch": 9.509536784741144, + "grad_norm": 8.540122985839844, + "learning_rate": 1.9778579812847236e-05, + "loss": 1.4062, + "step": 3490 + }, + { + "epoch": 9.512261580381471, + "grad_norm": 8.151784896850586, + "learning_rate": 1.9778395095464204e-05, + "loss": 1.2568, + "step": 3491 + }, + { + "epoch": 9.514986376021799, + "grad_norm": 15.209368705749512, + "learning_rate": 1.9778210301927344e-05, + "loss": 1.3538, + "step": 3492 + }, + { + "epoch": 9.517711171662125, + "grad_norm": 10.50976848602295, + "learning_rate": 1.97780254322381e-05, + "loss": 1.261, + "step": 3493 + }, + { + "epoch": 9.520435967302452, + "grad_norm": 9.538342475891113, + "learning_rate": 1.9777840486397904e-05, + "loss": 1.3208, + "step": 3494 + }, + { + "epoch": 9.52316076294278, + "grad_norm": 10.738985061645508, + "learning_rate": 1.9777655464408204e-05, + "loss": 1.4824, + "step": 3495 + }, + { + "epoch": 9.525885558583106, + "grad_norm": 10.215317726135254, + "learning_rate": 1.9777470366270436e-05, + "loss": 1.0896, + "step": 3496 + }, + { + "epoch": 9.528610354223433, + "grad_norm": 11.81888198852539, + "learning_rate": 1.9777285191986045e-05, + "loss": 1.5889, + "step": 3497 + }, + { + "epoch": 9.53133514986376, + "grad_norm": 9.270798683166504, + "learning_rate": 1.977709994155647e-05, + "loss": 1.2747, + "step": 3498 + }, + { + "epoch": 9.534059945504087, + "grad_norm": 9.496274948120117, + "learning_rate": 1.9776914614983157e-05, + "loss": 1.4822, + "step": 3499 + }, + { + "epoch": 9.536784741144414, + "grad_norm": 11.32534122467041, + "learning_rate": 1.9776729212267547e-05, + "loss": 1.4426, + "step": 3500 + }, + { + "epoch": 9.539509536784742, + "grad_norm": 11.459961891174316, + "learning_rate": 1.9776543733411084e-05, + "loss": 1.5642, + "step": 3501 + }, + { + "epoch": 9.542234332425068, + "grad_norm": 9.027872085571289, + "learning_rate": 1.9776358178415213e-05, + "loss": 1.459, + "step": 3502 + }, + { + "epoch": 9.544959128065395, + "grad_norm": 11.877817153930664, + "learning_rate": 1.977617254728138e-05, + "loss": 1.2825, + "step": 3503 + }, + { + "epoch": 9.547683923705723, + "grad_norm": 10.362582206726074, + "learning_rate": 1.977598684001103e-05, + "loss": 1.2644, + "step": 3504 + }, + { + "epoch": 9.550408719346049, + "grad_norm": 9.197845458984375, + "learning_rate": 1.977580105660561e-05, + "loss": 1.333, + "step": 3505 + }, + { + "epoch": 9.553133514986376, + "grad_norm": 11.093831062316895, + "learning_rate": 1.977561519706656e-05, + "loss": 1.2373, + "step": 3506 + }, + { + "epoch": 9.555858310626704, + "grad_norm": 9.646479606628418, + "learning_rate": 1.9775429261395343e-05, + "loss": 1.396, + "step": 3507 + }, + { + "epoch": 9.55858310626703, + "grad_norm": 9.306057929992676, + "learning_rate": 1.977524324959339e-05, + "loss": 1.1592, + "step": 3508 + }, + { + "epoch": 9.561307901907357, + "grad_norm": 8.801589012145996, + "learning_rate": 1.9775057161662163e-05, + "loss": 1.437, + "step": 3509 + }, + { + "epoch": 9.564032697547685, + "grad_norm": 10.09241771697998, + "learning_rate": 1.97748709976031e-05, + "loss": 1.5378, + "step": 3510 + }, + { + "epoch": 9.56675749318801, + "grad_norm": 9.766700744628906, + "learning_rate": 1.977468475741766e-05, + "loss": 1.4834, + "step": 3511 + }, + { + "epoch": 9.569482288828338, + "grad_norm": 9.25973892211914, + "learning_rate": 1.9774498441107288e-05, + "loss": 1.5376, + "step": 3512 + }, + { + "epoch": 9.572207084468666, + "grad_norm": 10.928956985473633, + "learning_rate": 1.9774312048673438e-05, + "loss": 1.1404, + "step": 3513 + }, + { + "epoch": 9.574931880108991, + "grad_norm": 8.28603458404541, + "learning_rate": 1.9774125580117557e-05, + "loss": 1.3813, + "step": 3514 + }, + { + "epoch": 9.577656675749319, + "grad_norm": 10.744699478149414, + "learning_rate": 1.9773939035441106e-05, + "loss": 1.3232, + "step": 3515 + }, + { + "epoch": 9.580381471389646, + "grad_norm": 10.062701225280762, + "learning_rate": 1.9773752414645527e-05, + "loss": 1.3611, + "step": 3516 + }, + { + "epoch": 9.583106267029972, + "grad_norm": 8.391669273376465, + "learning_rate": 1.977356571773228e-05, + "loss": 1.4429, + "step": 3517 + }, + { + "epoch": 9.5858310626703, + "grad_norm": 10.7404203414917, + "learning_rate": 1.9773378944702818e-05, + "loss": 1.2729, + "step": 3518 + }, + { + "epoch": 9.588555858310627, + "grad_norm": 9.84868335723877, + "learning_rate": 1.97731920955586e-05, + "loss": 1.2915, + "step": 3519 + }, + { + "epoch": 9.591280653950953, + "grad_norm": 9.618789672851562, + "learning_rate": 1.9773005170301072e-05, + "loss": 1.3093, + "step": 3520 + }, + { + "epoch": 9.59400544959128, + "grad_norm": 8.259662628173828, + "learning_rate": 1.9772818168931693e-05, + "loss": 1.3381, + "step": 3521 + }, + { + "epoch": 9.596730245231608, + "grad_norm": 10.0656156539917, + "learning_rate": 1.9772631091451924e-05, + "loss": 1.3623, + "step": 3522 + }, + { + "epoch": 9.599455040871934, + "grad_norm": 7.326105117797852, + "learning_rate": 1.9772443937863216e-05, + "loss": 1.3213, + "step": 3523 + }, + { + "epoch": 9.602179836512262, + "grad_norm": 11.508100509643555, + "learning_rate": 1.977225670816703e-05, + "loss": 1.4204, + "step": 3524 + }, + { + "epoch": 9.60490463215259, + "grad_norm": 14.950603485107422, + "learning_rate": 1.9772069402364823e-05, + "loss": 1.2897, + "step": 3525 + }, + { + "epoch": 9.607629427792915, + "grad_norm": 11.285598754882812, + "learning_rate": 1.9771882020458055e-05, + "loss": 1.3894, + "step": 3526 + }, + { + "epoch": 9.610354223433243, + "grad_norm": 12.085847854614258, + "learning_rate": 1.9771694562448186e-05, + "loss": 1.6387, + "step": 3527 + }, + { + "epoch": 9.61307901907357, + "grad_norm": 9.760807037353516, + "learning_rate": 1.9771507028336672e-05, + "loss": 1.1934, + "step": 3528 + }, + { + "epoch": 9.615803814713896, + "grad_norm": 9.40585994720459, + "learning_rate": 1.9771319418124974e-05, + "loss": 1.2397, + "step": 3529 + }, + { + "epoch": 9.618528610354224, + "grad_norm": 12.485505104064941, + "learning_rate": 1.9771131731814558e-05, + "loss": 1.3064, + "step": 3530 + }, + { + "epoch": 9.621253405994551, + "grad_norm": 7.9116740226745605, + "learning_rate": 1.9770943969406882e-05, + "loss": 1.3254, + "step": 3531 + }, + { + "epoch": 9.623978201634877, + "grad_norm": 8.666459083557129, + "learning_rate": 1.977075613090341e-05, + "loss": 1.4194, + "step": 3532 + }, + { + "epoch": 9.626702997275205, + "grad_norm": 7.706989288330078, + "learning_rate": 1.97705682163056e-05, + "loss": 1.2048, + "step": 3533 + }, + { + "epoch": 9.629427792915532, + "grad_norm": 9.042607307434082, + "learning_rate": 1.977038022561492e-05, + "loss": 1.3113, + "step": 3534 + }, + { + "epoch": 9.632152588555858, + "grad_norm": 8.763065338134766, + "learning_rate": 1.9770192158832837e-05, + "loss": 1.3235, + "step": 3535 + }, + { + "epoch": 9.634877384196185, + "grad_norm": 7.559271335601807, + "learning_rate": 1.9770004015960808e-05, + "loss": 1.2393, + "step": 3536 + }, + { + "epoch": 9.637602179836513, + "grad_norm": 13.301497459411621, + "learning_rate": 1.9769815797000303e-05, + "loss": 1.0942, + "step": 3537 + }, + { + "epoch": 9.640326975476839, + "grad_norm": 8.295751571655273, + "learning_rate": 1.9769627501952787e-05, + "loss": 1.2432, + "step": 3538 + }, + { + "epoch": 9.643051771117166, + "grad_norm": 12.13232421875, + "learning_rate": 1.9769439130819727e-05, + "loss": 1.3557, + "step": 3539 + }, + { + "epoch": 9.645776566757494, + "grad_norm": 10.783136367797852, + "learning_rate": 1.976925068360259e-05, + "loss": 1.3884, + "step": 3540 + }, + { + "epoch": 9.64850136239782, + "grad_norm": 7.590921878814697, + "learning_rate": 1.976906216030284e-05, + "loss": 1.2324, + "step": 3541 + }, + { + "epoch": 9.651226158038147, + "grad_norm": 12.891176223754883, + "learning_rate": 1.9768873560921954e-05, + "loss": 1.3088, + "step": 3542 + }, + { + "epoch": 9.653950953678475, + "grad_norm": 9.654071807861328, + "learning_rate": 1.9768684885461394e-05, + "loss": 1.4294, + "step": 3543 + }, + { + "epoch": 9.6566757493188, + "grad_norm": 9.73577880859375, + "learning_rate": 1.9768496133922626e-05, + "loss": 1.3999, + "step": 3544 + }, + { + "epoch": 9.659400544959128, + "grad_norm": 12.861915588378906, + "learning_rate": 1.9768307306307125e-05, + "loss": 1.3772, + "step": 3545 + }, + { + "epoch": 9.662125340599456, + "grad_norm": 10.343432426452637, + "learning_rate": 1.9768118402616367e-05, + "loss": 1.4392, + "step": 3546 + }, + { + "epoch": 9.664850136239782, + "grad_norm": 10.485712051391602, + "learning_rate": 1.9767929422851814e-05, + "loss": 1.3408, + "step": 3547 + }, + { + "epoch": 9.66757493188011, + "grad_norm": 13.244621276855469, + "learning_rate": 1.9767740367014937e-05, + "loss": 1.2383, + "step": 3548 + }, + { + "epoch": 9.670299727520437, + "grad_norm": 11.628501892089844, + "learning_rate": 1.9767551235107218e-05, + "loss": 1.3855, + "step": 3549 + }, + { + "epoch": 9.673024523160763, + "grad_norm": 12.488821983337402, + "learning_rate": 1.9767362027130122e-05, + "loss": 1.217, + "step": 3550 + }, + { + "epoch": 9.67574931880109, + "grad_norm": 35.66632080078125, + "learning_rate": 1.9767172743085124e-05, + "loss": 1.4966, + "step": 3551 + }, + { + "epoch": 9.678474114441418, + "grad_norm": 10.492840766906738, + "learning_rate": 1.97669833829737e-05, + "loss": 1.1748, + "step": 3552 + }, + { + "epoch": 9.681198910081743, + "grad_norm": 9.04301643371582, + "learning_rate": 1.9766793946797324e-05, + "loss": 1.2639, + "step": 3553 + }, + { + "epoch": 9.683923705722071, + "grad_norm": 11.102354049682617, + "learning_rate": 1.976660443455747e-05, + "loss": 1.3433, + "step": 3554 + }, + { + "epoch": 9.686648501362399, + "grad_norm": 37.838706970214844, + "learning_rate": 1.9766414846255614e-05, + "loss": 1.3713, + "step": 3555 + }, + { + "epoch": 9.689373297002724, + "grad_norm": 11.290416717529297, + "learning_rate": 1.9766225181893236e-05, + "loss": 1.3698, + "step": 3556 + }, + { + "epoch": 9.692098092643052, + "grad_norm": 29.570707321166992, + "learning_rate": 1.9766035441471813e-05, + "loss": 1.3085, + "step": 3557 + }, + { + "epoch": 9.69482288828338, + "grad_norm": 13.721502304077148, + "learning_rate": 1.9765845624992814e-05, + "loss": 1.3857, + "step": 3558 + }, + { + "epoch": 9.697547683923705, + "grad_norm": 17.07549285888672, + "learning_rate": 1.9765655732457728e-05, + "loss": 1.4221, + "step": 3559 + }, + { + "epoch": 9.700272479564033, + "grad_norm": 10.509212493896484, + "learning_rate": 1.9765465763868027e-05, + "loss": 1.3245, + "step": 3560 + }, + { + "epoch": 9.70299727520436, + "grad_norm": 7.748059272766113, + "learning_rate": 1.9765275719225196e-05, + "loss": 1.283, + "step": 3561 + }, + { + "epoch": 9.705722070844686, + "grad_norm": 13.8661527633667, + "learning_rate": 1.976508559853071e-05, + "loss": 1.4639, + "step": 3562 + }, + { + "epoch": 9.708446866485014, + "grad_norm": 9.865267753601074, + "learning_rate": 1.9764895401786054e-05, + "loss": 1.4209, + "step": 3563 + }, + { + "epoch": 9.711171662125341, + "grad_norm": 12.632296562194824, + "learning_rate": 1.9764705128992704e-05, + "loss": 1.4805, + "step": 3564 + }, + { + "epoch": 9.713896457765667, + "grad_norm": 14.47574234008789, + "learning_rate": 1.9764514780152146e-05, + "loss": 1.5071, + "step": 3565 + }, + { + "epoch": 9.716621253405995, + "grad_norm": 12.230063438415527, + "learning_rate": 1.976432435526586e-05, + "loss": 1.314, + "step": 3566 + }, + { + "epoch": 9.719346049046322, + "grad_norm": 8.775035858154297, + "learning_rate": 1.976413385433533e-05, + "loss": 1.3423, + "step": 3567 + }, + { + "epoch": 9.722070844686648, + "grad_norm": 12.163357734680176, + "learning_rate": 1.976394327736204e-05, + "loss": 1.3538, + "step": 3568 + }, + { + "epoch": 9.724795640326976, + "grad_norm": 10.467511177062988, + "learning_rate": 1.9763752624347475e-05, + "loss": 1.2112, + "step": 3569 + }, + { + "epoch": 9.727520435967303, + "grad_norm": 10.808884620666504, + "learning_rate": 1.976356189529312e-05, + "loss": 1.2449, + "step": 3570 + }, + { + "epoch": 9.730245231607629, + "grad_norm": 9.99303150177002, + "learning_rate": 1.9763371090200456e-05, + "loss": 1.3994, + "step": 3571 + }, + { + "epoch": 9.732970027247957, + "grad_norm": 8.264053344726562, + "learning_rate": 1.9763180209070977e-05, + "loss": 1.2852, + "step": 3572 + }, + { + "epoch": 9.735694822888284, + "grad_norm": 12.849554061889648, + "learning_rate": 1.976298925190616e-05, + "loss": 1.2565, + "step": 3573 + }, + { + "epoch": 9.73841961852861, + "grad_norm": 22.483198165893555, + "learning_rate": 1.9762798218707496e-05, + "loss": 1.2776, + "step": 3574 + }, + { + "epoch": 9.741144414168938, + "grad_norm": 15.177623748779297, + "learning_rate": 1.976260710947648e-05, + "loss": 1.4773, + "step": 3575 + }, + { + "epoch": 9.743869209809265, + "grad_norm": 10.869903564453125, + "learning_rate": 1.976241592421459e-05, + "loss": 1.4231, + "step": 3576 + }, + { + "epoch": 9.746594005449591, + "grad_norm": 10.320539474487305, + "learning_rate": 1.976222466292332e-05, + "loss": 1.3938, + "step": 3577 + }, + { + "epoch": 9.749318801089919, + "grad_norm": 10.482199668884277, + "learning_rate": 1.9762033325604156e-05, + "loss": 1.3408, + "step": 3578 + }, + { + "epoch": 9.752043596730246, + "grad_norm": 9.231746673583984, + "learning_rate": 1.9761841912258594e-05, + "loss": 1.3203, + "step": 3579 + }, + { + "epoch": 9.754768392370572, + "grad_norm": 9.591264724731445, + "learning_rate": 1.9761650422888118e-05, + "loss": 1.2886, + "step": 3580 + }, + { + "epoch": 9.7574931880109, + "grad_norm": 10.6572265625, + "learning_rate": 1.9761458857494223e-05, + "loss": 1.4587, + "step": 3581 + }, + { + "epoch": 9.760217983651227, + "grad_norm": 9.55623722076416, + "learning_rate": 1.9761267216078403e-05, + "loss": 1.3806, + "step": 3582 + }, + { + "epoch": 9.762942779291553, + "grad_norm": 12.238038063049316, + "learning_rate": 1.9761075498642144e-05, + "loss": 1.4348, + "step": 3583 + }, + { + "epoch": 9.76566757493188, + "grad_norm": 9.699817657470703, + "learning_rate": 1.976088370518695e-05, + "loss": 1.3208, + "step": 3584 + }, + { + "epoch": 9.768392370572208, + "grad_norm": 8.047388076782227, + "learning_rate": 1.9760691835714304e-05, + "loss": 1.366, + "step": 3585 + }, + { + "epoch": 9.771117166212534, + "grad_norm": 9.928215980529785, + "learning_rate": 1.9760499890225704e-05, + "loss": 1.1907, + "step": 3586 + }, + { + "epoch": 9.773841961852861, + "grad_norm": 11.434212684631348, + "learning_rate": 1.9760307868722646e-05, + "loss": 1.3413, + "step": 3587 + }, + { + "epoch": 9.776566757493189, + "grad_norm": 9.478497505187988, + "learning_rate": 1.9760115771206624e-05, + "loss": 1.2214, + "step": 3588 + }, + { + "epoch": 9.779291553133515, + "grad_norm": 12.000141143798828, + "learning_rate": 1.9759923597679133e-05, + "loss": 1.3748, + "step": 3589 + }, + { + "epoch": 9.782016348773842, + "grad_norm": 16.21526336669922, + "learning_rate": 1.9759731348141673e-05, + "loss": 1.4045, + "step": 3590 + }, + { + "epoch": 9.78474114441417, + "grad_norm": 12.084442138671875, + "learning_rate": 1.975953902259574e-05, + "loss": 1.3789, + "step": 3591 + }, + { + "epoch": 9.787465940054496, + "grad_norm": 10.21094799041748, + "learning_rate": 1.9759346621042827e-05, + "loss": 1.4468, + "step": 3592 + }, + { + "epoch": 9.790190735694823, + "grad_norm": 14.390522956848145, + "learning_rate": 1.9759154143484443e-05, + "loss": 1.3589, + "step": 3593 + }, + { + "epoch": 9.79291553133515, + "grad_norm": 10.500269889831543, + "learning_rate": 1.9758961589922078e-05, + "loss": 1.2593, + "step": 3594 + }, + { + "epoch": 9.795640326975477, + "grad_norm": 16.458541870117188, + "learning_rate": 1.975876896035723e-05, + "loss": 1.5293, + "step": 3595 + }, + { + "epoch": 9.798365122615804, + "grad_norm": 10.324142456054688, + "learning_rate": 1.975857625479141e-05, + "loss": 1.3386, + "step": 3596 + }, + { + "epoch": 9.80108991825613, + "grad_norm": 17.802846908569336, + "learning_rate": 1.9758383473226107e-05, + "loss": 1.4626, + "step": 3597 + }, + { + "epoch": 9.803814713896458, + "grad_norm": 8.964858055114746, + "learning_rate": 1.9758190615662827e-05, + "loss": 1.2153, + "step": 3598 + }, + { + "epoch": 9.806539509536785, + "grad_norm": 9.028390884399414, + "learning_rate": 1.9757997682103077e-05, + "loss": 1.2297, + "step": 3599 + }, + { + "epoch": 9.809264305177111, + "grad_norm": 9.114471435546875, + "learning_rate": 1.975780467254835e-05, + "loss": 1.3013, + "step": 3600 + }, + { + "epoch": 9.811989100817438, + "grad_norm": 10.367660522460938, + "learning_rate": 1.9757611587000164e-05, + "loss": 1.3669, + "step": 3601 + }, + { + "epoch": 9.814713896457766, + "grad_norm": 9.04752254486084, + "learning_rate": 1.9757418425460005e-05, + "loss": 1.4395, + "step": 3602 + }, + { + "epoch": 9.817438692098092, + "grad_norm": 9.182389259338379, + "learning_rate": 1.9757225187929387e-05, + "loss": 1.5559, + "step": 3603 + }, + { + "epoch": 9.82016348773842, + "grad_norm": 9.73576545715332, + "learning_rate": 1.9757031874409813e-05, + "loss": 1.5352, + "step": 3604 + }, + { + "epoch": 9.822888283378747, + "grad_norm": 9.303825378417969, + "learning_rate": 1.975683848490279e-05, + "loss": 1.5632, + "step": 3605 + }, + { + "epoch": 9.825613079019073, + "grad_norm": 12.194347381591797, + "learning_rate": 1.975664501940982e-05, + "loss": 1.4282, + "step": 3606 + }, + { + "epoch": 9.8283378746594, + "grad_norm": 11.136542320251465, + "learning_rate": 1.9756451477932414e-05, + "loss": 1.2998, + "step": 3607 + }, + { + "epoch": 9.831062670299728, + "grad_norm": 9.804329872131348, + "learning_rate": 1.975625786047208e-05, + "loss": 1.1824, + "step": 3608 + }, + { + "epoch": 9.833787465940054, + "grad_norm": 7.430677890777588, + "learning_rate": 1.9756064167030324e-05, + "loss": 1.2449, + "step": 3609 + }, + { + "epoch": 9.836512261580381, + "grad_norm": 11.333991050720215, + "learning_rate": 1.975587039760865e-05, + "loss": 1.2239, + "step": 3610 + }, + { + "epoch": 9.839237057220709, + "grad_norm": 8.473504066467285, + "learning_rate": 1.9755676552208577e-05, + "loss": 1.2458, + "step": 3611 + }, + { + "epoch": 9.841961852861035, + "grad_norm": 21.26403045654297, + "learning_rate": 1.97554826308316e-05, + "loss": 1.3889, + "step": 3612 + }, + { + "epoch": 9.844686648501362, + "grad_norm": 11.096529006958008, + "learning_rate": 1.9755288633479245e-05, + "loss": 1.4622, + "step": 3613 + }, + { + "epoch": 9.84741144414169, + "grad_norm": 10.732100486755371, + "learning_rate": 1.975509456015302e-05, + "loss": 1.4268, + "step": 3614 + }, + { + "epoch": 9.850136239782016, + "grad_norm": 8.53803539276123, + "learning_rate": 1.9754900410854425e-05, + "loss": 1.1648, + "step": 3615 + }, + { + "epoch": 9.852861035422343, + "grad_norm": 12.325318336486816, + "learning_rate": 1.9754706185584982e-05, + "loss": 1.2351, + "step": 3616 + }, + { + "epoch": 9.85558583106267, + "grad_norm": 10.54158878326416, + "learning_rate": 1.97545118843462e-05, + "loss": 1.5369, + "step": 3617 + }, + { + "epoch": 9.858310626702997, + "grad_norm": 8.079790115356445, + "learning_rate": 1.9754317507139596e-05, + "loss": 1.4783, + "step": 3618 + }, + { + "epoch": 9.861035422343324, + "grad_norm": 10.943889617919922, + "learning_rate": 1.9754123053966682e-05, + "loss": 1.5005, + "step": 3619 + }, + { + "epoch": 9.863760217983652, + "grad_norm": 8.651459693908691, + "learning_rate": 1.9753928524828967e-05, + "loss": 1.3979, + "step": 3620 + }, + { + "epoch": 9.866485013623977, + "grad_norm": 10.205894470214844, + "learning_rate": 1.975373391972797e-05, + "loss": 1.3853, + "step": 3621 + }, + { + "epoch": 9.869209809264305, + "grad_norm": 9.411439895629883, + "learning_rate": 1.9753539238665214e-05, + "loss": 1.1968, + "step": 3622 + }, + { + "epoch": 9.871934604904633, + "grad_norm": 8.494278907775879, + "learning_rate": 1.9753344481642205e-05, + "loss": 1.2158, + "step": 3623 + }, + { + "epoch": 9.874659400544958, + "grad_norm": 9.459856986999512, + "learning_rate": 1.9753149648660463e-05, + "loss": 1.2537, + "step": 3624 + }, + { + "epoch": 9.877384196185286, + "grad_norm": 11.612347602844238, + "learning_rate": 1.9752954739721506e-05, + "loss": 1.281, + "step": 3625 + }, + { + "epoch": 9.880108991825614, + "grad_norm": 11.348382949829102, + "learning_rate": 1.9752759754826848e-05, + "loss": 1.657, + "step": 3626 + }, + { + "epoch": 9.88283378746594, + "grad_norm": 10.99140739440918, + "learning_rate": 1.9752564693978017e-05, + "loss": 1.5684, + "step": 3627 + }, + { + "epoch": 9.885558583106267, + "grad_norm": 8.75643253326416, + "learning_rate": 1.975236955717652e-05, + "loss": 1.228, + "step": 3628 + }, + { + "epoch": 9.888283378746594, + "grad_norm": 8.574169158935547, + "learning_rate": 1.9752174344423887e-05, + "loss": 1.6069, + "step": 3629 + }, + { + "epoch": 9.89100817438692, + "grad_norm": 10.064516067504883, + "learning_rate": 1.975197905572163e-05, + "loss": 1.5732, + "step": 3630 + }, + { + "epoch": 9.893732970027248, + "grad_norm": 10.123259544372559, + "learning_rate": 1.9751783691071278e-05, + "loss": 1.4634, + "step": 3631 + }, + { + "epoch": 9.896457765667575, + "grad_norm": 7.016714572906494, + "learning_rate": 1.9751588250474347e-05, + "loss": 1.085, + "step": 3632 + }, + { + "epoch": 9.899182561307901, + "grad_norm": 7.592134475708008, + "learning_rate": 1.975139273393236e-05, + "loss": 1.3142, + "step": 3633 + }, + { + "epoch": 9.901907356948229, + "grad_norm": 9.733391761779785, + "learning_rate": 1.975119714144684e-05, + "loss": 1.373, + "step": 3634 + }, + { + "epoch": 9.904632152588556, + "grad_norm": 9.23591136932373, + "learning_rate": 1.9751001473019312e-05, + "loss": 1.4934, + "step": 3635 + }, + { + "epoch": 9.907356948228882, + "grad_norm": 12.293094635009766, + "learning_rate": 1.97508057286513e-05, + "loss": 1.1792, + "step": 3636 + }, + { + "epoch": 9.91008174386921, + "grad_norm": 9.169655799865723, + "learning_rate": 1.975060990834432e-05, + "loss": 1.6282, + "step": 3637 + }, + { + "epoch": 9.912806539509537, + "grad_norm": 8.291810035705566, + "learning_rate": 1.975041401209991e-05, + "loss": 1.4124, + "step": 3638 + }, + { + "epoch": 9.915531335149863, + "grad_norm": 9.391378402709961, + "learning_rate": 1.9750218039919587e-05, + "loss": 1.2786, + "step": 3639 + }, + { + "epoch": 9.91825613079019, + "grad_norm": 12.229228019714355, + "learning_rate": 1.975002199180488e-05, + "loss": 1.4749, + "step": 3640 + }, + { + "epoch": 9.920980926430518, + "grad_norm": 9.75719165802002, + "learning_rate": 1.9749825867757316e-05, + "loss": 1.2493, + "step": 3641 + }, + { + "epoch": 9.923705722070844, + "grad_norm": 10.654757499694824, + "learning_rate": 1.974962966777842e-05, + "loss": 1.5508, + "step": 3642 + }, + { + "epoch": 9.926430517711172, + "grad_norm": 9.315423965454102, + "learning_rate": 1.9749433391869725e-05, + "loss": 1.3826, + "step": 3643 + }, + { + "epoch": 9.9291553133515, + "grad_norm": 10.321687698364258, + "learning_rate": 1.9749237040032758e-05, + "loss": 1.2932, + "step": 3644 + }, + { + "epoch": 9.931880108991825, + "grad_norm": 9.969890594482422, + "learning_rate": 1.974904061226904e-05, + "loss": 1.4094, + "step": 3645 + }, + { + "epoch": 9.934604904632153, + "grad_norm": 15.723612785339355, + "learning_rate": 1.9748844108580113e-05, + "loss": 1.4934, + "step": 3646 + }, + { + "epoch": 9.93732970027248, + "grad_norm": 13.158507347106934, + "learning_rate": 1.9748647528967503e-05, + "loss": 1.5178, + "step": 3647 + }, + { + "epoch": 9.940054495912806, + "grad_norm": 8.285064697265625, + "learning_rate": 1.9748450873432737e-05, + "loss": 1.1406, + "step": 3648 + }, + { + "epoch": 9.942779291553133, + "grad_norm": 8.271842002868652, + "learning_rate": 1.974825414197735e-05, + "loss": 1.4692, + "step": 3649 + }, + { + "epoch": 9.945504087193461, + "grad_norm": 7.437000751495361, + "learning_rate": 1.9748057334602873e-05, + "loss": 1.1069, + "step": 3650 + }, + { + "epoch": 9.948228882833787, + "grad_norm": 8.541642189025879, + "learning_rate": 1.9747860451310838e-05, + "loss": 1.3345, + "step": 3651 + }, + { + "epoch": 9.950953678474114, + "grad_norm": 8.020855903625488, + "learning_rate": 1.974766349210278e-05, + "loss": 1.1671, + "step": 3652 + }, + { + "epoch": 9.953678474114442, + "grad_norm": 8.065467834472656, + "learning_rate": 1.9747466456980232e-05, + "loss": 1.2144, + "step": 3653 + }, + { + "epoch": 9.956403269754768, + "grad_norm": 11.647472381591797, + "learning_rate": 1.974726934594473e-05, + "loss": 1.5593, + "step": 3654 + }, + { + "epoch": 9.959128065395095, + "grad_norm": 17.921730041503906, + "learning_rate": 1.9747072158997808e-05, + "loss": 1.4771, + "step": 3655 + }, + { + "epoch": 9.961852861035423, + "grad_norm": 11.619487762451172, + "learning_rate": 1.9746874896141005e-05, + "loss": 1.3782, + "step": 3656 + }, + { + "epoch": 9.964577656675749, + "grad_norm": 21.86222267150879, + "learning_rate": 1.9746677557375847e-05, + "loss": 1.4021, + "step": 3657 + }, + { + "epoch": 9.967302452316076, + "grad_norm": 9.413336753845215, + "learning_rate": 1.9746480142703883e-05, + "loss": 1.3765, + "step": 3658 + }, + { + "epoch": 9.970027247956404, + "grad_norm": 10.448002815246582, + "learning_rate": 1.9746282652126646e-05, + "loss": 1.2358, + "step": 3659 + }, + { + "epoch": 9.97275204359673, + "grad_norm": 7.882084846496582, + "learning_rate": 1.974608508564567e-05, + "loss": 1.2864, + "step": 3660 + }, + { + "epoch": 9.975476839237057, + "grad_norm": 13.244160652160645, + "learning_rate": 1.97458874432625e-05, + "loss": 1.3535, + "step": 3661 + }, + { + "epoch": 9.978201634877385, + "grad_norm": 9.789565086364746, + "learning_rate": 1.974568972497867e-05, + "loss": 1.5103, + "step": 3662 + }, + { + "epoch": 9.98092643051771, + "grad_norm": 10.077621459960938, + "learning_rate": 1.9745491930795725e-05, + "loss": 1.3215, + "step": 3663 + }, + { + "epoch": 9.983651226158038, + "grad_norm": 8.027867317199707, + "learning_rate": 1.97452940607152e-05, + "loss": 1.4524, + "step": 3664 + }, + { + "epoch": 9.986376021798366, + "grad_norm": 12.210448265075684, + "learning_rate": 1.9745096114738637e-05, + "loss": 1.5635, + "step": 3665 + }, + { + "epoch": 9.989100817438691, + "grad_norm": 11.715902328491211, + "learning_rate": 1.9744898092867584e-05, + "loss": 1.4033, + "step": 3666 + }, + { + "epoch": 9.991825613079019, + "grad_norm": 10.559863090515137, + "learning_rate": 1.9744699995103574e-05, + "loss": 1.2605, + "step": 3667 + }, + { + "epoch": 9.994550408719347, + "grad_norm": 11.416446685791016, + "learning_rate": 1.9744501821448154e-05, + "loss": 1.4619, + "step": 3668 + }, + { + "epoch": 9.997275204359672, + "grad_norm": 9.612354278564453, + "learning_rate": 1.974430357190287e-05, + "loss": 1.281, + "step": 3669 + }, + { + "epoch": 10.0, + "grad_norm": 10.122220993041992, + "learning_rate": 1.9744105246469264e-05, + "loss": 1.4553, + "step": 3670 + }, + { + "epoch": 10.002724795640328, + "grad_norm": 8.111466407775879, + "learning_rate": 1.9743906845148877e-05, + "loss": 1.26, + "step": 3671 + }, + { + "epoch": 10.005449591280653, + "grad_norm": 8.482653617858887, + "learning_rate": 1.9743708367943256e-05, + "loss": 1.2026, + "step": 3672 + }, + { + "epoch": 10.008174386920981, + "grad_norm": 8.723862648010254, + "learning_rate": 1.974350981485395e-05, + "loss": 1.3042, + "step": 3673 + }, + { + "epoch": 10.010899182561309, + "grad_norm": 8.500794410705566, + "learning_rate": 1.9743311185882503e-05, + "loss": 1.3416, + "step": 3674 + }, + { + "epoch": 10.013623978201634, + "grad_norm": 7.933543682098389, + "learning_rate": 1.9743112481030465e-05, + "loss": 1.4116, + "step": 3675 + }, + { + "epoch": 10.016348773841962, + "grad_norm": 10.659152030944824, + "learning_rate": 1.974291370029938e-05, + "loss": 1.3218, + "step": 3676 + }, + { + "epoch": 10.01907356948229, + "grad_norm": 8.086297035217285, + "learning_rate": 1.974271484369079e-05, + "loss": 1.2712, + "step": 3677 + }, + { + "epoch": 10.021798365122615, + "grad_norm": 10.596502304077148, + "learning_rate": 1.9742515911206258e-05, + "loss": 1.2361, + "step": 3678 + }, + { + "epoch": 10.024523160762943, + "grad_norm": 8.962627410888672, + "learning_rate": 1.9742316902847322e-05, + "loss": 1.2885, + "step": 3679 + }, + { + "epoch": 10.02724795640327, + "grad_norm": 16.210643768310547, + "learning_rate": 1.9742117818615536e-05, + "loss": 1.2329, + "step": 3680 + }, + { + "epoch": 10.029972752043596, + "grad_norm": 8.1439790725708, + "learning_rate": 1.974191865851245e-05, + "loss": 1.1716, + "step": 3681 + }, + { + "epoch": 10.032697547683924, + "grad_norm": 7.825740337371826, + "learning_rate": 1.9741719422539614e-05, + "loss": 1.1626, + "step": 3682 + }, + { + "epoch": 10.035422343324251, + "grad_norm": 9.390591621398926, + "learning_rate": 1.9741520110698582e-05, + "loss": 1.2278, + "step": 3683 + }, + { + "epoch": 10.038147138964577, + "grad_norm": 10.142020225524902, + "learning_rate": 1.9741320722990903e-05, + "loss": 1.3694, + "step": 3684 + }, + { + "epoch": 10.040871934604905, + "grad_norm": 11.591178894042969, + "learning_rate": 1.9741121259418135e-05, + "loss": 1.3064, + "step": 3685 + }, + { + "epoch": 10.043596730245232, + "grad_norm": 9.16048526763916, + "learning_rate": 1.9740921719981827e-05, + "loss": 1.3254, + "step": 3686 + }, + { + "epoch": 10.046321525885558, + "grad_norm": 10.824785232543945, + "learning_rate": 1.9740722104683534e-05, + "loss": 1.2532, + "step": 3687 + }, + { + "epoch": 10.049046321525886, + "grad_norm": 8.441052436828613, + "learning_rate": 1.974052241352481e-05, + "loss": 1.2732, + "step": 3688 + }, + { + "epoch": 10.051771117166213, + "grad_norm": 7.5722737312316895, + "learning_rate": 1.9740322646507213e-05, + "loss": 1.2148, + "step": 3689 + }, + { + "epoch": 10.054495912806539, + "grad_norm": 9.024096488952637, + "learning_rate": 1.9740122803632295e-05, + "loss": 1.2815, + "step": 3690 + }, + { + "epoch": 10.057220708446867, + "grad_norm": 8.968578338623047, + "learning_rate": 1.9739922884901612e-05, + "loss": 1.2136, + "step": 3691 + }, + { + "epoch": 10.059945504087194, + "grad_norm": 8.43995189666748, + "learning_rate": 1.9739722890316728e-05, + "loss": 1.1365, + "step": 3692 + }, + { + "epoch": 10.06267029972752, + "grad_norm": 8.175556182861328, + "learning_rate": 1.9739522819879192e-05, + "loss": 1.2385, + "step": 3693 + }, + { + "epoch": 10.065395095367847, + "grad_norm": 10.570222854614258, + "learning_rate": 1.9739322673590567e-05, + "loss": 1.2109, + "step": 3694 + }, + { + "epoch": 10.068119891008175, + "grad_norm": 10.841527938842773, + "learning_rate": 1.9739122451452412e-05, + "loss": 1.2881, + "step": 3695 + }, + { + "epoch": 10.0708446866485, + "grad_norm": 10.643328666687012, + "learning_rate": 1.9738922153466282e-05, + "loss": 1.3911, + "step": 3696 + }, + { + "epoch": 10.073569482288828, + "grad_norm": 8.971731185913086, + "learning_rate": 1.973872177963374e-05, + "loss": 1.1599, + "step": 3697 + }, + { + "epoch": 10.076294277929156, + "grad_norm": 11.588750839233398, + "learning_rate": 1.9738521329956347e-05, + "loss": 1.1902, + "step": 3698 + }, + { + "epoch": 10.079019073569482, + "grad_norm": 11.11839485168457, + "learning_rate": 1.9738320804435662e-05, + "loss": 1.3882, + "step": 3699 + }, + { + "epoch": 10.08174386920981, + "grad_norm": 9.18759536743164, + "learning_rate": 1.973812020307325e-05, + "loss": 1.179, + "step": 3700 + }, + { + "epoch": 10.084468664850137, + "grad_norm": 9.8154878616333, + "learning_rate": 1.973791952587067e-05, + "loss": 1.54, + "step": 3701 + }, + { + "epoch": 10.087193460490463, + "grad_norm": 10.527271270751953, + "learning_rate": 1.9737718772829485e-05, + "loss": 1.2053, + "step": 3702 + }, + { + "epoch": 10.08991825613079, + "grad_norm": 13.684199333190918, + "learning_rate": 1.9737517943951262e-05, + "loss": 1.176, + "step": 3703 + }, + { + "epoch": 10.092643051771118, + "grad_norm": 10.439043998718262, + "learning_rate": 1.9737317039237563e-05, + "loss": 1.2402, + "step": 3704 + }, + { + "epoch": 10.095367847411444, + "grad_norm": 17.306127548217773, + "learning_rate": 1.973711605868995e-05, + "loss": 1.2937, + "step": 3705 + }, + { + "epoch": 10.098092643051771, + "grad_norm": 10.449017524719238, + "learning_rate": 1.973691500230999e-05, + "loss": 1.3955, + "step": 3706 + }, + { + "epoch": 10.100817438692099, + "grad_norm": 7.04243803024292, + "learning_rate": 1.9736713870099253e-05, + "loss": 1.0579, + "step": 3707 + }, + { + "epoch": 10.103542234332425, + "grad_norm": 8.271339416503906, + "learning_rate": 1.97365126620593e-05, + "loss": 1.2466, + "step": 3708 + }, + { + "epoch": 10.106267029972752, + "grad_norm": 9.956682205200195, + "learning_rate": 1.97363113781917e-05, + "loss": 1.2231, + "step": 3709 + }, + { + "epoch": 10.10899182561308, + "grad_norm": 11.767767906188965, + "learning_rate": 1.9736110018498017e-05, + "loss": 1.2996, + "step": 3710 + }, + { + "epoch": 10.111716621253406, + "grad_norm": 9.663322448730469, + "learning_rate": 1.973590858297983e-05, + "loss": 1.313, + "step": 3711 + }, + { + "epoch": 10.114441416893733, + "grad_norm": 9.044020652770996, + "learning_rate": 1.9735707071638693e-05, + "loss": 1.163, + "step": 3712 + }, + { + "epoch": 10.11716621253406, + "grad_norm": 11.269691467285156, + "learning_rate": 1.9735505484476186e-05, + "loss": 1.1702, + "step": 3713 + }, + { + "epoch": 10.119891008174386, + "grad_norm": 8.530739784240723, + "learning_rate": 1.9735303821493876e-05, + "loss": 1.1389, + "step": 3714 + }, + { + "epoch": 10.122615803814714, + "grad_norm": 12.510598182678223, + "learning_rate": 1.9735102082693332e-05, + "loss": 1.3535, + "step": 3715 + }, + { + "epoch": 10.125340599455042, + "grad_norm": 8.907414436340332, + "learning_rate": 1.9734900268076126e-05, + "loss": 1.2559, + "step": 3716 + }, + { + "epoch": 10.128065395095367, + "grad_norm": 9.467856407165527, + "learning_rate": 1.973469837764383e-05, + "loss": 1.3218, + "step": 3717 + }, + { + "epoch": 10.130790190735695, + "grad_norm": 9.451179504394531, + "learning_rate": 1.9734496411398015e-05, + "loss": 1.2432, + "step": 3718 + }, + { + "epoch": 10.133514986376023, + "grad_norm": 8.923680305480957, + "learning_rate": 1.973429436934026e-05, + "loss": 1.2878, + "step": 3719 + }, + { + "epoch": 10.136239782016348, + "grad_norm": 9.132368087768555, + "learning_rate": 1.973409225147213e-05, + "loss": 1.0828, + "step": 3720 + }, + { + "epoch": 10.138964577656676, + "grad_norm": 7.689108371734619, + "learning_rate": 1.9733890057795203e-05, + "loss": 1.1726, + "step": 3721 + }, + { + "epoch": 10.141689373297003, + "grad_norm": 8.812626838684082, + "learning_rate": 1.9733687788311055e-05, + "loss": 1.3396, + "step": 3722 + }, + { + "epoch": 10.14441416893733, + "grad_norm": 9.01380729675293, + "learning_rate": 1.973348544302126e-05, + "loss": 1.4514, + "step": 3723 + }, + { + "epoch": 10.147138964577657, + "grad_norm": 9.405804634094238, + "learning_rate": 1.973328302192739e-05, + "loss": 1.4629, + "step": 3724 + }, + { + "epoch": 10.149863760217984, + "grad_norm": 10.039285659790039, + "learning_rate": 1.973308052503103e-05, + "loss": 1.2334, + "step": 3725 + }, + { + "epoch": 10.15258855585831, + "grad_norm": 9.150543212890625, + "learning_rate": 1.9732877952333748e-05, + "loss": 1.4014, + "step": 3726 + }, + { + "epoch": 10.155313351498638, + "grad_norm": 9.5938720703125, + "learning_rate": 1.973267530383713e-05, + "loss": 1.3809, + "step": 3727 + }, + { + "epoch": 10.158038147138965, + "grad_norm": 8.93763542175293, + "learning_rate": 1.9732472579542746e-05, + "loss": 1.4094, + "step": 3728 + }, + { + "epoch": 10.160762942779291, + "grad_norm": 15.509340286254883, + "learning_rate": 1.973226977945218e-05, + "loss": 1.2356, + "step": 3729 + }, + { + "epoch": 10.163487738419619, + "grad_norm": 7.8337321281433105, + "learning_rate": 1.973206690356701e-05, + "loss": 1.2112, + "step": 3730 + }, + { + "epoch": 10.166212534059946, + "grad_norm": 9.732722282409668, + "learning_rate": 1.9731863951888818e-05, + "loss": 1.5032, + "step": 3731 + }, + { + "epoch": 10.168937329700272, + "grad_norm": 10.353492736816406, + "learning_rate": 1.9731660924419182e-05, + "loss": 1.4467, + "step": 3732 + }, + { + "epoch": 10.1716621253406, + "grad_norm": 7.0989556312561035, + "learning_rate": 1.9731457821159684e-05, + "loss": 1.085, + "step": 3733 + }, + { + "epoch": 10.174386920980927, + "grad_norm": 9.056624412536621, + "learning_rate": 1.9731254642111902e-05, + "loss": 1.1536, + "step": 3734 + }, + { + "epoch": 10.177111716621253, + "grad_norm": 8.502835273742676, + "learning_rate": 1.9731051387277427e-05, + "loss": 1.1707, + "step": 3735 + }, + { + "epoch": 10.17983651226158, + "grad_norm": 9.250792503356934, + "learning_rate": 1.9730848056657836e-05, + "loss": 1.3557, + "step": 3736 + }, + { + "epoch": 10.182561307901908, + "grad_norm": 8.868075370788574, + "learning_rate": 1.9730644650254713e-05, + "loss": 1.2949, + "step": 3737 + }, + { + "epoch": 10.185286103542234, + "grad_norm": 8.198171615600586, + "learning_rate": 1.973044116806964e-05, + "loss": 1.1875, + "step": 3738 + }, + { + "epoch": 10.188010899182562, + "grad_norm": 8.920578956604004, + "learning_rate": 1.9730237610104206e-05, + "loss": 1.0823, + "step": 3739 + }, + { + "epoch": 10.190735694822889, + "grad_norm": 7.37108039855957, + "learning_rate": 1.9730033976359997e-05, + "loss": 1.155, + "step": 3740 + }, + { + "epoch": 10.193460490463215, + "grad_norm": 8.776039123535156, + "learning_rate": 1.9729830266838595e-05, + "loss": 1.3577, + "step": 3741 + }, + { + "epoch": 10.196185286103542, + "grad_norm": 7.64220666885376, + "learning_rate": 1.9729626481541588e-05, + "loss": 1.3101, + "step": 3742 + }, + { + "epoch": 10.19891008174387, + "grad_norm": 7.907156467437744, + "learning_rate": 1.9729422620470565e-05, + "loss": 1.4675, + "step": 3743 + }, + { + "epoch": 10.201634877384196, + "grad_norm": 7.8961100578308105, + "learning_rate": 1.972921868362711e-05, + "loss": 1.261, + "step": 3744 + }, + { + "epoch": 10.204359673024523, + "grad_norm": 6.774257183074951, + "learning_rate": 1.972901467101281e-05, + "loss": 1.1376, + "step": 3745 + }, + { + "epoch": 10.207084468664851, + "grad_norm": 9.262910842895508, + "learning_rate": 1.972881058262926e-05, + "loss": 1.2229, + "step": 3746 + }, + { + "epoch": 10.209809264305177, + "grad_norm": 7.917628765106201, + "learning_rate": 1.9728606418478046e-05, + "loss": 1.4253, + "step": 3747 + }, + { + "epoch": 10.212534059945504, + "grad_norm": 7.9029693603515625, + "learning_rate": 1.9728402178560757e-05, + "loss": 1.0979, + "step": 3748 + }, + { + "epoch": 10.215258855585832, + "grad_norm": 10.971442222595215, + "learning_rate": 1.972819786287899e-05, + "loss": 1.1077, + "step": 3749 + }, + { + "epoch": 10.217983651226158, + "grad_norm": 8.34411907196045, + "learning_rate": 1.9727993471434326e-05, + "loss": 1.334, + "step": 3750 + }, + { + "epoch": 10.220708446866485, + "grad_norm": 7.335469722747803, + "learning_rate": 1.9727789004228362e-05, + "loss": 1.2454, + "step": 3751 + }, + { + "epoch": 10.223433242506813, + "grad_norm": 7.210789680480957, + "learning_rate": 1.972758446126269e-05, + "loss": 1.395, + "step": 3752 + }, + { + "epoch": 10.226158038147139, + "grad_norm": 9.126672744750977, + "learning_rate": 1.972737984253891e-05, + "loss": 1.3259, + "step": 3753 + }, + { + "epoch": 10.228882833787466, + "grad_norm": 7.081237316131592, + "learning_rate": 1.9727175148058603e-05, + "loss": 1.1564, + "step": 3754 + }, + { + "epoch": 10.231607629427794, + "grad_norm": 8.507473945617676, + "learning_rate": 1.9726970377823367e-05, + "loss": 1.1432, + "step": 3755 + }, + { + "epoch": 10.23433242506812, + "grad_norm": 14.03199577331543, + "learning_rate": 1.9726765531834803e-05, + "loss": 1.4624, + "step": 3756 + }, + { + "epoch": 10.237057220708447, + "grad_norm": 8.498391151428223, + "learning_rate": 1.9726560610094497e-05, + "loss": 1.1757, + "step": 3757 + }, + { + "epoch": 10.239782016348773, + "grad_norm": 10.178677558898926, + "learning_rate": 1.9726355612604058e-05, + "loss": 1.2178, + "step": 3758 + }, + { + "epoch": 10.2425068119891, + "grad_norm": 8.009960174560547, + "learning_rate": 1.972615053936507e-05, + "loss": 1.311, + "step": 3759 + }, + { + "epoch": 10.245231607629428, + "grad_norm": 8.563240051269531, + "learning_rate": 1.9725945390379135e-05, + "loss": 1.2861, + "step": 3760 + }, + { + "epoch": 10.247956403269754, + "grad_norm": 9.629040718078613, + "learning_rate": 1.972574016564785e-05, + "loss": 1.4379, + "step": 3761 + }, + { + "epoch": 10.250681198910081, + "grad_norm": 9.098408699035645, + "learning_rate": 1.9725534865172814e-05, + "loss": 1.52, + "step": 3762 + }, + { + "epoch": 10.253405994550409, + "grad_norm": 8.469637870788574, + "learning_rate": 1.9725329488955625e-05, + "loss": 1.3036, + "step": 3763 + }, + { + "epoch": 10.256130790190735, + "grad_norm": 8.403144836425781, + "learning_rate": 1.972512403699788e-05, + "loss": 1.1606, + "step": 3764 + }, + { + "epoch": 10.258855585831062, + "grad_norm": 7.526834964752197, + "learning_rate": 1.9724918509301186e-05, + "loss": 1.3171, + "step": 3765 + }, + { + "epoch": 10.26158038147139, + "grad_norm": 9.698179244995117, + "learning_rate": 1.972471290586714e-05, + "loss": 1.4565, + "step": 3766 + }, + { + "epoch": 10.264305177111716, + "grad_norm": 8.261470794677734, + "learning_rate": 1.9724507226697343e-05, + "loss": 1.1653, + "step": 3767 + }, + { + "epoch": 10.267029972752043, + "grad_norm": 7.540979385375977, + "learning_rate": 1.9724301471793394e-05, + "loss": 1.1472, + "step": 3768 + }, + { + "epoch": 10.269754768392371, + "grad_norm": 8.067627906799316, + "learning_rate": 1.9724095641156903e-05, + "loss": 1.083, + "step": 3769 + }, + { + "epoch": 10.272479564032697, + "grad_norm": 9.930658340454102, + "learning_rate": 1.972388973478946e-05, + "loss": 1.3225, + "step": 3770 + }, + { + "epoch": 10.275204359673024, + "grad_norm": 7.763191223144531, + "learning_rate": 1.9723683752692683e-05, + "loss": 1.449, + "step": 3771 + }, + { + "epoch": 10.277929155313352, + "grad_norm": 7.233214855194092, + "learning_rate": 1.9723477694868166e-05, + "loss": 1.1707, + "step": 3772 + }, + { + "epoch": 10.280653950953678, + "grad_norm": 9.923511505126953, + "learning_rate": 1.972327156131752e-05, + "loss": 1.3611, + "step": 3773 + }, + { + "epoch": 10.283378746594005, + "grad_norm": 9.412862777709961, + "learning_rate": 1.972306535204235e-05, + "loss": 1.616, + "step": 3774 + }, + { + "epoch": 10.286103542234333, + "grad_norm": 10.132314682006836, + "learning_rate": 1.972285906704426e-05, + "loss": 1.2781, + "step": 3775 + }, + { + "epoch": 10.288828337874659, + "grad_norm": 10.205955505371094, + "learning_rate": 1.9722652706324853e-05, + "loss": 1.3584, + "step": 3776 + }, + { + "epoch": 10.291553133514986, + "grad_norm": 8.780740737915039, + "learning_rate": 1.972244626988574e-05, + "loss": 1.2617, + "step": 3777 + }, + { + "epoch": 10.294277929155314, + "grad_norm": 8.577252388000488, + "learning_rate": 1.972223975772853e-05, + "loss": 1.3442, + "step": 3778 + }, + { + "epoch": 10.29700272479564, + "grad_norm": 21.673694610595703, + "learning_rate": 1.9722033169854828e-05, + "loss": 1.2632, + "step": 3779 + }, + { + "epoch": 10.299727520435967, + "grad_norm": 10.122228622436523, + "learning_rate": 1.972182650626625e-05, + "loss": 1.3464, + "step": 3780 + }, + { + "epoch": 10.302452316076295, + "grad_norm": 9.061145782470703, + "learning_rate": 1.9721619766964393e-05, + "loss": 1.2012, + "step": 3781 + }, + { + "epoch": 10.30517711171662, + "grad_norm": 10.760348320007324, + "learning_rate": 1.9721412951950876e-05, + "loss": 1.2756, + "step": 3782 + }, + { + "epoch": 10.307901907356948, + "grad_norm": 9.252158164978027, + "learning_rate": 1.9721206061227312e-05, + "loss": 1.1973, + "step": 3783 + }, + { + "epoch": 10.310626702997276, + "grad_norm": 8.771831512451172, + "learning_rate": 1.9720999094795303e-05, + "loss": 1.3455, + "step": 3784 + }, + { + "epoch": 10.313351498637601, + "grad_norm": 42.56612777709961, + "learning_rate": 1.9720792052656468e-05, + "loss": 1.1782, + "step": 3785 + }, + { + "epoch": 10.316076294277929, + "grad_norm": 10.31918716430664, + "learning_rate": 1.9720584934812417e-05, + "loss": 1.3016, + "step": 3786 + }, + { + "epoch": 10.318801089918257, + "grad_norm": 11.992305755615234, + "learning_rate": 1.9720377741264762e-05, + "loss": 1.3696, + "step": 3787 + }, + { + "epoch": 10.321525885558582, + "grad_norm": 9.100144386291504, + "learning_rate": 1.972017047201512e-05, + "loss": 1.4116, + "step": 3788 + }, + { + "epoch": 10.32425068119891, + "grad_norm": 9.619243621826172, + "learning_rate": 1.9719963127065106e-05, + "loss": 1.2756, + "step": 3789 + }, + { + "epoch": 10.326975476839237, + "grad_norm": 9.421488761901855, + "learning_rate": 1.9719755706416327e-05, + "loss": 1.3113, + "step": 3790 + }, + { + "epoch": 10.329700272479563, + "grad_norm": 12.199220657348633, + "learning_rate": 1.9719548210070406e-05, + "loss": 1.0781, + "step": 3791 + }, + { + "epoch": 10.33242506811989, + "grad_norm": 9.928030014038086, + "learning_rate": 1.9719340638028952e-05, + "loss": 1.2095, + "step": 3792 + }, + { + "epoch": 10.335149863760218, + "grad_norm": 9.56116008758545, + "learning_rate": 1.971913299029359e-05, + "loss": 1.1885, + "step": 3793 + }, + { + "epoch": 10.337874659400544, + "grad_norm": 7.255523681640625, + "learning_rate": 1.9718925266865933e-05, + "loss": 1.1289, + "step": 3794 + }, + { + "epoch": 10.340599455040872, + "grad_norm": 9.008003234863281, + "learning_rate": 1.97187174677476e-05, + "loss": 1.291, + "step": 3795 + }, + { + "epoch": 10.3433242506812, + "grad_norm": 9.741546630859375, + "learning_rate": 1.9718509592940206e-05, + "loss": 1.5688, + "step": 3796 + }, + { + "epoch": 10.346049046321525, + "grad_norm": 9.080355644226074, + "learning_rate": 1.971830164244537e-05, + "loss": 1.5061, + "step": 3797 + }, + { + "epoch": 10.348773841961853, + "grad_norm": 10.598738670349121, + "learning_rate": 1.9718093616264717e-05, + "loss": 1.4241, + "step": 3798 + }, + { + "epoch": 10.35149863760218, + "grad_norm": 9.218337059020996, + "learning_rate": 1.9717885514399865e-05, + "loss": 1.3118, + "step": 3799 + }, + { + "epoch": 10.354223433242506, + "grad_norm": 11.137333869934082, + "learning_rate": 1.971767733685243e-05, + "loss": 1.2661, + "step": 3800 + }, + { + "epoch": 10.356948228882834, + "grad_norm": 9.336284637451172, + "learning_rate": 1.9717469083624037e-05, + "loss": 1.1646, + "step": 3801 + }, + { + "epoch": 10.359673024523161, + "grad_norm": 8.485359191894531, + "learning_rate": 1.9717260754716306e-05, + "loss": 1.2327, + "step": 3802 + }, + { + "epoch": 10.362397820163487, + "grad_norm": 10.281926155090332, + "learning_rate": 1.9717052350130864e-05, + "loss": 1.3621, + "step": 3803 + }, + { + "epoch": 10.365122615803815, + "grad_norm": 9.651093482971191, + "learning_rate": 1.971684386986933e-05, + "loss": 1.2651, + "step": 3804 + }, + { + "epoch": 10.367847411444142, + "grad_norm": 7.217008113861084, + "learning_rate": 1.9716635313933334e-05, + "loss": 1.187, + "step": 3805 + }, + { + "epoch": 10.370572207084468, + "grad_norm": 11.755059242248535, + "learning_rate": 1.9716426682324488e-05, + "loss": 1.1824, + "step": 3806 + }, + { + "epoch": 10.373297002724795, + "grad_norm": 9.702676773071289, + "learning_rate": 1.9716217975044426e-05, + "loss": 1.145, + "step": 3807 + }, + { + "epoch": 10.376021798365123, + "grad_norm": 8.324348449707031, + "learning_rate": 1.971600919209477e-05, + "loss": 1.2952, + "step": 3808 + }, + { + "epoch": 10.378746594005449, + "grad_norm": 8.522875785827637, + "learning_rate": 1.9715800333477148e-05, + "loss": 1.2107, + "step": 3809 + }, + { + "epoch": 10.381471389645776, + "grad_norm": 10.177056312561035, + "learning_rate": 1.9715591399193184e-05, + "loss": 1.2394, + "step": 3810 + }, + { + "epoch": 10.384196185286104, + "grad_norm": 8.588276863098145, + "learning_rate": 1.971538238924451e-05, + "loss": 1.4268, + "step": 3811 + }, + { + "epoch": 10.38692098092643, + "grad_norm": 9.623733520507812, + "learning_rate": 1.971517330363275e-05, + "loss": 1.2933, + "step": 3812 + }, + { + "epoch": 10.389645776566757, + "grad_norm": 8.727866172790527, + "learning_rate": 1.971496414235953e-05, + "loss": 1.2993, + "step": 3813 + }, + { + "epoch": 10.392370572207085, + "grad_norm": 7.569778919219971, + "learning_rate": 1.9714754905426484e-05, + "loss": 1.144, + "step": 3814 + }, + { + "epoch": 10.39509536784741, + "grad_norm": 10.021020889282227, + "learning_rate": 1.971454559283524e-05, + "loss": 1.3115, + "step": 3815 + }, + { + "epoch": 10.397820163487738, + "grad_norm": 9.4724702835083, + "learning_rate": 1.971433620458743e-05, + "loss": 1.1936, + "step": 3816 + }, + { + "epoch": 10.400544959128066, + "grad_norm": 8.412431716918945, + "learning_rate": 1.9714126740684677e-05, + "loss": 1.1482, + "step": 3817 + }, + { + "epoch": 10.403269754768392, + "grad_norm": 9.864459991455078, + "learning_rate": 1.971391720112862e-05, + "loss": 1.2603, + "step": 3818 + }, + { + "epoch": 10.40599455040872, + "grad_norm": 10.525559425354004, + "learning_rate": 1.971370758592089e-05, + "loss": 1.3506, + "step": 3819 + }, + { + "epoch": 10.408719346049047, + "grad_norm": 9.138388633728027, + "learning_rate": 1.9713497895063116e-05, + "loss": 1.3379, + "step": 3820 + }, + { + "epoch": 10.411444141689373, + "grad_norm": 25.672163009643555, + "learning_rate": 1.9713288128556932e-05, + "loss": 1.3042, + "step": 3821 + }, + { + "epoch": 10.4141689373297, + "grad_norm": 8.900979995727539, + "learning_rate": 1.9713078286403973e-05, + "loss": 1.3018, + "step": 3822 + }, + { + "epoch": 10.416893732970028, + "grad_norm": 9.162127494812012, + "learning_rate": 1.9712868368605877e-05, + "loss": 1.2988, + "step": 3823 + }, + { + "epoch": 10.419618528610354, + "grad_norm": 9.616890907287598, + "learning_rate": 1.9712658375164272e-05, + "loss": 1.2065, + "step": 3824 + }, + { + "epoch": 10.422343324250681, + "grad_norm": 7.914255142211914, + "learning_rate": 1.9712448306080793e-05, + "loss": 1.2363, + "step": 3825 + }, + { + "epoch": 10.425068119891009, + "grad_norm": 9.041911125183105, + "learning_rate": 1.9712238161357084e-05, + "loss": 1.2035, + "step": 3826 + }, + { + "epoch": 10.427792915531334, + "grad_norm": 9.996464729309082, + "learning_rate": 1.9712027940994777e-05, + "loss": 1.5454, + "step": 3827 + }, + { + "epoch": 10.430517711171662, + "grad_norm": 10.33507251739502, + "learning_rate": 1.9711817644995504e-05, + "loss": 1.3087, + "step": 3828 + }, + { + "epoch": 10.43324250681199, + "grad_norm": 6.783405303955078, + "learning_rate": 1.9711607273360912e-05, + "loss": 1.0486, + "step": 3829 + }, + { + "epoch": 10.435967302452315, + "grad_norm": 9.515064239501953, + "learning_rate": 1.9711396826092634e-05, + "loss": 1.2166, + "step": 3830 + }, + { + "epoch": 10.438692098092643, + "grad_norm": 11.367918014526367, + "learning_rate": 1.971118630319231e-05, + "loss": 1.2151, + "step": 3831 + }, + { + "epoch": 10.44141689373297, + "grad_norm": 11.599645614624023, + "learning_rate": 1.971097570466158e-05, + "loss": 1.4387, + "step": 3832 + }, + { + "epoch": 10.444141689373296, + "grad_norm": 9.678275108337402, + "learning_rate": 1.9710765030502085e-05, + "loss": 1.2834, + "step": 3833 + }, + { + "epoch": 10.446866485013624, + "grad_norm": 9.844661712646484, + "learning_rate": 1.971055428071546e-05, + "loss": 1.3894, + "step": 3834 + }, + { + "epoch": 10.449591280653951, + "grad_norm": 9.34825325012207, + "learning_rate": 1.9710343455303354e-05, + "loss": 1.4243, + "step": 3835 + }, + { + "epoch": 10.452316076294277, + "grad_norm": 9.034146308898926, + "learning_rate": 1.9710132554267404e-05, + "loss": 1.3154, + "step": 3836 + }, + { + "epoch": 10.455040871934605, + "grad_norm": 7.973133087158203, + "learning_rate": 1.9709921577609256e-05, + "loss": 1.2537, + "step": 3837 + }, + { + "epoch": 10.457765667574932, + "grad_norm": 8.211280822753906, + "learning_rate": 1.9709710525330548e-05, + "loss": 1.2642, + "step": 3838 + }, + { + "epoch": 10.460490463215258, + "grad_norm": 7.642856121063232, + "learning_rate": 1.9709499397432933e-05, + "loss": 1.1416, + "step": 3839 + }, + { + "epoch": 10.463215258855586, + "grad_norm": 11.273480415344238, + "learning_rate": 1.9709288193918044e-05, + "loss": 1.4062, + "step": 3840 + }, + { + "epoch": 10.465940054495913, + "grad_norm": 8.373019218444824, + "learning_rate": 1.9709076914787535e-05, + "loss": 1.3447, + "step": 3841 + }, + { + "epoch": 10.46866485013624, + "grad_norm": 6.9242167472839355, + "learning_rate": 1.9708865560043044e-05, + "loss": 1.2529, + "step": 3842 + }, + { + "epoch": 10.471389645776567, + "grad_norm": 10.533818244934082, + "learning_rate": 1.9708654129686224e-05, + "loss": 1.3271, + "step": 3843 + }, + { + "epoch": 10.474114441416894, + "grad_norm": 8.539103507995605, + "learning_rate": 1.9708442623718715e-05, + "loss": 1.3213, + "step": 3844 + }, + { + "epoch": 10.47683923705722, + "grad_norm": 18.204378128051758, + "learning_rate": 1.9708231042142166e-05, + "loss": 1.1941, + "step": 3845 + }, + { + "epoch": 10.479564032697548, + "grad_norm": 7.1978020668029785, + "learning_rate": 1.970801938495823e-05, + "loss": 1.3103, + "step": 3846 + }, + { + "epoch": 10.482288828337875, + "grad_norm": 7.041075706481934, + "learning_rate": 1.970780765216855e-05, + "loss": 1.178, + "step": 3847 + }, + { + "epoch": 10.485013623978201, + "grad_norm": 9.322103500366211, + "learning_rate": 1.9707595843774775e-05, + "loss": 1.4185, + "step": 3848 + }, + { + "epoch": 10.487738419618529, + "grad_norm": 13.164305686950684, + "learning_rate": 1.970738395977856e-05, + "loss": 1.3958, + "step": 3849 + }, + { + "epoch": 10.490463215258856, + "grad_norm": 10.326935768127441, + "learning_rate": 1.9707172000181546e-05, + "loss": 1.1398, + "step": 3850 + }, + { + "epoch": 10.493188010899182, + "grad_norm": 11.156216621398926, + "learning_rate": 1.9706959964985393e-05, + "loss": 1.3259, + "step": 3851 + }, + { + "epoch": 10.49591280653951, + "grad_norm": 8.280145645141602, + "learning_rate": 1.9706747854191745e-05, + "loss": 1.1892, + "step": 3852 + }, + { + "epoch": 10.498637602179837, + "grad_norm": 7.20928430557251, + "learning_rate": 1.970653566780226e-05, + "loss": 1.2397, + "step": 3853 + }, + { + "epoch": 10.501362397820163, + "grad_norm": 8.880866050720215, + "learning_rate": 1.9706323405818585e-05, + "loss": 1.1702, + "step": 3854 + }, + { + "epoch": 10.50408719346049, + "grad_norm": 9.814594268798828, + "learning_rate": 1.970611106824238e-05, + "loss": 1.2422, + "step": 3855 + }, + { + "epoch": 10.506811989100818, + "grad_norm": 9.441638946533203, + "learning_rate": 1.970589865507529e-05, + "loss": 1.4011, + "step": 3856 + }, + { + "epoch": 10.509536784741144, + "grad_norm": 12.693705558776855, + "learning_rate": 1.9705686166318973e-05, + "loss": 1.1509, + "step": 3857 + }, + { + "epoch": 10.512261580381471, + "grad_norm": 8.02194881439209, + "learning_rate": 1.9705473601975086e-05, + "loss": 1.2563, + "step": 3858 + }, + { + "epoch": 10.514986376021799, + "grad_norm": 9.439316749572754, + "learning_rate": 1.9705260962045286e-05, + "loss": 1.0911, + "step": 3859 + }, + { + "epoch": 10.517711171662125, + "grad_norm": 8.744632720947266, + "learning_rate": 1.9705048246531223e-05, + "loss": 1.2751, + "step": 3860 + }, + { + "epoch": 10.520435967302452, + "grad_norm": 9.701316833496094, + "learning_rate": 1.9704835455434556e-05, + "loss": 1.3284, + "step": 3861 + }, + { + "epoch": 10.52316076294278, + "grad_norm": 10.048924446105957, + "learning_rate": 1.9704622588756946e-05, + "loss": 1.1418, + "step": 3862 + }, + { + "epoch": 10.525885558583106, + "grad_norm": 9.116254806518555, + "learning_rate": 1.9704409646500044e-05, + "loss": 1.2899, + "step": 3863 + }, + { + "epoch": 10.528610354223433, + "grad_norm": 8.23773193359375, + "learning_rate": 1.970419662866551e-05, + "loss": 1.3109, + "step": 3864 + }, + { + "epoch": 10.53133514986376, + "grad_norm": 9.133581161499023, + "learning_rate": 1.9703983535255013e-05, + "loss": 1.4475, + "step": 3865 + }, + { + "epoch": 10.534059945504087, + "grad_norm": 8.2056303024292, + "learning_rate": 1.97037703662702e-05, + "loss": 1.3225, + "step": 3866 + }, + { + "epoch": 10.536784741144414, + "grad_norm": 8.202545166015625, + "learning_rate": 1.9703557121712737e-05, + "loss": 1.1953, + "step": 3867 + }, + { + "epoch": 10.539509536784742, + "grad_norm": 11.55584716796875, + "learning_rate": 1.9703343801584282e-05, + "loss": 1.2284, + "step": 3868 + }, + { + "epoch": 10.542234332425068, + "grad_norm": 10.944612503051758, + "learning_rate": 1.9703130405886496e-05, + "loss": 1.2878, + "step": 3869 + }, + { + "epoch": 10.544959128065395, + "grad_norm": 8.7283296585083, + "learning_rate": 1.9702916934621044e-05, + "loss": 1.3218, + "step": 3870 + }, + { + "epoch": 10.547683923705723, + "grad_norm": 9.210609436035156, + "learning_rate": 1.970270338778959e-05, + "loss": 1.3323, + "step": 3871 + }, + { + "epoch": 10.550408719346049, + "grad_norm": 12.175301551818848, + "learning_rate": 1.970248976539379e-05, + "loss": 1.5093, + "step": 3872 + }, + { + "epoch": 10.553133514986376, + "grad_norm": 9.581300735473633, + "learning_rate": 1.9702276067435316e-05, + "loss": 1.2495, + "step": 3873 + }, + { + "epoch": 10.555858310626704, + "grad_norm": 16.556753158569336, + "learning_rate": 1.9702062293915827e-05, + "loss": 1.4321, + "step": 3874 + }, + { + "epoch": 10.55858310626703, + "grad_norm": 10.717095375061035, + "learning_rate": 1.9701848444836987e-05, + "loss": 1.4023, + "step": 3875 + }, + { + "epoch": 10.561307901907357, + "grad_norm": 168.3912353515625, + "learning_rate": 1.9701634520200468e-05, + "loss": 1.4412, + "step": 3876 + }, + { + "epoch": 10.564032697547685, + "grad_norm": 11.4203462600708, + "learning_rate": 1.9701420520007928e-05, + "loss": 1.4312, + "step": 3877 + }, + { + "epoch": 10.56675749318801, + "grad_norm": 13.96320629119873, + "learning_rate": 1.970120644426104e-05, + "loss": 1.2971, + "step": 3878 + }, + { + "epoch": 10.569482288828338, + "grad_norm": 11.062853813171387, + "learning_rate": 1.9700992292961464e-05, + "loss": 1.5339, + "step": 3879 + }, + { + "epoch": 10.572207084468666, + "grad_norm": 21.22389793395996, + "learning_rate": 1.9700778066110873e-05, + "loss": 1.4445, + "step": 3880 + }, + { + "epoch": 10.574931880108991, + "grad_norm": 12.854517936706543, + "learning_rate": 1.9700563763710937e-05, + "loss": 1.498, + "step": 3881 + }, + { + "epoch": 10.577656675749319, + "grad_norm": 12.884160041809082, + "learning_rate": 1.9700349385763323e-05, + "loss": 1.3398, + "step": 3882 + }, + { + "epoch": 10.580381471389646, + "grad_norm": 11.598206520080566, + "learning_rate": 1.9700134932269698e-05, + "loss": 1.0874, + "step": 3883 + }, + { + "epoch": 10.583106267029972, + "grad_norm": 9.25067138671875, + "learning_rate": 1.9699920403231734e-05, + "loss": 1.1362, + "step": 3884 + }, + { + "epoch": 10.5858310626703, + "grad_norm": 14.375128746032715, + "learning_rate": 1.9699705798651104e-05, + "loss": 1.3901, + "step": 3885 + }, + { + "epoch": 10.588555858310627, + "grad_norm": 15.819267272949219, + "learning_rate": 1.9699491118529476e-05, + "loss": 1.2039, + "step": 3886 + }, + { + "epoch": 10.591280653950953, + "grad_norm": 26.65336799621582, + "learning_rate": 1.9699276362868526e-05, + "loss": 1.3782, + "step": 3887 + }, + { + "epoch": 10.59400544959128, + "grad_norm": 9.443343162536621, + "learning_rate": 1.9699061531669922e-05, + "loss": 1.2375, + "step": 3888 + }, + { + "epoch": 10.596730245231608, + "grad_norm": 11.523008346557617, + "learning_rate": 1.969884662493534e-05, + "loss": 1.2773, + "step": 3889 + }, + { + "epoch": 10.599455040871934, + "grad_norm": 13.750526428222656, + "learning_rate": 1.969863164266645e-05, + "loss": 1.1868, + "step": 3890 + }, + { + "epoch": 10.602179836512262, + "grad_norm": 13.709173202514648, + "learning_rate": 1.9698416584864932e-05, + "loss": 1.4307, + "step": 3891 + }, + { + "epoch": 10.60490463215259, + "grad_norm": 16.232471466064453, + "learning_rate": 1.9698201451532458e-05, + "loss": 1.3699, + "step": 3892 + }, + { + "epoch": 10.607629427792915, + "grad_norm": 13.37336254119873, + "learning_rate": 1.9697986242670703e-05, + "loss": 1.2227, + "step": 3893 + }, + { + "epoch": 10.610354223433243, + "grad_norm": 21.085451126098633, + "learning_rate": 1.969777095828134e-05, + "loss": 1.4746, + "step": 3894 + }, + { + "epoch": 10.61307901907357, + "grad_norm": 11.080826759338379, + "learning_rate": 1.969755559836605e-05, + "loss": 1.1066, + "step": 3895 + }, + { + "epoch": 10.615803814713896, + "grad_norm": 21.83421516418457, + "learning_rate": 1.969734016292651e-05, + "loss": 1.3494, + "step": 3896 + }, + { + "epoch": 10.618528610354224, + "grad_norm": 10.210470199584961, + "learning_rate": 1.9697124651964397e-05, + "loss": 1.2649, + "step": 3897 + }, + { + "epoch": 10.621253405994551, + "grad_norm": 11.174847602844238, + "learning_rate": 1.969690906548139e-05, + "loss": 1.4182, + "step": 3898 + }, + { + "epoch": 10.623978201634877, + "grad_norm": 18.439865112304688, + "learning_rate": 1.9696693403479165e-05, + "loss": 1.4883, + "step": 3899 + }, + { + "epoch": 10.626702997275205, + "grad_norm": 13.370489120483398, + "learning_rate": 1.9696477665959405e-05, + "loss": 1.281, + "step": 3900 + }, + { + "epoch": 10.629427792915532, + "grad_norm": 17.80059051513672, + "learning_rate": 1.969626185292379e-05, + "loss": 1.2476, + "step": 3901 + }, + { + "epoch": 10.632152588555858, + "grad_norm": 10.8162841796875, + "learning_rate": 1.9696045964374e-05, + "loss": 1.276, + "step": 3902 + }, + { + "epoch": 10.634877384196185, + "grad_norm": 9.661311149597168, + "learning_rate": 1.9695830000311716e-05, + "loss": 1.1792, + "step": 3903 + }, + { + "epoch": 10.637602179836513, + "grad_norm": 11.938919067382812, + "learning_rate": 1.9695613960738617e-05, + "loss": 1.3979, + "step": 3904 + }, + { + "epoch": 10.640326975476839, + "grad_norm": 11.777043342590332, + "learning_rate": 1.9695397845656393e-05, + "loss": 1.2119, + "step": 3905 + }, + { + "epoch": 10.643051771117166, + "grad_norm": 13.915650367736816, + "learning_rate": 1.9695181655066718e-05, + "loss": 1.3026, + "step": 3906 + }, + { + "epoch": 10.645776566757494, + "grad_norm": 13.268310546875, + "learning_rate": 1.9694965388971283e-05, + "loss": 1.428, + "step": 3907 + }, + { + "epoch": 10.64850136239782, + "grad_norm": 10.28786563873291, + "learning_rate": 1.969474904737177e-05, + "loss": 1.2898, + "step": 3908 + }, + { + "epoch": 10.651226158038147, + "grad_norm": 10.619996070861816, + "learning_rate": 1.9694532630269864e-05, + "loss": 1.1797, + "step": 3909 + }, + { + "epoch": 10.653950953678475, + "grad_norm": 17.510385513305664, + "learning_rate": 1.9694316137667248e-05, + "loss": 1.3794, + "step": 3910 + }, + { + "epoch": 10.6566757493188, + "grad_norm": 12.013043403625488, + "learning_rate": 1.969409956956561e-05, + "loss": 1.3135, + "step": 3911 + }, + { + "epoch": 10.659400544959128, + "grad_norm": 7.912718772888184, + "learning_rate": 1.969388292596664e-05, + "loss": 1.1248, + "step": 3912 + }, + { + "epoch": 10.662125340599456, + "grad_norm": 7.531147003173828, + "learning_rate": 1.9693666206872017e-05, + "loss": 1.1257, + "step": 3913 + }, + { + "epoch": 10.664850136239782, + "grad_norm": 10.835655212402344, + "learning_rate": 1.9693449412283435e-05, + "loss": 1.2842, + "step": 3914 + }, + { + "epoch": 10.66757493188011, + "grad_norm": 13.660799980163574, + "learning_rate": 1.9693232542202582e-05, + "loss": 1.3916, + "step": 3915 + }, + { + "epoch": 10.670299727520437, + "grad_norm": 14.183218955993652, + "learning_rate": 1.9693015596631143e-05, + "loss": 1.3655, + "step": 3916 + }, + { + "epoch": 10.673024523160763, + "grad_norm": 9.423027038574219, + "learning_rate": 1.9692798575570814e-05, + "loss": 1.4351, + "step": 3917 + }, + { + "epoch": 10.67574931880109, + "grad_norm": 9.637275695800781, + "learning_rate": 1.969258147902328e-05, + "loss": 1.448, + "step": 3918 + }, + { + "epoch": 10.678474114441418, + "grad_norm": 19.27906608581543, + "learning_rate": 1.9692364306990235e-05, + "loss": 1.2805, + "step": 3919 + }, + { + "epoch": 10.681198910081743, + "grad_norm": 11.753655433654785, + "learning_rate": 1.9692147059473367e-05, + "loss": 1.2595, + "step": 3920 + }, + { + "epoch": 10.683923705722071, + "grad_norm": 10.566637992858887, + "learning_rate": 1.969192973647437e-05, + "loss": 1.2373, + "step": 3921 + }, + { + "epoch": 10.686648501362399, + "grad_norm": 10.477239608764648, + "learning_rate": 1.9691712337994938e-05, + "loss": 1.4121, + "step": 3922 + }, + { + "epoch": 10.689373297002724, + "grad_norm": 9.499421119689941, + "learning_rate": 1.969149486403676e-05, + "loss": 1.2876, + "step": 3923 + }, + { + "epoch": 10.692098092643052, + "grad_norm": 19.364608764648438, + "learning_rate": 1.9691277314601534e-05, + "loss": 1.3411, + "step": 3924 + }, + { + "epoch": 10.69482288828338, + "grad_norm": 11.257384300231934, + "learning_rate": 1.969105968969095e-05, + "loss": 1.4094, + "step": 3925 + }, + { + "epoch": 10.697547683923705, + "grad_norm": 10.027420043945312, + "learning_rate": 1.9690841989306703e-05, + "loss": 1.3489, + "step": 3926 + }, + { + "epoch": 10.700272479564033, + "grad_norm": 10.581485748291016, + "learning_rate": 1.9690624213450493e-05, + "loss": 1.3269, + "step": 3927 + }, + { + "epoch": 10.70299727520436, + "grad_norm": 8.834001541137695, + "learning_rate": 1.9690406362124014e-05, + "loss": 1.2834, + "step": 3928 + }, + { + "epoch": 10.705722070844686, + "grad_norm": 10.63623332977295, + "learning_rate": 1.9690188435328962e-05, + "loss": 1.5283, + "step": 3929 + }, + { + "epoch": 10.708446866485014, + "grad_norm": 10.122505187988281, + "learning_rate": 1.9689970433067035e-05, + "loss": 1.312, + "step": 3930 + }, + { + "epoch": 10.711171662125341, + "grad_norm": 12.947110176086426, + "learning_rate": 1.9689752355339928e-05, + "loss": 1.5078, + "step": 3931 + }, + { + "epoch": 10.713896457765667, + "grad_norm": 19.704675674438477, + "learning_rate": 1.9689534202149344e-05, + "loss": 1.3325, + "step": 3932 + }, + { + "epoch": 10.716621253405995, + "grad_norm": 8.936685562133789, + "learning_rate": 1.9689315973496978e-05, + "loss": 1.3584, + "step": 3933 + }, + { + "epoch": 10.719346049046322, + "grad_norm": 11.175673484802246, + "learning_rate": 1.9689097669384533e-05, + "loss": 1.2551, + "step": 3934 + }, + { + "epoch": 10.722070844686648, + "grad_norm": 9.431500434875488, + "learning_rate": 1.9688879289813705e-05, + "loss": 1.1538, + "step": 3935 + }, + { + "epoch": 10.724795640326976, + "grad_norm": 10.447210311889648, + "learning_rate": 1.96886608347862e-05, + "loss": 1.3635, + "step": 3936 + }, + { + "epoch": 10.727520435967303, + "grad_norm": 11.345307350158691, + "learning_rate": 1.9688442304303713e-05, + "loss": 1.3945, + "step": 3937 + }, + { + "epoch": 10.730245231607629, + "grad_norm": 11.375175476074219, + "learning_rate": 1.968822369836795e-05, + "loss": 1.2881, + "step": 3938 + }, + { + "epoch": 10.732970027247957, + "grad_norm": 8.946102142333984, + "learning_rate": 1.968800501698061e-05, + "loss": 1.4264, + "step": 3939 + }, + { + "epoch": 10.735694822888284, + "grad_norm": 11.147432327270508, + "learning_rate": 1.96877862601434e-05, + "loss": 1.2141, + "step": 3940 + }, + { + "epoch": 10.73841961852861, + "grad_norm": 10.1541748046875, + "learning_rate": 1.9687567427858026e-05, + "loss": 1.2441, + "step": 3941 + }, + { + "epoch": 10.741144414168938, + "grad_norm": 8.995576858520508, + "learning_rate": 1.9687348520126187e-05, + "loss": 1.3813, + "step": 3942 + }, + { + "epoch": 10.743869209809265, + "grad_norm": 10.57896614074707, + "learning_rate": 1.9687129536949587e-05, + "loss": 1.4097, + "step": 3943 + }, + { + "epoch": 10.746594005449591, + "grad_norm": 9.385448455810547, + "learning_rate": 1.9686910478329938e-05, + "loss": 1.3086, + "step": 3944 + }, + { + "epoch": 10.749318801089919, + "grad_norm": 10.483943939208984, + "learning_rate": 1.968669134426894e-05, + "loss": 1.2358, + "step": 3945 + }, + { + "epoch": 10.752043596730246, + "grad_norm": 20.128450393676758, + "learning_rate": 1.96864721347683e-05, + "loss": 1.4196, + "step": 3946 + }, + { + "epoch": 10.754768392370572, + "grad_norm": 16.337125778198242, + "learning_rate": 1.968625284982973e-05, + "loss": 1.2693, + "step": 3947 + }, + { + "epoch": 10.7574931880109, + "grad_norm": 12.40900707244873, + "learning_rate": 1.9686033489454934e-05, + "loss": 1.5403, + "step": 3948 + }, + { + "epoch": 10.760217983651227, + "grad_norm": 10.881063461303711, + "learning_rate": 1.9685814053645618e-05, + "loss": 1.4182, + "step": 3949 + }, + { + "epoch": 10.762942779291553, + "grad_norm": 11.267525672912598, + "learning_rate": 1.9685594542403494e-05, + "loss": 1.2871, + "step": 3950 + }, + { + "epoch": 10.76566757493188, + "grad_norm": 9.441262245178223, + "learning_rate": 1.9685374955730275e-05, + "loss": 1.2678, + "step": 3951 + }, + { + "epoch": 10.768392370572208, + "grad_norm": 12.279179573059082, + "learning_rate": 1.9685155293627664e-05, + "loss": 1.4314, + "step": 3952 + }, + { + "epoch": 10.771117166212534, + "grad_norm": 9.561209678649902, + "learning_rate": 1.9684935556097378e-05, + "loss": 1.2091, + "step": 3953 + }, + { + "epoch": 10.773841961852861, + "grad_norm": 12.12336540222168, + "learning_rate": 1.9684715743141126e-05, + "loss": 1.3057, + "step": 3954 + }, + { + "epoch": 10.776566757493189, + "grad_norm": 11.090004920959473, + "learning_rate": 1.9684495854760616e-05, + "loss": 1.3801, + "step": 3955 + }, + { + "epoch": 10.779291553133515, + "grad_norm": 10.307674407958984, + "learning_rate": 1.9684275890957564e-05, + "loss": 1.2096, + "step": 3956 + }, + { + "epoch": 10.782016348773842, + "grad_norm": 9.547151565551758, + "learning_rate": 1.968405585173369e-05, + "loss": 1.4956, + "step": 3957 + }, + { + "epoch": 10.78474114441417, + "grad_norm": 11.083027839660645, + "learning_rate": 1.968383573709069e-05, + "loss": 1.2542, + "step": 3958 + }, + { + "epoch": 10.787465940054496, + "grad_norm": 11.283376693725586, + "learning_rate": 1.9683615547030296e-05, + "loss": 1.2568, + "step": 3959 + }, + { + "epoch": 10.790190735694823, + "grad_norm": 17.618133544921875, + "learning_rate": 1.9683395281554217e-05, + "loss": 1.1948, + "step": 3960 + }, + { + "epoch": 10.79291553133515, + "grad_norm": 13.181232452392578, + "learning_rate": 1.9683174940664163e-05, + "loss": 1.2615, + "step": 3961 + }, + { + "epoch": 10.795640326975477, + "grad_norm": 11.228410720825195, + "learning_rate": 1.9682954524361853e-05, + "loss": 1.3403, + "step": 3962 + }, + { + "epoch": 10.798365122615804, + "grad_norm": 14.959089279174805, + "learning_rate": 1.968273403264901e-05, + "loss": 1.1914, + "step": 3963 + }, + { + "epoch": 10.80108991825613, + "grad_norm": 14.117962837219238, + "learning_rate": 1.9682513465527345e-05, + "loss": 1.3884, + "step": 3964 + }, + { + "epoch": 10.803814713896458, + "grad_norm": 10.425492286682129, + "learning_rate": 1.9682292822998575e-05, + "loss": 1.3193, + "step": 3965 + }, + { + "epoch": 10.806539509536785, + "grad_norm": 15.191742897033691, + "learning_rate": 1.968207210506442e-05, + "loss": 1.4309, + "step": 3966 + }, + { + "epoch": 10.809264305177111, + "grad_norm": 12.611985206604004, + "learning_rate": 1.96818513117266e-05, + "loss": 1.3052, + "step": 3967 + }, + { + "epoch": 10.811989100817438, + "grad_norm": 12.097752571105957, + "learning_rate": 1.968163044298683e-05, + "loss": 1.4307, + "step": 3968 + }, + { + "epoch": 10.814713896457766, + "grad_norm": 13.448756217956543, + "learning_rate": 1.968140949884684e-05, + "loss": 1.3792, + "step": 3969 + }, + { + "epoch": 10.817438692098092, + "grad_norm": 10.021312713623047, + "learning_rate": 1.9681188479308343e-05, + "loss": 1.2178, + "step": 3970 + }, + { + "epoch": 10.82016348773842, + "grad_norm": 10.934687614440918, + "learning_rate": 1.9680967384373058e-05, + "loss": 1.3379, + "step": 3971 + }, + { + "epoch": 10.822888283378747, + "grad_norm": 10.070216178894043, + "learning_rate": 1.9680746214042714e-05, + "loss": 1.3088, + "step": 3972 + }, + { + "epoch": 10.825613079019073, + "grad_norm": 11.109722137451172, + "learning_rate": 1.9680524968319027e-05, + "loss": 1.2734, + "step": 3973 + }, + { + "epoch": 10.8283378746594, + "grad_norm": 11.988601684570312, + "learning_rate": 1.9680303647203723e-05, + "loss": 1.3433, + "step": 3974 + }, + { + "epoch": 10.831062670299728, + "grad_norm": 20.463165283203125, + "learning_rate": 1.968008225069853e-05, + "loss": 1.2795, + "step": 3975 + }, + { + "epoch": 10.833787465940054, + "grad_norm": 20.51481819152832, + "learning_rate": 1.9679860778805167e-05, + "loss": 1.4119, + "step": 3976 + }, + { + "epoch": 10.836512261580381, + "grad_norm": 9.952378273010254, + "learning_rate": 1.9679639231525357e-05, + "loss": 1.2629, + "step": 3977 + }, + { + "epoch": 10.839237057220709, + "grad_norm": 10.788759231567383, + "learning_rate": 1.9679417608860828e-05, + "loss": 1.1267, + "step": 3978 + }, + { + "epoch": 10.841961852861035, + "grad_norm": 11.57756233215332, + "learning_rate": 1.9679195910813308e-05, + "loss": 1.2061, + "step": 3979 + }, + { + "epoch": 10.844686648501362, + "grad_norm": 15.758150100708008, + "learning_rate": 1.9678974137384524e-05, + "loss": 1.1931, + "step": 3980 + }, + { + "epoch": 10.84741144414169, + "grad_norm": 13.442411422729492, + "learning_rate": 1.9678752288576198e-05, + "loss": 1.5183, + "step": 3981 + }, + { + "epoch": 10.850136239782016, + "grad_norm": 12.64612865447998, + "learning_rate": 1.967853036439006e-05, + "loss": 1.2146, + "step": 3982 + }, + { + "epoch": 10.852861035422343, + "grad_norm": 11.583940505981445, + "learning_rate": 1.967830836482784e-05, + "loss": 1.2296, + "step": 3983 + }, + { + "epoch": 10.85558583106267, + "grad_norm": 14.167618751525879, + "learning_rate": 1.9678086289891265e-05, + "loss": 1.2363, + "step": 3984 + }, + { + "epoch": 10.858310626702997, + "grad_norm": 11.235509872436523, + "learning_rate": 1.9677864139582066e-05, + "loss": 1.5708, + "step": 3985 + }, + { + "epoch": 10.861035422343324, + "grad_norm": 11.968399047851562, + "learning_rate": 1.9677641913901975e-05, + "loss": 1.255, + "step": 3986 + }, + { + "epoch": 10.863760217983652, + "grad_norm": 11.38996696472168, + "learning_rate": 1.9677419612852716e-05, + "loss": 1.178, + "step": 3987 + }, + { + "epoch": 10.866485013623977, + "grad_norm": 9.439459800720215, + "learning_rate": 1.9677197236436027e-05, + "loss": 1.3945, + "step": 3988 + }, + { + "epoch": 10.869209809264305, + "grad_norm": 51.21841812133789, + "learning_rate": 1.967697478465364e-05, + "loss": 1.2637, + "step": 3989 + }, + { + "epoch": 10.871934604904633, + "grad_norm": 9.610937118530273, + "learning_rate": 1.9676752257507282e-05, + "loss": 1.2288, + "step": 3990 + }, + { + "epoch": 10.874659400544958, + "grad_norm": 13.754937171936035, + "learning_rate": 1.967652965499869e-05, + "loss": 1.3416, + "step": 3991 + }, + { + "epoch": 10.877384196185286, + "grad_norm": 12.980363845825195, + "learning_rate": 1.9676306977129595e-05, + "loss": 1.3398, + "step": 3992 + }, + { + "epoch": 10.880108991825614, + "grad_norm": 13.093537330627441, + "learning_rate": 1.967608422390173e-05, + "loss": 1.1812, + "step": 3993 + }, + { + "epoch": 10.88283378746594, + "grad_norm": 10.763243675231934, + "learning_rate": 1.967586139531684e-05, + "loss": 1.481, + "step": 3994 + }, + { + "epoch": 10.885558583106267, + "grad_norm": 13.629618644714355, + "learning_rate": 1.9675638491376646e-05, + "loss": 1.5605, + "step": 3995 + }, + { + "epoch": 10.888283378746594, + "grad_norm": 14.426143646240234, + "learning_rate": 1.9675415512082895e-05, + "loss": 1.449, + "step": 3996 + }, + { + "epoch": 10.89100817438692, + "grad_norm": 11.355213165283203, + "learning_rate": 1.9675192457437316e-05, + "loss": 1.4153, + "step": 3997 + }, + { + "epoch": 10.893732970027248, + "grad_norm": 16.483633041381836, + "learning_rate": 1.9674969327441652e-05, + "loss": 1.3821, + "step": 3998 + }, + { + "epoch": 10.896457765667575, + "grad_norm": 12.077117919921875, + "learning_rate": 1.9674746122097637e-05, + "loss": 1.4727, + "step": 3999 + }, + { + "epoch": 10.899182561307901, + "grad_norm": 14.361942291259766, + "learning_rate": 1.967452284140701e-05, + "loss": 1.2417, + "step": 4000 + }, + { + "epoch": 10.901907356948229, + "grad_norm": 9.589673042297363, + "learning_rate": 1.967429948537151e-05, + "loss": 1.248, + "step": 4001 + }, + { + "epoch": 10.904632152588556, + "grad_norm": 12.560636520385742, + "learning_rate": 1.967407605399288e-05, + "loss": 1.3608, + "step": 4002 + }, + { + "epoch": 10.907356948228882, + "grad_norm": 13.126648902893066, + "learning_rate": 1.967385254727286e-05, + "loss": 1.3916, + "step": 4003 + }, + { + "epoch": 10.91008174386921, + "grad_norm": 12.25019645690918, + "learning_rate": 1.9673628965213177e-05, + "loss": 1.2607, + "step": 4004 + }, + { + "epoch": 10.912806539509537, + "grad_norm": 14.17881965637207, + "learning_rate": 1.9673405307815592e-05, + "loss": 1.2688, + "step": 4005 + }, + { + "epoch": 10.915531335149863, + "grad_norm": 11.824095726013184, + "learning_rate": 1.9673181575081837e-05, + "loss": 1.2573, + "step": 4006 + }, + { + "epoch": 10.91825613079019, + "grad_norm": 11.577066421508789, + "learning_rate": 1.9672957767013652e-05, + "loss": 1.5425, + "step": 4007 + }, + { + "epoch": 10.920980926430518, + "grad_norm": 10.646503448486328, + "learning_rate": 1.9672733883612786e-05, + "loss": 1.2871, + "step": 4008 + }, + { + "epoch": 10.923705722070844, + "grad_norm": 10.270605087280273, + "learning_rate": 1.9672509924880977e-05, + "loss": 1.2559, + "step": 4009 + }, + { + "epoch": 10.926430517711172, + "grad_norm": 11.509736061096191, + "learning_rate": 1.9672285890819974e-05, + "loss": 1.3875, + "step": 4010 + }, + { + "epoch": 10.9291553133515, + "grad_norm": 12.517537117004395, + "learning_rate": 1.967206178143152e-05, + "loss": 1.2605, + "step": 4011 + }, + { + "epoch": 10.931880108991825, + "grad_norm": 12.90263557434082, + "learning_rate": 1.967183759671736e-05, + "loss": 1.3694, + "step": 4012 + }, + { + "epoch": 10.934604904632153, + "grad_norm": 12.983382225036621, + "learning_rate": 1.9671613336679237e-05, + "loss": 1.2583, + "step": 4013 + }, + { + "epoch": 10.93732970027248, + "grad_norm": 15.22011661529541, + "learning_rate": 1.9671389001318904e-05, + "loss": 1.3909, + "step": 4014 + }, + { + "epoch": 10.940054495912806, + "grad_norm": 12.214634895324707, + "learning_rate": 1.96711645906381e-05, + "loss": 1.2373, + "step": 4015 + }, + { + "epoch": 10.942779291553133, + "grad_norm": 14.635167121887207, + "learning_rate": 1.9670940104638582e-05, + "loss": 1.5059, + "step": 4016 + }, + { + "epoch": 10.945504087193461, + "grad_norm": 8.975303649902344, + "learning_rate": 1.9670715543322093e-05, + "loss": 1.365, + "step": 4017 + }, + { + "epoch": 10.948228882833787, + "grad_norm": 10.037346839904785, + "learning_rate": 1.9670490906690386e-05, + "loss": 1.0637, + "step": 4018 + }, + { + "epoch": 10.950953678474114, + "grad_norm": 10.849924087524414, + "learning_rate": 1.96702661947452e-05, + "loss": 1.2229, + "step": 4019 + }, + { + "epoch": 10.953678474114442, + "grad_norm": 12.21422290802002, + "learning_rate": 1.9670041407488298e-05, + "loss": 1.5168, + "step": 4020 + }, + { + "epoch": 10.956403269754768, + "grad_norm": 10.877645492553711, + "learning_rate": 1.966981654492142e-05, + "loss": 1.2937, + "step": 4021 + }, + { + "epoch": 10.959128065395095, + "grad_norm": 10.834639549255371, + "learning_rate": 1.9669591607046325e-05, + "loss": 1.6199, + "step": 4022 + }, + { + "epoch": 10.961852861035423, + "grad_norm": 7.974213123321533, + "learning_rate": 1.9669366593864763e-05, + "loss": 1.2144, + "step": 4023 + }, + { + "epoch": 10.964577656675749, + "grad_norm": 14.464746475219727, + "learning_rate": 1.966914150537848e-05, + "loss": 1.3779, + "step": 4024 + }, + { + "epoch": 10.967302452316076, + "grad_norm": 8.732192039489746, + "learning_rate": 1.9668916341589242e-05, + "loss": 1.2466, + "step": 4025 + }, + { + "epoch": 10.970027247956404, + "grad_norm": 15.23045539855957, + "learning_rate": 1.966869110249879e-05, + "loss": 1.3286, + "step": 4026 + }, + { + "epoch": 10.97275204359673, + "grad_norm": 10.571854591369629, + "learning_rate": 1.966846578810888e-05, + "loss": 1.3718, + "step": 4027 + }, + { + "epoch": 10.975476839237057, + "grad_norm": 12.137609481811523, + "learning_rate": 1.9668240398421275e-05, + "loss": 1.4802, + "step": 4028 + }, + { + "epoch": 10.978201634877385, + "grad_norm": 9.905146598815918, + "learning_rate": 1.966801493343772e-05, + "loss": 1.1791, + "step": 4029 + }, + { + "epoch": 10.98092643051771, + "grad_norm": 11.161646842956543, + "learning_rate": 1.966778939315998e-05, + "loss": 1.4644, + "step": 4030 + }, + { + "epoch": 10.983651226158038, + "grad_norm": 9.805384635925293, + "learning_rate": 1.9667563777589805e-05, + "loss": 1.2712, + "step": 4031 + }, + { + "epoch": 10.986376021798366, + "grad_norm": 15.272140502929688, + "learning_rate": 1.9667338086728955e-05, + "loss": 1.4487, + "step": 4032 + }, + { + "epoch": 10.989100817438691, + "grad_norm": 9.714131355285645, + "learning_rate": 1.966711232057919e-05, + "loss": 1.3469, + "step": 4033 + }, + { + "epoch": 10.991825613079019, + "grad_norm": 10.3309326171875, + "learning_rate": 1.966688647914226e-05, + "loss": 1.218, + "step": 4034 + }, + { + "epoch": 10.994550408719347, + "grad_norm": 19.648483276367188, + "learning_rate": 1.9666660562419936e-05, + "loss": 1.519, + "step": 4035 + }, + { + "epoch": 10.997275204359672, + "grad_norm": 11.848732948303223, + "learning_rate": 1.9666434570413964e-05, + "loss": 1.3718, + "step": 4036 + }, + { + "epoch": 11.0, + "grad_norm": 10.305585861206055, + "learning_rate": 1.9666208503126115e-05, + "loss": 1.2573, + "step": 4037 + }, + { + "epoch": 11.002724795640328, + "grad_norm": 7.629805088043213, + "learning_rate": 1.9665982360558143e-05, + "loss": 1.3308, + "step": 4038 + }, + { + "epoch": 11.005449591280653, + "grad_norm": 11.943351745605469, + "learning_rate": 1.966575614271181e-05, + "loss": 1.2527, + "step": 4039 + }, + { + "epoch": 11.008174386920981, + "grad_norm": 8.443275451660156, + "learning_rate": 1.9665529849588882e-05, + "loss": 1.2517, + "step": 4040 + }, + { + "epoch": 11.010899182561309, + "grad_norm": 10.50875473022461, + "learning_rate": 1.966530348119112e-05, + "loss": 1.0623, + "step": 4041 + }, + { + "epoch": 11.013623978201634, + "grad_norm": 10.328377723693848, + "learning_rate": 1.9665077037520283e-05, + "loss": 1.1433, + "step": 4042 + }, + { + "epoch": 11.016348773841962, + "grad_norm": 15.970246315002441, + "learning_rate": 1.966485051857814e-05, + "loss": 1.2085, + "step": 4043 + }, + { + "epoch": 11.01907356948229, + "grad_norm": 9.247635841369629, + "learning_rate": 1.9664623924366446e-05, + "loss": 1.3401, + "step": 4044 + }, + { + "epoch": 11.021798365122615, + "grad_norm": 8.929620742797852, + "learning_rate": 1.9664397254886975e-05, + "loss": 1.3857, + "step": 4045 + }, + { + "epoch": 11.024523160762943, + "grad_norm": 8.579508781433105, + "learning_rate": 1.9664170510141495e-05, + "loss": 1.2671, + "step": 4046 + }, + { + "epoch": 11.02724795640327, + "grad_norm": 8.783073425292969, + "learning_rate": 1.966394369013176e-05, + "loss": 1.2777, + "step": 4047 + }, + { + "epoch": 11.029972752043596, + "grad_norm": 9.716208457946777, + "learning_rate": 1.9663716794859543e-05, + "loss": 1.2649, + "step": 4048 + }, + { + "epoch": 11.032697547683924, + "grad_norm": 8.254244804382324, + "learning_rate": 1.9663489824326612e-05, + "loss": 1.137, + "step": 4049 + }, + { + "epoch": 11.035422343324251, + "grad_norm": 16.232574462890625, + "learning_rate": 1.966326277853473e-05, + "loss": 1.3208, + "step": 4050 + }, + { + "epoch": 11.038147138964577, + "grad_norm": 9.67200756072998, + "learning_rate": 1.9663035657485673e-05, + "loss": 1.1733, + "step": 4051 + }, + { + "epoch": 11.040871934604905, + "grad_norm": 8.065556526184082, + "learning_rate": 1.9662808461181206e-05, + "loss": 1.1406, + "step": 4052 + }, + { + "epoch": 11.043596730245232, + "grad_norm": 21.56169891357422, + "learning_rate": 1.9662581189623093e-05, + "loss": 1.158, + "step": 4053 + }, + { + "epoch": 11.046321525885558, + "grad_norm": 13.468238830566406, + "learning_rate": 1.9662353842813112e-05, + "loss": 1.3716, + "step": 4054 + }, + { + "epoch": 11.049046321525886, + "grad_norm": 20.729324340820312, + "learning_rate": 1.9662126420753026e-05, + "loss": 1.3013, + "step": 4055 + }, + { + "epoch": 11.051771117166213, + "grad_norm": 10.317609786987305, + "learning_rate": 1.9661898923444616e-05, + "loss": 1.094, + "step": 4056 + }, + { + "epoch": 11.054495912806539, + "grad_norm": 9.526543617248535, + "learning_rate": 1.9661671350889645e-05, + "loss": 1.0095, + "step": 4057 + }, + { + "epoch": 11.057220708446867, + "grad_norm": 9.82815170288086, + "learning_rate": 1.9661443703089888e-05, + "loss": 1.0662, + "step": 4058 + }, + { + "epoch": 11.059945504087194, + "grad_norm": 11.4994478225708, + "learning_rate": 1.966121598004712e-05, + "loss": 1.3569, + "step": 4059 + }, + { + "epoch": 11.06267029972752, + "grad_norm": 11.084864616394043, + "learning_rate": 1.9660988181763114e-05, + "loss": 1.2798, + "step": 4060 + }, + { + "epoch": 11.065395095367847, + "grad_norm": 9.071287155151367, + "learning_rate": 1.966076030823964e-05, + "loss": 1.093, + "step": 4061 + }, + { + "epoch": 11.068119891008175, + "grad_norm": 14.715372085571289, + "learning_rate": 1.9660532359478476e-05, + "loss": 1.2085, + "step": 4062 + }, + { + "epoch": 11.0708446866485, + "grad_norm": 11.17330551147461, + "learning_rate": 1.9660304335481398e-05, + "loss": 1.1809, + "step": 4063 + }, + { + "epoch": 11.073569482288828, + "grad_norm": 17.41897201538086, + "learning_rate": 1.966007623625018e-05, + "loss": 1.1323, + "step": 4064 + }, + { + "epoch": 11.076294277929156, + "grad_norm": 10.150404930114746, + "learning_rate": 1.96598480617866e-05, + "loss": 1.2778, + "step": 4065 + }, + { + "epoch": 11.079019073569482, + "grad_norm": 10.516081809997559, + "learning_rate": 1.9659619812092434e-05, + "loss": 1.2273, + "step": 4066 + }, + { + "epoch": 11.08174386920981, + "grad_norm": 9.161614418029785, + "learning_rate": 1.965939148716946e-05, + "loss": 1.0337, + "step": 4067 + }, + { + "epoch": 11.084468664850137, + "grad_norm": 10.477733612060547, + "learning_rate": 1.9659163087019454e-05, + "loss": 1.1277, + "step": 4068 + }, + { + "epoch": 11.087193460490463, + "grad_norm": 7.671123027801514, + "learning_rate": 1.96589346116442e-05, + "loss": 1.043, + "step": 4069 + }, + { + "epoch": 11.08991825613079, + "grad_norm": 9.864495277404785, + "learning_rate": 1.9658706061045473e-05, + "loss": 1.2415, + "step": 4070 + }, + { + "epoch": 11.092643051771118, + "grad_norm": 9.38493537902832, + "learning_rate": 1.9658477435225053e-05, + "loss": 1.2493, + "step": 4071 + }, + { + "epoch": 11.095367847411444, + "grad_norm": 10.206192016601562, + "learning_rate": 1.9658248734184725e-05, + "loss": 1.1704, + "step": 4072 + }, + { + "epoch": 11.098092643051771, + "grad_norm": 8.365642547607422, + "learning_rate": 1.9658019957926263e-05, + "loss": 1.0044, + "step": 4073 + }, + { + "epoch": 11.100817438692099, + "grad_norm": 8.866310119628906, + "learning_rate": 1.9657791106451454e-05, + "loss": 1.3228, + "step": 4074 + }, + { + "epoch": 11.103542234332425, + "grad_norm": 43.499473571777344, + "learning_rate": 1.9657562179762078e-05, + "loss": 1.3042, + "step": 4075 + }, + { + "epoch": 11.106267029972752, + "grad_norm": 13.006279945373535, + "learning_rate": 1.965733317785992e-05, + "loss": 1.5593, + "step": 4076 + }, + { + "epoch": 11.10899182561308, + "grad_norm": 13.291231155395508, + "learning_rate": 1.965710410074676e-05, + "loss": 1.3572, + "step": 4077 + }, + { + "epoch": 11.111716621253406, + "grad_norm": 9.592552185058594, + "learning_rate": 1.9656874948424384e-05, + "loss": 1.1603, + "step": 4078 + }, + { + "epoch": 11.114441416893733, + "grad_norm": 11.061075210571289, + "learning_rate": 1.9656645720894577e-05, + "loss": 1.209, + "step": 4079 + }, + { + "epoch": 11.11716621253406, + "grad_norm": 8.441675186157227, + "learning_rate": 1.9656416418159127e-05, + "loss": 1.0714, + "step": 4080 + }, + { + "epoch": 11.119891008174386, + "grad_norm": 11.681937217712402, + "learning_rate": 1.9656187040219812e-05, + "loss": 1.3994, + "step": 4081 + }, + { + "epoch": 11.122615803814714, + "grad_norm": 11.914758682250977, + "learning_rate": 1.9655957587078426e-05, + "loss": 1.2463, + "step": 4082 + }, + { + "epoch": 11.125340599455042, + "grad_norm": 8.07807445526123, + "learning_rate": 1.9655728058736753e-05, + "loss": 1.2039, + "step": 4083 + }, + { + "epoch": 11.128065395095367, + "grad_norm": 8.954924583435059, + "learning_rate": 1.9655498455196576e-05, + "loss": 1.1509, + "step": 4084 + }, + { + "epoch": 11.130790190735695, + "grad_norm": 10.02565860748291, + "learning_rate": 1.9655268776459694e-05, + "loss": 1.2639, + "step": 4085 + }, + { + "epoch": 11.133514986376023, + "grad_norm": 9.384295463562012, + "learning_rate": 1.965503902252789e-05, + "loss": 1.1588, + "step": 4086 + }, + { + "epoch": 11.136239782016348, + "grad_norm": 9.927639961242676, + "learning_rate": 1.965480919340295e-05, + "loss": 1.1903, + "step": 4087 + }, + { + "epoch": 11.138964577656676, + "grad_norm": 7.977211952209473, + "learning_rate": 1.9654579289086665e-05, + "loss": 1.1218, + "step": 4088 + }, + { + "epoch": 11.141689373297003, + "grad_norm": 13.479766845703125, + "learning_rate": 1.965434930958083e-05, + "loss": 1.0947, + "step": 4089 + }, + { + "epoch": 11.14441416893733, + "grad_norm": 10.667736053466797, + "learning_rate": 1.965411925488723e-05, + "loss": 1.2054, + "step": 4090 + }, + { + "epoch": 11.147138964577657, + "grad_norm": 16.211450576782227, + "learning_rate": 1.9653889125007665e-05, + "loss": 1.158, + "step": 4091 + }, + { + "epoch": 11.149863760217984, + "grad_norm": 9.036359786987305, + "learning_rate": 1.965365891994392e-05, + "loss": 0.9523, + "step": 4092 + }, + { + "epoch": 11.15258855585831, + "grad_norm": 9.005630493164062, + "learning_rate": 1.9653428639697788e-05, + "loss": 1.2079, + "step": 4093 + }, + { + "epoch": 11.155313351498638, + "grad_norm": 9.042786598205566, + "learning_rate": 1.9653198284271065e-05, + "loss": 1.3333, + "step": 4094 + }, + { + "epoch": 11.158038147138965, + "grad_norm": 9.039999008178711, + "learning_rate": 1.9652967853665547e-05, + "loss": 0.9956, + "step": 4095 + }, + { + "epoch": 11.160762942779291, + "grad_norm": 14.095746040344238, + "learning_rate": 1.9652737347883025e-05, + "loss": 1.147, + "step": 4096 + }, + { + "epoch": 11.163487738419619, + "grad_norm": 8.9838228225708, + "learning_rate": 1.9652506766925296e-05, + "loss": 1.1233, + "step": 4097 + }, + { + "epoch": 11.166212534059946, + "grad_norm": 9.379589080810547, + "learning_rate": 1.965227611079415e-05, + "loss": 1.0171, + "step": 4098 + }, + { + "epoch": 11.168937329700272, + "grad_norm": 13.760157585144043, + "learning_rate": 1.9652045379491395e-05, + "loss": 1.3872, + "step": 4099 + }, + { + "epoch": 11.1716621253406, + "grad_norm": 13.840320587158203, + "learning_rate": 1.9651814573018818e-05, + "loss": 1.2776, + "step": 4100 + }, + { + "epoch": 11.174386920980927, + "grad_norm": 11.532063484191895, + "learning_rate": 1.965158369137822e-05, + "loss": 1.4041, + "step": 4101 + }, + { + "epoch": 11.177111716621253, + "grad_norm": 11.299899101257324, + "learning_rate": 1.96513527345714e-05, + "loss": 1.3455, + "step": 4102 + }, + { + "epoch": 11.17983651226158, + "grad_norm": 9.078874588012695, + "learning_rate": 1.9651121702600155e-05, + "loss": 1.1794, + "step": 4103 + }, + { + "epoch": 11.182561307901908, + "grad_norm": 11.858445167541504, + "learning_rate": 1.9650890595466284e-05, + "loss": 1.0796, + "step": 4104 + }, + { + "epoch": 11.185286103542234, + "grad_norm": 10.78423023223877, + "learning_rate": 1.965065941317159e-05, + "loss": 1.2229, + "step": 4105 + }, + { + "epoch": 11.188010899182562, + "grad_norm": 11.808480262756348, + "learning_rate": 1.9650428155717867e-05, + "loss": 1.2874, + "step": 4106 + }, + { + "epoch": 11.190735694822889, + "grad_norm": 14.424799919128418, + "learning_rate": 1.965019682310692e-05, + "loss": 1.4639, + "step": 4107 + }, + { + "epoch": 11.193460490463215, + "grad_norm": 10.045002937316895, + "learning_rate": 1.9649965415340553e-05, + "loss": 1.1688, + "step": 4108 + }, + { + "epoch": 11.196185286103542, + "grad_norm": 11.161811828613281, + "learning_rate": 1.9649733932420566e-05, + "loss": 1.3177, + "step": 4109 + }, + { + "epoch": 11.19891008174387, + "grad_norm": 9.272212982177734, + "learning_rate": 1.9649502374348763e-05, + "loss": 1.0918, + "step": 4110 + }, + { + "epoch": 11.201634877384196, + "grad_norm": 10.659878730773926, + "learning_rate": 1.9649270741126944e-05, + "loss": 1.3677, + "step": 4111 + }, + { + "epoch": 11.204359673024523, + "grad_norm": 9.117798805236816, + "learning_rate": 1.9649039032756913e-05, + "loss": 1.2502, + "step": 4112 + }, + { + "epoch": 11.207084468664851, + "grad_norm": 12.927522659301758, + "learning_rate": 1.964880724924048e-05, + "loss": 1.2788, + "step": 4113 + }, + { + "epoch": 11.209809264305177, + "grad_norm": 11.339554786682129, + "learning_rate": 1.9648575390579447e-05, + "loss": 1.4341, + "step": 4114 + }, + { + "epoch": 11.212534059945504, + "grad_norm": 12.668943405151367, + "learning_rate": 1.964834345677562e-05, + "loss": 1.4468, + "step": 4115 + }, + { + "epoch": 11.215258855585832, + "grad_norm": 17.67973518371582, + "learning_rate": 1.96481114478308e-05, + "loss": 1.1472, + "step": 4116 + }, + { + "epoch": 11.217983651226158, + "grad_norm": 16.11754035949707, + "learning_rate": 1.96478793637468e-05, + "loss": 1.3931, + "step": 4117 + }, + { + "epoch": 11.220708446866485, + "grad_norm": 11.04246711730957, + "learning_rate": 1.964764720452543e-05, + "loss": 1.1917, + "step": 4118 + }, + { + "epoch": 11.223433242506813, + "grad_norm": 18.711198806762695, + "learning_rate": 1.964741497016849e-05, + "loss": 1.2371, + "step": 4119 + }, + { + "epoch": 11.226158038147139, + "grad_norm": 10.438543319702148, + "learning_rate": 1.9647182660677796e-05, + "loss": 1.0435, + "step": 4120 + }, + { + "epoch": 11.228882833787466, + "grad_norm": 15.964482307434082, + "learning_rate": 1.9646950276055153e-05, + "loss": 1.1743, + "step": 4121 + }, + { + "epoch": 11.231607629427794, + "grad_norm": 13.605895042419434, + "learning_rate": 1.964671781630237e-05, + "loss": 1.2588, + "step": 4122 + }, + { + "epoch": 11.23433242506812, + "grad_norm": 22.46067237854004, + "learning_rate": 1.964648528142126e-05, + "loss": 1.282, + "step": 4123 + }, + { + "epoch": 11.237057220708447, + "grad_norm": 10.966947555541992, + "learning_rate": 1.9646252671413633e-05, + "loss": 1.0828, + "step": 4124 + }, + { + "epoch": 11.239782016348773, + "grad_norm": 11.58065414428711, + "learning_rate": 1.96460199862813e-05, + "loss": 1.1797, + "step": 4125 + }, + { + "epoch": 11.2425068119891, + "grad_norm": 12.301233291625977, + "learning_rate": 1.9645787226026075e-05, + "loss": 1.2278, + "step": 4126 + }, + { + "epoch": 11.245231607629428, + "grad_norm": 16.46876335144043, + "learning_rate": 1.964555439064977e-05, + "loss": 1.1877, + "step": 4127 + }, + { + "epoch": 11.247956403269754, + "grad_norm": 12.894742965698242, + "learning_rate": 1.96453214801542e-05, + "loss": 1.2786, + "step": 4128 + }, + { + "epoch": 11.250681198910081, + "grad_norm": 14.421160697937012, + "learning_rate": 1.9645088494541172e-05, + "loss": 1.3118, + "step": 4129 + }, + { + "epoch": 11.253405994550409, + "grad_norm": 14.483222007751465, + "learning_rate": 1.9644855433812507e-05, + "loss": 1.4663, + "step": 4130 + }, + { + "epoch": 11.256130790190735, + "grad_norm": 31.697895050048828, + "learning_rate": 1.9644622297970018e-05, + "loss": 1.1819, + "step": 4131 + }, + { + "epoch": 11.258855585831062, + "grad_norm": 12.084939002990723, + "learning_rate": 1.964438908701552e-05, + "loss": 1.3225, + "step": 4132 + }, + { + "epoch": 11.26158038147139, + "grad_norm": 12.784135818481445, + "learning_rate": 1.9644155800950832e-05, + "loss": 1.3584, + "step": 4133 + }, + { + "epoch": 11.264305177111716, + "grad_norm": 8.929036140441895, + "learning_rate": 1.964392243977777e-05, + "loss": 1.2412, + "step": 4134 + }, + { + "epoch": 11.267029972752043, + "grad_norm": 12.572015762329102, + "learning_rate": 1.9643689003498147e-05, + "loss": 1.3308, + "step": 4135 + }, + { + "epoch": 11.269754768392371, + "grad_norm": 12.465352058410645, + "learning_rate": 1.964345549211379e-05, + "loss": 1.2808, + "step": 4136 + }, + { + "epoch": 11.272479564032697, + "grad_norm": 9.7542724609375, + "learning_rate": 1.9643221905626505e-05, + "loss": 1.0579, + "step": 4137 + }, + { + "epoch": 11.275204359673024, + "grad_norm": 18.65604591369629, + "learning_rate": 1.9642988244038122e-05, + "loss": 1.2966, + "step": 4138 + }, + { + "epoch": 11.277929155313352, + "grad_norm": 11.757242202758789, + "learning_rate": 1.9642754507350457e-05, + "loss": 1.2561, + "step": 4139 + }, + { + "epoch": 11.280653950953678, + "grad_norm": 8.50538444519043, + "learning_rate": 1.9642520695565328e-05, + "loss": 1.1646, + "step": 4140 + }, + { + "epoch": 11.283378746594005, + "grad_norm": 9.911194801330566, + "learning_rate": 1.9642286808684562e-05, + "loss": 1.4351, + "step": 4141 + }, + { + "epoch": 11.286103542234333, + "grad_norm": 10.260211944580078, + "learning_rate": 1.9642052846709975e-05, + "loss": 1.1672, + "step": 4142 + }, + { + "epoch": 11.288828337874659, + "grad_norm": 12.260438919067383, + "learning_rate": 1.964181880964339e-05, + "loss": 1.449, + "step": 4143 + }, + { + "epoch": 11.291553133514986, + "grad_norm": 14.704292297363281, + "learning_rate": 1.9641584697486632e-05, + "loss": 1.1729, + "step": 4144 + }, + { + "epoch": 11.294277929155314, + "grad_norm": 10.67501163482666, + "learning_rate": 1.964135051024152e-05, + "loss": 1.3525, + "step": 4145 + }, + { + "epoch": 11.29700272479564, + "grad_norm": 10.726551055908203, + "learning_rate": 1.964111624790988e-05, + "loss": 1.3108, + "step": 4146 + }, + { + "epoch": 11.299727520435967, + "grad_norm": 14.48544979095459, + "learning_rate": 1.964088191049354e-05, + "loss": 1.3015, + "step": 4147 + }, + { + "epoch": 11.302452316076295, + "grad_norm": 10.027518272399902, + "learning_rate": 1.964064749799432e-05, + "loss": 1.1862, + "step": 4148 + }, + { + "epoch": 11.30517711171662, + "grad_norm": 40.34449005126953, + "learning_rate": 1.9640413010414048e-05, + "loss": 1.1127, + "step": 4149 + }, + { + "epoch": 11.307901907356948, + "grad_norm": 9.3348970413208, + "learning_rate": 1.9640178447754554e-05, + "loss": 1.0125, + "step": 4150 + }, + { + "epoch": 11.310626702997276, + "grad_norm": 11.324419021606445, + "learning_rate": 1.9639943810017654e-05, + "loss": 1.2837, + "step": 4151 + }, + { + "epoch": 11.313351498637601, + "grad_norm": 12.872102737426758, + "learning_rate": 1.9639709097205185e-05, + "loss": 1.3274, + "step": 4152 + }, + { + "epoch": 11.316076294277929, + "grad_norm": 9.504002571105957, + "learning_rate": 1.963947430931897e-05, + "loss": 1.4272, + "step": 4153 + }, + { + "epoch": 11.318801089918257, + "grad_norm": 81.22502136230469, + "learning_rate": 1.963923944636084e-05, + "loss": 1.2947, + "step": 4154 + }, + { + "epoch": 11.321525885558582, + "grad_norm": 10.916065216064453, + "learning_rate": 1.9639004508332627e-05, + "loss": 1.1638, + "step": 4155 + }, + { + "epoch": 11.32425068119891, + "grad_norm": 10.57822322845459, + "learning_rate": 1.9638769495236154e-05, + "loss": 1.3083, + "step": 4156 + }, + { + "epoch": 11.326975476839237, + "grad_norm": 12.542110443115234, + "learning_rate": 1.963853440707325e-05, + "loss": 1.3452, + "step": 4157 + }, + { + "epoch": 11.329700272479563, + "grad_norm": 9.83530044555664, + "learning_rate": 1.9638299243845758e-05, + "loss": 1.2844, + "step": 4158 + }, + { + "epoch": 11.33242506811989, + "grad_norm": 11.479257583618164, + "learning_rate": 1.96380640055555e-05, + "loss": 1.1814, + "step": 4159 + }, + { + "epoch": 11.335149863760218, + "grad_norm": 10.582036018371582, + "learning_rate": 1.9637828692204307e-05, + "loss": 1.1533, + "step": 4160 + }, + { + "epoch": 11.337874659400544, + "grad_norm": 15.099767684936523, + "learning_rate": 1.9637593303794015e-05, + "loss": 1.3831, + "step": 4161 + }, + { + "epoch": 11.340599455040872, + "grad_norm": 10.092370986938477, + "learning_rate": 1.9637357840326457e-05, + "loss": 1.1663, + "step": 4162 + }, + { + "epoch": 11.3433242506812, + "grad_norm": 11.402278900146484, + "learning_rate": 1.9637122301803466e-05, + "loss": 1.1959, + "step": 4163 + }, + { + "epoch": 11.346049046321525, + "grad_norm": 9.97726058959961, + "learning_rate": 1.963688668822688e-05, + "loss": 1.1047, + "step": 4164 + }, + { + "epoch": 11.348773841961853, + "grad_norm": 9.727554321289062, + "learning_rate": 1.9636650999598527e-05, + "loss": 1.1803, + "step": 4165 + }, + { + "epoch": 11.35149863760218, + "grad_norm": 9.918126106262207, + "learning_rate": 1.9636415235920246e-05, + "loss": 1.3164, + "step": 4166 + }, + { + "epoch": 11.354223433242506, + "grad_norm": 8.939223289489746, + "learning_rate": 1.9636179397193874e-05, + "loss": 1.4137, + "step": 4167 + }, + { + "epoch": 11.356948228882834, + "grad_norm": 14.461063385009766, + "learning_rate": 1.9635943483421246e-05, + "loss": 1.168, + "step": 4168 + }, + { + "epoch": 11.359673024523161, + "grad_norm": 8.427556037902832, + "learning_rate": 1.9635707494604203e-05, + "loss": 1.0503, + "step": 4169 + }, + { + "epoch": 11.362397820163487, + "grad_norm": 8.970022201538086, + "learning_rate": 1.9635471430744578e-05, + "loss": 1.1821, + "step": 4170 + }, + { + "epoch": 11.365122615803815, + "grad_norm": 7.9704060554504395, + "learning_rate": 1.9635235291844213e-05, + "loss": 1.2388, + "step": 4171 + }, + { + "epoch": 11.367847411444142, + "grad_norm": 10.413139343261719, + "learning_rate": 1.9634999077904945e-05, + "loss": 1.3325, + "step": 4172 + }, + { + "epoch": 11.370572207084468, + "grad_norm": 11.076361656188965, + "learning_rate": 1.9634762788928615e-05, + "loss": 1.3113, + "step": 4173 + }, + { + "epoch": 11.373297002724795, + "grad_norm": 8.550765037536621, + "learning_rate": 1.963452642491706e-05, + "loss": 1.1122, + "step": 4174 + }, + { + "epoch": 11.376021798365123, + "grad_norm": 17.111282348632812, + "learning_rate": 1.9634289985872126e-05, + "loss": 1.1338, + "step": 4175 + }, + { + "epoch": 11.378746594005449, + "grad_norm": 11.5484619140625, + "learning_rate": 1.963405347179565e-05, + "loss": 1.3228, + "step": 4176 + }, + { + "epoch": 11.381471389645776, + "grad_norm": 9.316886901855469, + "learning_rate": 1.963381688268948e-05, + "loss": 1.1422, + "step": 4177 + }, + { + "epoch": 11.384196185286104, + "grad_norm": 12.380435943603516, + "learning_rate": 1.963358021855545e-05, + "loss": 1.3149, + "step": 4178 + }, + { + "epoch": 11.38692098092643, + "grad_norm": 10.483932495117188, + "learning_rate": 1.9633343479395405e-05, + "loss": 1.3203, + "step": 4179 + }, + { + "epoch": 11.389645776566757, + "grad_norm": 9.909773826599121, + "learning_rate": 1.9633106665211196e-05, + "loss": 1.2068, + "step": 4180 + }, + { + "epoch": 11.392370572207085, + "grad_norm": 9.947454452514648, + "learning_rate": 1.963286977600466e-05, + "loss": 1.3235, + "step": 4181 + }, + { + "epoch": 11.39509536784741, + "grad_norm": 9.787384986877441, + "learning_rate": 1.9632632811777644e-05, + "loss": 1.4629, + "step": 4182 + }, + { + "epoch": 11.397820163487738, + "grad_norm": 8.918498992919922, + "learning_rate": 1.9632395772531993e-05, + "loss": 1.3926, + "step": 4183 + }, + { + "epoch": 11.400544959128066, + "grad_norm": 8.588772773742676, + "learning_rate": 1.9632158658269554e-05, + "loss": 1.2854, + "step": 4184 + }, + { + "epoch": 11.403269754768392, + "grad_norm": 10.430420875549316, + "learning_rate": 1.9631921468992173e-05, + "loss": 1.1613, + "step": 4185 + }, + { + "epoch": 11.40599455040872, + "grad_norm": 11.09743881225586, + "learning_rate": 1.96316842047017e-05, + "loss": 1.2173, + "step": 4186 + }, + { + "epoch": 11.408719346049047, + "grad_norm": 9.371150970458984, + "learning_rate": 1.963144686539998e-05, + "loss": 1.0715, + "step": 4187 + }, + { + "epoch": 11.411444141689373, + "grad_norm": 9.642024993896484, + "learning_rate": 1.963120945108886e-05, + "loss": 1.0969, + "step": 4188 + }, + { + "epoch": 11.4141689373297, + "grad_norm": 8.411330223083496, + "learning_rate": 1.9630971961770194e-05, + "loss": 1.2397, + "step": 4189 + }, + { + "epoch": 11.416893732970028, + "grad_norm": 8.898776054382324, + "learning_rate": 1.9630734397445824e-05, + "loss": 1.2456, + "step": 4190 + }, + { + "epoch": 11.419618528610354, + "grad_norm": 10.948317527770996, + "learning_rate": 1.963049675811761e-05, + "loss": 1.2649, + "step": 4191 + }, + { + "epoch": 11.422343324250681, + "grad_norm": 9.487371444702148, + "learning_rate": 1.963025904378739e-05, + "loss": 1.1331, + "step": 4192 + }, + { + "epoch": 11.425068119891009, + "grad_norm": 9.217453002929688, + "learning_rate": 1.9630021254457026e-05, + "loss": 1.297, + "step": 4193 + }, + { + "epoch": 11.427792915531334, + "grad_norm": 7.42936372756958, + "learning_rate": 1.9629783390128366e-05, + "loss": 1.4397, + "step": 4194 + }, + { + "epoch": 11.430517711171662, + "grad_norm": 10.919928550720215, + "learning_rate": 1.9629545450803266e-05, + "loss": 1.3093, + "step": 4195 + }, + { + "epoch": 11.43324250681199, + "grad_norm": 9.25825309753418, + "learning_rate": 1.9629307436483573e-05, + "loss": 1.0737, + "step": 4196 + }, + { + "epoch": 11.435967302452315, + "grad_norm": 10.210301399230957, + "learning_rate": 1.9629069347171144e-05, + "loss": 1.4414, + "step": 4197 + }, + { + "epoch": 11.438692098092643, + "grad_norm": 7.53134822845459, + "learning_rate": 1.9628831182867833e-05, + "loss": 1.3176, + "step": 4198 + }, + { + "epoch": 11.44141689373297, + "grad_norm": 7.884014129638672, + "learning_rate": 1.9628592943575494e-05, + "loss": 1.1528, + "step": 4199 + }, + { + "epoch": 11.444141689373296, + "grad_norm": 11.789016723632812, + "learning_rate": 1.9628354629295983e-05, + "loss": 1.2783, + "step": 4200 + }, + { + "epoch": 11.446866485013624, + "grad_norm": 12.273369789123535, + "learning_rate": 1.962811624003116e-05, + "loss": 1.2969, + "step": 4201 + }, + { + "epoch": 11.449591280653951, + "grad_norm": 9.086417198181152, + "learning_rate": 1.9627877775782873e-05, + "loss": 1.1382, + "step": 4202 + }, + { + "epoch": 11.452316076294277, + "grad_norm": 7.977797031402588, + "learning_rate": 1.9627639236552983e-05, + "loss": 1.3462, + "step": 4203 + }, + { + "epoch": 11.455040871934605, + "grad_norm": 8.445021629333496, + "learning_rate": 1.9627400622343354e-05, + "loss": 1.2949, + "step": 4204 + }, + { + "epoch": 11.457765667574932, + "grad_norm": 8.467462539672852, + "learning_rate": 1.9627161933155833e-05, + "loss": 1.3215, + "step": 4205 + }, + { + "epoch": 11.460490463215258, + "grad_norm": 9.459888458251953, + "learning_rate": 1.962692316899229e-05, + "loss": 1.1018, + "step": 4206 + }, + { + "epoch": 11.463215258855586, + "grad_norm": 8.615829467773438, + "learning_rate": 1.9626684329854575e-05, + "loss": 1.1511, + "step": 4207 + }, + { + "epoch": 11.465940054495913, + "grad_norm": 9.40342903137207, + "learning_rate": 1.9626445415744552e-05, + "loss": 1.0793, + "step": 4208 + }, + { + "epoch": 11.46866485013624, + "grad_norm": 10.980266571044922, + "learning_rate": 1.9626206426664084e-05, + "loss": 1.1465, + "step": 4209 + }, + { + "epoch": 11.471389645776567, + "grad_norm": 8.530308723449707, + "learning_rate": 1.962596736261503e-05, + "loss": 1.1807, + "step": 4210 + }, + { + "epoch": 11.474114441416894, + "grad_norm": 8.508332252502441, + "learning_rate": 1.9625728223599253e-05, + "loss": 1.2659, + "step": 4211 + }, + { + "epoch": 11.47683923705722, + "grad_norm": 8.210857391357422, + "learning_rate": 1.962548900961861e-05, + "loss": 1.1379, + "step": 4212 + }, + { + "epoch": 11.479564032697548, + "grad_norm": 9.084643363952637, + "learning_rate": 1.9625249720674975e-05, + "loss": 1.377, + "step": 4213 + }, + { + "epoch": 11.482288828337875, + "grad_norm": 11.54325008392334, + "learning_rate": 1.96250103567702e-05, + "loss": 1.4338, + "step": 4214 + }, + { + "epoch": 11.485013623978201, + "grad_norm": 10.700432777404785, + "learning_rate": 1.9624770917906156e-05, + "loss": 1.0547, + "step": 4215 + }, + { + "epoch": 11.487738419618529, + "grad_norm": 8.42674446105957, + "learning_rate": 1.9624531404084704e-05, + "loss": 1.2573, + "step": 4216 + }, + { + "epoch": 11.490463215258856, + "grad_norm": 10.657425880432129, + "learning_rate": 1.962429181530771e-05, + "loss": 1.2754, + "step": 4217 + }, + { + "epoch": 11.493188010899182, + "grad_norm": 7.15110445022583, + "learning_rate": 1.9624052151577047e-05, + "loss": 1.0391, + "step": 4218 + }, + { + "epoch": 11.49591280653951, + "grad_norm": 8.82170295715332, + "learning_rate": 1.962381241289457e-05, + "loss": 1.4329, + "step": 4219 + }, + { + "epoch": 11.498637602179837, + "grad_norm": 10.280640602111816, + "learning_rate": 1.9623572599262156e-05, + "loss": 1.3613, + "step": 4220 + }, + { + "epoch": 11.501362397820163, + "grad_norm": 8.611913681030273, + "learning_rate": 1.9623332710681666e-05, + "loss": 1.1653, + "step": 4221 + }, + { + "epoch": 11.50408719346049, + "grad_norm": 7.79402494430542, + "learning_rate": 1.962309274715497e-05, + "loss": 1.1033, + "step": 4222 + }, + { + "epoch": 11.506811989100818, + "grad_norm": 9.2391939163208, + "learning_rate": 1.962285270868394e-05, + "loss": 1.2617, + "step": 4223 + }, + { + "epoch": 11.509536784741144, + "grad_norm": 8.58356761932373, + "learning_rate": 1.962261259527044e-05, + "loss": 1.2402, + "step": 4224 + }, + { + "epoch": 11.512261580381471, + "grad_norm": 10.11650562286377, + "learning_rate": 1.9622372406916343e-05, + "loss": 1.1157, + "step": 4225 + }, + { + "epoch": 11.514986376021799, + "grad_norm": 10.219006538391113, + "learning_rate": 1.9622132143623524e-05, + "loss": 1.2388, + "step": 4226 + }, + { + "epoch": 11.517711171662125, + "grad_norm": 10.135218620300293, + "learning_rate": 1.9621891805393846e-05, + "loss": 1.2124, + "step": 4227 + }, + { + "epoch": 11.520435967302452, + "grad_norm": 9.944450378417969, + "learning_rate": 1.9621651392229182e-05, + "loss": 1.3591, + "step": 4228 + }, + { + "epoch": 11.52316076294278, + "grad_norm": 8.386174201965332, + "learning_rate": 1.9621410904131407e-05, + "loss": 1.2812, + "step": 4229 + }, + { + "epoch": 11.525885558583106, + "grad_norm": 9.262544631958008, + "learning_rate": 1.9621170341102396e-05, + "loss": 1.436, + "step": 4230 + }, + { + "epoch": 11.528610354223433, + "grad_norm": 10.720914840698242, + "learning_rate": 1.962092970314402e-05, + "loss": 1.3401, + "step": 4231 + }, + { + "epoch": 11.53133514986376, + "grad_norm": 7.582281589508057, + "learning_rate": 1.9620688990258152e-05, + "loss": 1.2751, + "step": 4232 + }, + { + "epoch": 11.534059945504087, + "grad_norm": 9.216172218322754, + "learning_rate": 1.962044820244667e-05, + "loss": 1.1741, + "step": 4233 + }, + { + "epoch": 11.536784741144414, + "grad_norm": 8.738519668579102, + "learning_rate": 1.9620207339711442e-05, + "loss": 1.1365, + "step": 4234 + }, + { + "epoch": 11.539509536784742, + "grad_norm": 9.072188377380371, + "learning_rate": 1.9619966402054355e-05, + "loss": 1.3137, + "step": 4235 + }, + { + "epoch": 11.542234332425068, + "grad_norm": 8.85590648651123, + "learning_rate": 1.9619725389477275e-05, + "loss": 1.2622, + "step": 4236 + }, + { + "epoch": 11.544959128065395, + "grad_norm": 9.035333633422852, + "learning_rate": 1.9619484301982086e-05, + "loss": 1.2571, + "step": 4237 + }, + { + "epoch": 11.547683923705723, + "grad_norm": 7.747833251953125, + "learning_rate": 1.961924313957066e-05, + "loss": 1.323, + "step": 4238 + }, + { + "epoch": 11.550408719346049, + "grad_norm": 7.55806827545166, + "learning_rate": 1.961900190224488e-05, + "loss": 1.4465, + "step": 4239 + }, + { + "epoch": 11.553133514986376, + "grad_norm": 10.450825691223145, + "learning_rate": 1.9618760590006623e-05, + "loss": 1.2168, + "step": 4240 + }, + { + "epoch": 11.555858310626704, + "grad_norm": 9.569533348083496, + "learning_rate": 1.9618519202857768e-05, + "loss": 1.3794, + "step": 4241 + }, + { + "epoch": 11.55858310626703, + "grad_norm": 8.513108253479004, + "learning_rate": 1.9618277740800195e-05, + "loss": 1.082, + "step": 4242 + }, + { + "epoch": 11.561307901907357, + "grad_norm": 11.943915367126465, + "learning_rate": 1.961803620383578e-05, + "loss": 1.261, + "step": 4243 + }, + { + "epoch": 11.564032697547685, + "grad_norm": 8.429560661315918, + "learning_rate": 1.9617794591966418e-05, + "loss": 1.1899, + "step": 4244 + }, + { + "epoch": 11.56675749318801, + "grad_norm": 7.78025484085083, + "learning_rate": 1.9617552905193972e-05, + "loss": 1.2947, + "step": 4245 + }, + { + "epoch": 11.569482288828338, + "grad_norm": 11.231201171875, + "learning_rate": 1.961731114352034e-05, + "loss": 1.3087, + "step": 4246 + }, + { + "epoch": 11.572207084468666, + "grad_norm": 8.603983879089355, + "learning_rate": 1.9617069306947394e-05, + "loss": 1.2297, + "step": 4247 + }, + { + "epoch": 11.574931880108991, + "grad_norm": 9.307816505432129, + "learning_rate": 1.9616827395477026e-05, + "loss": 1.1334, + "step": 4248 + }, + { + "epoch": 11.577656675749319, + "grad_norm": 8.92887020111084, + "learning_rate": 1.961658540911111e-05, + "loss": 1.3169, + "step": 4249 + }, + { + "epoch": 11.580381471389646, + "grad_norm": 8.824298858642578, + "learning_rate": 1.961634334785154e-05, + "loss": 1.2552, + "step": 4250 + }, + { + "epoch": 11.583106267029972, + "grad_norm": 8.4943208694458, + "learning_rate": 1.9616101211700198e-05, + "loss": 1.1731, + "step": 4251 + }, + { + "epoch": 11.5858310626703, + "grad_norm": 11.546370506286621, + "learning_rate": 1.961585900065897e-05, + "loss": 1.259, + "step": 4252 + }, + { + "epoch": 11.588555858310627, + "grad_norm": 11.164836883544922, + "learning_rate": 1.961561671472974e-05, + "loss": 1.3291, + "step": 4253 + }, + { + "epoch": 11.591280653950953, + "grad_norm": 9.311529159545898, + "learning_rate": 1.9615374353914395e-05, + "loss": 1.4153, + "step": 4254 + }, + { + "epoch": 11.59400544959128, + "grad_norm": 10.316414833068848, + "learning_rate": 1.9615131918214824e-05, + "loss": 1.4077, + "step": 4255 + }, + { + "epoch": 11.596730245231608, + "grad_norm": 25.058340072631836, + "learning_rate": 1.961488940763292e-05, + "loss": 1.2662, + "step": 4256 + }, + { + "epoch": 11.599455040871934, + "grad_norm": 14.15247917175293, + "learning_rate": 1.961464682217056e-05, + "loss": 1.3037, + "step": 4257 + }, + { + "epoch": 11.602179836512262, + "grad_norm": 10.92613410949707, + "learning_rate": 1.9614404161829643e-05, + "loss": 1.3882, + "step": 4258 + }, + { + "epoch": 11.60490463215259, + "grad_norm": 8.810829162597656, + "learning_rate": 1.9614161426612056e-05, + "loss": 1.2002, + "step": 4259 + }, + { + "epoch": 11.607629427792915, + "grad_norm": 8.915725708007812, + "learning_rate": 1.9613918616519688e-05, + "loss": 1.2571, + "step": 4260 + }, + { + "epoch": 11.610354223433243, + "grad_norm": 10.085176467895508, + "learning_rate": 1.9613675731554435e-05, + "loss": 1.1372, + "step": 4261 + }, + { + "epoch": 11.61307901907357, + "grad_norm": 9.723475456237793, + "learning_rate": 1.961343277171818e-05, + "loss": 1.2898, + "step": 4262 + }, + { + "epoch": 11.615803814713896, + "grad_norm": 7.391706943511963, + "learning_rate": 1.9613189737012824e-05, + "loss": 1.0732, + "step": 4263 + }, + { + "epoch": 11.618528610354224, + "grad_norm": 8.334680557250977, + "learning_rate": 1.9612946627440254e-05, + "loss": 1.2378, + "step": 4264 + }, + { + "epoch": 11.621253405994551, + "grad_norm": 10.083943367004395, + "learning_rate": 1.9612703443002366e-05, + "loss": 1.4141, + "step": 4265 + }, + { + "epoch": 11.623978201634877, + "grad_norm": 8.957664489746094, + "learning_rate": 1.9612460183701053e-05, + "loss": 1.1027, + "step": 4266 + }, + { + "epoch": 11.626702997275205, + "grad_norm": 9.454508781433105, + "learning_rate": 1.9612216849538205e-05, + "loss": 1.1311, + "step": 4267 + }, + { + "epoch": 11.629427792915532, + "grad_norm": 10.544790267944336, + "learning_rate": 1.9611973440515724e-05, + "loss": 1.3735, + "step": 4268 + }, + { + "epoch": 11.632152588555858, + "grad_norm": 13.891005516052246, + "learning_rate": 1.9611729956635507e-05, + "loss": 1.0608, + "step": 4269 + }, + { + "epoch": 11.634877384196185, + "grad_norm": 12.7100830078125, + "learning_rate": 1.9611486397899445e-05, + "loss": 1.3298, + "step": 4270 + }, + { + "epoch": 11.637602179836513, + "grad_norm": 8.996678352355957, + "learning_rate": 1.9611242764309434e-05, + "loss": 1.4302, + "step": 4271 + }, + { + "epoch": 11.640326975476839, + "grad_norm": 9.974884986877441, + "learning_rate": 1.9610999055867376e-05, + "loss": 1.2512, + "step": 4272 + }, + { + "epoch": 11.643051771117166, + "grad_norm": 10.96886157989502, + "learning_rate": 1.9610755272575167e-05, + "loss": 1.3538, + "step": 4273 + }, + { + "epoch": 11.645776566757494, + "grad_norm": 9.486754417419434, + "learning_rate": 1.96105114144347e-05, + "loss": 1.1885, + "step": 4274 + }, + { + "epoch": 11.64850136239782, + "grad_norm": 9.534106254577637, + "learning_rate": 1.9610267481447883e-05, + "loss": 1.2775, + "step": 4275 + }, + { + "epoch": 11.651226158038147, + "grad_norm": 9.522997856140137, + "learning_rate": 1.9610023473616616e-05, + "loss": 1.1348, + "step": 4276 + }, + { + "epoch": 11.653950953678475, + "grad_norm": 10.608443260192871, + "learning_rate": 1.960977939094279e-05, + "loss": 1.3552, + "step": 4277 + }, + { + "epoch": 11.6566757493188, + "grad_norm": 10.006903648376465, + "learning_rate": 1.9609535233428313e-05, + "loss": 1.2917, + "step": 4278 + }, + { + "epoch": 11.659400544959128, + "grad_norm": 10.470991134643555, + "learning_rate": 1.9609291001075082e-05, + "loss": 1.3833, + "step": 4279 + }, + { + "epoch": 11.662125340599456, + "grad_norm": 9.588545799255371, + "learning_rate": 1.9609046693885007e-05, + "loss": 1.27, + "step": 4280 + }, + { + "epoch": 11.664850136239782, + "grad_norm": 19.973514556884766, + "learning_rate": 1.9608802311859984e-05, + "loss": 1.3926, + "step": 4281 + }, + { + "epoch": 11.66757493188011, + "grad_norm": 20.925952911376953, + "learning_rate": 1.9608557855001918e-05, + "loss": 1.2761, + "step": 4282 + }, + { + "epoch": 11.670299727520437, + "grad_norm": 9.654898643493652, + "learning_rate": 1.9608313323312712e-05, + "loss": 1.3579, + "step": 4283 + }, + { + "epoch": 11.673024523160763, + "grad_norm": 10.667916297912598, + "learning_rate": 1.960806871679427e-05, + "loss": 1.2363, + "step": 4284 + }, + { + "epoch": 11.67574931880109, + "grad_norm": 8.566445350646973, + "learning_rate": 1.96078240354485e-05, + "loss": 1.1454, + "step": 4285 + }, + { + "epoch": 11.678474114441418, + "grad_norm": 8.778693199157715, + "learning_rate": 1.9607579279277304e-05, + "loss": 1.177, + "step": 4286 + }, + { + "epoch": 11.681198910081743, + "grad_norm": 13.553953170776367, + "learning_rate": 1.960733444828259e-05, + "loss": 1.4387, + "step": 4287 + }, + { + "epoch": 11.683923705722071, + "grad_norm": 9.751891136169434, + "learning_rate": 1.9607089542466266e-05, + "loss": 1.2366, + "step": 4288 + }, + { + "epoch": 11.686648501362399, + "grad_norm": 10.268438339233398, + "learning_rate": 1.960684456183024e-05, + "loss": 1.3503, + "step": 4289 + }, + { + "epoch": 11.689373297002724, + "grad_norm": 13.085841178894043, + "learning_rate": 1.9606599506376415e-05, + "loss": 1.1855, + "step": 4290 + }, + { + "epoch": 11.692098092643052, + "grad_norm": 9.935746192932129, + "learning_rate": 1.96063543761067e-05, + "loss": 1.104, + "step": 4291 + }, + { + "epoch": 11.69482288828338, + "grad_norm": 10.535567283630371, + "learning_rate": 1.960610917102301e-05, + "loss": 1.2815, + "step": 4292 + }, + { + "epoch": 11.697547683923705, + "grad_norm": 10.67478084564209, + "learning_rate": 1.9605863891127247e-05, + "loss": 1.1548, + "step": 4293 + }, + { + "epoch": 11.700272479564033, + "grad_norm": 9.28094482421875, + "learning_rate": 1.960561853642133e-05, + "loss": 1.2197, + "step": 4294 + }, + { + "epoch": 11.70299727520436, + "grad_norm": 9.412829399108887, + "learning_rate": 1.960537310690716e-05, + "loss": 1.0266, + "step": 4295 + }, + { + "epoch": 11.705722070844686, + "grad_norm": 14.982603073120117, + "learning_rate": 1.9605127602586656e-05, + "loss": 1.3112, + "step": 4296 + }, + { + "epoch": 11.708446866485014, + "grad_norm": 12.387552261352539, + "learning_rate": 1.9604882023461725e-05, + "loss": 1.4277, + "step": 4297 + }, + { + "epoch": 11.711171662125341, + "grad_norm": 13.129229545593262, + "learning_rate": 1.9604636369534285e-05, + "loss": 1.2236, + "step": 4298 + }, + { + "epoch": 11.713896457765667, + "grad_norm": 11.800368309020996, + "learning_rate": 1.9604390640806246e-05, + "loss": 1.261, + "step": 4299 + }, + { + "epoch": 11.716621253405995, + "grad_norm": 15.784507751464844, + "learning_rate": 1.9604144837279523e-05, + "loss": 1.1934, + "step": 4300 + }, + { + "epoch": 11.719346049046322, + "grad_norm": 8.646052360534668, + "learning_rate": 1.9603898958956024e-05, + "loss": 1.166, + "step": 4301 + }, + { + "epoch": 11.722070844686648, + "grad_norm": 9.307878494262695, + "learning_rate": 1.960365300583767e-05, + "loss": 1.0243, + "step": 4302 + }, + { + "epoch": 11.724795640326976, + "grad_norm": 11.6644926071167, + "learning_rate": 1.960340697792638e-05, + "loss": 1.1243, + "step": 4303 + }, + { + "epoch": 11.727520435967303, + "grad_norm": 10.589908599853516, + "learning_rate": 1.9603160875224067e-05, + "loss": 1.4622, + "step": 4304 + }, + { + "epoch": 11.730245231607629, + "grad_norm": 8.321166038513184, + "learning_rate": 1.960291469773264e-05, + "loss": 1.2344, + "step": 4305 + }, + { + "epoch": 11.732970027247957, + "grad_norm": 11.593385696411133, + "learning_rate": 1.9602668445454024e-05, + "loss": 1.1692, + "step": 4306 + }, + { + "epoch": 11.735694822888284, + "grad_norm": 10.745800971984863, + "learning_rate": 1.9602422118390138e-05, + "loss": 1.3217, + "step": 4307 + }, + { + "epoch": 11.73841961852861, + "grad_norm": 8.608404159545898, + "learning_rate": 1.9602175716542895e-05, + "loss": 1.1926, + "step": 4308 + }, + { + "epoch": 11.741144414168938, + "grad_norm": 9.466004371643066, + "learning_rate": 1.9601929239914217e-05, + "loss": 1.2781, + "step": 4309 + }, + { + "epoch": 11.743869209809265, + "grad_norm": 9.192959785461426, + "learning_rate": 1.960168268850602e-05, + "loss": 1.2083, + "step": 4310 + }, + { + "epoch": 11.746594005449591, + "grad_norm": 17.6987361907959, + "learning_rate": 1.9601436062320232e-05, + "loss": 1.333, + "step": 4311 + }, + { + "epoch": 11.749318801089919, + "grad_norm": 8.098871231079102, + "learning_rate": 1.960118936135877e-05, + "loss": 1.2598, + "step": 4312 + }, + { + "epoch": 11.752043596730246, + "grad_norm": 11.7301607131958, + "learning_rate": 1.960094258562355e-05, + "loss": 1.4526, + "step": 4313 + }, + { + "epoch": 11.754768392370572, + "grad_norm": 9.770210266113281, + "learning_rate": 1.9600695735116503e-05, + "loss": 1.2316, + "step": 4314 + }, + { + "epoch": 11.7574931880109, + "grad_norm": 8.813011169433594, + "learning_rate": 1.9600448809839542e-05, + "loss": 1.3875, + "step": 4315 + }, + { + "epoch": 11.760217983651227, + "grad_norm": 10.773046493530273, + "learning_rate": 1.9600201809794596e-05, + "loss": 1.2832, + "step": 4316 + }, + { + "epoch": 11.762942779291553, + "grad_norm": 8.112799644470215, + "learning_rate": 1.9599954734983586e-05, + "loss": 1.3123, + "step": 4317 + }, + { + "epoch": 11.76566757493188, + "grad_norm": 24.07083511352539, + "learning_rate": 1.9599707585408438e-05, + "loss": 1.3369, + "step": 4318 + }, + { + "epoch": 11.768392370572208, + "grad_norm": 12.28234577178955, + "learning_rate": 1.959946036107108e-05, + "loss": 1.397, + "step": 4319 + }, + { + "epoch": 11.771117166212534, + "grad_norm": 10.630733489990234, + "learning_rate": 1.959921306197343e-05, + "loss": 1.2463, + "step": 4320 + }, + { + "epoch": 11.773841961852861, + "grad_norm": 12.136207580566406, + "learning_rate": 1.959896568811742e-05, + "loss": 1.1973, + "step": 4321 + }, + { + "epoch": 11.776566757493189, + "grad_norm": 12.15300464630127, + "learning_rate": 1.959871823950497e-05, + "loss": 1.1873, + "step": 4322 + }, + { + "epoch": 11.779291553133515, + "grad_norm": 9.693768501281738, + "learning_rate": 1.9598470716138015e-05, + "loss": 1.3191, + "step": 4323 + }, + { + "epoch": 11.782016348773842, + "grad_norm": 10.026284217834473, + "learning_rate": 1.9598223118018477e-05, + "loss": 1.3662, + "step": 4324 + }, + { + "epoch": 11.78474114441417, + "grad_norm": 9.156767845153809, + "learning_rate": 1.959797544514829e-05, + "loss": 1.241, + "step": 4325 + }, + { + "epoch": 11.787465940054496, + "grad_norm": 11.601896286010742, + "learning_rate": 1.9597727697529373e-05, + "loss": 1.281, + "step": 4326 + }, + { + "epoch": 11.790190735694823, + "grad_norm": 9.980677604675293, + "learning_rate": 1.9597479875163666e-05, + "loss": 1.2557, + "step": 4327 + }, + { + "epoch": 11.79291553133515, + "grad_norm": 10.158729553222656, + "learning_rate": 1.9597231978053095e-05, + "loss": 1.1277, + "step": 4328 + }, + { + "epoch": 11.795640326975477, + "grad_norm": 11.920785903930664, + "learning_rate": 1.9596984006199585e-05, + "loss": 1.3772, + "step": 4329 + }, + { + "epoch": 11.798365122615804, + "grad_norm": 12.154458045959473, + "learning_rate": 1.9596735959605077e-05, + "loss": 1.2166, + "step": 4330 + }, + { + "epoch": 11.80108991825613, + "grad_norm": 12.615863800048828, + "learning_rate": 1.95964878382715e-05, + "loss": 1.1858, + "step": 4331 + }, + { + "epoch": 11.803814713896458, + "grad_norm": 9.947614669799805, + "learning_rate": 1.9596239642200784e-05, + "loss": 1.5405, + "step": 4332 + }, + { + "epoch": 11.806539509536785, + "grad_norm": 16.928955078125, + "learning_rate": 1.959599137139486e-05, + "loss": 1.182, + "step": 4333 + }, + { + "epoch": 11.809264305177111, + "grad_norm": 7.814918041229248, + "learning_rate": 1.959574302585566e-05, + "loss": 1.1677, + "step": 4334 + }, + { + "epoch": 11.811989100817438, + "grad_norm": 9.805076599121094, + "learning_rate": 1.9595494605585127e-05, + "loss": 1.2236, + "step": 4335 + }, + { + "epoch": 11.814713896457766, + "grad_norm": 18.602846145629883, + "learning_rate": 1.9595246110585194e-05, + "loss": 1.3203, + "step": 4336 + }, + { + "epoch": 11.817438692098092, + "grad_norm": 9.417820930480957, + "learning_rate": 1.959499754085779e-05, + "loss": 1.2467, + "step": 4337 + }, + { + "epoch": 11.82016348773842, + "grad_norm": 8.117120742797852, + "learning_rate": 1.9594748896404853e-05, + "loss": 1.2739, + "step": 4338 + }, + { + "epoch": 11.822888283378747, + "grad_norm": 10.711532592773438, + "learning_rate": 1.9594500177228322e-05, + "loss": 1.3523, + "step": 4339 + }, + { + "epoch": 11.825613079019073, + "grad_norm": 11.009588241577148, + "learning_rate": 1.959425138333013e-05, + "loss": 1.4854, + "step": 4340 + }, + { + "epoch": 11.8283378746594, + "grad_norm": 13.619063377380371, + "learning_rate": 1.959400251471222e-05, + "loss": 1.3606, + "step": 4341 + }, + { + "epoch": 11.831062670299728, + "grad_norm": 8.956987380981445, + "learning_rate": 1.9593753571376524e-05, + "loss": 1.2725, + "step": 4342 + }, + { + "epoch": 11.833787465940054, + "grad_norm": 10.285244941711426, + "learning_rate": 1.9593504553324987e-05, + "loss": 1.198, + "step": 4343 + }, + { + "epoch": 11.836512261580381, + "grad_norm": 12.4805908203125, + "learning_rate": 1.9593255460559543e-05, + "loss": 1.2314, + "step": 4344 + }, + { + "epoch": 11.839237057220709, + "grad_norm": 33.98967361450195, + "learning_rate": 1.9593006293082134e-05, + "loss": 1.2979, + "step": 4345 + }, + { + "epoch": 11.841961852861035, + "grad_norm": 11.135168075561523, + "learning_rate": 1.9592757050894705e-05, + "loss": 1.2222, + "step": 4346 + }, + { + "epoch": 11.844686648501362, + "grad_norm": 8.834343910217285, + "learning_rate": 1.9592507733999187e-05, + "loss": 1.1731, + "step": 4347 + }, + { + "epoch": 11.84741144414169, + "grad_norm": 10.759552001953125, + "learning_rate": 1.959225834239753e-05, + "loss": 1.2273, + "step": 4348 + }, + { + "epoch": 11.850136239782016, + "grad_norm": 8.94282054901123, + "learning_rate": 1.9592008876091676e-05, + "loss": 1.3877, + "step": 4349 + }, + { + "epoch": 11.852861035422343, + "grad_norm": 8.68305778503418, + "learning_rate": 1.9591759335083563e-05, + "loss": 1.1846, + "step": 4350 + }, + { + "epoch": 11.85558583106267, + "grad_norm": 10.559568405151367, + "learning_rate": 1.9591509719375136e-05, + "loss": 1.2915, + "step": 4351 + }, + { + "epoch": 11.858310626702997, + "grad_norm": 10.871464729309082, + "learning_rate": 1.9591260028968344e-05, + "loss": 1.3989, + "step": 4352 + }, + { + "epoch": 11.861035422343324, + "grad_norm": 9.31416130065918, + "learning_rate": 1.9591010263865125e-05, + "loss": 1.0696, + "step": 4353 + }, + { + "epoch": 11.863760217983652, + "grad_norm": 11.239910125732422, + "learning_rate": 1.9590760424067424e-05, + "loss": 1.3904, + "step": 4354 + }, + { + "epoch": 11.866485013623977, + "grad_norm": 12.502378463745117, + "learning_rate": 1.9590510509577195e-05, + "loss": 1.4033, + "step": 4355 + }, + { + "epoch": 11.869209809264305, + "grad_norm": 13.228873252868652, + "learning_rate": 1.9590260520396377e-05, + "loss": 1.355, + "step": 4356 + }, + { + "epoch": 11.871934604904633, + "grad_norm": 8.481633186340332, + "learning_rate": 1.9590010456526917e-05, + "loss": 1.3428, + "step": 4357 + }, + { + "epoch": 11.874659400544958, + "grad_norm": 11.9637451171875, + "learning_rate": 1.9589760317970765e-05, + "loss": 1.1692, + "step": 4358 + }, + { + "epoch": 11.877384196185286, + "grad_norm": 12.829935073852539, + "learning_rate": 1.958951010472987e-05, + "loss": 1.1487, + "step": 4359 + }, + { + "epoch": 11.880108991825614, + "grad_norm": 8.80949878692627, + "learning_rate": 1.9589259816806177e-05, + "loss": 1.3743, + "step": 4360 + }, + { + "epoch": 11.88283378746594, + "grad_norm": 16.82501983642578, + "learning_rate": 1.9589009454201634e-05, + "loss": 1.3043, + "step": 4361 + }, + { + "epoch": 11.885558583106267, + "grad_norm": 16.30137825012207, + "learning_rate": 1.9588759016918198e-05, + "loss": 1.0549, + "step": 4362 + }, + { + "epoch": 11.888283378746594, + "grad_norm": 11.18465805053711, + "learning_rate": 1.9588508504957816e-05, + "loss": 1.2505, + "step": 4363 + }, + { + "epoch": 11.89100817438692, + "grad_norm": 10.844934463500977, + "learning_rate": 1.958825791832244e-05, + "loss": 1.2908, + "step": 4364 + }, + { + "epoch": 11.893732970027248, + "grad_norm": 8.732866287231445, + "learning_rate": 1.9588007257014013e-05, + "loss": 1.3306, + "step": 4365 + }, + { + "epoch": 11.896457765667575, + "grad_norm": 12.165096282958984, + "learning_rate": 1.95877565210345e-05, + "loss": 1.2432, + "step": 4366 + }, + { + "epoch": 11.899182561307901, + "grad_norm": 11.769744873046875, + "learning_rate": 1.9587505710385847e-05, + "loss": 1.3108, + "step": 4367 + }, + { + "epoch": 11.901907356948229, + "grad_norm": 14.404982566833496, + "learning_rate": 1.958725482507001e-05, + "loss": 1.2993, + "step": 4368 + }, + { + "epoch": 11.904632152588556, + "grad_norm": 10.435540199279785, + "learning_rate": 1.9587003865088937e-05, + "loss": 1.2786, + "step": 4369 + }, + { + "epoch": 11.907356948228882, + "grad_norm": 9.30897331237793, + "learning_rate": 1.9586752830444585e-05, + "loss": 1.3557, + "step": 4370 + }, + { + "epoch": 11.91008174386921, + "grad_norm": 16.349184036254883, + "learning_rate": 1.9586501721138914e-05, + "loss": 1.3054, + "step": 4371 + }, + { + "epoch": 11.912806539509537, + "grad_norm": 11.184679985046387, + "learning_rate": 1.9586250537173878e-05, + "loss": 1.2993, + "step": 4372 + }, + { + "epoch": 11.915531335149863, + "grad_norm": 11.601655006408691, + "learning_rate": 1.9585999278551426e-05, + "loss": 1.3396, + "step": 4373 + }, + { + "epoch": 11.91825613079019, + "grad_norm": 9.532584190368652, + "learning_rate": 1.9585747945273526e-05, + "loss": 1.4148, + "step": 4374 + }, + { + "epoch": 11.920980926430518, + "grad_norm": 13.469198226928711, + "learning_rate": 1.9585496537342123e-05, + "loss": 1.3572, + "step": 4375 + }, + { + "epoch": 11.923705722070844, + "grad_norm": 10.040478706359863, + "learning_rate": 1.958524505475919e-05, + "loss": 1.0967, + "step": 4376 + }, + { + "epoch": 11.926430517711172, + "grad_norm": 28.938920974731445, + "learning_rate": 1.958499349752667e-05, + "loss": 1.2146, + "step": 4377 + }, + { + "epoch": 11.9291553133515, + "grad_norm": 8.300970077514648, + "learning_rate": 1.958474186564653e-05, + "loss": 1.3777, + "step": 4378 + }, + { + "epoch": 11.931880108991825, + "grad_norm": 12.287845611572266, + "learning_rate": 1.958449015912073e-05, + "loss": 1.4329, + "step": 4379 + }, + { + "epoch": 11.934604904632153, + "grad_norm": 10.114580154418945, + "learning_rate": 1.958423837795123e-05, + "loss": 1.2354, + "step": 4380 + }, + { + "epoch": 11.93732970027248, + "grad_norm": 12.478697776794434, + "learning_rate": 1.958398652213999e-05, + "loss": 1.2632, + "step": 4381 + }, + { + "epoch": 11.940054495912806, + "grad_norm": 12.757806777954102, + "learning_rate": 1.9583734591688966e-05, + "loss": 1.2795, + "step": 4382 + }, + { + "epoch": 11.942779291553133, + "grad_norm": 12.535611152648926, + "learning_rate": 1.9583482586600132e-05, + "loss": 1.2043, + "step": 4383 + }, + { + "epoch": 11.945504087193461, + "grad_norm": 13.83928394317627, + "learning_rate": 1.958323050687544e-05, + "loss": 1.3303, + "step": 4384 + }, + { + "epoch": 11.948228882833787, + "grad_norm": 12.60389232635498, + "learning_rate": 1.9582978352516863e-05, + "loss": 1.2756, + "step": 4385 + }, + { + "epoch": 11.950953678474114, + "grad_norm": 13.583793640136719, + "learning_rate": 1.958272612352635e-05, + "loss": 1.2454, + "step": 4386 + }, + { + "epoch": 11.953678474114442, + "grad_norm": 9.803666114807129, + "learning_rate": 1.9582473819905884e-05, + "loss": 1.2583, + "step": 4387 + }, + { + "epoch": 11.956403269754768, + "grad_norm": 9.510045051574707, + "learning_rate": 1.9582221441657413e-05, + "loss": 1.2581, + "step": 4388 + }, + { + "epoch": 11.959128065395095, + "grad_norm": 11.14546012878418, + "learning_rate": 1.9581968988782914e-05, + "loss": 1.3142, + "step": 4389 + }, + { + "epoch": 11.961852861035423, + "grad_norm": 11.336246490478516, + "learning_rate": 1.9581716461284344e-05, + "loss": 1.3818, + "step": 4390 + }, + { + "epoch": 11.964577656675749, + "grad_norm": 9.391512870788574, + "learning_rate": 1.958146385916368e-05, + "loss": 1.2222, + "step": 4391 + }, + { + "epoch": 11.967302452316076, + "grad_norm": 10.746350288391113, + "learning_rate": 1.9581211182422882e-05, + "loss": 1.186, + "step": 4392 + }, + { + "epoch": 11.970027247956404, + "grad_norm": 8.70995044708252, + "learning_rate": 1.958095843106392e-05, + "loss": 1.1543, + "step": 4393 + }, + { + "epoch": 11.97275204359673, + "grad_norm": 10.364996910095215, + "learning_rate": 1.958070560508876e-05, + "loss": 1.196, + "step": 4394 + }, + { + "epoch": 11.975476839237057, + "grad_norm": 11.579974174499512, + "learning_rate": 1.9580452704499375e-05, + "loss": 1.2598, + "step": 4395 + }, + { + "epoch": 11.978201634877385, + "grad_norm": 37.31267166137695, + "learning_rate": 1.9580199729297736e-05, + "loss": 1.2881, + "step": 4396 + }, + { + "epoch": 11.98092643051771, + "grad_norm": 9.780526161193848, + "learning_rate": 1.9579946679485803e-05, + "loss": 1.3279, + "step": 4397 + }, + { + "epoch": 11.983651226158038, + "grad_norm": 8.573712348937988, + "learning_rate": 1.9579693555065558e-05, + "loss": 1.1371, + "step": 4398 + }, + { + "epoch": 11.986376021798366, + "grad_norm": 10.88554859161377, + "learning_rate": 1.9579440356038966e-05, + "loss": 1.5913, + "step": 4399 + }, + { + "epoch": 11.989100817438691, + "grad_norm": 14.26610279083252, + "learning_rate": 1.9579187082408003e-05, + "loss": 1.2529, + "step": 4400 + }, + { + "epoch": 11.991825613079019, + "grad_norm": 10.75584602355957, + "learning_rate": 1.957893373417464e-05, + "loss": 1.4375, + "step": 4401 + }, + { + "epoch": 11.994550408719347, + "grad_norm": 13.039530754089355, + "learning_rate": 1.9578680311340846e-05, + "loss": 1.2537, + "step": 4402 + }, + { + "epoch": 11.997275204359672, + "grad_norm": 9.510915756225586, + "learning_rate": 1.95784268139086e-05, + "loss": 1.2441, + "step": 4403 + }, + { + "epoch": 12.0, + "grad_norm": 11.786630630493164, + "learning_rate": 1.957817324187987e-05, + "loss": 1.1521, + "step": 4404 + }, + { + "epoch": 12.002724795640328, + "grad_norm": 15.739928245544434, + "learning_rate": 1.9577919595256642e-05, + "loss": 1.0649, + "step": 4405 + }, + { + "epoch": 12.005449591280653, + "grad_norm": 8.629070281982422, + "learning_rate": 1.9577665874040882e-05, + "loss": 1.1111, + "step": 4406 + }, + { + "epoch": 12.008174386920981, + "grad_norm": 8.434273719787598, + "learning_rate": 1.9577412078234565e-05, + "loss": 1.0261, + "step": 4407 + }, + { + "epoch": 12.010899182561309, + "grad_norm": 9.693862915039062, + "learning_rate": 1.9577158207839674e-05, + "loss": 1.1152, + "step": 4408 + }, + { + "epoch": 12.013623978201634, + "grad_norm": 6.749441146850586, + "learning_rate": 1.9576904262858183e-05, + "loss": 1.1797, + "step": 4409 + }, + { + "epoch": 12.016348773841962, + "grad_norm": 8.0995454788208, + "learning_rate": 1.957665024329207e-05, + "loss": 1.1367, + "step": 4410 + }, + { + "epoch": 12.01907356948229, + "grad_norm": 9.009051322937012, + "learning_rate": 1.9576396149143312e-05, + "loss": 1.1127, + "step": 4411 + }, + { + "epoch": 12.021798365122615, + "grad_norm": 9.048227310180664, + "learning_rate": 1.9576141980413893e-05, + "loss": 1.2572, + "step": 4412 + }, + { + "epoch": 12.024523160762943, + "grad_norm": 15.703821182250977, + "learning_rate": 1.957588773710578e-05, + "loss": 1.3508, + "step": 4413 + }, + { + "epoch": 12.02724795640327, + "grad_norm": 8.47426700592041, + "learning_rate": 1.957563341922097e-05, + "loss": 1.1946, + "step": 4414 + }, + { + "epoch": 12.029972752043596, + "grad_norm": 10.599610328674316, + "learning_rate": 1.957537902676143e-05, + "loss": 1.2874, + "step": 4415 + }, + { + "epoch": 12.032697547683924, + "grad_norm": 9.831764221191406, + "learning_rate": 1.9575124559729147e-05, + "loss": 1.0459, + "step": 4416 + }, + { + "epoch": 12.035422343324251, + "grad_norm": 8.489566802978516, + "learning_rate": 1.9574870018126108e-05, + "loss": 1.2295, + "step": 4417 + }, + { + "epoch": 12.038147138964577, + "grad_norm": 12.235746383666992, + "learning_rate": 1.9574615401954283e-05, + "loss": 1.2502, + "step": 4418 + }, + { + "epoch": 12.040871934604905, + "grad_norm": 14.411274909973145, + "learning_rate": 1.957436071121566e-05, + "loss": 1.1135, + "step": 4419 + }, + { + "epoch": 12.043596730245232, + "grad_norm": 8.343754768371582, + "learning_rate": 1.957410594591223e-05, + "loss": 1.0618, + "step": 4420 + }, + { + "epoch": 12.046321525885558, + "grad_norm": 8.101775169372559, + "learning_rate": 1.9573851106045965e-05, + "loss": 1.1919, + "step": 4421 + }, + { + "epoch": 12.049046321525886, + "grad_norm": 8.42682933807373, + "learning_rate": 1.957359619161886e-05, + "loss": 1.2458, + "step": 4422 + }, + { + "epoch": 12.051771117166213, + "grad_norm": 10.502134323120117, + "learning_rate": 1.9573341202632897e-05, + "loss": 1.1694, + "step": 4423 + }, + { + "epoch": 12.054495912806539, + "grad_norm": 8.5780611038208, + "learning_rate": 1.9573086139090056e-05, + "loss": 1.1309, + "step": 4424 + }, + { + "epoch": 12.057220708446867, + "grad_norm": 10.66483211517334, + "learning_rate": 1.957283100099233e-05, + "loss": 1.0049, + "step": 4425 + }, + { + "epoch": 12.059945504087194, + "grad_norm": 9.722137451171875, + "learning_rate": 1.9572575788341707e-05, + "loss": 1.2512, + "step": 4426 + }, + { + "epoch": 12.06267029972752, + "grad_norm": 11.696825981140137, + "learning_rate": 1.957232050114017e-05, + "loss": 1.1697, + "step": 4427 + }, + { + "epoch": 12.065395095367847, + "grad_norm": 9.30435848236084, + "learning_rate": 1.957206513938971e-05, + "loss": 1.1656, + "step": 4428 + }, + { + "epoch": 12.068119891008175, + "grad_norm": 7.531614780426025, + "learning_rate": 1.957180970309231e-05, + "loss": 1.1726, + "step": 4429 + }, + { + "epoch": 12.0708446866485, + "grad_norm": 10.614941596984863, + "learning_rate": 1.957155419224997e-05, + "loss": 1.4146, + "step": 4430 + }, + { + "epoch": 12.073569482288828, + "grad_norm": 10.960173606872559, + "learning_rate": 1.957129860686467e-05, + "loss": 1.136, + "step": 4431 + }, + { + "epoch": 12.076294277929156, + "grad_norm": 8.614213943481445, + "learning_rate": 1.9571042946938408e-05, + "loss": 1.1938, + "step": 4432 + }, + { + "epoch": 12.079019073569482, + "grad_norm": 9.550384521484375, + "learning_rate": 1.957078721247317e-05, + "loss": 1.2781, + "step": 4433 + }, + { + "epoch": 12.08174386920981, + "grad_norm": 48.99443054199219, + "learning_rate": 1.957053140347095e-05, + "loss": 0.9927, + "step": 4434 + }, + { + "epoch": 12.084468664850137, + "grad_norm": 10.192533493041992, + "learning_rate": 1.957027551993374e-05, + "loss": 1.1252, + "step": 4435 + }, + { + "epoch": 12.087193460490463, + "grad_norm": 9.485245704650879, + "learning_rate": 1.957001956186353e-05, + "loss": 1.2756, + "step": 4436 + }, + { + "epoch": 12.08991825613079, + "grad_norm": 11.191668510437012, + "learning_rate": 1.9569763529262315e-05, + "loss": 1.1938, + "step": 4437 + }, + { + "epoch": 12.092643051771118, + "grad_norm": 9.03013801574707, + "learning_rate": 1.9569507422132092e-05, + "loss": 1.1267, + "step": 4438 + }, + { + "epoch": 12.095367847411444, + "grad_norm": 11.902277946472168, + "learning_rate": 1.956925124047485e-05, + "loss": 1.2581, + "step": 4439 + }, + { + "epoch": 12.098092643051771, + "grad_norm": 10.63662052154541, + "learning_rate": 1.9568994984292592e-05, + "loss": 1.1394, + "step": 4440 + }, + { + "epoch": 12.100817438692099, + "grad_norm": 7.562166690826416, + "learning_rate": 1.9568738653587304e-05, + "loss": 1.186, + "step": 4441 + }, + { + "epoch": 12.103542234332425, + "grad_norm": 9.163925170898438, + "learning_rate": 1.9568482248360992e-05, + "loss": 1.0581, + "step": 4442 + }, + { + "epoch": 12.106267029972752, + "grad_norm": 10.432324409484863, + "learning_rate": 1.956822576861565e-05, + "loss": 1.1753, + "step": 4443 + }, + { + "epoch": 12.10899182561308, + "grad_norm": 10.020838737487793, + "learning_rate": 1.9567969214353266e-05, + "loss": 1.1882, + "step": 4444 + }, + { + "epoch": 12.111716621253406, + "grad_norm": 10.333386421203613, + "learning_rate": 1.956771258557585e-05, + "loss": 1.1543, + "step": 4445 + }, + { + "epoch": 12.114441416893733, + "grad_norm": 13.603619575500488, + "learning_rate": 1.9567455882285397e-05, + "loss": 1.3115, + "step": 4446 + }, + { + "epoch": 12.11716621253406, + "grad_norm": 8.085104942321777, + "learning_rate": 1.95671991044839e-05, + "loss": 1.0378, + "step": 4447 + }, + { + "epoch": 12.119891008174386, + "grad_norm": 10.977900505065918, + "learning_rate": 1.9566942252173373e-05, + "loss": 1.2616, + "step": 4448 + }, + { + "epoch": 12.122615803814714, + "grad_norm": 11.41482162475586, + "learning_rate": 1.9566685325355803e-05, + "loss": 1.3162, + "step": 4449 + }, + { + "epoch": 12.125340599455042, + "grad_norm": 23.697675704956055, + "learning_rate": 1.9566428324033192e-05, + "loss": 1.0796, + "step": 4450 + }, + { + "epoch": 12.128065395095367, + "grad_norm": 11.825977325439453, + "learning_rate": 1.9566171248207552e-05, + "loss": 1.2524, + "step": 4451 + }, + { + "epoch": 12.130790190735695, + "grad_norm": 9.793973922729492, + "learning_rate": 1.9565914097880874e-05, + "loss": 1.2634, + "step": 4452 + }, + { + "epoch": 12.133514986376023, + "grad_norm": 10.945475578308105, + "learning_rate": 1.956565687305517e-05, + "loss": 1.3218, + "step": 4453 + }, + { + "epoch": 12.136239782016348, + "grad_norm": 7.100282192230225, + "learning_rate": 1.9565399573732432e-05, + "loss": 1.1567, + "step": 4454 + }, + { + "epoch": 12.138964577656676, + "grad_norm": 11.469827651977539, + "learning_rate": 1.956514219991467e-05, + "loss": 1.1404, + "step": 4455 + }, + { + "epoch": 12.141689373297003, + "grad_norm": 8.892791748046875, + "learning_rate": 1.956488475160389e-05, + "loss": 1.2952, + "step": 4456 + }, + { + "epoch": 12.14441416893733, + "grad_norm": 7.216567039489746, + "learning_rate": 1.9564627228802098e-05, + "loss": 1.1753, + "step": 4457 + }, + { + "epoch": 12.147138964577657, + "grad_norm": 7.672146320343018, + "learning_rate": 1.9564369631511296e-05, + "loss": 1.3711, + "step": 4458 + }, + { + "epoch": 12.149863760217984, + "grad_norm": 7.896295547485352, + "learning_rate": 1.956411195973349e-05, + "loss": 1.0814, + "step": 4459 + }, + { + "epoch": 12.15258855585831, + "grad_norm": 9.343679428100586, + "learning_rate": 1.956385421347069e-05, + "loss": 1.1007, + "step": 4460 + }, + { + "epoch": 12.155313351498638, + "grad_norm": 11.700438499450684, + "learning_rate": 1.9563596392724897e-05, + "loss": 1.3137, + "step": 4461 + }, + { + "epoch": 12.158038147138965, + "grad_norm": 10.045361518859863, + "learning_rate": 1.9563338497498127e-05, + "loss": 1.3904, + "step": 4462 + }, + { + "epoch": 12.160762942779291, + "grad_norm": 11.074722290039062, + "learning_rate": 1.9563080527792383e-05, + "loss": 1.197, + "step": 4463 + }, + { + "epoch": 12.163487738419619, + "grad_norm": 15.348587036132812, + "learning_rate": 1.9562822483609675e-05, + "loss": 1.1335, + "step": 4464 + }, + { + "epoch": 12.166212534059946, + "grad_norm": 10.257996559143066, + "learning_rate": 1.9562564364952012e-05, + "loss": 1.2634, + "step": 4465 + }, + { + "epoch": 12.168937329700272, + "grad_norm": 8.52253246307373, + "learning_rate": 1.956230617182141e-05, + "loss": 1.0405, + "step": 4466 + }, + { + "epoch": 12.1716621253406, + "grad_norm": 10.670637130737305, + "learning_rate": 1.956204790421987e-05, + "loss": 1.271, + "step": 4467 + }, + { + "epoch": 12.174386920980927, + "grad_norm": 8.055587768554688, + "learning_rate": 1.956178956214941e-05, + "loss": 1.2493, + "step": 4468 + }, + { + "epoch": 12.177111716621253, + "grad_norm": 8.456838607788086, + "learning_rate": 1.9561531145612042e-05, + "loss": 0.9962, + "step": 4469 + }, + { + "epoch": 12.17983651226158, + "grad_norm": 8.796440124511719, + "learning_rate": 1.956127265460978e-05, + "loss": 1.1199, + "step": 4470 + }, + { + "epoch": 12.182561307901908, + "grad_norm": 8.285974502563477, + "learning_rate": 1.9561014089144634e-05, + "loss": 1.3137, + "step": 4471 + }, + { + "epoch": 12.185286103542234, + "grad_norm": 9.08488941192627, + "learning_rate": 1.9560755449218612e-05, + "loss": 1.0901, + "step": 4472 + }, + { + "epoch": 12.188010899182562, + "grad_norm": 9.358592987060547, + "learning_rate": 1.956049673483374e-05, + "loss": 1.1443, + "step": 4473 + }, + { + "epoch": 12.190735694822889, + "grad_norm": 9.08774471282959, + "learning_rate": 1.956023794599202e-05, + "loss": 1.2371, + "step": 4474 + }, + { + "epoch": 12.193460490463215, + "grad_norm": 16.300308227539062, + "learning_rate": 1.9559979082695483e-05, + "loss": 1.3635, + "step": 4475 + }, + { + "epoch": 12.196185286103542, + "grad_norm": 9.76804256439209, + "learning_rate": 1.955972014494613e-05, + "loss": 1.3032, + "step": 4476 + }, + { + "epoch": 12.19891008174387, + "grad_norm": 8.860701560974121, + "learning_rate": 1.955946113274599e-05, + "loss": 1.1211, + "step": 4477 + }, + { + "epoch": 12.201634877384196, + "grad_norm": 7.7827606201171875, + "learning_rate": 1.955920204609707e-05, + "loss": 1.2136, + "step": 4478 + }, + { + "epoch": 12.204359673024523, + "grad_norm": 9.018577575683594, + "learning_rate": 1.9558942885001394e-05, + "loss": 1.3269, + "step": 4479 + }, + { + "epoch": 12.207084468664851, + "grad_norm": 11.849574089050293, + "learning_rate": 1.9558683649460977e-05, + "loss": 1.2241, + "step": 4480 + }, + { + "epoch": 12.209809264305177, + "grad_norm": 14.160171508789062, + "learning_rate": 1.955842433947784e-05, + "loss": 1.1177, + "step": 4481 + }, + { + "epoch": 12.212534059945504, + "grad_norm": 39.62517547607422, + "learning_rate": 1.9558164955054005e-05, + "loss": 1.1292, + "step": 4482 + }, + { + "epoch": 12.215258855585832, + "grad_norm": 12.130826950073242, + "learning_rate": 1.9557905496191485e-05, + "loss": 1.1411, + "step": 4483 + }, + { + "epoch": 12.217983651226158, + "grad_norm": 9.747757911682129, + "learning_rate": 1.9557645962892306e-05, + "loss": 1.0795, + "step": 4484 + }, + { + "epoch": 12.220708446866485, + "grad_norm": 9.641395568847656, + "learning_rate": 1.9557386355158487e-05, + "loss": 1.0536, + "step": 4485 + }, + { + "epoch": 12.223433242506813, + "grad_norm": 7.763537406921387, + "learning_rate": 1.955712667299205e-05, + "loss": 1.1582, + "step": 4486 + }, + { + "epoch": 12.226158038147139, + "grad_norm": 9.421480178833008, + "learning_rate": 1.9556866916395025e-05, + "loss": 1.292, + "step": 4487 + }, + { + "epoch": 12.228882833787466, + "grad_norm": 19.76326560974121, + "learning_rate": 1.9556607085369423e-05, + "loss": 1.0522, + "step": 4488 + }, + { + "epoch": 12.231607629427794, + "grad_norm": 10.995299339294434, + "learning_rate": 1.955634717991727e-05, + "loss": 1.1641, + "step": 4489 + }, + { + "epoch": 12.23433242506812, + "grad_norm": 8.183566093444824, + "learning_rate": 1.9556087200040595e-05, + "loss": 1.2008, + "step": 4490 + }, + { + "epoch": 12.237057220708447, + "grad_norm": 8.867317199707031, + "learning_rate": 1.9555827145741418e-05, + "loss": 1.0337, + "step": 4491 + }, + { + "epoch": 12.239782016348773, + "grad_norm": 9.299468040466309, + "learning_rate": 1.955556701702177e-05, + "loss": 1.0896, + "step": 4492 + }, + { + "epoch": 12.2425068119891, + "grad_norm": 10.6619873046875, + "learning_rate": 1.955530681388367e-05, + "loss": 1.1201, + "step": 4493 + }, + { + "epoch": 12.245231607629428, + "grad_norm": 8.409582138061523, + "learning_rate": 1.9555046536329154e-05, + "loss": 1.1041, + "step": 4494 + }, + { + "epoch": 12.247956403269754, + "grad_norm": 13.844766616821289, + "learning_rate": 1.955478618436024e-05, + "loss": 1.2786, + "step": 4495 + }, + { + "epoch": 12.250681198910081, + "grad_norm": 9.929696083068848, + "learning_rate": 1.9554525757978958e-05, + "loss": 1.2646, + "step": 4496 + }, + { + "epoch": 12.253405994550409, + "grad_norm": 9.000109672546387, + "learning_rate": 1.9554265257187336e-05, + "loss": 1.1101, + "step": 4497 + }, + { + "epoch": 12.256130790190735, + "grad_norm": 11.595155715942383, + "learning_rate": 1.955400468198741e-05, + "loss": 1.0933, + "step": 4498 + }, + { + "epoch": 12.258855585831062, + "grad_norm": 11.236772537231445, + "learning_rate": 1.9553744032381198e-05, + "loss": 1.231, + "step": 4499 + }, + { + "epoch": 12.26158038147139, + "grad_norm": 9.075350761413574, + "learning_rate": 1.9553483308370732e-05, + "loss": 1.1371, + "step": 4500 + }, + { + "epoch": 12.264305177111716, + "grad_norm": 30.546899795532227, + "learning_rate": 1.955322250995805e-05, + "loss": 1.1213, + "step": 4501 + }, + { + "epoch": 12.267029972752043, + "grad_norm": 12.340591430664062, + "learning_rate": 1.9552961637145177e-05, + "loss": 1.1868, + "step": 4502 + }, + { + "epoch": 12.269754768392371, + "grad_norm": 10.846833229064941, + "learning_rate": 1.9552700689934146e-05, + "loss": 1.2559, + "step": 4503 + }, + { + "epoch": 12.272479564032697, + "grad_norm": 9.99949836730957, + "learning_rate": 1.9552439668326993e-05, + "loss": 1.1394, + "step": 4504 + }, + { + "epoch": 12.275204359673024, + "grad_norm": 10.80855655670166, + "learning_rate": 1.955217857232574e-05, + "loss": 1.2053, + "step": 4505 + }, + { + "epoch": 12.277929155313352, + "grad_norm": 10.59102725982666, + "learning_rate": 1.9551917401932436e-05, + "loss": 1.229, + "step": 4506 + }, + { + "epoch": 12.280653950953678, + "grad_norm": 9.98192310333252, + "learning_rate": 1.95516561571491e-05, + "loss": 1.1077, + "step": 4507 + }, + { + "epoch": 12.283378746594005, + "grad_norm": 10.518499374389648, + "learning_rate": 1.9551394837977776e-05, + "loss": 1.2952, + "step": 4508 + }, + { + "epoch": 12.286103542234333, + "grad_norm": 20.259326934814453, + "learning_rate": 1.9551133444420495e-05, + "loss": 1.1157, + "step": 4509 + }, + { + "epoch": 12.288828337874659, + "grad_norm": 17.111726760864258, + "learning_rate": 1.9550871976479297e-05, + "loss": 1.1477, + "step": 4510 + }, + { + "epoch": 12.291553133514986, + "grad_norm": 18.629878997802734, + "learning_rate": 1.9550610434156213e-05, + "loss": 1.078, + "step": 4511 + }, + { + "epoch": 12.294277929155314, + "grad_norm": 11.988139152526855, + "learning_rate": 1.9550348817453286e-05, + "loss": 1.2703, + "step": 4512 + }, + { + "epoch": 12.29700272479564, + "grad_norm": 10.327305793762207, + "learning_rate": 1.9550087126372544e-05, + "loss": 1.0684, + "step": 4513 + }, + { + "epoch": 12.299727520435967, + "grad_norm": 11.47162914276123, + "learning_rate": 1.9549825360916035e-05, + "loss": 1.0139, + "step": 4514 + }, + { + "epoch": 12.302452316076295, + "grad_norm": 11.214944839477539, + "learning_rate": 1.954956352108579e-05, + "loss": 1.0042, + "step": 4515 + }, + { + "epoch": 12.30517711171662, + "grad_norm": 19.47401237487793, + "learning_rate": 1.9549301606883855e-05, + "loss": 1.1846, + "step": 4516 + }, + { + "epoch": 12.307901907356948, + "grad_norm": 15.151413917541504, + "learning_rate": 1.9549039618312268e-05, + "loss": 1.1472, + "step": 4517 + }, + { + "epoch": 12.310626702997276, + "grad_norm": 16.04181671142578, + "learning_rate": 1.9548777555373065e-05, + "loss": 1.167, + "step": 4518 + }, + { + "epoch": 12.313351498637601, + "grad_norm": 13.755768775939941, + "learning_rate": 1.954851541806829e-05, + "loss": 1.1953, + "step": 4519 + }, + { + "epoch": 12.316076294277929, + "grad_norm": 8.122154235839844, + "learning_rate": 1.9548253206399983e-05, + "loss": 1.1219, + "step": 4520 + }, + { + "epoch": 12.318801089918257, + "grad_norm": 15.348465919494629, + "learning_rate": 1.954799092037019e-05, + "loss": 1.2222, + "step": 4521 + }, + { + "epoch": 12.321525885558582, + "grad_norm": 14.399018287658691, + "learning_rate": 1.9547728559980948e-05, + "loss": 1.2212, + "step": 4522 + }, + { + "epoch": 12.32425068119891, + "grad_norm": 16.025836944580078, + "learning_rate": 1.9547466125234305e-05, + "loss": 1.0447, + "step": 4523 + }, + { + "epoch": 12.326975476839237, + "grad_norm": 16.8812255859375, + "learning_rate": 1.95472036161323e-05, + "loss": 1.2146, + "step": 4524 + }, + { + "epoch": 12.329700272479563, + "grad_norm": 9.85257339477539, + "learning_rate": 1.9546941032676986e-05, + "loss": 1.5183, + "step": 4525 + }, + { + "epoch": 12.33242506811989, + "grad_norm": 9.414003372192383, + "learning_rate": 1.95466783748704e-05, + "loss": 1.3218, + "step": 4526 + }, + { + "epoch": 12.335149863760218, + "grad_norm": 12.69359016418457, + "learning_rate": 1.954641564271459e-05, + "loss": 1.0989, + "step": 4527 + }, + { + "epoch": 12.337874659400544, + "grad_norm": 13.881927490234375, + "learning_rate": 1.95461528362116e-05, + "loss": 1.2754, + "step": 4528 + }, + { + "epoch": 12.340599455040872, + "grad_norm": 20.145729064941406, + "learning_rate": 1.9545889955363483e-05, + "loss": 1.3813, + "step": 4529 + }, + { + "epoch": 12.3433242506812, + "grad_norm": 12.239202499389648, + "learning_rate": 1.954562700017228e-05, + "loss": 1.2983, + "step": 4530 + }, + { + "epoch": 12.346049046321525, + "grad_norm": 12.98681354522705, + "learning_rate": 1.954536397064004e-05, + "loss": 1.3801, + "step": 4531 + }, + { + "epoch": 12.348773841961853, + "grad_norm": 22.513046264648438, + "learning_rate": 1.954510086676882e-05, + "loss": 1.1106, + "step": 4532 + }, + { + "epoch": 12.35149863760218, + "grad_norm": 13.772794723510742, + "learning_rate": 1.9544837688560653e-05, + "loss": 1.0582, + "step": 4533 + }, + { + "epoch": 12.354223433242506, + "grad_norm": 10.135868072509766, + "learning_rate": 1.95445744360176e-05, + "loss": 1.4319, + "step": 4534 + }, + { + "epoch": 12.356948228882834, + "grad_norm": 9.674370765686035, + "learning_rate": 1.954431110914171e-05, + "loss": 1.1812, + "step": 4535 + }, + { + "epoch": 12.359673024523161, + "grad_norm": 11.166690826416016, + "learning_rate": 1.9544047707935026e-05, + "loss": 1.2947, + "step": 4536 + }, + { + "epoch": 12.362397820163487, + "grad_norm": 9.085147857666016, + "learning_rate": 1.954378423239961e-05, + "loss": 1.1365, + "step": 4537 + }, + { + "epoch": 12.365122615803815, + "grad_norm": 15.084121704101562, + "learning_rate": 1.9543520682537514e-05, + "loss": 1.2815, + "step": 4538 + }, + { + "epoch": 12.367847411444142, + "grad_norm": 43.925254821777344, + "learning_rate": 1.954325705835078e-05, + "loss": 1.313, + "step": 4539 + }, + { + "epoch": 12.370572207084468, + "grad_norm": 9.097298622131348, + "learning_rate": 1.954299335984147e-05, + "loss": 1.1218, + "step": 4540 + }, + { + "epoch": 12.373297002724795, + "grad_norm": 7.759567737579346, + "learning_rate": 1.9542729587011635e-05, + "loss": 1.1088, + "step": 4541 + }, + { + "epoch": 12.376021798365123, + "grad_norm": 8.935018539428711, + "learning_rate": 1.954246573986333e-05, + "loss": 1.0938, + "step": 4542 + }, + { + "epoch": 12.378746594005449, + "grad_norm": 12.664612770080566, + "learning_rate": 1.9542201818398606e-05, + "loss": 1.2271, + "step": 4543 + }, + { + "epoch": 12.381471389645776, + "grad_norm": 8.754498481750488, + "learning_rate": 1.9541937822619524e-05, + "loss": 1.1702, + "step": 4544 + }, + { + "epoch": 12.384196185286104, + "grad_norm": 11.0216646194458, + "learning_rate": 1.9541673752528135e-05, + "loss": 1.1772, + "step": 4545 + }, + { + "epoch": 12.38692098092643, + "grad_norm": 14.213191986083984, + "learning_rate": 1.95414096081265e-05, + "loss": 1.2859, + "step": 4546 + }, + { + "epoch": 12.389645776566757, + "grad_norm": 8.516196250915527, + "learning_rate": 1.954114538941667e-05, + "loss": 1.0405, + "step": 4547 + }, + { + "epoch": 12.392370572207085, + "grad_norm": 11.736917495727539, + "learning_rate": 1.954088109640071e-05, + "loss": 1.3147, + "step": 4548 + }, + { + "epoch": 12.39509536784741, + "grad_norm": 11.034043312072754, + "learning_rate": 1.9540616729080676e-05, + "loss": 1.3899, + "step": 4549 + }, + { + "epoch": 12.397820163487738, + "grad_norm": 9.75068187713623, + "learning_rate": 1.9540352287458624e-05, + "loss": 1.281, + "step": 4550 + }, + { + "epoch": 12.400544959128066, + "grad_norm": 12.010876655578613, + "learning_rate": 1.9540087771536617e-05, + "loss": 1.3296, + "step": 4551 + }, + { + "epoch": 12.403269754768392, + "grad_norm": 12.708393096923828, + "learning_rate": 1.953982318131671e-05, + "loss": 1.24, + "step": 4552 + }, + { + "epoch": 12.40599455040872, + "grad_norm": 8.05755615234375, + "learning_rate": 1.9539558516800968e-05, + "loss": 1.1244, + "step": 4553 + }, + { + "epoch": 12.408719346049047, + "grad_norm": 11.966116905212402, + "learning_rate": 1.9539293777991456e-05, + "loss": 1.281, + "step": 4554 + }, + { + "epoch": 12.411444141689373, + "grad_norm": 12.17050552368164, + "learning_rate": 1.9539028964890227e-05, + "loss": 1.2935, + "step": 4555 + }, + { + "epoch": 12.4141689373297, + "grad_norm": 10.085892677307129, + "learning_rate": 1.953876407749935e-05, + "loss": 1.2612, + "step": 4556 + }, + { + "epoch": 12.416893732970028, + "grad_norm": 8.45280647277832, + "learning_rate": 1.9538499115820883e-05, + "loss": 1.1785, + "step": 4557 + }, + { + "epoch": 12.419618528610354, + "grad_norm": 10.129697799682617, + "learning_rate": 1.9538234079856892e-05, + "loss": 1.5048, + "step": 4558 + }, + { + "epoch": 12.422343324250681, + "grad_norm": 6.851092338562012, + "learning_rate": 1.9537968969609444e-05, + "loss": 1.0962, + "step": 4559 + }, + { + "epoch": 12.425068119891009, + "grad_norm": 8.825153350830078, + "learning_rate": 1.9537703785080598e-05, + "loss": 1.0917, + "step": 4560 + }, + { + "epoch": 12.427792915531334, + "grad_norm": 10.525093078613281, + "learning_rate": 1.953743852627242e-05, + "loss": 1.2708, + "step": 4561 + }, + { + "epoch": 12.430517711171662, + "grad_norm": 18.500041961669922, + "learning_rate": 1.953717319318698e-05, + "loss": 1.1589, + "step": 4562 + }, + { + "epoch": 12.43324250681199, + "grad_norm": 9.579687118530273, + "learning_rate": 1.9536907785826345e-05, + "loss": 1.1946, + "step": 4563 + }, + { + "epoch": 12.435967302452315, + "grad_norm": 10.064245223999023, + "learning_rate": 1.9536642304192574e-05, + "loss": 1.4142, + "step": 4564 + }, + { + "epoch": 12.438692098092643, + "grad_norm": 8.188551902770996, + "learning_rate": 1.9536376748287743e-05, + "loss": 1.1736, + "step": 4565 + }, + { + "epoch": 12.44141689373297, + "grad_norm": 6.685877323150635, + "learning_rate": 1.9536111118113917e-05, + "loss": 1.0797, + "step": 4566 + }, + { + "epoch": 12.444141689373296, + "grad_norm": 7.987151622772217, + "learning_rate": 1.953584541367316e-05, + "loss": 1.2999, + "step": 4567 + }, + { + "epoch": 12.446866485013624, + "grad_norm": 9.174522399902344, + "learning_rate": 1.9535579634967548e-05, + "loss": 1.1052, + "step": 4568 + }, + { + "epoch": 12.449591280653951, + "grad_norm": 10.419933319091797, + "learning_rate": 1.9535313781999155e-05, + "loss": 1.1375, + "step": 4569 + }, + { + "epoch": 12.452316076294277, + "grad_norm": 7.917226314544678, + "learning_rate": 1.9535047854770038e-05, + "loss": 1.1587, + "step": 4570 + }, + { + "epoch": 12.455040871934605, + "grad_norm": 11.952027320861816, + "learning_rate": 1.9534781853282278e-05, + "loss": 1.2106, + "step": 4571 + }, + { + "epoch": 12.457765667574932, + "grad_norm": 15.018729209899902, + "learning_rate": 1.953451577753794e-05, + "loss": 1.3325, + "step": 4572 + }, + { + "epoch": 12.460490463215258, + "grad_norm": 10.02099609375, + "learning_rate": 1.9534249627539105e-05, + "loss": 1.0997, + "step": 4573 + }, + { + "epoch": 12.463215258855586, + "grad_norm": 8.177393913269043, + "learning_rate": 1.953398340328784e-05, + "loss": 1.0704, + "step": 4574 + }, + { + "epoch": 12.465940054495913, + "grad_norm": 8.423258781433105, + "learning_rate": 1.9533717104786218e-05, + "loss": 1.1108, + "step": 4575 + }, + { + "epoch": 12.46866485013624, + "grad_norm": 9.97563648223877, + "learning_rate": 1.953345073203631e-05, + "loss": 1.3052, + "step": 4576 + }, + { + "epoch": 12.471389645776567, + "grad_norm": 9.08750057220459, + "learning_rate": 1.95331842850402e-05, + "loss": 1.2687, + "step": 4577 + }, + { + "epoch": 12.474114441416894, + "grad_norm": 11.651878356933594, + "learning_rate": 1.9532917763799957e-05, + "loss": 1.2065, + "step": 4578 + }, + { + "epoch": 12.47683923705722, + "grad_norm": 8.31631088256836, + "learning_rate": 1.9532651168317657e-05, + "loss": 1.115, + "step": 4579 + }, + { + "epoch": 12.479564032697548, + "grad_norm": 8.28477668762207, + "learning_rate": 1.9532384498595376e-05, + "loss": 1.2628, + "step": 4580 + }, + { + "epoch": 12.482288828337875, + "grad_norm": 13.442248344421387, + "learning_rate": 1.953211775463519e-05, + "loss": 1.4312, + "step": 4581 + }, + { + "epoch": 12.485013623978201, + "grad_norm": 8.9275541305542, + "learning_rate": 1.9531850936439177e-05, + "loss": 1.2312, + "step": 4582 + }, + { + "epoch": 12.487738419618529, + "grad_norm": 8.316483497619629, + "learning_rate": 1.953158404400942e-05, + "loss": 1.1727, + "step": 4583 + }, + { + "epoch": 12.490463215258856, + "grad_norm": 8.06887149810791, + "learning_rate": 1.953131707734799e-05, + "loss": 1.144, + "step": 4584 + }, + { + "epoch": 12.493188010899182, + "grad_norm": 8.375883102416992, + "learning_rate": 1.9531050036456972e-05, + "loss": 1.2737, + "step": 4585 + }, + { + "epoch": 12.49591280653951, + "grad_norm": 8.302019119262695, + "learning_rate": 1.9530782921338442e-05, + "loss": 1.1799, + "step": 4586 + }, + { + "epoch": 12.498637602179837, + "grad_norm": 8.256749153137207, + "learning_rate": 1.953051573199448e-05, + "loss": 1.0681, + "step": 4587 + }, + { + "epoch": 12.501362397820163, + "grad_norm": 7.484298229217529, + "learning_rate": 1.9530248468427166e-05, + "loss": 1.2612, + "step": 4588 + }, + { + "epoch": 12.50408719346049, + "grad_norm": 8.9029541015625, + "learning_rate": 1.9529981130638585e-05, + "loss": 1.1285, + "step": 4589 + }, + { + "epoch": 12.506811989100818, + "grad_norm": 11.159380912780762, + "learning_rate": 1.952971371863082e-05, + "loss": 1.3145, + "step": 4590 + }, + { + "epoch": 12.509536784741144, + "grad_norm": 11.16989803314209, + "learning_rate": 1.952944623240595e-05, + "loss": 1.1538, + "step": 4591 + }, + { + "epoch": 12.512261580381471, + "grad_norm": 9.007346153259277, + "learning_rate": 1.952917867196606e-05, + "loss": 1.3169, + "step": 4592 + }, + { + "epoch": 12.514986376021799, + "grad_norm": 8.884353637695312, + "learning_rate": 1.9528911037313233e-05, + "loss": 1.1614, + "step": 4593 + }, + { + "epoch": 12.517711171662125, + "grad_norm": 8.167776107788086, + "learning_rate": 1.9528643328449554e-05, + "loss": 1.1514, + "step": 4594 + }, + { + "epoch": 12.520435967302452, + "grad_norm": 8.666801452636719, + "learning_rate": 1.9528375545377107e-05, + "loss": 1.0505, + "step": 4595 + }, + { + "epoch": 12.52316076294278, + "grad_norm": 6.815107822418213, + "learning_rate": 1.9528107688097978e-05, + "loss": 0.9323, + "step": 4596 + }, + { + "epoch": 12.525885558583106, + "grad_norm": 8.493805885314941, + "learning_rate": 1.9527839756614253e-05, + "loss": 1.1121, + "step": 4597 + }, + { + "epoch": 12.528610354223433, + "grad_norm": 8.735637664794922, + "learning_rate": 1.952757175092802e-05, + "loss": 1.208, + "step": 4598 + }, + { + "epoch": 12.53133514986376, + "grad_norm": 8.221902847290039, + "learning_rate": 1.952730367104136e-05, + "loss": 1.0355, + "step": 4599 + }, + { + "epoch": 12.534059945504087, + "grad_norm": 8.883963584899902, + "learning_rate": 1.9527035516956368e-05, + "loss": 1.3167, + "step": 4600 + }, + { + "epoch": 12.536784741144414, + "grad_norm": 9.42188549041748, + "learning_rate": 1.9526767288675134e-05, + "loss": 1.0435, + "step": 4601 + }, + { + "epoch": 12.539509536784742, + "grad_norm": 8.609175682067871, + "learning_rate": 1.952649898619974e-05, + "loss": 1.2488, + "step": 4602 + }, + { + "epoch": 12.542234332425068, + "grad_norm": 10.529431343078613, + "learning_rate": 1.952623060953228e-05, + "loss": 1.1753, + "step": 4603 + }, + { + "epoch": 12.544959128065395, + "grad_norm": 9.760684967041016, + "learning_rate": 1.952596215867484e-05, + "loss": 1.0697, + "step": 4604 + }, + { + "epoch": 12.547683923705723, + "grad_norm": 15.903693199157715, + "learning_rate": 1.9525693633629514e-05, + "loss": 1.171, + "step": 4605 + }, + { + "epoch": 12.550408719346049, + "grad_norm": 9.444087982177734, + "learning_rate": 1.9525425034398394e-05, + "loss": 1.2163, + "step": 4606 + }, + { + "epoch": 12.553133514986376, + "grad_norm": 9.362471580505371, + "learning_rate": 1.952515636098357e-05, + "loss": 1.0851, + "step": 4607 + }, + { + "epoch": 12.555858310626704, + "grad_norm": 8.800759315490723, + "learning_rate": 1.9524887613387133e-05, + "loss": 1.126, + "step": 4608 + }, + { + "epoch": 12.55858310626703, + "grad_norm": 14.719269752502441, + "learning_rate": 1.9524618791611177e-05, + "loss": 1.1335, + "step": 4609 + }, + { + "epoch": 12.561307901907357, + "grad_norm": 9.89954662322998, + "learning_rate": 1.9524349895657798e-05, + "loss": 1.2173, + "step": 4610 + }, + { + "epoch": 12.564032697547685, + "grad_norm": 7.570556640625, + "learning_rate": 1.9524080925529093e-05, + "loss": 1.283, + "step": 4611 + }, + { + "epoch": 12.56675749318801, + "grad_norm": 11.356952667236328, + "learning_rate": 1.9523811881227147e-05, + "loss": 1.2185, + "step": 4612 + }, + { + "epoch": 12.569482288828338, + "grad_norm": 56.742427825927734, + "learning_rate": 1.952354276275406e-05, + "loss": 1.0366, + "step": 4613 + }, + { + "epoch": 12.572207084468666, + "grad_norm": 9.515989303588867, + "learning_rate": 1.952327357011193e-05, + "loss": 1.184, + "step": 4614 + }, + { + "epoch": 12.574931880108991, + "grad_norm": 16.08742904663086, + "learning_rate": 1.9523004303302854e-05, + "loss": 1.4866, + "step": 4615 + }, + { + "epoch": 12.577656675749319, + "grad_norm": 8.824570655822754, + "learning_rate": 1.9522734962328926e-05, + "loss": 1.3364, + "step": 4616 + }, + { + "epoch": 12.580381471389646, + "grad_norm": 10.563802719116211, + "learning_rate": 1.952246554719224e-05, + "loss": 1.2041, + "step": 4617 + }, + { + "epoch": 12.583106267029972, + "grad_norm": 8.585123062133789, + "learning_rate": 1.9522196057894905e-05, + "loss": 0.9529, + "step": 4618 + }, + { + "epoch": 12.5858310626703, + "grad_norm": 8.832019805908203, + "learning_rate": 1.952192649443901e-05, + "loss": 1.0126, + "step": 4619 + }, + { + "epoch": 12.588555858310627, + "grad_norm": 9.905095100402832, + "learning_rate": 1.952165685682666e-05, + "loss": 1.1479, + "step": 4620 + }, + { + "epoch": 12.591280653950953, + "grad_norm": 8.778387069702148, + "learning_rate": 1.9521387145059952e-05, + "loss": 1.2529, + "step": 4621 + }, + { + "epoch": 12.59400544959128, + "grad_norm": 13.142505645751953, + "learning_rate": 1.9521117359140985e-05, + "loss": 1.2751, + "step": 4622 + }, + { + "epoch": 12.596730245231608, + "grad_norm": 14.675884246826172, + "learning_rate": 1.952084749907187e-05, + "loss": 1.2427, + "step": 4623 + }, + { + "epoch": 12.599455040871934, + "grad_norm": 9.52199649810791, + "learning_rate": 1.9520577564854696e-05, + "loss": 1.2654, + "step": 4624 + }, + { + "epoch": 12.602179836512262, + "grad_norm": 9.89417839050293, + "learning_rate": 1.952030755649157e-05, + "loss": 1.1506, + "step": 4625 + }, + { + "epoch": 12.60490463215259, + "grad_norm": 27.12210464477539, + "learning_rate": 1.952003747398459e-05, + "loss": 1.2183, + "step": 4626 + }, + { + "epoch": 12.607629427792915, + "grad_norm": 10.320030212402344, + "learning_rate": 1.9519767317335875e-05, + "loss": 1.2805, + "step": 4627 + }, + { + "epoch": 12.610354223433243, + "grad_norm": 11.5519380569458, + "learning_rate": 1.951949708654751e-05, + "loss": 1.3403, + "step": 4628 + }, + { + "epoch": 12.61307901907357, + "grad_norm": 12.985690116882324, + "learning_rate": 1.9519226781621613e-05, + "loss": 1.228, + "step": 4629 + }, + { + "epoch": 12.615803814713896, + "grad_norm": 9.530143737792969, + "learning_rate": 1.9518956402560282e-05, + "loss": 1.1143, + "step": 4630 + }, + { + "epoch": 12.618528610354224, + "grad_norm": 10.194968223571777, + "learning_rate": 1.9518685949365626e-05, + "loss": 1.1965, + "step": 4631 + }, + { + "epoch": 12.621253405994551, + "grad_norm": 8.98924446105957, + "learning_rate": 1.951841542203975e-05, + "loss": 1.2051, + "step": 4632 + }, + { + "epoch": 12.623978201634877, + "grad_norm": 8.00615119934082, + "learning_rate": 1.9518144820584763e-05, + "loss": 0.9694, + "step": 4633 + }, + { + "epoch": 12.626702997275205, + "grad_norm": 10.693278312683105, + "learning_rate": 1.9517874145002768e-05, + "loss": 1.1099, + "step": 4634 + }, + { + "epoch": 12.629427792915532, + "grad_norm": 10.002409934997559, + "learning_rate": 1.9517603395295873e-05, + "loss": 1.2314, + "step": 4635 + }, + { + "epoch": 12.632152588555858, + "grad_norm": 11.508398056030273, + "learning_rate": 1.951733257146619e-05, + "loss": 1.2388, + "step": 4636 + }, + { + "epoch": 12.634877384196185, + "grad_norm": 9.302984237670898, + "learning_rate": 1.9517061673515832e-05, + "loss": 1.176, + "step": 4637 + }, + { + "epoch": 12.637602179836513, + "grad_norm": 9.541932106018066, + "learning_rate": 1.95167907014469e-05, + "loss": 1.0867, + "step": 4638 + }, + { + "epoch": 12.640326975476839, + "grad_norm": 8.283167839050293, + "learning_rate": 1.951651965526151e-05, + "loss": 1.0667, + "step": 4639 + }, + { + "epoch": 12.643051771117166, + "grad_norm": 9.077845573425293, + "learning_rate": 1.9516248534961773e-05, + "loss": 1.1912, + "step": 4640 + }, + { + "epoch": 12.645776566757494, + "grad_norm": 8.404955863952637, + "learning_rate": 1.9515977340549794e-05, + "loss": 1.1189, + "step": 4641 + }, + { + "epoch": 12.64850136239782, + "grad_norm": 16.992172241210938, + "learning_rate": 1.9515706072027694e-05, + "loss": 1.3352, + "step": 4642 + }, + { + "epoch": 12.651226158038147, + "grad_norm": 9.835552215576172, + "learning_rate": 1.9515434729397577e-05, + "loss": 1.1182, + "step": 4643 + }, + { + "epoch": 12.653950953678475, + "grad_norm": 16.78769302368164, + "learning_rate": 1.9515163312661563e-05, + "loss": 1.2881, + "step": 4644 + }, + { + "epoch": 12.6566757493188, + "grad_norm": 10.720549583435059, + "learning_rate": 1.9514891821821768e-05, + "loss": 1.1658, + "step": 4645 + }, + { + "epoch": 12.659400544959128, + "grad_norm": 9.843253135681152, + "learning_rate": 1.9514620256880294e-05, + "loss": 1.4648, + "step": 4646 + }, + { + "epoch": 12.662125340599456, + "grad_norm": 10.77347183227539, + "learning_rate": 1.9514348617839268e-05, + "loss": 1.1985, + "step": 4647 + }, + { + "epoch": 12.664850136239782, + "grad_norm": 12.356215476989746, + "learning_rate": 1.95140769047008e-05, + "loss": 1.2772, + "step": 4648 + }, + { + "epoch": 12.66757493188011, + "grad_norm": 9.784097671508789, + "learning_rate": 1.9513805117467007e-05, + "loss": 1.2134, + "step": 4649 + }, + { + "epoch": 12.670299727520437, + "grad_norm": 9.46358871459961, + "learning_rate": 1.9513533256140004e-05, + "loss": 0.9877, + "step": 4650 + }, + { + "epoch": 12.673024523160763, + "grad_norm": 8.930076599121094, + "learning_rate": 1.9513261320721915e-05, + "loss": 1.1536, + "step": 4651 + }, + { + "epoch": 12.67574931880109, + "grad_norm": 13.492873191833496, + "learning_rate": 1.951298931121485e-05, + "loss": 1.1965, + "step": 4652 + }, + { + "epoch": 12.678474114441418, + "grad_norm": 15.724522590637207, + "learning_rate": 1.951271722762093e-05, + "loss": 1.3823, + "step": 4653 + }, + { + "epoch": 12.681198910081743, + "grad_norm": 10.186450004577637, + "learning_rate": 1.9512445069942275e-05, + "loss": 1.2336, + "step": 4654 + }, + { + "epoch": 12.683923705722071, + "grad_norm": 9.98702621459961, + "learning_rate": 1.9512172838181005e-05, + "loss": 1.1196, + "step": 4655 + }, + { + "epoch": 12.686648501362399, + "grad_norm": 11.274605751037598, + "learning_rate": 1.9511900532339237e-05, + "loss": 1.1848, + "step": 4656 + }, + { + "epoch": 12.689373297002724, + "grad_norm": 10.36972427368164, + "learning_rate": 1.9511628152419098e-05, + "loss": 1.0969, + "step": 4657 + }, + { + "epoch": 12.692098092643052, + "grad_norm": 53.64316177368164, + "learning_rate": 1.9511355698422702e-05, + "loss": 1.2065, + "step": 4658 + }, + { + "epoch": 12.69482288828338, + "grad_norm": 8.796631813049316, + "learning_rate": 1.9511083170352173e-05, + "loss": 1.4153, + "step": 4659 + }, + { + "epoch": 12.697547683923705, + "grad_norm": 10.043909072875977, + "learning_rate": 1.9510810568209634e-05, + "loss": 0.9744, + "step": 4660 + }, + { + "epoch": 12.700272479564033, + "grad_norm": 9.707660675048828, + "learning_rate": 1.9510537891997214e-05, + "loss": 1.1343, + "step": 4661 + }, + { + "epoch": 12.70299727520436, + "grad_norm": 15.499692916870117, + "learning_rate": 1.9510265141717024e-05, + "loss": 1.1963, + "step": 4662 + }, + { + "epoch": 12.705722070844686, + "grad_norm": 9.693360328674316, + "learning_rate": 1.9509992317371196e-05, + "loss": 1.2511, + "step": 4663 + }, + { + "epoch": 12.708446866485014, + "grad_norm": 9.773543357849121, + "learning_rate": 1.9509719418961858e-05, + "loss": 1.0464, + "step": 4664 + }, + { + "epoch": 12.711171662125341, + "grad_norm": 9.990696907043457, + "learning_rate": 1.9509446446491127e-05, + "loss": 1.0648, + "step": 4665 + }, + { + "epoch": 12.713896457765667, + "grad_norm": 9.596586227416992, + "learning_rate": 1.9509173399961137e-05, + "loss": 1.2563, + "step": 4666 + }, + { + "epoch": 12.716621253405995, + "grad_norm": 13.25296688079834, + "learning_rate": 1.950890027937401e-05, + "loss": 1.1661, + "step": 4667 + }, + { + "epoch": 12.719346049046322, + "grad_norm": 8.975726127624512, + "learning_rate": 1.9508627084731872e-05, + "loss": 1.1356, + "step": 4668 + }, + { + "epoch": 12.722070844686648, + "grad_norm": 8.937646865844727, + "learning_rate": 1.9508353816036853e-05, + "loss": 1.1023, + "step": 4669 + }, + { + "epoch": 12.724795640326976, + "grad_norm": 10.015127182006836, + "learning_rate": 1.950808047329108e-05, + "loss": 1.2043, + "step": 4670 + }, + { + "epoch": 12.727520435967303, + "grad_norm": 9.980385780334473, + "learning_rate": 1.9507807056496683e-05, + "loss": 1.1761, + "step": 4671 + }, + { + "epoch": 12.730245231607629, + "grad_norm": 11.312211036682129, + "learning_rate": 1.950753356565579e-05, + "loss": 1.2368, + "step": 4672 + }, + { + "epoch": 12.732970027247957, + "grad_norm": 8.812410354614258, + "learning_rate": 1.950726000077053e-05, + "loss": 1.5366, + "step": 4673 + }, + { + "epoch": 12.735694822888284, + "grad_norm": 13.870210647583008, + "learning_rate": 1.950698636184304e-05, + "loss": 1.2469, + "step": 4674 + }, + { + "epoch": 12.73841961852861, + "grad_norm": 11.117531776428223, + "learning_rate": 1.9506712648875444e-05, + "loss": 1.3184, + "step": 4675 + }, + { + "epoch": 12.741144414168938, + "grad_norm": 21.896833419799805, + "learning_rate": 1.9506438861869875e-05, + "loss": 1.2288, + "step": 4676 + }, + { + "epoch": 12.743869209809265, + "grad_norm": 9.635631561279297, + "learning_rate": 1.9506165000828467e-05, + "loss": 1.0354, + "step": 4677 + }, + { + "epoch": 12.746594005449591, + "grad_norm": 17.402633666992188, + "learning_rate": 1.950589106575335e-05, + "loss": 1.29, + "step": 4678 + }, + { + "epoch": 12.749318801089919, + "grad_norm": 8.623910903930664, + "learning_rate": 1.9505617056646658e-05, + "loss": 1.278, + "step": 4679 + }, + { + "epoch": 12.752043596730246, + "grad_norm": 8.760870933532715, + "learning_rate": 1.950534297351053e-05, + "loss": 1.156, + "step": 4680 + }, + { + "epoch": 12.754768392370572, + "grad_norm": 8.295570373535156, + "learning_rate": 1.9505068816347095e-05, + "loss": 1.2488, + "step": 4681 + }, + { + "epoch": 12.7574931880109, + "grad_norm": 8.168697357177734, + "learning_rate": 1.9504794585158492e-05, + "loss": 0.9883, + "step": 4682 + }, + { + "epoch": 12.760217983651227, + "grad_norm": 8.455802917480469, + "learning_rate": 1.9504520279946853e-05, + "loss": 1.1169, + "step": 4683 + }, + { + "epoch": 12.762942779291553, + "grad_norm": 10.661886215209961, + "learning_rate": 1.9504245900714313e-05, + "loss": 1.2681, + "step": 4684 + }, + { + "epoch": 12.76566757493188, + "grad_norm": 7.8510284423828125, + "learning_rate": 1.9503971447463016e-05, + "loss": 1.0563, + "step": 4685 + }, + { + "epoch": 12.768392370572208, + "grad_norm": 9.176054000854492, + "learning_rate": 1.9503696920195096e-05, + "loss": 1.1731, + "step": 4686 + }, + { + "epoch": 12.771117166212534, + "grad_norm": 10.042091369628906, + "learning_rate": 1.950342231891269e-05, + "loss": 1.2781, + "step": 4687 + }, + { + "epoch": 12.773841961852861, + "grad_norm": 8.199237823486328, + "learning_rate": 1.9503147643617932e-05, + "loss": 1.1545, + "step": 4688 + }, + { + "epoch": 12.776566757493189, + "grad_norm": 11.569225311279297, + "learning_rate": 1.950287289431297e-05, + "loss": 1.3064, + "step": 4689 + }, + { + "epoch": 12.779291553133515, + "grad_norm": 10.179621696472168, + "learning_rate": 1.950259807099994e-05, + "loss": 1.0471, + "step": 4690 + }, + { + "epoch": 12.782016348773842, + "grad_norm": 9.003026008605957, + "learning_rate": 1.9502323173680983e-05, + "loss": 1.1021, + "step": 4691 + }, + { + "epoch": 12.78474114441417, + "grad_norm": 11.675942420959473, + "learning_rate": 1.9502048202358236e-05, + "loss": 1.0442, + "step": 4692 + }, + { + "epoch": 12.787465940054496, + "grad_norm": 9.208623886108398, + "learning_rate": 1.9501773157033847e-05, + "loss": 1.0453, + "step": 4693 + }, + { + "epoch": 12.790190735694823, + "grad_norm": 8.950695991516113, + "learning_rate": 1.9501498037709948e-05, + "loss": 0.9741, + "step": 4694 + }, + { + "epoch": 12.79291553133515, + "grad_norm": 10.017278671264648, + "learning_rate": 1.9501222844388696e-05, + "loss": 1.1675, + "step": 4695 + }, + { + "epoch": 12.795640326975477, + "grad_norm": 8.59681510925293, + "learning_rate": 1.950094757707222e-05, + "loss": 1.2896, + "step": 4696 + }, + { + "epoch": 12.798365122615804, + "grad_norm": 12.797869682312012, + "learning_rate": 1.950067223576267e-05, + "loss": 1.2446, + "step": 4697 + }, + { + "epoch": 12.80108991825613, + "grad_norm": 11.969429969787598, + "learning_rate": 1.9500396820462194e-05, + "loss": 1.1785, + "step": 4698 + }, + { + "epoch": 12.803814713896458, + "grad_norm": 8.822981834411621, + "learning_rate": 1.9500121331172936e-05, + "loss": 1.0251, + "step": 4699 + }, + { + "epoch": 12.806539509536785, + "grad_norm": 15.670023918151855, + "learning_rate": 1.9499845767897033e-05, + "loss": 1.4297, + "step": 4700 + }, + { + "epoch": 12.809264305177111, + "grad_norm": 8.35623836517334, + "learning_rate": 1.9499570130636638e-05, + "loss": 1.0447, + "step": 4701 + }, + { + "epoch": 12.811989100817438, + "grad_norm": 9.654727935791016, + "learning_rate": 1.9499294419393898e-05, + "loss": 1.1633, + "step": 4702 + }, + { + "epoch": 12.814713896457766, + "grad_norm": 8.043304443359375, + "learning_rate": 1.949901863417096e-05, + "loss": 1.1345, + "step": 4703 + }, + { + "epoch": 12.817438692098092, + "grad_norm": 9.322258949279785, + "learning_rate": 1.9498742774969968e-05, + "loss": 1.0305, + "step": 4704 + }, + { + "epoch": 12.82016348773842, + "grad_norm": 13.219219207763672, + "learning_rate": 1.9498466841793073e-05, + "loss": 1.3967, + "step": 4705 + }, + { + "epoch": 12.822888283378747, + "grad_norm": 10.525544166564941, + "learning_rate": 1.9498190834642426e-05, + "loss": 1.0349, + "step": 4706 + }, + { + "epoch": 12.825613079019073, + "grad_norm": 9.625303268432617, + "learning_rate": 1.9497914753520175e-05, + "loss": 1.2478, + "step": 4707 + }, + { + "epoch": 12.8283378746594, + "grad_norm": 8.864691734313965, + "learning_rate": 1.9497638598428464e-05, + "loss": 1.0991, + "step": 4708 + }, + { + "epoch": 12.831062670299728, + "grad_norm": 11.785776138305664, + "learning_rate": 1.9497362369369456e-05, + "loss": 1.1125, + "step": 4709 + }, + { + "epoch": 12.833787465940054, + "grad_norm": 9.78260326385498, + "learning_rate": 1.949708606634529e-05, + "loss": 1.4175, + "step": 4710 + }, + { + "epoch": 12.836512261580381, + "grad_norm": 18.374671936035156, + "learning_rate": 1.9496809689358127e-05, + "loss": 1.1838, + "step": 4711 + }, + { + "epoch": 12.839237057220709, + "grad_norm": 10.118465423583984, + "learning_rate": 1.9496533238410117e-05, + "loss": 1.1545, + "step": 4712 + }, + { + "epoch": 12.841961852861035, + "grad_norm": 10.40396785736084, + "learning_rate": 1.949625671350341e-05, + "loss": 1.1724, + "step": 4713 + }, + { + "epoch": 12.844686648501362, + "grad_norm": 11.841177940368652, + "learning_rate": 1.949598011464016e-05, + "loss": 1.2544, + "step": 4714 + }, + { + "epoch": 12.84741144414169, + "grad_norm": 9.664090156555176, + "learning_rate": 1.949570344182252e-05, + "loss": 1.2993, + "step": 4715 + }, + { + "epoch": 12.850136239782016, + "grad_norm": 11.260235786437988, + "learning_rate": 1.9495426695052652e-05, + "loss": 1.2002, + "step": 4716 + }, + { + "epoch": 12.852861035422343, + "grad_norm": 9.741466522216797, + "learning_rate": 1.9495149874332707e-05, + "loss": 1.0798, + "step": 4717 + }, + { + "epoch": 12.85558583106267, + "grad_norm": 12.825498580932617, + "learning_rate": 1.9494872979664838e-05, + "loss": 1.176, + "step": 4718 + }, + { + "epoch": 12.858310626702997, + "grad_norm": 14.039491653442383, + "learning_rate": 1.9494596011051205e-05, + "loss": 1.1194, + "step": 4719 + }, + { + "epoch": 12.861035422343324, + "grad_norm": 8.56617546081543, + "learning_rate": 1.9494318968493965e-05, + "loss": 1.1135, + "step": 4720 + }, + { + "epoch": 12.863760217983652, + "grad_norm": 11.367093086242676, + "learning_rate": 1.949404185199527e-05, + "loss": 1.0955, + "step": 4721 + }, + { + "epoch": 12.866485013623977, + "grad_norm": 8.225251197814941, + "learning_rate": 1.9493764661557287e-05, + "loss": 1.1096, + "step": 4722 + }, + { + "epoch": 12.869209809264305, + "grad_norm": 18.134790420532227, + "learning_rate": 1.949348739718217e-05, + "loss": 1.2549, + "step": 4723 + }, + { + "epoch": 12.871934604904633, + "grad_norm": 14.881370544433594, + "learning_rate": 1.9493210058872075e-05, + "loss": 1.401, + "step": 4724 + }, + { + "epoch": 12.874659400544958, + "grad_norm": 10.585454940795898, + "learning_rate": 1.949293264662917e-05, + "loss": 1.0671, + "step": 4725 + }, + { + "epoch": 12.877384196185286, + "grad_norm": 11.371530532836914, + "learning_rate": 1.9492655160455607e-05, + "loss": 1.0669, + "step": 4726 + }, + { + "epoch": 12.880108991825614, + "grad_norm": 11.10936164855957, + "learning_rate": 1.9492377600353555e-05, + "loss": 1.1472, + "step": 4727 + }, + { + "epoch": 12.88283378746594, + "grad_norm": 10.045562744140625, + "learning_rate": 1.9492099966325168e-05, + "loss": 1.0927, + "step": 4728 + }, + { + "epoch": 12.885558583106267, + "grad_norm": 9.858827590942383, + "learning_rate": 1.9491822258372614e-05, + "loss": 1.1929, + "step": 4729 + }, + { + "epoch": 12.888283378746594, + "grad_norm": 12.741924285888672, + "learning_rate": 1.9491544476498054e-05, + "loss": 1.2134, + "step": 4730 + }, + { + "epoch": 12.89100817438692, + "grad_norm": 9.4379243850708, + "learning_rate": 1.949126662070365e-05, + "loss": 1.0623, + "step": 4731 + }, + { + "epoch": 12.893732970027248, + "grad_norm": 12.204022407531738, + "learning_rate": 1.949098869099157e-05, + "loss": 1.3323, + "step": 4732 + }, + { + "epoch": 12.896457765667575, + "grad_norm": 10.362288475036621, + "learning_rate": 1.949071068736397e-05, + "loss": 1.2102, + "step": 4733 + }, + { + "epoch": 12.899182561307901, + "grad_norm": 22.170654296875, + "learning_rate": 1.9490432609823027e-05, + "loss": 1.1755, + "step": 4734 + }, + { + "epoch": 12.901907356948229, + "grad_norm": 12.023188591003418, + "learning_rate": 1.94901544583709e-05, + "loss": 1.1824, + "step": 4735 + }, + { + "epoch": 12.904632152588556, + "grad_norm": 11.377690315246582, + "learning_rate": 1.9489876233009747e-05, + "loss": 1.4109, + "step": 4736 + }, + { + "epoch": 12.907356948228882, + "grad_norm": 17.193017959594727, + "learning_rate": 1.9489597933741754e-05, + "loss": 1.1846, + "step": 4737 + }, + { + "epoch": 12.91008174386921, + "grad_norm": 17.572160720825195, + "learning_rate": 1.948931956056907e-05, + "loss": 1.2808, + "step": 4738 + }, + { + "epoch": 12.912806539509537, + "grad_norm": 10.966382026672363, + "learning_rate": 1.9489041113493875e-05, + "loss": 1.2979, + "step": 4739 + }, + { + "epoch": 12.915531335149863, + "grad_norm": 12.861130714416504, + "learning_rate": 1.9488762592518332e-05, + "loss": 1.0878, + "step": 4740 + }, + { + "epoch": 12.91825613079019, + "grad_norm": 12.99240493774414, + "learning_rate": 1.9488483997644613e-05, + "loss": 1.1365, + "step": 4741 + }, + { + "epoch": 12.920980926430518, + "grad_norm": 15.539706230163574, + "learning_rate": 1.948820532887488e-05, + "loss": 1.2317, + "step": 4742 + }, + { + "epoch": 12.923705722070844, + "grad_norm": 10.954058647155762, + "learning_rate": 1.9487926586211314e-05, + "loss": 1.1658, + "step": 4743 + }, + { + "epoch": 12.926430517711172, + "grad_norm": 9.134175300598145, + "learning_rate": 1.9487647769656082e-05, + "loss": 1.3232, + "step": 4744 + }, + { + "epoch": 12.9291553133515, + "grad_norm": 10.19599437713623, + "learning_rate": 1.948736887921135e-05, + "loss": 1.1957, + "step": 4745 + }, + { + "epoch": 12.931880108991825, + "grad_norm": 9.151069641113281, + "learning_rate": 1.94870899148793e-05, + "loss": 1.2957, + "step": 4746 + }, + { + "epoch": 12.934604904632153, + "grad_norm": 10.090906143188477, + "learning_rate": 1.9486810876662097e-05, + "loss": 1.1069, + "step": 4747 + }, + { + "epoch": 12.93732970027248, + "grad_norm": 14.232126235961914, + "learning_rate": 1.9486531764561915e-05, + "loss": 1.2755, + "step": 4748 + }, + { + "epoch": 12.940054495912806, + "grad_norm": 12.848154067993164, + "learning_rate": 1.948625257858093e-05, + "loss": 1.1897, + "step": 4749 + }, + { + "epoch": 12.942779291553133, + "grad_norm": 10.731879234313965, + "learning_rate": 1.9485973318721316e-05, + "loss": 1.1263, + "step": 4750 + }, + { + "epoch": 12.945504087193461, + "grad_norm": 8.240216255187988, + "learning_rate": 1.9485693984985246e-05, + "loss": 1.1028, + "step": 4751 + }, + { + "epoch": 12.948228882833787, + "grad_norm": 7.984894752502441, + "learning_rate": 1.9485414577374896e-05, + "loss": 1.0601, + "step": 4752 + }, + { + "epoch": 12.950953678474114, + "grad_norm": 19.504682540893555, + "learning_rate": 1.9485135095892444e-05, + "loss": 1.1667, + "step": 4753 + }, + { + "epoch": 12.953678474114442, + "grad_norm": 12.880973815917969, + "learning_rate": 1.9484855540540063e-05, + "loss": 1.1313, + "step": 4754 + }, + { + "epoch": 12.956403269754768, + "grad_norm": 14.527582168579102, + "learning_rate": 1.9484575911319934e-05, + "loss": 1.2534, + "step": 4755 + }, + { + "epoch": 12.959128065395095, + "grad_norm": 12.558151245117188, + "learning_rate": 1.9484296208234232e-05, + "loss": 1.4653, + "step": 4756 + }, + { + "epoch": 12.961852861035423, + "grad_norm": 16.638273239135742, + "learning_rate": 1.9484016431285137e-05, + "loss": 1.2145, + "step": 4757 + }, + { + "epoch": 12.964577656675749, + "grad_norm": 11.54865550994873, + "learning_rate": 1.948373658047483e-05, + "loss": 1.1606, + "step": 4758 + }, + { + "epoch": 12.967302452316076, + "grad_norm": 28.242734909057617, + "learning_rate": 1.9483456655805485e-05, + "loss": 1.3115, + "step": 4759 + }, + { + "epoch": 12.970027247956404, + "grad_norm": 13.323819160461426, + "learning_rate": 1.9483176657279282e-05, + "loss": 1.4126, + "step": 4760 + }, + { + "epoch": 12.97275204359673, + "grad_norm": 14.263542175292969, + "learning_rate": 1.948289658489841e-05, + "loss": 1.2168, + "step": 4761 + }, + { + "epoch": 12.975476839237057, + "grad_norm": 11.75001335144043, + "learning_rate": 1.9482616438665037e-05, + "loss": 1.4028, + "step": 4762 + }, + { + "epoch": 12.978201634877385, + "grad_norm": 12.625207901000977, + "learning_rate": 1.9482336218581358e-05, + "loss": 1.2711, + "step": 4763 + }, + { + "epoch": 12.98092643051771, + "grad_norm": 12.272146224975586, + "learning_rate": 1.9482055924649552e-05, + "loss": 1.2874, + "step": 4764 + }, + { + "epoch": 12.983651226158038, + "grad_norm": 13.786018371582031, + "learning_rate": 1.9481775556871795e-05, + "loss": 1.2549, + "step": 4765 + }, + { + "epoch": 12.986376021798366, + "grad_norm": 10.136306762695312, + "learning_rate": 1.9481495115250277e-05, + "loss": 1.1978, + "step": 4766 + }, + { + "epoch": 12.989100817438691, + "grad_norm": 10.84641170501709, + "learning_rate": 1.9481214599787178e-05, + "loss": 1.2397, + "step": 4767 + }, + { + "epoch": 12.991825613079019, + "grad_norm": 10.182979583740234, + "learning_rate": 1.948093401048469e-05, + "loss": 1.1631, + "step": 4768 + }, + { + "epoch": 12.994550408719347, + "grad_norm": 9.386366844177246, + "learning_rate": 1.9480653347344992e-05, + "loss": 1.2756, + "step": 4769 + }, + { + "epoch": 12.997275204359672, + "grad_norm": 10.589299201965332, + "learning_rate": 1.9480372610370265e-05, + "loss": 0.9358, + "step": 4770 + }, + { + "epoch": 13.0, + "grad_norm": 9.844215393066406, + "learning_rate": 1.9480091799562706e-05, + "loss": 1.0752, + "step": 4771 + }, + { + "epoch": 13.002724795640328, + "grad_norm": 7.666797637939453, + "learning_rate": 1.9479810914924498e-05, + "loss": 0.9545, + "step": 4772 + }, + { + "epoch": 13.005449591280653, + "grad_norm": 7.6852946281433105, + "learning_rate": 1.9479529956457825e-05, + "loss": 1.082, + "step": 4773 + }, + { + "epoch": 13.008174386920981, + "grad_norm": 12.821184158325195, + "learning_rate": 1.9479248924164878e-05, + "loss": 1.1492, + "step": 4774 + }, + { + "epoch": 13.010899182561309, + "grad_norm": 8.613661766052246, + "learning_rate": 1.9478967818047846e-05, + "loss": 1.1296, + "step": 4775 + }, + { + "epoch": 13.013623978201634, + "grad_norm": 9.4019136428833, + "learning_rate": 1.947868663810892e-05, + "loss": 1.0706, + "step": 4776 + }, + { + "epoch": 13.016348773841962, + "grad_norm": 11.372208595275879, + "learning_rate": 1.9478405384350283e-05, + "loss": 0.9995, + "step": 4777 + }, + { + "epoch": 13.01907356948229, + "grad_norm": 8.624147415161133, + "learning_rate": 1.9478124056774133e-05, + "loss": 1.0875, + "step": 4778 + }, + { + "epoch": 13.021798365122615, + "grad_norm": 10.279169082641602, + "learning_rate": 1.9477842655382656e-05, + "loss": 1.126, + "step": 4779 + }, + { + "epoch": 13.024523160762943, + "grad_norm": 10.575634002685547, + "learning_rate": 1.9477561180178048e-05, + "loss": 1.1987, + "step": 4780 + }, + { + "epoch": 13.02724795640327, + "grad_norm": 11.488377571105957, + "learning_rate": 1.9477279631162494e-05, + "loss": 1.0762, + "step": 4781 + }, + { + "epoch": 13.029972752043596, + "grad_norm": 10.141093254089355, + "learning_rate": 1.9476998008338197e-05, + "loss": 1.0608, + "step": 4782 + }, + { + "epoch": 13.032697547683924, + "grad_norm": 9.139327049255371, + "learning_rate": 1.9476716311707342e-05, + "loss": 1.238, + "step": 4783 + }, + { + "epoch": 13.035422343324251, + "grad_norm": 8.857711791992188, + "learning_rate": 1.9476434541272127e-05, + "loss": 1.1503, + "step": 4784 + }, + { + "epoch": 13.038147138964577, + "grad_norm": 10.265288352966309, + "learning_rate": 1.9476152697034743e-05, + "loss": 1.0933, + "step": 4785 + }, + { + "epoch": 13.040871934604905, + "grad_norm": 9.10065746307373, + "learning_rate": 1.9475870778997386e-05, + "loss": 1.1567, + "step": 4786 + }, + { + "epoch": 13.043596730245232, + "grad_norm": 7.665113925933838, + "learning_rate": 1.947558878716225e-05, + "loss": 1.103, + "step": 4787 + }, + { + "epoch": 13.046321525885558, + "grad_norm": 8.798256874084473, + "learning_rate": 1.947530672153154e-05, + "loss": 1.1296, + "step": 4788 + }, + { + "epoch": 13.049046321525886, + "grad_norm": 8.013124465942383, + "learning_rate": 1.9475024582107443e-05, + "loss": 1.1741, + "step": 4789 + }, + { + "epoch": 13.051771117166213, + "grad_norm": 8.364792823791504, + "learning_rate": 1.9474742368892162e-05, + "loss": 1.1431, + "step": 4790 + }, + { + "epoch": 13.054495912806539, + "grad_norm": 7.662590026855469, + "learning_rate": 1.9474460081887888e-05, + "loss": 1.2012, + "step": 4791 + }, + { + "epoch": 13.057220708446867, + "grad_norm": 9.507669448852539, + "learning_rate": 1.9474177721096825e-05, + "loss": 1.1265, + "step": 4792 + }, + { + "epoch": 13.059945504087194, + "grad_norm": 10.31091594696045, + "learning_rate": 1.9473895286521173e-05, + "loss": 0.9613, + "step": 4793 + }, + { + "epoch": 13.06267029972752, + "grad_norm": 7.168553352355957, + "learning_rate": 1.9473612778163126e-05, + "loss": 0.9987, + "step": 4794 + }, + { + "epoch": 13.065395095367847, + "grad_norm": 9.055052757263184, + "learning_rate": 1.9473330196024892e-05, + "loss": 1.1428, + "step": 4795 + }, + { + "epoch": 13.068119891008175, + "grad_norm": 8.657708168029785, + "learning_rate": 1.947304754010866e-05, + "loss": 1.0333, + "step": 4796 + }, + { + "epoch": 13.0708446866485, + "grad_norm": 8.923104286193848, + "learning_rate": 1.9472764810416647e-05, + "loss": 1.1104, + "step": 4797 + }, + { + "epoch": 13.073569482288828, + "grad_norm": 7.689241886138916, + "learning_rate": 1.9472482006951045e-05, + "loss": 1.0107, + "step": 4798 + }, + { + "epoch": 13.076294277929156, + "grad_norm": 8.09443473815918, + "learning_rate": 1.9472199129714053e-05, + "loss": 0.9927, + "step": 4799 + }, + { + "epoch": 13.079019073569482, + "grad_norm": 9.916367530822754, + "learning_rate": 1.947191617870788e-05, + "loss": 1.1208, + "step": 4800 + }, + { + "epoch": 13.08174386920981, + "grad_norm": 7.7582106590271, + "learning_rate": 1.9471633153934735e-05, + "loss": 1.0, + "step": 4801 + }, + { + "epoch": 13.084468664850137, + "grad_norm": 8.89434814453125, + "learning_rate": 1.9471350055396813e-05, + "loss": 1.0178, + "step": 4802 + }, + { + "epoch": 13.087193460490463, + "grad_norm": 10.418031692504883, + "learning_rate": 1.9471066883096318e-05, + "loss": 1.1067, + "step": 4803 + }, + { + "epoch": 13.08991825613079, + "grad_norm": 8.61137866973877, + "learning_rate": 1.947078363703546e-05, + "loss": 1.058, + "step": 4804 + }, + { + "epoch": 13.092643051771118, + "grad_norm": 8.120413780212402, + "learning_rate": 1.9470500317216447e-05, + "loss": 1.09, + "step": 4805 + }, + { + "epoch": 13.095367847411444, + "grad_norm": 8.580293655395508, + "learning_rate": 1.947021692364148e-05, + "loss": 1.0365, + "step": 4806 + }, + { + "epoch": 13.098092643051771, + "grad_norm": 11.327431678771973, + "learning_rate": 1.9469933456312768e-05, + "loss": 1.1143, + "step": 4807 + }, + { + "epoch": 13.100817438692099, + "grad_norm": 8.277037620544434, + "learning_rate": 1.946964991523252e-05, + "loss": 1.1616, + "step": 4808 + }, + { + "epoch": 13.103542234332425, + "grad_norm": 16.122602462768555, + "learning_rate": 1.9469366300402943e-05, + "loss": 0.9401, + "step": 4809 + }, + { + "epoch": 13.106267029972752, + "grad_norm": 11.935078620910645, + "learning_rate": 1.9469082611826247e-05, + "loss": 1.2131, + "step": 4810 + }, + { + "epoch": 13.10899182561308, + "grad_norm": 9.547844886779785, + "learning_rate": 1.9468798849504637e-05, + "loss": 1.1139, + "step": 4811 + }, + { + "epoch": 13.111716621253406, + "grad_norm": 8.435270309448242, + "learning_rate": 1.946851501344033e-05, + "loss": 1.1428, + "step": 4812 + }, + { + "epoch": 13.114441416893733, + "grad_norm": 11.99997329711914, + "learning_rate": 1.946823110363553e-05, + "loss": 1.0203, + "step": 4813 + }, + { + "epoch": 13.11716621253406, + "grad_norm": 10.833842277526855, + "learning_rate": 1.9467947120092456e-05, + "loss": 1.2686, + "step": 4814 + }, + { + "epoch": 13.119891008174386, + "grad_norm": 10.036761283874512, + "learning_rate": 1.946766306281331e-05, + "loss": 1.2429, + "step": 4815 + }, + { + "epoch": 13.122615803814714, + "grad_norm": 12.2543306350708, + "learning_rate": 1.9467378931800307e-05, + "loss": 1.2078, + "step": 4816 + }, + { + "epoch": 13.125340599455042, + "grad_norm": 11.304621696472168, + "learning_rate": 1.9467094727055666e-05, + "loss": 1.0267, + "step": 4817 + }, + { + "epoch": 13.128065395095367, + "grad_norm": 7.782921314239502, + "learning_rate": 1.9466810448581593e-05, + "loss": 1.2629, + "step": 4818 + }, + { + "epoch": 13.130790190735695, + "grad_norm": 10.114357948303223, + "learning_rate": 1.9466526096380306e-05, + "loss": 1.1245, + "step": 4819 + }, + { + "epoch": 13.133514986376023, + "grad_norm": 12.20517349243164, + "learning_rate": 1.946624167045402e-05, + "loss": 1.1082, + "step": 4820 + }, + { + "epoch": 13.136239782016348, + "grad_norm": 7.676155090332031, + "learning_rate": 1.9465957170804945e-05, + "loss": 0.9092, + "step": 4821 + }, + { + "epoch": 13.138964577656676, + "grad_norm": 17.275049209594727, + "learning_rate": 1.9465672597435305e-05, + "loss": 1.0386, + "step": 4822 + }, + { + "epoch": 13.141689373297003, + "grad_norm": 9.47167682647705, + "learning_rate": 1.946538795034731e-05, + "loss": 1.1665, + "step": 4823 + }, + { + "epoch": 13.14441416893733, + "grad_norm": 10.40883731842041, + "learning_rate": 1.9465103229543177e-05, + "loss": 0.9478, + "step": 4824 + }, + { + "epoch": 13.147138964577657, + "grad_norm": 8.743013381958008, + "learning_rate": 1.9464818435025123e-05, + "loss": 1.0924, + "step": 4825 + }, + { + "epoch": 13.149863760217984, + "grad_norm": 9.411235809326172, + "learning_rate": 1.946453356679537e-05, + "loss": 1.4094, + "step": 4826 + }, + { + "epoch": 13.15258855585831, + "grad_norm": 7.757769584655762, + "learning_rate": 1.946424862485613e-05, + "loss": 1.0376, + "step": 4827 + }, + { + "epoch": 13.155313351498638, + "grad_norm": 11.2542142868042, + "learning_rate": 1.9463963609209634e-05, + "loss": 1.0562, + "step": 4828 + }, + { + "epoch": 13.158038147138965, + "grad_norm": 18.28806495666504, + "learning_rate": 1.946367851985809e-05, + "loss": 1.0532, + "step": 4829 + }, + { + "epoch": 13.160762942779291, + "grad_norm": 10.936038970947266, + "learning_rate": 1.946339335680372e-05, + "loss": 1.187, + "step": 4830 + }, + { + "epoch": 13.163487738419619, + "grad_norm": 9.41383171081543, + "learning_rate": 1.946310812004875e-05, + "loss": 1.1675, + "step": 4831 + }, + { + "epoch": 13.166212534059946, + "grad_norm": 8.845934867858887, + "learning_rate": 1.94628228095954e-05, + "loss": 1.0764, + "step": 4832 + }, + { + "epoch": 13.168937329700272, + "grad_norm": 8.47250747680664, + "learning_rate": 1.9462537425445886e-05, + "loss": 1.2778, + "step": 4833 + }, + { + "epoch": 13.1716621253406, + "grad_norm": 7.736001014709473, + "learning_rate": 1.946225196760244e-05, + "loss": 1.1509, + "step": 4834 + }, + { + "epoch": 13.174386920980927, + "grad_norm": 10.229379653930664, + "learning_rate": 1.9461966436067277e-05, + "loss": 1.1388, + "step": 4835 + }, + { + "epoch": 13.177111716621253, + "grad_norm": 7.262877941131592, + "learning_rate": 1.9461680830842623e-05, + "loss": 1.1038, + "step": 4836 + }, + { + "epoch": 13.17983651226158, + "grad_norm": 12.27935791015625, + "learning_rate": 1.9461395151930707e-05, + "loss": 1.2803, + "step": 4837 + }, + { + "epoch": 13.182561307901908, + "grad_norm": 9.038432121276855, + "learning_rate": 1.9461109399333748e-05, + "loss": 1.2936, + "step": 4838 + }, + { + "epoch": 13.185286103542234, + "grad_norm": 13.52312183380127, + "learning_rate": 1.9460823573053972e-05, + "loss": 1.2933, + "step": 4839 + }, + { + "epoch": 13.188010899182562, + "grad_norm": 10.074718475341797, + "learning_rate": 1.946053767309361e-05, + "loss": 1.0635, + "step": 4840 + }, + { + "epoch": 13.190735694822889, + "grad_norm": 8.525565147399902, + "learning_rate": 1.946025169945488e-05, + "loss": 1.052, + "step": 4841 + }, + { + "epoch": 13.193460490463215, + "grad_norm": 8.379159927368164, + "learning_rate": 1.945996565214002e-05, + "loss": 1.0662, + "step": 4842 + }, + { + "epoch": 13.196185286103542, + "grad_norm": 7.827342987060547, + "learning_rate": 1.9459679531151246e-05, + "loss": 1.02, + "step": 4843 + }, + { + "epoch": 13.19891008174387, + "grad_norm": 9.321455001831055, + "learning_rate": 1.9459393336490797e-05, + "loss": 1.0466, + "step": 4844 + }, + { + "epoch": 13.201634877384196, + "grad_norm": 8.47685432434082, + "learning_rate": 1.9459107068160898e-05, + "loss": 1.0537, + "step": 4845 + }, + { + "epoch": 13.204359673024523, + "grad_norm": 10.115507125854492, + "learning_rate": 1.9458820726163774e-05, + "loss": 1.1064, + "step": 4846 + }, + { + "epoch": 13.207084468664851, + "grad_norm": 9.728424072265625, + "learning_rate": 1.945853431050166e-05, + "loss": 1.0018, + "step": 4847 + }, + { + "epoch": 13.209809264305177, + "grad_norm": 8.614083290100098, + "learning_rate": 1.9458247821176787e-05, + "loss": 0.9924, + "step": 4848 + }, + { + "epoch": 13.212534059945504, + "grad_norm": 10.828216552734375, + "learning_rate": 1.945796125819138e-05, + "loss": 1.1628, + "step": 4849 + }, + { + "epoch": 13.215258855585832, + "grad_norm": 7.806414604187012, + "learning_rate": 1.9457674621547678e-05, + "loss": 1.1448, + "step": 4850 + }, + { + "epoch": 13.217983651226158, + "grad_norm": 10.824487686157227, + "learning_rate": 1.945738791124791e-05, + "loss": 1.1963, + "step": 4851 + }, + { + "epoch": 13.220708446866485, + "grad_norm": 9.565332412719727, + "learning_rate": 1.945710112729431e-05, + "loss": 1.0291, + "step": 4852 + }, + { + "epoch": 13.223433242506813, + "grad_norm": 9.20203685760498, + "learning_rate": 1.9456814269689112e-05, + "loss": 1.2798, + "step": 4853 + }, + { + "epoch": 13.226158038147139, + "grad_norm": 14.028481483459473, + "learning_rate": 1.9456527338434545e-05, + "loss": 1.0686, + "step": 4854 + }, + { + "epoch": 13.228882833787466, + "grad_norm": 8.253077507019043, + "learning_rate": 1.945624033353285e-05, + "loss": 1.2712, + "step": 4855 + }, + { + "epoch": 13.231607629427794, + "grad_norm": 12.524160385131836, + "learning_rate": 1.945595325498626e-05, + "loss": 1.1675, + "step": 4856 + }, + { + "epoch": 13.23433242506812, + "grad_norm": 9.643004417419434, + "learning_rate": 1.9455666102797007e-05, + "loss": 1.1772, + "step": 4857 + }, + { + "epoch": 13.237057220708447, + "grad_norm": 9.738412857055664, + "learning_rate": 1.9455378876967335e-05, + "loss": 1.032, + "step": 4858 + }, + { + "epoch": 13.239782016348773, + "grad_norm": 8.651823043823242, + "learning_rate": 1.9455091577499476e-05, + "loss": 1.1724, + "step": 4859 + }, + { + "epoch": 13.2425068119891, + "grad_norm": 11.075654029846191, + "learning_rate": 1.9454804204395667e-05, + "loss": 1.0635, + "step": 4860 + }, + { + "epoch": 13.245231607629428, + "grad_norm": 12.856353759765625, + "learning_rate": 1.9454516757658142e-05, + "loss": 1.1277, + "step": 4861 + }, + { + "epoch": 13.247956403269754, + "grad_norm": 8.579092979431152, + "learning_rate": 1.9454229237289152e-05, + "loss": 1.0472, + "step": 4862 + }, + { + "epoch": 13.250681198910081, + "grad_norm": 10.595727920532227, + "learning_rate": 1.9453941643290928e-05, + "loss": 1.1139, + "step": 4863 + }, + { + "epoch": 13.253405994550409, + "grad_norm": 11.85381031036377, + "learning_rate": 1.945365397566571e-05, + "loss": 1.0942, + "step": 4864 + }, + { + "epoch": 13.256130790190735, + "grad_norm": 14.746014595031738, + "learning_rate": 1.9453366234415737e-05, + "loss": 1.1694, + "step": 4865 + }, + { + "epoch": 13.258855585831062, + "grad_norm": 8.3314847946167, + "learning_rate": 1.9453078419543257e-05, + "loss": 0.9364, + "step": 4866 + }, + { + "epoch": 13.26158038147139, + "grad_norm": 10.424186706542969, + "learning_rate": 1.9452790531050502e-05, + "loss": 1.1519, + "step": 4867 + }, + { + "epoch": 13.264305177111716, + "grad_norm": 10.4879732131958, + "learning_rate": 1.945250256893972e-05, + "loss": 1.062, + "step": 4868 + }, + { + "epoch": 13.267029972752043, + "grad_norm": 9.179813385009766, + "learning_rate": 1.945221453321315e-05, + "loss": 1.2612, + "step": 4869 + }, + { + "epoch": 13.269754768392371, + "grad_norm": 11.862262725830078, + "learning_rate": 1.945192642387304e-05, + "loss": 1.2861, + "step": 4870 + }, + { + "epoch": 13.272479564032697, + "grad_norm": 15.201726913452148, + "learning_rate": 1.945163824092163e-05, + "loss": 1.2764, + "step": 4871 + }, + { + "epoch": 13.275204359673024, + "grad_norm": 9.373326301574707, + "learning_rate": 1.9451349984361168e-05, + "loss": 1.1027, + "step": 4872 + }, + { + "epoch": 13.277929155313352, + "grad_norm": 9.788365364074707, + "learning_rate": 1.9451061654193893e-05, + "loss": 1.0702, + "step": 4873 + }, + { + "epoch": 13.280653950953678, + "grad_norm": 10.5549955368042, + "learning_rate": 1.9450773250422058e-05, + "loss": 1.0361, + "step": 4874 + }, + { + "epoch": 13.283378746594005, + "grad_norm": 16.18577003479004, + "learning_rate": 1.9450484773047905e-05, + "loss": 0.9915, + "step": 4875 + }, + { + "epoch": 13.286103542234333, + "grad_norm": 9.295065879821777, + "learning_rate": 1.9450196222073676e-05, + "loss": 1.0227, + "step": 4876 + }, + { + "epoch": 13.288828337874659, + "grad_norm": 9.181978225708008, + "learning_rate": 1.9449907597501626e-05, + "loss": 1.218, + "step": 4877 + }, + { + "epoch": 13.291553133514986, + "grad_norm": 8.142616271972656, + "learning_rate": 1.9449618899334e-05, + "loss": 0.8522, + "step": 4878 + }, + { + "epoch": 13.294277929155314, + "grad_norm": 11.572206497192383, + "learning_rate": 1.9449330127573044e-05, + "loss": 1.0811, + "step": 4879 + }, + { + "epoch": 13.29700272479564, + "grad_norm": 9.058589935302734, + "learning_rate": 1.9449041282221012e-05, + "loss": 1.0762, + "step": 4880 + }, + { + "epoch": 13.299727520435967, + "grad_norm": 11.395737648010254, + "learning_rate": 1.9448752363280147e-05, + "loss": 1.343, + "step": 4881 + }, + { + "epoch": 13.302452316076295, + "grad_norm": 10.529814720153809, + "learning_rate": 1.9448463370752705e-05, + "loss": 0.9668, + "step": 4882 + }, + { + "epoch": 13.30517711171662, + "grad_norm": 7.888298034667969, + "learning_rate": 1.9448174304640936e-05, + "loss": 0.9543, + "step": 4883 + }, + { + "epoch": 13.307901907356948, + "grad_norm": 9.759827613830566, + "learning_rate": 1.944788516494709e-05, + "loss": 1.3025, + "step": 4884 + }, + { + "epoch": 13.310626702997276, + "grad_norm": 11.753057479858398, + "learning_rate": 1.9447595951673415e-05, + "loss": 1.0895, + "step": 4885 + }, + { + "epoch": 13.313351498637601, + "grad_norm": 10.756237983703613, + "learning_rate": 1.9447306664822166e-05, + "loss": 1.1907, + "step": 4886 + }, + { + "epoch": 13.316076294277929, + "grad_norm": 9.583301544189453, + "learning_rate": 1.94470173043956e-05, + "loss": 1.1617, + "step": 4887 + }, + { + "epoch": 13.318801089918257, + "grad_norm": 8.751459121704102, + "learning_rate": 1.9446727870395964e-05, + "loss": 0.9995, + "step": 4888 + }, + { + "epoch": 13.321525885558582, + "grad_norm": 12.962774276733398, + "learning_rate": 1.944643836282552e-05, + "loss": 1.1714, + "step": 4889 + }, + { + "epoch": 13.32425068119891, + "grad_norm": 9.904338836669922, + "learning_rate": 1.9446148781686515e-05, + "loss": 1.114, + "step": 4890 + }, + { + "epoch": 13.326975476839237, + "grad_norm": 8.514065742492676, + "learning_rate": 1.9445859126981207e-05, + "loss": 0.9292, + "step": 4891 + }, + { + "epoch": 13.329700272479563, + "grad_norm": 13.031332969665527, + "learning_rate": 1.9445569398711853e-05, + "loss": 1.1843, + "step": 4892 + }, + { + "epoch": 13.33242506811989, + "grad_norm": 8.385294914245605, + "learning_rate": 1.944527959688071e-05, + "loss": 1.3203, + "step": 4893 + }, + { + "epoch": 13.335149863760218, + "grad_norm": 10.21648120880127, + "learning_rate": 1.9444989721490034e-05, + "loss": 1.2075, + "step": 4894 + }, + { + "epoch": 13.337874659400544, + "grad_norm": 9.46163272857666, + "learning_rate": 1.9444699772542076e-05, + "loss": 1.0375, + "step": 4895 + }, + { + "epoch": 13.340599455040872, + "grad_norm": 7.836633205413818, + "learning_rate": 1.9444409750039107e-05, + "loss": 0.8973, + "step": 4896 + }, + { + "epoch": 13.3433242506812, + "grad_norm": 9.458667755126953, + "learning_rate": 1.9444119653983376e-05, + "loss": 1.175, + "step": 4897 + }, + { + "epoch": 13.346049046321525, + "grad_norm": 10.297599792480469, + "learning_rate": 1.9443829484377147e-05, + "loss": 1.1794, + "step": 4898 + }, + { + "epoch": 13.348773841961853, + "grad_norm": 8.998893737792969, + "learning_rate": 1.9443539241222672e-05, + "loss": 1.0908, + "step": 4899 + }, + { + "epoch": 13.35149863760218, + "grad_norm": 9.326870918273926, + "learning_rate": 1.9443248924522223e-05, + "loss": 0.962, + "step": 4900 + }, + { + "epoch": 13.354223433242506, + "grad_norm": 14.722137451171875, + "learning_rate": 1.9442958534278054e-05, + "loss": 1.2463, + "step": 4901 + }, + { + "epoch": 13.356948228882834, + "grad_norm": 11.660216331481934, + "learning_rate": 1.944266807049243e-05, + "loss": 1.0574, + "step": 4902 + }, + { + "epoch": 13.359673024523161, + "grad_norm": 9.365885734558105, + "learning_rate": 1.944237753316761e-05, + "loss": 1.0701, + "step": 4903 + }, + { + "epoch": 13.362397820163487, + "grad_norm": 10.935153007507324, + "learning_rate": 1.944208692230585e-05, + "loss": 1.0439, + "step": 4904 + }, + { + "epoch": 13.365122615803815, + "grad_norm": 8.973504066467285, + "learning_rate": 1.944179623790943e-05, + "loss": 0.9796, + "step": 4905 + }, + { + "epoch": 13.367847411444142, + "grad_norm": 12.400835037231445, + "learning_rate": 1.9441505479980602e-05, + "loss": 1.0642, + "step": 4906 + }, + { + "epoch": 13.370572207084468, + "grad_norm": 16.130796432495117, + "learning_rate": 1.9441214648521633e-05, + "loss": 1.3103, + "step": 4907 + }, + { + "epoch": 13.373297002724795, + "grad_norm": 10.828619003295898, + "learning_rate": 1.944092374353479e-05, + "loss": 1.0986, + "step": 4908 + }, + { + "epoch": 13.376021798365123, + "grad_norm": 10.00255012512207, + "learning_rate": 1.9440632765022332e-05, + "loss": 0.9907, + "step": 4909 + }, + { + "epoch": 13.378746594005449, + "grad_norm": 9.481042861938477, + "learning_rate": 1.9440341712986534e-05, + "loss": 1.1254, + "step": 4910 + }, + { + "epoch": 13.381471389645776, + "grad_norm": 9.945815086364746, + "learning_rate": 1.944005058742966e-05, + "loss": 1.1763, + "step": 4911 + }, + { + "epoch": 13.384196185286104, + "grad_norm": 12.883193969726562, + "learning_rate": 1.9439759388353972e-05, + "loss": 1.0884, + "step": 4912 + }, + { + "epoch": 13.38692098092643, + "grad_norm": 13.921396255493164, + "learning_rate": 1.9439468115761745e-05, + "loss": 1.2479, + "step": 4913 + }, + { + "epoch": 13.389645776566757, + "grad_norm": 8.882813453674316, + "learning_rate": 1.943917676965524e-05, + "loss": 1.1646, + "step": 4914 + }, + { + "epoch": 13.392370572207085, + "grad_norm": 12.870677947998047, + "learning_rate": 1.9438885350036735e-05, + "loss": 1.4008, + "step": 4915 + }, + { + "epoch": 13.39509536784741, + "grad_norm": 8.222795486450195, + "learning_rate": 1.943859385690849e-05, + "loss": 0.9674, + "step": 4916 + }, + { + "epoch": 13.397820163487738, + "grad_norm": 9.917922973632812, + "learning_rate": 1.9438302290272782e-05, + "loss": 1.0837, + "step": 4917 + }, + { + "epoch": 13.400544959128066, + "grad_norm": 13.1954927444458, + "learning_rate": 1.943801065013188e-05, + "loss": 1.3821, + "step": 4918 + }, + { + "epoch": 13.403269754768392, + "grad_norm": 8.951169967651367, + "learning_rate": 1.9437718936488054e-05, + "loss": 1.1001, + "step": 4919 + }, + { + "epoch": 13.40599455040872, + "grad_norm": 14.295671463012695, + "learning_rate": 1.9437427149343576e-05, + "loss": 1.103, + "step": 4920 + }, + { + "epoch": 13.408719346049047, + "grad_norm": 23.772388458251953, + "learning_rate": 1.943713528870072e-05, + "loss": 1.1239, + "step": 4921 + }, + { + "epoch": 13.411444141689373, + "grad_norm": 20.6263484954834, + "learning_rate": 1.943684335456176e-05, + "loss": 1.2134, + "step": 4922 + }, + { + "epoch": 13.4141689373297, + "grad_norm": 12.296714782714844, + "learning_rate": 1.9436551346928963e-05, + "loss": 1.2314, + "step": 4923 + }, + { + "epoch": 13.416893732970028, + "grad_norm": 9.434287071228027, + "learning_rate": 1.943625926580461e-05, + "loss": 1.0848, + "step": 4924 + }, + { + "epoch": 13.419618528610354, + "grad_norm": 8.973977088928223, + "learning_rate": 1.9435967111190975e-05, + "loss": 1.1523, + "step": 4925 + }, + { + "epoch": 13.422343324250681, + "grad_norm": 10.713934898376465, + "learning_rate": 1.9435674883090333e-05, + "loss": 1.241, + "step": 4926 + }, + { + "epoch": 13.425068119891009, + "grad_norm": 12.549975395202637, + "learning_rate": 1.9435382581504955e-05, + "loss": 1.1179, + "step": 4927 + }, + { + "epoch": 13.427792915531334, + "grad_norm": 12.254369735717773, + "learning_rate": 1.9435090206437124e-05, + "loss": 1.0909, + "step": 4928 + }, + { + "epoch": 13.430517711171662, + "grad_norm": 9.583385467529297, + "learning_rate": 1.9434797757889114e-05, + "loss": 0.9912, + "step": 4929 + }, + { + "epoch": 13.43324250681199, + "grad_norm": 12.13889217376709, + "learning_rate": 1.94345052358632e-05, + "loss": 1.3284, + "step": 4930 + }, + { + "epoch": 13.435967302452315, + "grad_norm": 10.6828031539917, + "learning_rate": 1.9434212640361662e-05, + "loss": 1.0371, + "step": 4931 + }, + { + "epoch": 13.438692098092643, + "grad_norm": 8.419368743896484, + "learning_rate": 1.9433919971386785e-05, + "loss": 1.0361, + "step": 4932 + }, + { + "epoch": 13.44141689373297, + "grad_norm": 9.591110229492188, + "learning_rate": 1.943362722894084e-05, + "loss": 1.3, + "step": 4933 + }, + { + "epoch": 13.444141689373296, + "grad_norm": 13.010809898376465, + "learning_rate": 1.943333441302611e-05, + "loss": 1.002, + "step": 4934 + }, + { + "epoch": 13.446866485013624, + "grad_norm": 7.335751056671143, + "learning_rate": 1.9433041523644873e-05, + "loss": 0.9941, + "step": 4935 + }, + { + "epoch": 13.449591280653951, + "grad_norm": 13.550209999084473, + "learning_rate": 1.9432748560799416e-05, + "loss": 1.3273, + "step": 4936 + }, + { + "epoch": 13.452316076294277, + "grad_norm": 10.893725395202637, + "learning_rate": 1.9432455524492014e-05, + "loss": 0.9391, + "step": 4937 + }, + { + "epoch": 13.455040871934605, + "grad_norm": 8.60975170135498, + "learning_rate": 1.9432162414724952e-05, + "loss": 1.0885, + "step": 4938 + }, + { + "epoch": 13.457765667574932, + "grad_norm": 10.962531089782715, + "learning_rate": 1.9431869231500516e-05, + "loss": 1.2214, + "step": 4939 + }, + { + "epoch": 13.460490463215258, + "grad_norm": 10.27914047241211, + "learning_rate": 1.9431575974820983e-05, + "loss": 1.1592, + "step": 4940 + }, + { + "epoch": 13.463215258855586, + "grad_norm": 8.277831077575684, + "learning_rate": 1.943128264468864e-05, + "loss": 1.0098, + "step": 4941 + }, + { + "epoch": 13.465940054495913, + "grad_norm": 8.443522453308105, + "learning_rate": 1.943098924110577e-05, + "loss": 1.1726, + "step": 4942 + }, + { + "epoch": 13.46866485013624, + "grad_norm": 9.645376205444336, + "learning_rate": 1.9430695764074662e-05, + "loss": 1.0812, + "step": 4943 + }, + { + "epoch": 13.471389645776567, + "grad_norm": 11.037893295288086, + "learning_rate": 1.9430402213597598e-05, + "loss": 1.0818, + "step": 4944 + }, + { + "epoch": 13.474114441416894, + "grad_norm": 13.38748836517334, + "learning_rate": 1.9430108589676868e-05, + "loss": 1.2874, + "step": 4945 + }, + { + "epoch": 13.47683923705722, + "grad_norm": 10.455015182495117, + "learning_rate": 1.9429814892314752e-05, + "loss": 1.1831, + "step": 4946 + }, + { + "epoch": 13.479564032697548, + "grad_norm": 11.289458274841309, + "learning_rate": 1.9429521121513542e-05, + "loss": 1.144, + "step": 4947 + }, + { + "epoch": 13.482288828337875, + "grad_norm": 9.35831356048584, + "learning_rate": 1.9429227277275525e-05, + "loss": 1.0409, + "step": 4948 + }, + { + "epoch": 13.485013623978201, + "grad_norm": 18.667573928833008, + "learning_rate": 1.942893335960299e-05, + "loss": 1.0792, + "step": 4949 + }, + { + "epoch": 13.487738419618529, + "grad_norm": 11.403008460998535, + "learning_rate": 1.9428639368498223e-05, + "loss": 1.2703, + "step": 4950 + }, + { + "epoch": 13.490463215258856, + "grad_norm": 9.828926086425781, + "learning_rate": 1.9428345303963517e-05, + "loss": 1.0442, + "step": 4951 + }, + { + "epoch": 13.493188010899182, + "grad_norm": 10.004315376281738, + "learning_rate": 1.9428051166001162e-05, + "loss": 1.1315, + "step": 4952 + }, + { + "epoch": 13.49591280653951, + "grad_norm": 8.655510902404785, + "learning_rate": 1.942775695461345e-05, + "loss": 0.9866, + "step": 4953 + }, + { + "epoch": 13.498637602179837, + "grad_norm": 7.741220951080322, + "learning_rate": 1.942746266980267e-05, + "loss": 1.1243, + "step": 4954 + }, + { + "epoch": 13.501362397820163, + "grad_norm": 7.098425388336182, + "learning_rate": 1.942716831157111e-05, + "loss": 0.8582, + "step": 4955 + }, + { + "epoch": 13.50408719346049, + "grad_norm": 13.48908519744873, + "learning_rate": 1.942687387992107e-05, + "loss": 1.1384, + "step": 4956 + }, + { + "epoch": 13.506811989100818, + "grad_norm": 14.542173385620117, + "learning_rate": 1.9426579374854838e-05, + "loss": 1.1768, + "step": 4957 + }, + { + "epoch": 13.509536784741144, + "grad_norm": 121.65567016601562, + "learning_rate": 1.9426284796374712e-05, + "loss": 1.3164, + "step": 4958 + }, + { + "epoch": 13.512261580381471, + "grad_norm": 11.893477439880371, + "learning_rate": 1.942599014448298e-05, + "loss": 1.2727, + "step": 4959 + }, + { + "epoch": 13.514986376021799, + "grad_norm": 11.721236228942871, + "learning_rate": 1.942569541918194e-05, + "loss": 0.9863, + "step": 4960 + }, + { + "epoch": 13.517711171662125, + "grad_norm": 9.663614273071289, + "learning_rate": 1.9425400620473893e-05, + "loss": 1.1519, + "step": 4961 + }, + { + "epoch": 13.520435967302452, + "grad_norm": 11.535460472106934, + "learning_rate": 1.9425105748361122e-05, + "loss": 1.1575, + "step": 4962 + }, + { + "epoch": 13.52316076294278, + "grad_norm": 15.516406059265137, + "learning_rate": 1.9424810802845937e-05, + "loss": 1.2666, + "step": 4963 + }, + { + "epoch": 13.525885558583106, + "grad_norm": 12.936622619628906, + "learning_rate": 1.9424515783930624e-05, + "loss": 1.2213, + "step": 4964 + }, + { + "epoch": 13.528610354223433, + "grad_norm": 16.40265464782715, + "learning_rate": 1.942422069161749e-05, + "loss": 1.1985, + "step": 4965 + }, + { + "epoch": 13.53133514986376, + "grad_norm": 17.725162506103516, + "learning_rate": 1.9423925525908826e-05, + "loss": 1.2993, + "step": 4966 + }, + { + "epoch": 13.534059945504087, + "grad_norm": 9.422935485839844, + "learning_rate": 1.9423630286806928e-05, + "loss": 1.166, + "step": 4967 + }, + { + "epoch": 13.536784741144414, + "grad_norm": 18.535873413085938, + "learning_rate": 1.942333497431411e-05, + "loss": 1.3313, + "step": 4968 + }, + { + "epoch": 13.539509536784742, + "grad_norm": 10.134592056274414, + "learning_rate": 1.9423039588432657e-05, + "loss": 1.1255, + "step": 4969 + }, + { + "epoch": 13.542234332425068, + "grad_norm": 11.532000541687012, + "learning_rate": 1.9422744129164877e-05, + "loss": 1.2673, + "step": 4970 + }, + { + "epoch": 13.544959128065395, + "grad_norm": 13.674302101135254, + "learning_rate": 1.9422448596513067e-05, + "loss": 1.2104, + "step": 4971 + }, + { + "epoch": 13.547683923705723, + "grad_norm": 9.66440200805664, + "learning_rate": 1.9422152990479533e-05, + "loss": 1.2751, + "step": 4972 + }, + { + "epoch": 13.550408719346049, + "grad_norm": 13.31756591796875, + "learning_rate": 1.9421857311066575e-05, + "loss": 1.3547, + "step": 4973 + }, + { + "epoch": 13.553133514986376, + "grad_norm": 12.21282958984375, + "learning_rate": 1.9421561558276495e-05, + "loss": 1.1848, + "step": 4974 + }, + { + "epoch": 13.555858310626704, + "grad_norm": 11.367598533630371, + "learning_rate": 1.942126573211159e-05, + "loss": 1.1157, + "step": 4975 + }, + { + "epoch": 13.55858310626703, + "grad_norm": 13.134461402893066, + "learning_rate": 1.942096983257418e-05, + "loss": 1.1757, + "step": 4976 + }, + { + "epoch": 13.561307901907357, + "grad_norm": 13.335122108459473, + "learning_rate": 1.9420673859666557e-05, + "loss": 1.3433, + "step": 4977 + }, + { + "epoch": 13.564032697547685, + "grad_norm": 13.226652145385742, + "learning_rate": 1.942037781339103e-05, + "loss": 1.439, + "step": 4978 + }, + { + "epoch": 13.56675749318801, + "grad_norm": 11.82116413116455, + "learning_rate": 1.9420081693749903e-05, + "loss": 0.9768, + "step": 4979 + }, + { + "epoch": 13.569482288828338, + "grad_norm": 10.326279640197754, + "learning_rate": 1.941978550074548e-05, + "loss": 1.1863, + "step": 4980 + }, + { + "epoch": 13.572207084468666, + "grad_norm": 15.456771850585938, + "learning_rate": 1.9419489234380077e-05, + "loss": 1.1077, + "step": 4981 + }, + { + "epoch": 13.574931880108991, + "grad_norm": 22.4259090423584, + "learning_rate": 1.941919289465599e-05, + "loss": 1.1985, + "step": 4982 + }, + { + "epoch": 13.577656675749319, + "grad_norm": 11.79200267791748, + "learning_rate": 1.9418896481575534e-05, + "loss": 1.1946, + "step": 4983 + }, + { + "epoch": 13.580381471389646, + "grad_norm": 12.975360870361328, + "learning_rate": 1.9418599995141013e-05, + "loss": 1.0375, + "step": 4984 + }, + { + "epoch": 13.583106267029972, + "grad_norm": 12.62851333618164, + "learning_rate": 1.941830343535474e-05, + "loss": 1.311, + "step": 4985 + }, + { + "epoch": 13.5858310626703, + "grad_norm": 14.895894050598145, + "learning_rate": 1.9418006802219022e-05, + "loss": 1.3494, + "step": 4986 + }, + { + "epoch": 13.588555858310627, + "grad_norm": 15.663689613342285, + "learning_rate": 1.9417710095736173e-05, + "loss": 1.1829, + "step": 4987 + }, + { + "epoch": 13.591280653950953, + "grad_norm": 8.505025863647461, + "learning_rate": 1.94174133159085e-05, + "loss": 1.0594, + "step": 4988 + }, + { + "epoch": 13.59400544959128, + "grad_norm": 10.836217880249023, + "learning_rate": 1.9417116462738312e-05, + "loss": 1.2996, + "step": 4989 + }, + { + "epoch": 13.596730245231608, + "grad_norm": 12.67309856414795, + "learning_rate": 1.9416819536227928e-05, + "loss": 1.2812, + "step": 4990 + }, + { + "epoch": 13.599455040871934, + "grad_norm": 37.39385223388672, + "learning_rate": 1.9416522536379653e-05, + "loss": 1.1196, + "step": 4991 + }, + { + "epoch": 13.602179836512262, + "grad_norm": 13.147069931030273, + "learning_rate": 1.9416225463195807e-05, + "loss": 1.3328, + "step": 4992 + }, + { + "epoch": 13.60490463215259, + "grad_norm": 14.431489944458008, + "learning_rate": 1.94159283166787e-05, + "loss": 1.074, + "step": 4993 + }, + { + "epoch": 13.607629427792915, + "grad_norm": 40.52897644042969, + "learning_rate": 1.9415631096830644e-05, + "loss": 1.2249, + "step": 4994 + }, + { + "epoch": 13.610354223433243, + "grad_norm": 11.68537425994873, + "learning_rate": 1.9415333803653955e-05, + "loss": 1.0654, + "step": 4995 + }, + { + "epoch": 13.61307901907357, + "grad_norm": 10.335807800292969, + "learning_rate": 1.941503643715095e-05, + "loss": 1.1626, + "step": 4996 + }, + { + "epoch": 13.615803814713896, + "grad_norm": 63.72047805786133, + "learning_rate": 1.9414738997323947e-05, + "loss": 1.1919, + "step": 4997 + }, + { + "epoch": 13.618528610354224, + "grad_norm": 10.672576904296875, + "learning_rate": 1.9414441484175258e-05, + "loss": 1.2578, + "step": 4998 + }, + { + "epoch": 13.621253405994551, + "grad_norm": 12.725996971130371, + "learning_rate": 1.9414143897707204e-05, + "loss": 1.2, + "step": 4999 + }, + { + "epoch": 13.623978201634877, + "grad_norm": 9.036222457885742, + "learning_rate": 1.9413846237922098e-05, + "loss": 1.3495, + "step": 5000 + }, + { + "epoch": 13.626702997275205, + "grad_norm": 20.720375061035156, + "learning_rate": 1.941354850482226e-05, + "loss": 1.2527, + "step": 5001 + }, + { + "epoch": 13.629427792915532, + "grad_norm": 15.53624153137207, + "learning_rate": 1.941325069841001e-05, + "loss": 1.4265, + "step": 5002 + }, + { + "epoch": 13.632152588555858, + "grad_norm": 13.139444351196289, + "learning_rate": 1.9412952818687665e-05, + "loss": 1.3018, + "step": 5003 + }, + { + "epoch": 13.634877384196185, + "grad_norm": 10.584000587463379, + "learning_rate": 1.941265486565755e-05, + "loss": 1.416, + "step": 5004 + }, + { + "epoch": 13.637602179836513, + "grad_norm": 9.378589630126953, + "learning_rate": 1.941235683932198e-05, + "loss": 1.271, + "step": 5005 + }, + { + "epoch": 13.640326975476839, + "grad_norm": 19.38829803466797, + "learning_rate": 1.9412058739683276e-05, + "loss": 1.4248, + "step": 5006 + }, + { + "epoch": 13.643051771117166, + "grad_norm": 11.798781394958496, + "learning_rate": 1.9411760566743765e-05, + "loss": 1.2646, + "step": 5007 + }, + { + "epoch": 13.645776566757494, + "grad_norm": 10.712326049804688, + "learning_rate": 1.941146232050576e-05, + "loss": 1.314, + "step": 5008 + }, + { + "epoch": 13.64850136239782, + "grad_norm": 10.130495071411133, + "learning_rate": 1.9411164000971597e-05, + "loss": 1.2925, + "step": 5009 + }, + { + "epoch": 13.651226158038147, + "grad_norm": 21.946491241455078, + "learning_rate": 1.9410865608143586e-05, + "loss": 1.2432, + "step": 5010 + }, + { + "epoch": 13.653950953678475, + "grad_norm": 9.57172966003418, + "learning_rate": 1.941056714202406e-05, + "loss": 1.2327, + "step": 5011 + }, + { + "epoch": 13.6566757493188, + "grad_norm": 12.476937294006348, + "learning_rate": 1.9410268602615338e-05, + "loss": 1.1344, + "step": 5012 + }, + { + "epoch": 13.659400544959128, + "grad_norm": 14.384178161621094, + "learning_rate": 1.9409969989919746e-05, + "loss": 1.2058, + "step": 5013 + }, + { + "epoch": 13.662125340599456, + "grad_norm": 13.131757736206055, + "learning_rate": 1.940967130393961e-05, + "loss": 1.1837, + "step": 5014 + }, + { + "epoch": 13.664850136239782, + "grad_norm": 13.937726974487305, + "learning_rate": 1.940937254467726e-05, + "loss": 1.2732, + "step": 5015 + }, + { + "epoch": 13.66757493188011, + "grad_norm": 12.27633285522461, + "learning_rate": 1.940907371213502e-05, + "loss": 1.1104, + "step": 5016 + }, + { + "epoch": 13.670299727520437, + "grad_norm": 14.232234001159668, + "learning_rate": 1.9408774806315215e-05, + "loss": 1.2317, + "step": 5017 + }, + { + "epoch": 13.673024523160763, + "grad_norm": 11.793499946594238, + "learning_rate": 1.9408475827220173e-05, + "loss": 1.2783, + "step": 5018 + }, + { + "epoch": 13.67574931880109, + "grad_norm": 14.1796293258667, + "learning_rate": 1.9408176774852224e-05, + "loss": 1.0769, + "step": 5019 + }, + { + "epoch": 13.678474114441418, + "grad_norm": 10.935534477233887, + "learning_rate": 1.9407877649213696e-05, + "loss": 0.9988, + "step": 5020 + }, + { + "epoch": 13.681198910081743, + "grad_norm": 10.10819149017334, + "learning_rate": 1.9407578450306926e-05, + "loss": 1.1537, + "step": 5021 + }, + { + "epoch": 13.683923705722071, + "grad_norm": 12.352477073669434, + "learning_rate": 1.9407279178134233e-05, + "loss": 1.046, + "step": 5022 + }, + { + "epoch": 13.686648501362399, + "grad_norm": 12.96524715423584, + "learning_rate": 1.9406979832697953e-05, + "loss": 1.261, + "step": 5023 + }, + { + "epoch": 13.689373297002724, + "grad_norm": 12.40776538848877, + "learning_rate": 1.9406680414000418e-05, + "loss": 1.2307, + "step": 5024 + }, + { + "epoch": 13.692098092643052, + "grad_norm": 9.899091720581055, + "learning_rate": 1.9406380922043955e-05, + "loss": 1.1104, + "step": 5025 + }, + { + "epoch": 13.69482288828338, + "grad_norm": 9.56047534942627, + "learning_rate": 1.9406081356830906e-05, + "loss": 1.0581, + "step": 5026 + }, + { + "epoch": 13.697547683923705, + "grad_norm": 8.775030136108398, + "learning_rate": 1.9405781718363595e-05, + "loss": 1.0488, + "step": 5027 + }, + { + "epoch": 13.700272479564033, + "grad_norm": 10.675580978393555, + "learning_rate": 1.940548200664436e-05, + "loss": 1.1741, + "step": 5028 + }, + { + "epoch": 13.70299727520436, + "grad_norm": 7.952402114868164, + "learning_rate": 1.9405182221675535e-05, + "loss": 1.1293, + "step": 5029 + }, + { + "epoch": 13.705722070844686, + "grad_norm": 9.325764656066895, + "learning_rate": 1.940488236345945e-05, + "loss": 1.157, + "step": 5030 + }, + { + "epoch": 13.708446866485014, + "grad_norm": 10.313379287719727, + "learning_rate": 1.9404582431998446e-05, + "loss": 1.1921, + "step": 5031 + }, + { + "epoch": 13.711171662125341, + "grad_norm": 10.060182571411133, + "learning_rate": 1.9404282427294854e-05, + "loss": 1.1826, + "step": 5032 + }, + { + "epoch": 13.713896457765667, + "grad_norm": 9.37794303894043, + "learning_rate": 1.9403982349351014e-05, + "loss": 1.1277, + "step": 5033 + }, + { + "epoch": 13.716621253405995, + "grad_norm": 12.922962188720703, + "learning_rate": 1.9403682198169266e-05, + "loss": 1.2212, + "step": 5034 + }, + { + "epoch": 13.719346049046322, + "grad_norm": 10.3358793258667, + "learning_rate": 1.940338197375194e-05, + "loss": 1.1089, + "step": 5035 + }, + { + "epoch": 13.722070844686648, + "grad_norm": 10.662749290466309, + "learning_rate": 1.940308167610138e-05, + "loss": 1.2673, + "step": 5036 + }, + { + "epoch": 13.724795640326976, + "grad_norm": 8.988673210144043, + "learning_rate": 1.940278130521992e-05, + "loss": 1.1497, + "step": 5037 + }, + { + "epoch": 13.727520435967303, + "grad_norm": 10.619245529174805, + "learning_rate": 1.94024808611099e-05, + "loss": 1.1885, + "step": 5038 + }, + { + "epoch": 13.730245231607629, + "grad_norm": 10.40213680267334, + "learning_rate": 1.9402180343773665e-05, + "loss": 1.1804, + "step": 5039 + }, + { + "epoch": 13.732970027247957, + "grad_norm": 8.468010902404785, + "learning_rate": 1.9401879753213556e-05, + "loss": 1.2205, + "step": 5040 + }, + { + "epoch": 13.735694822888284, + "grad_norm": 10.093297958374023, + "learning_rate": 1.9401579089431904e-05, + "loss": 0.8463, + "step": 5041 + }, + { + "epoch": 13.73841961852861, + "grad_norm": 10.707527160644531, + "learning_rate": 1.940127835243106e-05, + "loss": 1.1765, + "step": 5042 + }, + { + "epoch": 13.741144414168938, + "grad_norm": 8.857259750366211, + "learning_rate": 1.940097754221336e-05, + "loss": 1.4438, + "step": 5043 + }, + { + "epoch": 13.743869209809265, + "grad_norm": 11.06920051574707, + "learning_rate": 1.940067665878115e-05, + "loss": 1.3408, + "step": 5044 + }, + { + "epoch": 13.746594005449591, + "grad_norm": 8.317543029785156, + "learning_rate": 1.9400375702136777e-05, + "loss": 0.8645, + "step": 5045 + }, + { + "epoch": 13.749318801089919, + "grad_norm": 7.602947235107422, + "learning_rate": 1.9400074672282576e-05, + "loss": 1.2239, + "step": 5046 + }, + { + "epoch": 13.752043596730246, + "grad_norm": 10.72529411315918, + "learning_rate": 1.9399773569220896e-05, + "loss": 1.2053, + "step": 5047 + }, + { + "epoch": 13.754768392370572, + "grad_norm": 9.096590995788574, + "learning_rate": 1.939947239295408e-05, + "loss": 1.114, + "step": 5048 + }, + { + "epoch": 13.7574931880109, + "grad_norm": 8.262537002563477, + "learning_rate": 1.939917114348448e-05, + "loss": 1.1478, + "step": 5049 + }, + { + "epoch": 13.760217983651227, + "grad_norm": 7.784013271331787, + "learning_rate": 1.939886982081444e-05, + "loss": 1.1875, + "step": 5050 + }, + { + "epoch": 13.762942779291553, + "grad_norm": 8.267370223999023, + "learning_rate": 1.93985684249463e-05, + "loss": 1.0675, + "step": 5051 + }, + { + "epoch": 13.76566757493188, + "grad_norm": 7.184292316436768, + "learning_rate": 1.939826695588241e-05, + "loss": 1.1619, + "step": 5052 + }, + { + "epoch": 13.768392370572208, + "grad_norm": 14.374281883239746, + "learning_rate": 1.939796541362512e-05, + "loss": 1.2981, + "step": 5053 + }, + { + "epoch": 13.771117166212534, + "grad_norm": 11.208491325378418, + "learning_rate": 1.9397663798176783e-05, + "loss": 1.1274, + "step": 5054 + }, + { + "epoch": 13.773841961852861, + "grad_norm": 20.029939651489258, + "learning_rate": 1.939736210953974e-05, + "loss": 1.1852, + "step": 5055 + }, + { + "epoch": 13.776566757493189, + "grad_norm": 8.747542381286621, + "learning_rate": 1.939706034771634e-05, + "loss": 1.1677, + "step": 5056 + }, + { + "epoch": 13.779291553133515, + "grad_norm": 8.436010360717773, + "learning_rate": 1.9396758512708943e-05, + "loss": 1.156, + "step": 5057 + }, + { + "epoch": 13.782016348773842, + "grad_norm": 19.555360794067383, + "learning_rate": 1.9396456604519885e-05, + "loss": 1.2537, + "step": 5058 + }, + { + "epoch": 13.78474114441417, + "grad_norm": 9.587838172912598, + "learning_rate": 1.939615462315153e-05, + "loss": 1.1218, + "step": 5059 + }, + { + "epoch": 13.787465940054496, + "grad_norm": 8.060758590698242, + "learning_rate": 1.9395852568606225e-05, + "loss": 0.8926, + "step": 5060 + }, + { + "epoch": 13.790190735694823, + "grad_norm": 9.282258033752441, + "learning_rate": 1.9395550440886325e-05, + "loss": 1.3179, + "step": 5061 + }, + { + "epoch": 13.79291553133515, + "grad_norm": 9.416927337646484, + "learning_rate": 1.9395248239994177e-05, + "loss": 1.1321, + "step": 5062 + }, + { + "epoch": 13.795640326975477, + "grad_norm": 9.92941665649414, + "learning_rate": 1.939494596593214e-05, + "loss": 1.1082, + "step": 5063 + }, + { + "epoch": 13.798365122615804, + "grad_norm": 12.008455276489258, + "learning_rate": 1.939464361870256e-05, + "loss": 1.0618, + "step": 5064 + }, + { + "epoch": 13.80108991825613, + "grad_norm": 8.59157657623291, + "learning_rate": 1.9394341198307808e-05, + "loss": 0.9966, + "step": 5065 + }, + { + "epoch": 13.803814713896458, + "grad_norm": 10.721652030944824, + "learning_rate": 1.9394038704750225e-05, + "loss": 1.3184, + "step": 5066 + }, + { + "epoch": 13.806539509536785, + "grad_norm": 10.89718246459961, + "learning_rate": 1.939373613803217e-05, + "loss": 1.2522, + "step": 5067 + }, + { + "epoch": 13.809264305177111, + "grad_norm": 11.09522533416748, + "learning_rate": 1.9393433498155997e-05, + "loss": 0.9753, + "step": 5068 + }, + { + "epoch": 13.811989100817438, + "grad_norm": 9.063777923583984, + "learning_rate": 1.9393130785124073e-05, + "loss": 1.3086, + "step": 5069 + }, + { + "epoch": 13.814713896457766, + "grad_norm": 12.276968002319336, + "learning_rate": 1.9392827998938744e-05, + "loss": 1.1953, + "step": 5070 + }, + { + "epoch": 13.817438692098092, + "grad_norm": 11.270060539245605, + "learning_rate": 1.9392525139602373e-05, + "loss": 0.8892, + "step": 5071 + }, + { + "epoch": 13.82016348773842, + "grad_norm": 11.454496383666992, + "learning_rate": 1.939222220711732e-05, + "loss": 1.3066, + "step": 5072 + }, + { + "epoch": 13.822888283378747, + "grad_norm": 8.781437873840332, + "learning_rate": 1.9391919201485945e-05, + "loss": 1.2725, + "step": 5073 + }, + { + "epoch": 13.825613079019073, + "grad_norm": 8.515535354614258, + "learning_rate": 1.93916161227106e-05, + "loss": 0.9761, + "step": 5074 + }, + { + "epoch": 13.8283378746594, + "grad_norm": 8.936002731323242, + "learning_rate": 1.9391312970793654e-05, + "loss": 0.9933, + "step": 5075 + }, + { + "epoch": 13.831062670299728, + "grad_norm": 11.896123886108398, + "learning_rate": 1.9391009745737465e-05, + "loss": 1.0779, + "step": 5076 + }, + { + "epoch": 13.833787465940054, + "grad_norm": 8.316001892089844, + "learning_rate": 1.9390706447544393e-05, + "loss": 1.0015, + "step": 5077 + }, + { + "epoch": 13.836512261580381, + "grad_norm": 9.644735336303711, + "learning_rate": 1.9390403076216805e-05, + "loss": 1.2458, + "step": 5078 + }, + { + "epoch": 13.839237057220709, + "grad_norm": 9.578886032104492, + "learning_rate": 1.9390099631757057e-05, + "loss": 1.3386, + "step": 5079 + }, + { + "epoch": 13.841961852861035, + "grad_norm": 7.128910064697266, + "learning_rate": 1.938979611416752e-05, + "loss": 1.0, + "step": 5080 + }, + { + "epoch": 13.844686648501362, + "grad_norm": 8.676445960998535, + "learning_rate": 1.9389492523450545e-05, + "loss": 1.0251, + "step": 5081 + }, + { + "epoch": 13.84741144414169, + "grad_norm": 9.316558837890625, + "learning_rate": 1.938918885960851e-05, + "loss": 0.9949, + "step": 5082 + }, + { + "epoch": 13.850136239782016, + "grad_norm": 12.280668258666992, + "learning_rate": 1.9388885122643773e-05, + "loss": 1.1279, + "step": 5083 + }, + { + "epoch": 13.852861035422343, + "grad_norm": 9.22166633605957, + "learning_rate": 1.9388581312558702e-05, + "loss": 1.1763, + "step": 5084 + }, + { + "epoch": 13.85558583106267, + "grad_norm": 8.401951789855957, + "learning_rate": 1.938827742935566e-05, + "loss": 1.2942, + "step": 5085 + }, + { + "epoch": 13.858310626702997, + "grad_norm": 11.350404739379883, + "learning_rate": 1.9387973473037016e-05, + "loss": 1.1261, + "step": 5086 + }, + { + "epoch": 13.861035422343324, + "grad_norm": 10.082850456237793, + "learning_rate": 1.9387669443605137e-05, + "loss": 1.0293, + "step": 5087 + }, + { + "epoch": 13.863760217983652, + "grad_norm": 10.138223648071289, + "learning_rate": 1.938736534106239e-05, + "loss": 1.0718, + "step": 5088 + }, + { + "epoch": 13.866485013623977, + "grad_norm": 11.336297988891602, + "learning_rate": 1.938706116541114e-05, + "loss": 1.2708, + "step": 5089 + }, + { + "epoch": 13.869209809264305, + "grad_norm": 10.716597557067871, + "learning_rate": 1.9386756916653765e-05, + "loss": 1.1121, + "step": 5090 + }, + { + "epoch": 13.871934604904633, + "grad_norm": 16.344484329223633, + "learning_rate": 1.938645259479263e-05, + "loss": 1.3132, + "step": 5091 + }, + { + "epoch": 13.874659400544958, + "grad_norm": 11.688093185424805, + "learning_rate": 1.9386148199830104e-05, + "loss": 1.1921, + "step": 5092 + }, + { + "epoch": 13.877384196185286, + "grad_norm": 11.601099014282227, + "learning_rate": 1.9385843731768556e-05, + "loss": 1.0042, + "step": 5093 + }, + { + "epoch": 13.880108991825614, + "grad_norm": 14.272059440612793, + "learning_rate": 1.9385539190610358e-05, + "loss": 1.1868, + "step": 5094 + }, + { + "epoch": 13.88283378746594, + "grad_norm": 32.3015022277832, + "learning_rate": 1.9385234576357885e-05, + "loss": 1.2266, + "step": 5095 + }, + { + "epoch": 13.885558583106267, + "grad_norm": 10.42785358428955, + "learning_rate": 1.9384929889013507e-05, + "loss": 1.1726, + "step": 5096 + }, + { + "epoch": 13.888283378746594, + "grad_norm": 10.774063110351562, + "learning_rate": 1.9384625128579597e-05, + "loss": 1.0793, + "step": 5097 + }, + { + "epoch": 13.89100817438692, + "grad_norm": 13.434088706970215, + "learning_rate": 1.9384320295058528e-05, + "loss": 1.3506, + "step": 5098 + }, + { + "epoch": 13.893732970027248, + "grad_norm": 9.60982608795166, + "learning_rate": 1.9384015388452674e-05, + "loss": 1.2122, + "step": 5099 + }, + { + "epoch": 13.896457765667575, + "grad_norm": 9.065067291259766, + "learning_rate": 1.9383710408764412e-05, + "loss": 1.1741, + "step": 5100 + }, + { + "epoch": 13.899182561307901, + "grad_norm": 8.91007137298584, + "learning_rate": 1.938340535599611e-05, + "loss": 1.0735, + "step": 5101 + }, + { + "epoch": 13.901907356948229, + "grad_norm": 9.0178861618042, + "learning_rate": 1.938310023015016e-05, + "loss": 1.0222, + "step": 5102 + }, + { + "epoch": 13.904632152588556, + "grad_norm": 11.126150131225586, + "learning_rate": 1.9382795031228915e-05, + "loss": 1.3145, + "step": 5103 + }, + { + "epoch": 13.907356948228882, + "grad_norm": 15.351320266723633, + "learning_rate": 1.9382489759234773e-05, + "loss": 1.2039, + "step": 5104 + }, + { + "epoch": 13.91008174386921, + "grad_norm": 10.8551025390625, + "learning_rate": 1.93821844141701e-05, + "loss": 1.2683, + "step": 5105 + }, + { + "epoch": 13.912806539509537, + "grad_norm": 9.00561809539795, + "learning_rate": 1.9381878996037276e-05, + "loss": 1.3562, + "step": 5106 + }, + { + "epoch": 13.915531335149863, + "grad_norm": 9.64782428741455, + "learning_rate": 1.938157350483868e-05, + "loss": 1.0952, + "step": 5107 + }, + { + "epoch": 13.91825613079019, + "grad_norm": 19.437721252441406, + "learning_rate": 1.9381267940576694e-05, + "loss": 1.1235, + "step": 5108 + }, + { + "epoch": 13.920980926430518, + "grad_norm": 8.850643157958984, + "learning_rate": 1.9380962303253695e-05, + "loss": 1.2327, + "step": 5109 + }, + { + "epoch": 13.923705722070844, + "grad_norm": 11.061198234558105, + "learning_rate": 1.938065659287206e-05, + "loss": 1.4087, + "step": 5110 + }, + { + "epoch": 13.926430517711172, + "grad_norm": 8.402247428894043, + "learning_rate": 1.9380350809434176e-05, + "loss": 1.2124, + "step": 5111 + }, + { + "epoch": 13.9291553133515, + "grad_norm": 8.88551139831543, + "learning_rate": 1.938004495294242e-05, + "loss": 1.1362, + "step": 5112 + }, + { + "epoch": 13.931880108991825, + "grad_norm": 9.316143989562988, + "learning_rate": 1.9379739023399177e-05, + "loss": 1.0752, + "step": 5113 + }, + { + "epoch": 13.934604904632153, + "grad_norm": 8.615004539489746, + "learning_rate": 1.937943302080683e-05, + "loss": 1.2195, + "step": 5114 + }, + { + "epoch": 13.93732970027248, + "grad_norm": 14.729580879211426, + "learning_rate": 1.9379126945167755e-05, + "loss": 1.1555, + "step": 5115 + }, + { + "epoch": 13.940054495912806, + "grad_norm": 9.22382640838623, + "learning_rate": 1.9378820796484348e-05, + "loss": 1.0374, + "step": 5116 + }, + { + "epoch": 13.942779291553133, + "grad_norm": 14.224115371704102, + "learning_rate": 1.9378514574758983e-05, + "loss": 1.136, + "step": 5117 + }, + { + "epoch": 13.945504087193461, + "grad_norm": 11.138895034790039, + "learning_rate": 1.937820827999405e-05, + "loss": 0.9072, + "step": 5118 + }, + { + "epoch": 13.948228882833787, + "grad_norm": 12.33624267578125, + "learning_rate": 1.937790191219193e-05, + "loss": 1.3173, + "step": 5119 + }, + { + "epoch": 13.950953678474114, + "grad_norm": 9.658340454101562, + "learning_rate": 1.9377595471355016e-05, + "loss": 1.1707, + "step": 5120 + }, + { + "epoch": 13.953678474114442, + "grad_norm": 16.252883911132812, + "learning_rate": 1.9377288957485687e-05, + "loss": 1.3693, + "step": 5121 + }, + { + "epoch": 13.956403269754768, + "grad_norm": 9.234550476074219, + "learning_rate": 1.9376982370586335e-05, + "loss": 0.9656, + "step": 5122 + }, + { + "epoch": 13.959128065395095, + "grad_norm": 9.315324783325195, + "learning_rate": 1.9376675710659344e-05, + "loss": 1.1426, + "step": 5123 + }, + { + "epoch": 13.961852861035423, + "grad_norm": 10.235756874084473, + "learning_rate": 1.9376368977707107e-05, + "loss": 1.2695, + "step": 5124 + }, + { + "epoch": 13.964577656675749, + "grad_norm": 7.971922397613525, + "learning_rate": 1.9376062171732005e-05, + "loss": 0.9756, + "step": 5125 + }, + { + "epoch": 13.967302452316076, + "grad_norm": 13.746105194091797, + "learning_rate": 1.937575529273644e-05, + "loss": 1.3748, + "step": 5126 + }, + { + "epoch": 13.970027247956404, + "grad_norm": 10.527334213256836, + "learning_rate": 1.937544834072279e-05, + "loss": 1.2439, + "step": 5127 + }, + { + "epoch": 13.97275204359673, + "grad_norm": 10.209712982177734, + "learning_rate": 1.937514131569345e-05, + "loss": 1.0908, + "step": 5128 + }, + { + "epoch": 13.975476839237057, + "grad_norm": 11.231954574584961, + "learning_rate": 1.9374834217650814e-05, + "loss": 1.3093, + "step": 5129 + }, + { + "epoch": 13.978201634877385, + "grad_norm": 8.496438026428223, + "learning_rate": 1.9374527046597267e-05, + "loss": 1.05, + "step": 5130 + }, + { + "epoch": 13.98092643051771, + "grad_norm": 9.906559944152832, + "learning_rate": 1.9374219802535207e-05, + "loss": 1.3284, + "step": 5131 + }, + { + "epoch": 13.983651226158038, + "grad_norm": 9.432076454162598, + "learning_rate": 1.9373912485467027e-05, + "loss": 1.2576, + "step": 5132 + }, + { + "epoch": 13.986376021798366, + "grad_norm": 9.473461151123047, + "learning_rate": 1.9373605095395114e-05, + "loss": 1.0918, + "step": 5133 + }, + { + "epoch": 13.989100817438691, + "grad_norm": 8.349873542785645, + "learning_rate": 1.937329763232187e-05, + "loss": 1.261, + "step": 5134 + }, + { + "epoch": 13.991825613079019, + "grad_norm": 8.589016914367676, + "learning_rate": 1.9372990096249684e-05, + "loss": 1.1616, + "step": 5135 + }, + { + "epoch": 13.994550408719347, + "grad_norm": 9.705038070678711, + "learning_rate": 1.9372682487180953e-05, + "loss": 1.1487, + "step": 5136 + }, + { + "epoch": 13.997275204359672, + "grad_norm": 9.136675834655762, + "learning_rate": 1.937237480511807e-05, + "loss": 1.0737, + "step": 5137 + }, + { + "epoch": 14.0, + "grad_norm": 8.555794715881348, + "learning_rate": 1.937206705006344e-05, + "loss": 1.0691, + "step": 5138 + }, + { + "epoch": 14.002724795640328, + "grad_norm": 10.775039672851562, + "learning_rate": 1.9371759222019446e-05, + "loss": 1.1906, + "step": 5139 + }, + { + "epoch": 14.005449591280653, + "grad_norm": 10.422962188720703, + "learning_rate": 1.93714513209885e-05, + "loss": 1.2634, + "step": 5140 + }, + { + "epoch": 14.008174386920981, + "grad_norm": 11.841338157653809, + "learning_rate": 1.937114334697299e-05, + "loss": 1.0758, + "step": 5141 + }, + { + "epoch": 14.010899182561309, + "grad_norm": 7.517180919647217, + "learning_rate": 1.9370835299975312e-05, + "loss": 0.9236, + "step": 5142 + }, + { + "epoch": 14.013623978201634, + "grad_norm": 9.28675365447998, + "learning_rate": 1.9370527179997877e-05, + "loss": 1.0269, + "step": 5143 + }, + { + "epoch": 14.016348773841962, + "grad_norm": 8.840786933898926, + "learning_rate": 1.937021898704307e-05, + "loss": 0.9282, + "step": 5144 + }, + { + "epoch": 14.01907356948229, + "grad_norm": 11.340668678283691, + "learning_rate": 1.9369910721113307e-05, + "loss": 1.0544, + "step": 5145 + }, + { + "epoch": 14.021798365122615, + "grad_norm": 8.026557922363281, + "learning_rate": 1.936960238221098e-05, + "loss": 1.0471, + "step": 5146 + }, + { + "epoch": 14.024523160762943, + "grad_norm": 9.061466217041016, + "learning_rate": 1.936929397033849e-05, + "loss": 1.064, + "step": 5147 + }, + { + "epoch": 14.02724795640327, + "grad_norm": 9.586761474609375, + "learning_rate": 1.936898548549824e-05, + "loss": 1.1797, + "step": 5148 + }, + { + "epoch": 14.029972752043596, + "grad_norm": 7.718034267425537, + "learning_rate": 1.9368676927692633e-05, + "loss": 0.8347, + "step": 5149 + }, + { + "epoch": 14.032697547683924, + "grad_norm": 8.380197525024414, + "learning_rate": 1.936836829692407e-05, + "loss": 0.9882, + "step": 5150 + }, + { + "epoch": 14.035422343324251, + "grad_norm": 10.051340103149414, + "learning_rate": 1.9368059593194957e-05, + "loss": 0.9783, + "step": 5151 + }, + { + "epoch": 14.038147138964577, + "grad_norm": 6.907543659210205, + "learning_rate": 1.9367750816507697e-05, + "loss": 0.9395, + "step": 5152 + }, + { + "epoch": 14.040871934604905, + "grad_norm": 8.483818054199219, + "learning_rate": 1.9367441966864696e-05, + "loss": 1.1664, + "step": 5153 + }, + { + "epoch": 14.043596730245232, + "grad_norm": 8.694487571716309, + "learning_rate": 1.9367133044268357e-05, + "loss": 1.072, + "step": 5154 + }, + { + "epoch": 14.046321525885558, + "grad_norm": 9.576281547546387, + "learning_rate": 1.9366824048721092e-05, + "loss": 0.9762, + "step": 5155 + }, + { + "epoch": 14.049046321525886, + "grad_norm": 8.219457626342773, + "learning_rate": 1.9366514980225297e-05, + "loss": 0.9261, + "step": 5156 + }, + { + "epoch": 14.051771117166213, + "grad_norm": 17.113773345947266, + "learning_rate": 1.9366205838783386e-05, + "loss": 0.8933, + "step": 5157 + }, + { + "epoch": 14.054495912806539, + "grad_norm": 9.046813011169434, + "learning_rate": 1.9365896624397767e-05, + "loss": 1.0859, + "step": 5158 + }, + { + "epoch": 14.057220708446867, + "grad_norm": 16.562040328979492, + "learning_rate": 1.9365587337070847e-05, + "loss": 1.1587, + "step": 5159 + }, + { + "epoch": 14.059945504087194, + "grad_norm": 11.743142127990723, + "learning_rate": 1.936527797680503e-05, + "loss": 1.0215, + "step": 5160 + }, + { + "epoch": 14.06267029972752, + "grad_norm": 13.082555770874023, + "learning_rate": 1.9364968543602734e-05, + "loss": 1.2086, + "step": 5161 + }, + { + "epoch": 14.065395095367847, + "grad_norm": 9.03809642791748, + "learning_rate": 1.9364659037466363e-05, + "loss": 1.127, + "step": 5162 + }, + { + "epoch": 14.068119891008175, + "grad_norm": 10.348206520080566, + "learning_rate": 1.936434945839833e-05, + "loss": 0.9873, + "step": 5163 + }, + { + "epoch": 14.0708446866485, + "grad_norm": 9.243765830993652, + "learning_rate": 1.9364039806401044e-05, + "loss": 1.0645, + "step": 5164 + }, + { + "epoch": 14.073569482288828, + "grad_norm": 8.912335395812988, + "learning_rate": 1.9363730081476917e-05, + "loss": 1.0516, + "step": 5165 + }, + { + "epoch": 14.076294277929156, + "grad_norm": 11.13410758972168, + "learning_rate": 1.9363420283628362e-05, + "loss": 1.0215, + "step": 5166 + }, + { + "epoch": 14.079019073569482, + "grad_norm": 19.718351364135742, + "learning_rate": 1.9363110412857792e-05, + "loss": 1.218, + "step": 5167 + }, + { + "epoch": 14.08174386920981, + "grad_norm": 8.111212730407715, + "learning_rate": 1.9362800469167616e-05, + "loss": 0.9565, + "step": 5168 + }, + { + "epoch": 14.084468664850137, + "grad_norm": 21.195087432861328, + "learning_rate": 1.9362490452560253e-05, + "loss": 1.0968, + "step": 5169 + }, + { + "epoch": 14.087193460490463, + "grad_norm": 12.929117202758789, + "learning_rate": 1.936218036303812e-05, + "loss": 1.1819, + "step": 5170 + }, + { + "epoch": 14.08991825613079, + "grad_norm": 12.823680877685547, + "learning_rate": 1.9361870200603622e-05, + "loss": 0.9674, + "step": 5171 + }, + { + "epoch": 14.092643051771118, + "grad_norm": 8.026865005493164, + "learning_rate": 1.9361559965259183e-05, + "loss": 1.0482, + "step": 5172 + }, + { + "epoch": 14.095367847411444, + "grad_norm": 14.824681282043457, + "learning_rate": 1.9361249657007212e-05, + "loss": 1.175, + "step": 5173 + }, + { + "epoch": 14.098092643051771, + "grad_norm": 9.480208396911621, + "learning_rate": 1.9360939275850136e-05, + "loss": 0.9825, + "step": 5174 + }, + { + "epoch": 14.100817438692099, + "grad_norm": 10.715375900268555, + "learning_rate": 1.9360628821790365e-05, + "loss": 0.98, + "step": 5175 + }, + { + "epoch": 14.103542234332425, + "grad_norm": 8.420612335205078, + "learning_rate": 1.9360318294830316e-05, + "loss": 1.0737, + "step": 5176 + }, + { + "epoch": 14.106267029972752, + "grad_norm": 55.007171630859375, + "learning_rate": 1.936000769497241e-05, + "loss": 1.03, + "step": 5177 + }, + { + "epoch": 14.10899182561308, + "grad_norm": 10.606861114501953, + "learning_rate": 1.9359697022219065e-05, + "loss": 1.0549, + "step": 5178 + }, + { + "epoch": 14.111716621253406, + "grad_norm": 11.335735321044922, + "learning_rate": 1.93593862765727e-05, + "loss": 0.9281, + "step": 5179 + }, + { + "epoch": 14.114441416893733, + "grad_norm": 9.67910099029541, + "learning_rate": 1.9359075458035737e-05, + "loss": 1.0305, + "step": 5180 + }, + { + "epoch": 14.11716621253406, + "grad_norm": 11.689078330993652, + "learning_rate": 1.9358764566610598e-05, + "loss": 1.166, + "step": 5181 + }, + { + "epoch": 14.119891008174386, + "grad_norm": 9.712400436401367, + "learning_rate": 1.9358453602299697e-05, + "loss": 1.0057, + "step": 5182 + }, + { + "epoch": 14.122615803814714, + "grad_norm": 8.734127044677734, + "learning_rate": 1.9358142565105463e-05, + "loss": 1.1764, + "step": 5183 + }, + { + "epoch": 14.125340599455042, + "grad_norm": 11.82819938659668, + "learning_rate": 1.9357831455030315e-05, + "loss": 1.1128, + "step": 5184 + }, + { + "epoch": 14.128065395095367, + "grad_norm": 9.787619590759277, + "learning_rate": 1.9357520272076676e-05, + "loss": 1.0128, + "step": 5185 + }, + { + "epoch": 14.130790190735695, + "grad_norm": 10.834694862365723, + "learning_rate": 1.9357209016246972e-05, + "loss": 1.0073, + "step": 5186 + }, + { + "epoch": 14.133514986376023, + "grad_norm": 11.580232620239258, + "learning_rate": 1.9356897687543626e-05, + "loss": 1.1733, + "step": 5187 + }, + { + "epoch": 14.136239782016348, + "grad_norm": 10.885783195495605, + "learning_rate": 1.9356586285969062e-05, + "loss": 1.0463, + "step": 5188 + }, + { + "epoch": 14.138964577656676, + "grad_norm": 11.105716705322266, + "learning_rate": 1.9356274811525707e-05, + "loss": 1.0547, + "step": 5189 + }, + { + "epoch": 14.141689373297003, + "grad_norm": 10.251579284667969, + "learning_rate": 1.935596326421598e-05, + "loss": 1.0901, + "step": 5190 + }, + { + "epoch": 14.14441416893733, + "grad_norm": 9.170507431030273, + "learning_rate": 1.9355651644042312e-05, + "loss": 1.2407, + "step": 5191 + }, + { + "epoch": 14.147138964577657, + "grad_norm": 12.432571411132812, + "learning_rate": 1.9355339951007133e-05, + "loss": 1.2239, + "step": 5192 + }, + { + "epoch": 14.149863760217984, + "grad_norm": 9.303281784057617, + "learning_rate": 1.935502818511287e-05, + "loss": 1.1278, + "step": 5193 + }, + { + "epoch": 14.15258855585831, + "grad_norm": 9.055807113647461, + "learning_rate": 1.9354716346361947e-05, + "loss": 0.8248, + "step": 5194 + }, + { + "epoch": 14.155313351498638, + "grad_norm": 9.458588600158691, + "learning_rate": 1.935440443475679e-05, + "loss": 1.0507, + "step": 5195 + }, + { + "epoch": 14.158038147138965, + "grad_norm": 24.18316650390625, + "learning_rate": 1.9354092450299835e-05, + "loss": 1.2896, + "step": 5196 + }, + { + "epoch": 14.160762942779291, + "grad_norm": 8.916409492492676, + "learning_rate": 1.9353780392993512e-05, + "loss": 1.0306, + "step": 5197 + }, + { + "epoch": 14.163487738419619, + "grad_norm": 8.950216293334961, + "learning_rate": 1.9353468262840242e-05, + "loss": 1.0764, + "step": 5198 + }, + { + "epoch": 14.166212534059946, + "grad_norm": 10.580193519592285, + "learning_rate": 1.9353156059842467e-05, + "loss": 1.1387, + "step": 5199 + }, + { + "epoch": 14.168937329700272, + "grad_norm": 10.426873207092285, + "learning_rate": 1.9352843784002613e-05, + "loss": 0.9557, + "step": 5200 + }, + { + "epoch": 14.1716621253406, + "grad_norm": 14.51240348815918, + "learning_rate": 1.9352531435323113e-05, + "loss": 0.9541, + "step": 5201 + }, + { + "epoch": 14.174386920980927, + "grad_norm": 9.402112007141113, + "learning_rate": 1.9352219013806396e-05, + "loss": 1.006, + "step": 5202 + }, + { + "epoch": 14.177111716621253, + "grad_norm": 23.714242935180664, + "learning_rate": 1.93519065194549e-05, + "loss": 1.0583, + "step": 5203 + }, + { + "epoch": 14.17983651226158, + "grad_norm": 10.282632827758789, + "learning_rate": 1.935159395227106e-05, + "loss": 1.0785, + "step": 5204 + }, + { + "epoch": 14.182561307901908, + "grad_norm": 13.316774368286133, + "learning_rate": 1.9351281312257304e-05, + "loss": 1.032, + "step": 5205 + }, + { + "epoch": 14.185286103542234, + "grad_norm": 11.040825843811035, + "learning_rate": 1.9350968599416073e-05, + "loss": 1.3308, + "step": 5206 + }, + { + "epoch": 14.188010899182562, + "grad_norm": 9.174239158630371, + "learning_rate": 1.9350655813749795e-05, + "loss": 1.0178, + "step": 5207 + }, + { + "epoch": 14.190735694822889, + "grad_norm": 10.617894172668457, + "learning_rate": 1.9350342955260913e-05, + "loss": 0.8774, + "step": 5208 + }, + { + "epoch": 14.193460490463215, + "grad_norm": 7.703207015991211, + "learning_rate": 1.935003002395186e-05, + "loss": 1.0482, + "step": 5209 + }, + { + "epoch": 14.196185286103542, + "grad_norm": 9.032089233398438, + "learning_rate": 1.9349717019825076e-05, + "loss": 1.175, + "step": 5210 + }, + { + "epoch": 14.19891008174387, + "grad_norm": 10.903448104858398, + "learning_rate": 1.9349403942882995e-05, + "loss": 1.0756, + "step": 5211 + }, + { + "epoch": 14.201634877384196, + "grad_norm": 10.451948165893555, + "learning_rate": 1.934909079312806e-05, + "loss": 1.1343, + "step": 5212 + }, + { + "epoch": 14.204359673024523, + "grad_norm": 8.245926856994629, + "learning_rate": 1.9348777570562705e-05, + "loss": 1.23, + "step": 5213 + }, + { + "epoch": 14.207084468664851, + "grad_norm": 9.887392044067383, + "learning_rate": 1.934846427518937e-05, + "loss": 1.0542, + "step": 5214 + }, + { + "epoch": 14.209809264305177, + "grad_norm": 10.74023151397705, + "learning_rate": 1.9348150907010495e-05, + "loss": 1.0374, + "step": 5215 + }, + { + "epoch": 14.212534059945504, + "grad_norm": 12.305845260620117, + "learning_rate": 1.9347837466028524e-05, + "loss": 1.178, + "step": 5216 + }, + { + "epoch": 14.215258855585832, + "grad_norm": 9.770783424377441, + "learning_rate": 1.9347523952245898e-05, + "loss": 1.1133, + "step": 5217 + }, + { + "epoch": 14.217983651226158, + "grad_norm": 9.333532333374023, + "learning_rate": 1.9347210365665052e-05, + "loss": 0.9165, + "step": 5218 + }, + { + "epoch": 14.220708446866485, + "grad_norm": 9.938899040222168, + "learning_rate": 1.9346896706288433e-05, + "loss": 1.1858, + "step": 5219 + }, + { + "epoch": 14.223433242506813, + "grad_norm": 10.495904922485352, + "learning_rate": 1.9346582974118484e-05, + "loss": 1.28, + "step": 5220 + }, + { + "epoch": 14.226158038147139, + "grad_norm": 8.536820411682129, + "learning_rate": 1.934626916915765e-05, + "loss": 1.0775, + "step": 5221 + }, + { + "epoch": 14.228882833787466, + "grad_norm": 8.524038314819336, + "learning_rate": 1.9345955291408368e-05, + "loss": 1.0872, + "step": 5222 + }, + { + "epoch": 14.231607629427794, + "grad_norm": 7.942371845245361, + "learning_rate": 1.934564134087309e-05, + "loss": 1.166, + "step": 5223 + }, + { + "epoch": 14.23433242506812, + "grad_norm": 11.302346229553223, + "learning_rate": 1.9345327317554258e-05, + "loss": 0.9764, + "step": 5224 + }, + { + "epoch": 14.237057220708447, + "grad_norm": 7.489410400390625, + "learning_rate": 1.934501322145432e-05, + "loss": 0.9688, + "step": 5225 + }, + { + "epoch": 14.239782016348773, + "grad_norm": 9.616244316101074, + "learning_rate": 1.9344699052575713e-05, + "loss": 1.0598, + "step": 5226 + }, + { + "epoch": 14.2425068119891, + "grad_norm": 7.459101676940918, + "learning_rate": 1.9344384810920894e-05, + "loss": 0.9845, + "step": 5227 + }, + { + "epoch": 14.245231607629428, + "grad_norm": 7.418712139129639, + "learning_rate": 1.9344070496492307e-05, + "loss": 1.0337, + "step": 5228 + }, + { + "epoch": 14.247956403269754, + "grad_norm": 12.477212905883789, + "learning_rate": 1.93437561092924e-05, + "loss": 0.9674, + "step": 5229 + }, + { + "epoch": 14.250681198910081, + "grad_norm": 10.46294116973877, + "learning_rate": 1.9343441649323623e-05, + "loss": 1.1455, + "step": 5230 + }, + { + "epoch": 14.253405994550409, + "grad_norm": 11.074926376342773, + "learning_rate": 1.9343127116588422e-05, + "loss": 1.0607, + "step": 5231 + }, + { + "epoch": 14.256130790190735, + "grad_norm": 12.724575996398926, + "learning_rate": 1.9342812511089245e-05, + "loss": 1.0946, + "step": 5232 + }, + { + "epoch": 14.258855585831062, + "grad_norm": 11.567410469055176, + "learning_rate": 1.9342497832828545e-05, + "loss": 1.2377, + "step": 5233 + }, + { + "epoch": 14.26158038147139, + "grad_norm": 10.05311107635498, + "learning_rate": 1.9342183081808776e-05, + "loss": 0.9814, + "step": 5234 + }, + { + "epoch": 14.264305177111716, + "grad_norm": 12.47072696685791, + "learning_rate": 1.9341868258032383e-05, + "loss": 1.0944, + "step": 5235 + }, + { + "epoch": 14.267029972752043, + "grad_norm": 9.628125190734863, + "learning_rate": 1.9341553361501823e-05, + "loss": 0.9958, + "step": 5236 + }, + { + "epoch": 14.269754768392371, + "grad_norm": 8.3932523727417, + "learning_rate": 1.9341238392219546e-05, + "loss": 0.9589, + "step": 5237 + }, + { + "epoch": 14.272479564032697, + "grad_norm": 14.278056144714355, + "learning_rate": 1.9340923350188004e-05, + "loss": 1.0369, + "step": 5238 + }, + { + "epoch": 14.275204359673024, + "grad_norm": 13.667935371398926, + "learning_rate": 1.934060823540965e-05, + "loss": 1.0345, + "step": 5239 + }, + { + "epoch": 14.277929155313352, + "grad_norm": 9.29685115814209, + "learning_rate": 1.9340293047886943e-05, + "loss": 1.1643, + "step": 5240 + }, + { + "epoch": 14.280653950953678, + "grad_norm": 8.895401000976562, + "learning_rate": 1.9339977787622332e-05, + "loss": 1.0632, + "step": 5241 + }, + { + "epoch": 14.283378746594005, + "grad_norm": 8.890891075134277, + "learning_rate": 1.9339662454618277e-05, + "loss": 1.0703, + "step": 5242 + }, + { + "epoch": 14.286103542234333, + "grad_norm": 8.847053527832031, + "learning_rate": 1.9339347048877228e-05, + "loss": 0.9144, + "step": 5243 + }, + { + "epoch": 14.288828337874659, + "grad_norm": 9.546551704406738, + "learning_rate": 1.9339031570401647e-05, + "loss": 1.175, + "step": 5244 + }, + { + "epoch": 14.291553133514986, + "grad_norm": 10.097752571105957, + "learning_rate": 1.933871601919399e-05, + "loss": 1.637, + "step": 5245 + }, + { + "epoch": 14.294277929155314, + "grad_norm": 10.346940994262695, + "learning_rate": 1.9338400395256708e-05, + "loss": 1.2756, + "step": 5246 + }, + { + "epoch": 14.29700272479564, + "grad_norm": 12.138782501220703, + "learning_rate": 1.9338084698592266e-05, + "loss": 1.1531, + "step": 5247 + }, + { + "epoch": 14.299727520435967, + "grad_norm": 8.375985145568848, + "learning_rate": 1.9337768929203124e-05, + "loss": 0.8945, + "step": 5248 + }, + { + "epoch": 14.302452316076295, + "grad_norm": 13.717570304870605, + "learning_rate": 1.933745308709174e-05, + "loss": 0.981, + "step": 5249 + }, + { + "epoch": 14.30517711171662, + "grad_norm": 8.631799697875977, + "learning_rate": 1.9337137172260568e-05, + "loss": 1.1099, + "step": 5250 + }, + { + "epoch": 14.307901907356948, + "grad_norm": 7.853982448577881, + "learning_rate": 1.933682118471207e-05, + "loss": 1.0149, + "step": 5251 + }, + { + "epoch": 14.310626702997276, + "grad_norm": 10.202895164489746, + "learning_rate": 1.9336505124448714e-05, + "loss": 1.0979, + "step": 5252 + }, + { + "epoch": 14.313351498637601, + "grad_norm": 9.769791603088379, + "learning_rate": 1.9336188991472956e-05, + "loss": 1.1184, + "step": 5253 + }, + { + "epoch": 14.316076294277929, + "grad_norm": 8.059771537780762, + "learning_rate": 1.9335872785787257e-05, + "loss": 1.0947, + "step": 5254 + }, + { + "epoch": 14.318801089918257, + "grad_norm": 68.8738021850586, + "learning_rate": 1.933555650739408e-05, + "loss": 1.2471, + "step": 5255 + }, + { + "epoch": 14.321525885558582, + "grad_norm": 9.558309555053711, + "learning_rate": 1.933524015629589e-05, + "loss": 1.2317, + "step": 5256 + }, + { + "epoch": 14.32425068119891, + "grad_norm": 8.446417808532715, + "learning_rate": 1.9334923732495153e-05, + "loss": 1.1877, + "step": 5257 + }, + { + "epoch": 14.326975476839237, + "grad_norm": 8.942597389221191, + "learning_rate": 1.9334607235994328e-05, + "loss": 1.1284, + "step": 5258 + }, + { + "epoch": 14.329700272479563, + "grad_norm": 9.941106796264648, + "learning_rate": 1.933429066679588e-05, + "loss": 1.0425, + "step": 5259 + }, + { + "epoch": 14.33242506811989, + "grad_norm": 8.345467567443848, + "learning_rate": 1.9333974024902278e-05, + "loss": 1.0031, + "step": 5260 + }, + { + "epoch": 14.335149863760218, + "grad_norm": 8.661430358886719, + "learning_rate": 1.933365731031599e-05, + "loss": 1.1255, + "step": 5261 + }, + { + "epoch": 14.337874659400544, + "grad_norm": 8.243463516235352, + "learning_rate": 1.9333340523039477e-05, + "loss": 1.0671, + "step": 5262 + }, + { + "epoch": 14.340599455040872, + "grad_norm": 9.933423042297363, + "learning_rate": 1.9333023663075208e-05, + "loss": 0.934, + "step": 5263 + }, + { + "epoch": 14.3433242506812, + "grad_norm": 8.510039329528809, + "learning_rate": 1.9332706730425654e-05, + "loss": 1.0812, + "step": 5264 + }, + { + "epoch": 14.346049046321525, + "grad_norm": 9.866889953613281, + "learning_rate": 1.9332389725093276e-05, + "loss": 1.1134, + "step": 5265 + }, + { + "epoch": 14.348773841961853, + "grad_norm": 8.618088722229004, + "learning_rate": 1.9332072647080548e-05, + "loss": 0.9312, + "step": 5266 + }, + { + "epoch": 14.35149863760218, + "grad_norm": 9.735777854919434, + "learning_rate": 1.933175549638994e-05, + "loss": 0.9116, + "step": 5267 + }, + { + "epoch": 14.354223433242506, + "grad_norm": 13.522176742553711, + "learning_rate": 1.933143827302392e-05, + "loss": 0.99, + "step": 5268 + }, + { + "epoch": 14.356948228882834, + "grad_norm": 12.312538146972656, + "learning_rate": 1.9331120976984962e-05, + "loss": 0.9844, + "step": 5269 + }, + { + "epoch": 14.359673024523161, + "grad_norm": 9.45966625213623, + "learning_rate": 1.933080360827553e-05, + "loss": 1.1396, + "step": 5270 + }, + { + "epoch": 14.362397820163487, + "grad_norm": 9.67317008972168, + "learning_rate": 1.93304861668981e-05, + "loss": 1.0793, + "step": 5271 + }, + { + "epoch": 14.365122615803815, + "grad_norm": 11.211816787719727, + "learning_rate": 1.933016865285515e-05, + "loss": 1.2239, + "step": 5272 + }, + { + "epoch": 14.367847411444142, + "grad_norm": 9.201240539550781, + "learning_rate": 1.9329851066149138e-05, + "loss": 1.0579, + "step": 5273 + }, + { + "epoch": 14.370572207084468, + "grad_norm": 12.017439842224121, + "learning_rate": 1.932953340678255e-05, + "loss": 1.2026, + "step": 5274 + }, + { + "epoch": 14.373297002724795, + "grad_norm": 9.993738174438477, + "learning_rate": 1.9329215674757856e-05, + "loss": 0.9805, + "step": 5275 + }, + { + "epoch": 14.376021798365123, + "grad_norm": 8.909194946289062, + "learning_rate": 1.932889787007753e-05, + "loss": 1.0084, + "step": 5276 + }, + { + "epoch": 14.378746594005449, + "grad_norm": 19.06960105895996, + "learning_rate": 1.932857999274405e-05, + "loss": 1.1138, + "step": 5277 + }, + { + "epoch": 14.381471389645776, + "grad_norm": 10.438451766967773, + "learning_rate": 1.932826204275989e-05, + "loss": 1.0244, + "step": 5278 + }, + { + "epoch": 14.384196185286104, + "grad_norm": 11.111006736755371, + "learning_rate": 1.932794402012752e-05, + "loss": 1.0233, + "step": 5279 + }, + { + "epoch": 14.38692098092643, + "grad_norm": 11.95139217376709, + "learning_rate": 1.932762592484943e-05, + "loss": 1.3044, + "step": 5280 + }, + { + "epoch": 14.389645776566757, + "grad_norm": 12.746063232421875, + "learning_rate": 1.9327307756928082e-05, + "loss": 1.1691, + "step": 5281 + }, + { + "epoch": 14.392370572207085, + "grad_norm": 13.35183334350586, + "learning_rate": 1.9326989516365965e-05, + "loss": 1.2515, + "step": 5282 + }, + { + "epoch": 14.39509536784741, + "grad_norm": 7.97482442855835, + "learning_rate": 1.9326671203165555e-05, + "loss": 0.9849, + "step": 5283 + }, + { + "epoch": 14.397820163487738, + "grad_norm": 11.38698673248291, + "learning_rate": 1.9326352817329325e-05, + "loss": 1.2874, + "step": 5284 + }, + { + "epoch": 14.400544959128066, + "grad_norm": 8.816800117492676, + "learning_rate": 1.9326034358859763e-05, + "loss": 1.072, + "step": 5285 + }, + { + "epoch": 14.403269754768392, + "grad_norm": 9.06088638305664, + "learning_rate": 1.9325715827759347e-05, + "loss": 1.157, + "step": 5286 + }, + { + "epoch": 14.40599455040872, + "grad_norm": 12.826264381408691, + "learning_rate": 1.9325397224030556e-05, + "loss": 0.9587, + "step": 5287 + }, + { + "epoch": 14.408719346049047, + "grad_norm": 8.464082717895508, + "learning_rate": 1.932507854767587e-05, + "loss": 1.0815, + "step": 5288 + }, + { + "epoch": 14.411444141689373, + "grad_norm": 11.152374267578125, + "learning_rate": 1.932475979869777e-05, + "loss": 1.0793, + "step": 5289 + }, + { + "epoch": 14.4141689373297, + "grad_norm": 9.872017860412598, + "learning_rate": 1.9324440977098743e-05, + "loss": 1.2461, + "step": 5290 + }, + { + "epoch": 14.416893732970028, + "grad_norm": 8.444131851196289, + "learning_rate": 1.9324122082881273e-05, + "loss": 1.0906, + "step": 5291 + }, + { + "epoch": 14.419618528610354, + "grad_norm": 13.058818817138672, + "learning_rate": 1.9323803116047835e-05, + "loss": 1.0557, + "step": 5292 + }, + { + "epoch": 14.422343324250681, + "grad_norm": 9.907197952270508, + "learning_rate": 1.932348407660092e-05, + "loss": 1.2539, + "step": 5293 + }, + { + "epoch": 14.425068119891009, + "grad_norm": 8.678665161132812, + "learning_rate": 1.932316496454301e-05, + "loss": 0.843, + "step": 5294 + }, + { + "epoch": 14.427792915531334, + "grad_norm": 10.322772026062012, + "learning_rate": 1.9322845779876594e-05, + "loss": 1.1262, + "step": 5295 + }, + { + "epoch": 14.430517711171662, + "grad_norm": 24.07590103149414, + "learning_rate": 1.9322526522604158e-05, + "loss": 1.002, + "step": 5296 + }, + { + "epoch": 14.43324250681199, + "grad_norm": 11.389932632446289, + "learning_rate": 1.932220719272818e-05, + "loss": 1.0343, + "step": 5297 + }, + { + "epoch": 14.435967302452315, + "grad_norm": 9.001762390136719, + "learning_rate": 1.932188779025115e-05, + "loss": 1.0803, + "step": 5298 + }, + { + "epoch": 14.438692098092643, + "grad_norm": 10.911750793457031, + "learning_rate": 1.9321568315175566e-05, + "loss": 1.0684, + "step": 5299 + }, + { + "epoch": 14.44141689373297, + "grad_norm": 9.265901565551758, + "learning_rate": 1.93212487675039e-05, + "loss": 1.0171, + "step": 5300 + }, + { + "epoch": 14.444141689373296, + "grad_norm": 9.530998229980469, + "learning_rate": 1.9320929147238656e-05, + "loss": 0.9602, + "step": 5301 + }, + { + "epoch": 14.446866485013624, + "grad_norm": 10.691299438476562, + "learning_rate": 1.9320609454382314e-05, + "loss": 0.9978, + "step": 5302 + }, + { + "epoch": 14.449591280653951, + "grad_norm": 11.737393379211426, + "learning_rate": 1.932028968893736e-05, + "loss": 1.0564, + "step": 5303 + }, + { + "epoch": 14.452316076294277, + "grad_norm": 13.94564151763916, + "learning_rate": 1.9319969850906293e-05, + "loss": 1.05, + "step": 5304 + }, + { + "epoch": 14.455040871934605, + "grad_norm": 8.74657154083252, + "learning_rate": 1.9319649940291605e-05, + "loss": 1.0525, + "step": 5305 + }, + { + "epoch": 14.457765667574932, + "grad_norm": 10.81070327758789, + "learning_rate": 1.9319329957095777e-05, + "loss": 1.4153, + "step": 5306 + }, + { + "epoch": 14.460490463215258, + "grad_norm": 9.045839309692383, + "learning_rate": 1.9319009901321312e-05, + "loss": 0.9253, + "step": 5307 + }, + { + "epoch": 14.463215258855586, + "grad_norm": 20.913326263427734, + "learning_rate": 1.9318689772970695e-05, + "loss": 1.1169, + "step": 5308 + }, + { + "epoch": 14.465940054495913, + "grad_norm": 10.087102890014648, + "learning_rate": 1.9318369572046425e-05, + "loss": 1.0671, + "step": 5309 + }, + { + "epoch": 14.46866485013624, + "grad_norm": 8.336085319519043, + "learning_rate": 1.931804929855099e-05, + "loss": 1.223, + "step": 5310 + }, + { + "epoch": 14.471389645776567, + "grad_norm": 11.849065780639648, + "learning_rate": 1.931772895248689e-05, + "loss": 1.0393, + "step": 5311 + }, + { + "epoch": 14.474114441416894, + "grad_norm": 8.905378341674805, + "learning_rate": 1.931740853385661e-05, + "loss": 1.0046, + "step": 5312 + }, + { + "epoch": 14.47683923705722, + "grad_norm": 8.513957023620605, + "learning_rate": 1.9317088042662656e-05, + "loss": 1.1963, + "step": 5313 + }, + { + "epoch": 14.479564032697548, + "grad_norm": 9.680682182312012, + "learning_rate": 1.931676747890752e-05, + "loss": 0.9915, + "step": 5314 + }, + { + "epoch": 14.482288828337875, + "grad_norm": 9.793913841247559, + "learning_rate": 1.93164468425937e-05, + "loss": 1.2289, + "step": 5315 + }, + { + "epoch": 14.485013623978201, + "grad_norm": 8.151663780212402, + "learning_rate": 1.9316126133723694e-05, + "loss": 0.994, + "step": 5316 + }, + { + "epoch": 14.487738419618529, + "grad_norm": 8.099178314208984, + "learning_rate": 1.9315805352299996e-05, + "loss": 0.8774, + "step": 5317 + }, + { + "epoch": 14.490463215258856, + "grad_norm": 14.407559394836426, + "learning_rate": 1.9315484498325103e-05, + "loss": 1.0383, + "step": 5318 + }, + { + "epoch": 14.493188010899182, + "grad_norm": 11.349617004394531, + "learning_rate": 1.9315163571801517e-05, + "loss": 1.0759, + "step": 5319 + }, + { + "epoch": 14.49591280653951, + "grad_norm": 38.68876647949219, + "learning_rate": 1.9314842572731737e-05, + "loss": 1.156, + "step": 5320 + }, + { + "epoch": 14.498637602179837, + "grad_norm": 8.868889808654785, + "learning_rate": 1.9314521501118265e-05, + "loss": 1.0035, + "step": 5321 + }, + { + "epoch": 14.501362397820163, + "grad_norm": 8.173551559448242, + "learning_rate": 1.93142003569636e-05, + "loss": 1.1855, + "step": 5322 + }, + { + "epoch": 14.50408719346049, + "grad_norm": 8.55869197845459, + "learning_rate": 1.931387914027024e-05, + "loss": 1.0449, + "step": 5323 + }, + { + "epoch": 14.506811989100818, + "grad_norm": 12.509915351867676, + "learning_rate": 1.931355785104069e-05, + "loss": 1.0078, + "step": 5324 + }, + { + "epoch": 14.509536784741144, + "grad_norm": 10.232088088989258, + "learning_rate": 1.931323648927745e-05, + "loss": 1.0969, + "step": 5325 + }, + { + "epoch": 14.512261580381471, + "grad_norm": 10.29968547821045, + "learning_rate": 1.9312915054983023e-05, + "loss": 1.1525, + "step": 5326 + }, + { + "epoch": 14.514986376021799, + "grad_norm": 44.228973388671875, + "learning_rate": 1.9312593548159916e-05, + "loss": 1.2103, + "step": 5327 + }, + { + "epoch": 14.517711171662125, + "grad_norm": 20.510353088378906, + "learning_rate": 1.931227196881063e-05, + "loss": 1.0187, + "step": 5328 + }, + { + "epoch": 14.520435967302452, + "grad_norm": 12.056849479675293, + "learning_rate": 1.9311950316937666e-05, + "loss": 0.8915, + "step": 5329 + }, + { + "epoch": 14.52316076294278, + "grad_norm": 12.606382369995117, + "learning_rate": 1.9311628592543538e-05, + "loss": 1.1522, + "step": 5330 + }, + { + "epoch": 14.525885558583106, + "grad_norm": 14.394980430603027, + "learning_rate": 1.9311306795630745e-05, + "loss": 1.1936, + "step": 5331 + }, + { + "epoch": 14.528610354223433, + "grad_norm": 11.048859596252441, + "learning_rate": 1.931098492620179e-05, + "loss": 1.037, + "step": 5332 + }, + { + "epoch": 14.53133514986376, + "grad_norm": 14.999587059020996, + "learning_rate": 1.9310662984259187e-05, + "loss": 1.1234, + "step": 5333 + }, + { + "epoch": 14.534059945504087, + "grad_norm": 10.57614517211914, + "learning_rate": 1.931034096980544e-05, + "loss": 0.8899, + "step": 5334 + }, + { + "epoch": 14.536784741144414, + "grad_norm": 10.451554298400879, + "learning_rate": 1.931001888284306e-05, + "loss": 0.8661, + "step": 5335 + }, + { + "epoch": 14.539509536784742, + "grad_norm": 12.769274711608887, + "learning_rate": 1.9309696723374548e-05, + "loss": 1.1665, + "step": 5336 + }, + { + "epoch": 14.542234332425068, + "grad_norm": 13.212369918823242, + "learning_rate": 1.930937449140242e-05, + "loss": 1.1079, + "step": 5337 + }, + { + "epoch": 14.544959128065395, + "grad_norm": 16.784992218017578, + "learning_rate": 1.9309052186929184e-05, + "loss": 1.1338, + "step": 5338 + }, + { + "epoch": 14.547683923705723, + "grad_norm": 10.934957504272461, + "learning_rate": 1.930872980995735e-05, + "loss": 1.0775, + "step": 5339 + }, + { + "epoch": 14.550408719346049, + "grad_norm": 108.7918701171875, + "learning_rate": 1.930840736048942e-05, + "loss": 0.9453, + "step": 5340 + }, + { + "epoch": 14.553133514986376, + "grad_norm": 10.363018989562988, + "learning_rate": 1.9308084838527922e-05, + "loss": 1.1213, + "step": 5341 + }, + { + "epoch": 14.555858310626704, + "grad_norm": 10.330005645751953, + "learning_rate": 1.9307762244075357e-05, + "loss": 1.2231, + "step": 5342 + }, + { + "epoch": 14.55858310626703, + "grad_norm": 12.0515718460083, + "learning_rate": 1.9307439577134238e-05, + "loss": 1.2269, + "step": 5343 + }, + { + "epoch": 14.561307901907357, + "grad_norm": 9.661890983581543, + "learning_rate": 1.9307116837707078e-05, + "loss": 1.3032, + "step": 5344 + }, + { + "epoch": 14.564032697547685, + "grad_norm": 10.54574966430664, + "learning_rate": 1.9306794025796395e-05, + "loss": 1.1172, + "step": 5345 + }, + { + "epoch": 14.56675749318801, + "grad_norm": 8.823716163635254, + "learning_rate": 1.9306471141404696e-05, + "loss": 1.0186, + "step": 5346 + }, + { + "epoch": 14.569482288828338, + "grad_norm": 9.0007905960083, + "learning_rate": 1.93061481845345e-05, + "loss": 1.1873, + "step": 5347 + }, + { + "epoch": 14.572207084468666, + "grad_norm": 11.603144645690918, + "learning_rate": 1.9305825155188324e-05, + "loss": 1.1558, + "step": 5348 + }, + { + "epoch": 14.574931880108991, + "grad_norm": 11.087784767150879, + "learning_rate": 1.930550205336868e-05, + "loss": 1.1632, + "step": 5349 + }, + { + "epoch": 14.577656675749319, + "grad_norm": 11.974077224731445, + "learning_rate": 1.9305178879078083e-05, + "loss": 1.1041, + "step": 5350 + }, + { + "epoch": 14.580381471389646, + "grad_norm": 10.979742050170898, + "learning_rate": 1.9304855632319052e-05, + "loss": 1.1948, + "step": 5351 + }, + { + "epoch": 14.583106267029972, + "grad_norm": 9.695462226867676, + "learning_rate": 1.930453231309411e-05, + "loss": 1.0532, + "step": 5352 + }, + { + "epoch": 14.5858310626703, + "grad_norm": 16.92827606201172, + "learning_rate": 1.9304208921405766e-05, + "loss": 1.0894, + "step": 5353 + }, + { + "epoch": 14.588555858310627, + "grad_norm": 8.352365493774414, + "learning_rate": 1.9303885457256543e-05, + "loss": 0.8616, + "step": 5354 + }, + { + "epoch": 14.591280653950953, + "grad_norm": 14.493141174316406, + "learning_rate": 1.930356192064896e-05, + "loss": 1.083, + "step": 5355 + }, + { + "epoch": 14.59400544959128, + "grad_norm": 10.147053718566895, + "learning_rate": 1.9303238311585534e-05, + "loss": 1.1628, + "step": 5356 + }, + { + "epoch": 14.596730245231608, + "grad_norm": 10.885664939880371, + "learning_rate": 1.930291463006879e-05, + "loss": 1.1016, + "step": 5357 + }, + { + "epoch": 14.599455040871934, + "grad_norm": 13.00692081451416, + "learning_rate": 1.9302590876101248e-05, + "loss": 1.1027, + "step": 5358 + }, + { + "epoch": 14.602179836512262, + "grad_norm": 9.570802688598633, + "learning_rate": 1.9302267049685424e-05, + "loss": 1.0396, + "step": 5359 + }, + { + "epoch": 14.60490463215259, + "grad_norm": 12.471563339233398, + "learning_rate": 1.9301943150823845e-05, + "loss": 1.1912, + "step": 5360 + }, + { + "epoch": 14.607629427792915, + "grad_norm": 12.29695987701416, + "learning_rate": 1.930161917951903e-05, + "loss": 1.1016, + "step": 5361 + }, + { + "epoch": 14.610354223433243, + "grad_norm": 18.859411239624023, + "learning_rate": 1.9301295135773507e-05, + "loss": 1.21, + "step": 5362 + }, + { + "epoch": 14.61307901907357, + "grad_norm": 9.199820518493652, + "learning_rate": 1.9300971019589796e-05, + "loss": 1.0422, + "step": 5363 + }, + { + "epoch": 14.615803814713896, + "grad_norm": 15.703910827636719, + "learning_rate": 1.9300646830970423e-05, + "loss": 1.1895, + "step": 5364 + }, + { + "epoch": 14.618528610354224, + "grad_norm": 13.497588157653809, + "learning_rate": 1.930032256991791e-05, + "loss": 1.4207, + "step": 5365 + }, + { + "epoch": 14.621253405994551, + "grad_norm": 21.071622848510742, + "learning_rate": 1.9299998236434786e-05, + "loss": 1.1438, + "step": 5366 + }, + { + "epoch": 14.623978201634877, + "grad_norm": 11.96397876739502, + "learning_rate": 1.9299673830523574e-05, + "loss": 1.1494, + "step": 5367 + }, + { + "epoch": 14.626702997275205, + "grad_norm": 7.910435199737549, + "learning_rate": 1.9299349352186803e-05, + "loss": 1.3066, + "step": 5368 + }, + { + "epoch": 14.629427792915532, + "grad_norm": 11.785028457641602, + "learning_rate": 1.9299024801426994e-05, + "loss": 1.24, + "step": 5369 + }, + { + "epoch": 14.632152588555858, + "grad_norm": 13.936634063720703, + "learning_rate": 1.9298700178246685e-05, + "loss": 1.0817, + "step": 5370 + }, + { + "epoch": 14.634877384196185, + "grad_norm": 13.785355567932129, + "learning_rate": 1.9298375482648396e-05, + "loss": 1.0967, + "step": 5371 + }, + { + "epoch": 14.637602179836513, + "grad_norm": 14.386396408081055, + "learning_rate": 1.9298050714634654e-05, + "loss": 1.1433, + "step": 5372 + }, + { + "epoch": 14.640326975476839, + "grad_norm": 9.83299446105957, + "learning_rate": 1.9297725874208e-05, + "loss": 1.1227, + "step": 5373 + }, + { + "epoch": 14.643051771117166, + "grad_norm": 10.26580810546875, + "learning_rate": 1.9297400961370953e-05, + "loss": 1.0359, + "step": 5374 + }, + { + "epoch": 14.645776566757494, + "grad_norm": 8.300336837768555, + "learning_rate": 1.9297075976126044e-05, + "loss": 1.0693, + "step": 5375 + }, + { + "epoch": 14.64850136239782, + "grad_norm": 15.77609634399414, + "learning_rate": 1.9296750918475807e-05, + "loss": 1.1682, + "step": 5376 + }, + { + "epoch": 14.651226158038147, + "grad_norm": 13.076919555664062, + "learning_rate": 1.9296425788422776e-05, + "loss": 1.0071, + "step": 5377 + }, + { + "epoch": 14.653950953678475, + "grad_norm": 9.423595428466797, + "learning_rate": 1.9296100585969478e-05, + "loss": 0.8604, + "step": 5378 + }, + { + "epoch": 14.6566757493188, + "grad_norm": 11.712821006774902, + "learning_rate": 1.9295775311118445e-05, + "loss": 1.2681, + "step": 5379 + }, + { + "epoch": 14.659400544959128, + "grad_norm": 13.311676025390625, + "learning_rate": 1.9295449963872217e-05, + "loss": 1.0983, + "step": 5380 + }, + { + "epoch": 14.662125340599456, + "grad_norm": 11.761080741882324, + "learning_rate": 1.9295124544233322e-05, + "loss": 1.1125, + "step": 5381 + }, + { + "epoch": 14.664850136239782, + "grad_norm": 9.576361656188965, + "learning_rate": 1.92947990522043e-05, + "loss": 1.0984, + "step": 5382 + }, + { + "epoch": 14.66757493188011, + "grad_norm": 38.030128479003906, + "learning_rate": 1.929447348778768e-05, + "loss": 1.2019, + "step": 5383 + }, + { + "epoch": 14.670299727520437, + "grad_norm": 11.681124687194824, + "learning_rate": 1.9294147850985997e-05, + "loss": 0.9224, + "step": 5384 + }, + { + "epoch": 14.673024523160763, + "grad_norm": 11.757031440734863, + "learning_rate": 1.929382214180179e-05, + "loss": 0.9999, + "step": 5385 + }, + { + "epoch": 14.67574931880109, + "grad_norm": 16.173267364501953, + "learning_rate": 1.92934963602376e-05, + "loss": 1.1206, + "step": 5386 + }, + { + "epoch": 14.678474114441418, + "grad_norm": 10.76258659362793, + "learning_rate": 1.9293170506295955e-05, + "loss": 1.177, + "step": 5387 + }, + { + "epoch": 14.681198910081743, + "grad_norm": 12.828961372375488, + "learning_rate": 1.92928445799794e-05, + "loss": 1.079, + "step": 5388 + }, + { + "epoch": 14.683923705722071, + "grad_norm": 12.985787391662598, + "learning_rate": 1.929251858129047e-05, + "loss": 1.1857, + "step": 5389 + }, + { + "epoch": 14.686648501362399, + "grad_norm": 11.821076393127441, + "learning_rate": 1.92921925102317e-05, + "loss": 1.2253, + "step": 5390 + }, + { + "epoch": 14.689373297002724, + "grad_norm": 9.981273651123047, + "learning_rate": 1.929186636680564e-05, + "loss": 1.1775, + "step": 5391 + }, + { + "epoch": 14.692098092643052, + "grad_norm": 8.71783447265625, + "learning_rate": 1.929154015101482e-05, + "loss": 1.1611, + "step": 5392 + }, + { + "epoch": 14.69482288828338, + "grad_norm": 11.263312339782715, + "learning_rate": 1.9291213862861785e-05, + "loss": 1.094, + "step": 5393 + }, + { + "epoch": 14.697547683923705, + "grad_norm": 13.133688926696777, + "learning_rate": 1.9290887502349078e-05, + "loss": 1.167, + "step": 5394 + }, + { + "epoch": 14.700272479564033, + "grad_norm": 9.394452095031738, + "learning_rate": 1.9290561069479237e-05, + "loss": 1.0637, + "step": 5395 + }, + { + "epoch": 14.70299727520436, + "grad_norm": 13.00540542602539, + "learning_rate": 1.9290234564254803e-05, + "loss": 1.1196, + "step": 5396 + }, + { + "epoch": 14.705722070844686, + "grad_norm": 9.813802719116211, + "learning_rate": 1.928990798667832e-05, + "loss": 1.1252, + "step": 5397 + }, + { + "epoch": 14.708446866485014, + "grad_norm": 11.41059398651123, + "learning_rate": 1.9289581336752338e-05, + "loss": 1.0109, + "step": 5398 + }, + { + "epoch": 14.711171662125341, + "grad_norm": 9.798429489135742, + "learning_rate": 1.928925461447939e-05, + "loss": 1.1284, + "step": 5399 + }, + { + "epoch": 14.713896457765667, + "grad_norm": 8.876011848449707, + "learning_rate": 1.9288927819862033e-05, + "loss": 1.1147, + "step": 5400 + }, + { + "epoch": 14.716621253405995, + "grad_norm": 9.106521606445312, + "learning_rate": 1.92886009529028e-05, + "loss": 1.0334, + "step": 5401 + }, + { + "epoch": 14.719346049046322, + "grad_norm": 9.955561637878418, + "learning_rate": 1.9288274013604242e-05, + "loss": 1.1182, + "step": 5402 + }, + { + "epoch": 14.722070844686648, + "grad_norm": 9.079973220825195, + "learning_rate": 1.928794700196891e-05, + "loss": 1.1797, + "step": 5403 + }, + { + "epoch": 14.724795640326976, + "grad_norm": 12.39723014831543, + "learning_rate": 1.9287619917999336e-05, + "loss": 1.1438, + "step": 5404 + }, + { + "epoch": 14.727520435967303, + "grad_norm": 10.512011528015137, + "learning_rate": 1.9287292761698083e-05, + "loss": 1.0942, + "step": 5405 + }, + { + "epoch": 14.730245231607629, + "grad_norm": 12.560011863708496, + "learning_rate": 1.9286965533067694e-05, + "loss": 1.0437, + "step": 5406 + }, + { + "epoch": 14.732970027247957, + "grad_norm": 9.511140823364258, + "learning_rate": 1.9286638232110714e-05, + "loss": 1.1846, + "step": 5407 + }, + { + "epoch": 14.735694822888284, + "grad_norm": 10.107234001159668, + "learning_rate": 1.9286310858829696e-05, + "loss": 1.2512, + "step": 5408 + }, + { + "epoch": 14.73841961852861, + "grad_norm": 10.85128402709961, + "learning_rate": 1.9285983413227186e-05, + "loss": 0.8578, + "step": 5409 + }, + { + "epoch": 14.741144414168938, + "grad_norm": 11.938522338867188, + "learning_rate": 1.928565589530574e-05, + "loss": 1.0198, + "step": 5410 + }, + { + "epoch": 14.743869209809265, + "grad_norm": 11.250466346740723, + "learning_rate": 1.9285328305067898e-05, + "loss": 1.2422, + "step": 5411 + }, + { + "epoch": 14.746594005449591, + "grad_norm": 9.212725639343262, + "learning_rate": 1.928500064251622e-05, + "loss": 1.2889, + "step": 5412 + }, + { + "epoch": 14.749318801089919, + "grad_norm": 7.821893692016602, + "learning_rate": 1.9284672907653258e-05, + "loss": 1.0786, + "step": 5413 + }, + { + "epoch": 14.752043596730246, + "grad_norm": 9.918364524841309, + "learning_rate": 1.928434510048156e-05, + "loss": 1.1282, + "step": 5414 + }, + { + "epoch": 14.754768392370572, + "grad_norm": 9.928297996520996, + "learning_rate": 1.9284017221003686e-05, + "loss": 1.1211, + "step": 5415 + }, + { + "epoch": 14.7574931880109, + "grad_norm": 8.590800285339355, + "learning_rate": 1.928368926922218e-05, + "loss": 1.1864, + "step": 5416 + }, + { + "epoch": 14.760217983651227, + "grad_norm": 8.307841300964355, + "learning_rate": 1.92833612451396e-05, + "loss": 0.9934, + "step": 5417 + }, + { + "epoch": 14.762942779291553, + "grad_norm": 8.209846496582031, + "learning_rate": 1.9283033148758506e-05, + "loss": 1.0151, + "step": 5418 + }, + { + "epoch": 14.76566757493188, + "grad_norm": 9.439775466918945, + "learning_rate": 1.9282704980081446e-05, + "loss": 1.1469, + "step": 5419 + }, + { + "epoch": 14.768392370572208, + "grad_norm": 9.905940055847168, + "learning_rate": 1.928237673911098e-05, + "loss": 1.1277, + "step": 5420 + }, + { + "epoch": 14.771117166212534, + "grad_norm": 10.38306999206543, + "learning_rate": 1.928204842584966e-05, + "loss": 1.0771, + "step": 5421 + }, + { + "epoch": 14.773841961852861, + "grad_norm": 10.64194393157959, + "learning_rate": 1.928172004030005e-05, + "loss": 1.1511, + "step": 5422 + }, + { + "epoch": 14.776566757493189, + "grad_norm": 9.811735153198242, + "learning_rate": 1.9281391582464697e-05, + "loss": 1.2218, + "step": 5423 + }, + { + "epoch": 14.779291553133515, + "grad_norm": 10.465387344360352, + "learning_rate": 1.9281063052346168e-05, + "loss": 0.9645, + "step": 5424 + }, + { + "epoch": 14.782016348773842, + "grad_norm": 9.601802825927734, + "learning_rate": 1.928073444994702e-05, + "loss": 1.1152, + "step": 5425 + }, + { + "epoch": 14.78474114441417, + "grad_norm": 8.191433906555176, + "learning_rate": 1.928040577526981e-05, + "loss": 1.0205, + "step": 5426 + }, + { + "epoch": 14.787465940054496, + "grad_norm": 8.16183090209961, + "learning_rate": 1.9280077028317096e-05, + "loss": 1.1672, + "step": 5427 + }, + { + "epoch": 14.790190735694823, + "grad_norm": 13.249311447143555, + "learning_rate": 1.927974820909144e-05, + "loss": 1.1494, + "step": 5428 + }, + { + "epoch": 14.79291553133515, + "grad_norm": 7.822423458099365, + "learning_rate": 1.927941931759541e-05, + "loss": 1.1196, + "step": 5429 + }, + { + "epoch": 14.795640326975477, + "grad_norm": 7.371486186981201, + "learning_rate": 1.9279090353831557e-05, + "loss": 0.9851, + "step": 5430 + }, + { + "epoch": 14.798365122615804, + "grad_norm": 9.159686088562012, + "learning_rate": 1.9278761317802448e-05, + "loss": 1.1333, + "step": 5431 + }, + { + "epoch": 14.80108991825613, + "grad_norm": 14.047561645507812, + "learning_rate": 1.9278432209510644e-05, + "loss": 1.1741, + "step": 5432 + }, + { + "epoch": 14.803814713896458, + "grad_norm": 12.84555435180664, + "learning_rate": 1.9278103028958707e-05, + "loss": 1.0486, + "step": 5433 + }, + { + "epoch": 14.806539509536785, + "grad_norm": 8.609007835388184, + "learning_rate": 1.9277773776149208e-05, + "loss": 1.0444, + "step": 5434 + }, + { + "epoch": 14.809264305177111, + "grad_norm": 8.697768211364746, + "learning_rate": 1.92774444510847e-05, + "loss": 1.1321, + "step": 5435 + }, + { + "epoch": 14.811989100817438, + "grad_norm": 7.1575798988342285, + "learning_rate": 1.927711505376775e-05, + "loss": 1.1589, + "step": 5436 + }, + { + "epoch": 14.814713896457766, + "grad_norm": 32.84316635131836, + "learning_rate": 1.9276785584200935e-05, + "loss": 1.0726, + "step": 5437 + }, + { + "epoch": 14.817438692098092, + "grad_norm": 9.116987228393555, + "learning_rate": 1.9276456042386806e-05, + "loss": 1.0488, + "step": 5438 + }, + { + "epoch": 14.82016348773842, + "grad_norm": 8.860197067260742, + "learning_rate": 1.927612642832794e-05, + "loss": 1.098, + "step": 5439 + }, + { + "epoch": 14.822888283378747, + "grad_norm": 9.601526260375977, + "learning_rate": 1.9275796742026898e-05, + "loss": 1.1243, + "step": 5440 + }, + { + "epoch": 14.825613079019073, + "grad_norm": 11.47438907623291, + "learning_rate": 1.9275466983486247e-05, + "loss": 1.1287, + "step": 5441 + }, + { + "epoch": 14.8283378746594, + "grad_norm": 8.937363624572754, + "learning_rate": 1.9275137152708564e-05, + "loss": 0.9294, + "step": 5442 + }, + { + "epoch": 14.831062670299728, + "grad_norm": 9.600807189941406, + "learning_rate": 1.9274807249696405e-05, + "loss": 1.077, + "step": 5443 + }, + { + "epoch": 14.833787465940054, + "grad_norm": 8.64490795135498, + "learning_rate": 1.927447727445235e-05, + "loss": 0.9917, + "step": 5444 + }, + { + "epoch": 14.836512261580381, + "grad_norm": 9.722396850585938, + "learning_rate": 1.9274147226978962e-05, + "loss": 0.9272, + "step": 5445 + }, + { + "epoch": 14.839237057220709, + "grad_norm": 9.325379371643066, + "learning_rate": 1.9273817107278815e-05, + "loss": 1.0829, + "step": 5446 + }, + { + "epoch": 14.841961852861035, + "grad_norm": 9.744324684143066, + "learning_rate": 1.927348691535448e-05, + "loss": 1.0204, + "step": 5447 + }, + { + "epoch": 14.844686648501362, + "grad_norm": 10.210845947265625, + "learning_rate": 1.9273156651208525e-05, + "loss": 1.2598, + "step": 5448 + }, + { + "epoch": 14.84741144414169, + "grad_norm": 8.943734169006348, + "learning_rate": 1.9272826314843526e-05, + "loss": 1.0222, + "step": 5449 + }, + { + "epoch": 14.850136239782016, + "grad_norm": 7.680088520050049, + "learning_rate": 1.9272495906262053e-05, + "loss": 0.9257, + "step": 5450 + }, + { + "epoch": 14.852861035422343, + "grad_norm": 11.96497631072998, + "learning_rate": 1.927216542546668e-05, + "loss": 1.1292, + "step": 5451 + }, + { + "epoch": 14.85558583106267, + "grad_norm": 7.999666213989258, + "learning_rate": 1.9271834872459982e-05, + "loss": 1.0208, + "step": 5452 + }, + { + "epoch": 14.858310626702997, + "grad_norm": 10.969223976135254, + "learning_rate": 1.9271504247244534e-05, + "loss": 1.1418, + "step": 5453 + }, + { + "epoch": 14.861035422343324, + "grad_norm": 10.95656967163086, + "learning_rate": 1.927117354982291e-05, + "loss": 1.1616, + "step": 5454 + }, + { + "epoch": 14.863760217983652, + "grad_norm": 11.002049446105957, + "learning_rate": 1.927084278019768e-05, + "loss": 1.04, + "step": 5455 + }, + { + "epoch": 14.866485013623977, + "grad_norm": 9.948211669921875, + "learning_rate": 1.9270511938371425e-05, + "loss": 1.1589, + "step": 5456 + }, + { + "epoch": 14.869209809264305, + "grad_norm": 7.003767967224121, + "learning_rate": 1.9270181024346727e-05, + "loss": 1.054, + "step": 5457 + }, + { + "epoch": 14.871934604904633, + "grad_norm": 9.24045181274414, + "learning_rate": 1.9269850038126152e-05, + "loss": 0.9512, + "step": 5458 + }, + { + "epoch": 14.874659400544958, + "grad_norm": 9.06789493560791, + "learning_rate": 1.9269518979712285e-05, + "loss": 1.1877, + "step": 5459 + }, + { + "epoch": 14.877384196185286, + "grad_norm": 10.27806282043457, + "learning_rate": 1.9269187849107703e-05, + "loss": 1.1566, + "step": 5460 + }, + { + "epoch": 14.880108991825614, + "grad_norm": 8.048421859741211, + "learning_rate": 1.9268856646314983e-05, + "loss": 1.1638, + "step": 5461 + }, + { + "epoch": 14.88283378746594, + "grad_norm": 11.141575813293457, + "learning_rate": 1.926852537133671e-05, + "loss": 1.2466, + "step": 5462 + }, + { + "epoch": 14.885558583106267, + "grad_norm": 8.194379806518555, + "learning_rate": 1.926819402417546e-05, + "loss": 1.1511, + "step": 5463 + }, + { + "epoch": 14.888283378746594, + "grad_norm": 8.322203636169434, + "learning_rate": 1.9267862604833808e-05, + "loss": 1.0703, + "step": 5464 + }, + { + "epoch": 14.89100817438692, + "grad_norm": 8.79293155670166, + "learning_rate": 1.9267531113314343e-05, + "loss": 1.2595, + "step": 5465 + }, + { + "epoch": 14.893732970027248, + "grad_norm": 12.21040153503418, + "learning_rate": 1.9267199549619643e-05, + "loss": 1.0713, + "step": 5466 + }, + { + "epoch": 14.896457765667575, + "grad_norm": 13.462485313415527, + "learning_rate": 1.926686791375229e-05, + "loss": 1.0867, + "step": 5467 + }, + { + "epoch": 14.899182561307901, + "grad_norm": 8.758882522583008, + "learning_rate": 1.926653620571487e-05, + "loss": 1.1934, + "step": 5468 + }, + { + "epoch": 14.901907356948229, + "grad_norm": 8.370561599731445, + "learning_rate": 1.9266204425509962e-05, + "loss": 1.1484, + "step": 5469 + }, + { + "epoch": 14.904632152588556, + "grad_norm": 9.9232816696167, + "learning_rate": 1.9265872573140156e-05, + "loss": 1.0056, + "step": 5470 + }, + { + "epoch": 14.907356948228882, + "grad_norm": 9.87440013885498, + "learning_rate": 1.926554064860803e-05, + "loss": 1.1371, + "step": 5471 + }, + { + "epoch": 14.91008174386921, + "grad_norm": 9.33785343170166, + "learning_rate": 1.9265208651916172e-05, + "loss": 1.063, + "step": 5472 + }, + { + "epoch": 14.912806539509537, + "grad_norm": 16.72821044921875, + "learning_rate": 1.9264876583067167e-05, + "loss": 1.2517, + "step": 5473 + }, + { + "epoch": 14.915531335149863, + "grad_norm": 9.422157287597656, + "learning_rate": 1.92645444420636e-05, + "loss": 1.1331, + "step": 5474 + }, + { + "epoch": 14.91825613079019, + "grad_norm": 8.592704772949219, + "learning_rate": 1.9264212228908063e-05, + "loss": 1.0295, + "step": 5475 + }, + { + "epoch": 14.920980926430518, + "grad_norm": 8.709903717041016, + "learning_rate": 1.9263879943603136e-05, + "loss": 1.0198, + "step": 5476 + }, + { + "epoch": 14.923705722070844, + "grad_norm": 8.811495780944824, + "learning_rate": 1.9263547586151412e-05, + "loss": 0.9832, + "step": 5477 + }, + { + "epoch": 14.926430517711172, + "grad_norm": 10.670900344848633, + "learning_rate": 1.9263215156555477e-05, + "loss": 1.1501, + "step": 5478 + }, + { + "epoch": 14.9291553133515, + "grad_norm": 9.27827262878418, + "learning_rate": 1.9262882654817918e-05, + "loss": 1.157, + "step": 5479 + }, + { + "epoch": 14.931880108991825, + "grad_norm": 11.302102088928223, + "learning_rate": 1.926255008094133e-05, + "loss": 1.0518, + "step": 5480 + }, + { + "epoch": 14.934604904632153, + "grad_norm": 7.121042728424072, + "learning_rate": 1.92622174349283e-05, + "loss": 0.9431, + "step": 5481 + }, + { + "epoch": 14.93732970027248, + "grad_norm": 9.873361587524414, + "learning_rate": 1.9261884716781417e-05, + "loss": 1.1199, + "step": 5482 + }, + { + "epoch": 14.940054495912806, + "grad_norm": 10.81009578704834, + "learning_rate": 1.9261551926503277e-05, + "loss": 1.1157, + "step": 5483 + }, + { + "epoch": 14.942779291553133, + "grad_norm": 10.118577003479004, + "learning_rate": 1.9261219064096467e-05, + "loss": 1.0876, + "step": 5484 + }, + { + "epoch": 14.945504087193461, + "grad_norm": 9.304665565490723, + "learning_rate": 1.926088612956358e-05, + "loss": 1.1548, + "step": 5485 + }, + { + "epoch": 14.948228882833787, + "grad_norm": 8.310667991638184, + "learning_rate": 1.926055312290721e-05, + "loss": 1.0819, + "step": 5486 + }, + { + "epoch": 14.950953678474114, + "grad_norm": 10.15754508972168, + "learning_rate": 1.9260220044129953e-05, + "loss": 0.9282, + "step": 5487 + }, + { + "epoch": 14.953678474114442, + "grad_norm": 10.331604957580566, + "learning_rate": 1.9259886893234397e-05, + "loss": 1.1792, + "step": 5488 + }, + { + "epoch": 14.956403269754768, + "grad_norm": 10.211618423461914, + "learning_rate": 1.925955367022314e-05, + "loss": 1.0898, + "step": 5489 + }, + { + "epoch": 14.959128065395095, + "grad_norm": 11.046704292297363, + "learning_rate": 1.925922037509878e-05, + "loss": 1.0498, + "step": 5490 + }, + { + "epoch": 14.961852861035423, + "grad_norm": 13.784923553466797, + "learning_rate": 1.925888700786391e-05, + "loss": 0.9541, + "step": 5491 + }, + { + "epoch": 14.964577656675749, + "grad_norm": 14.446078300476074, + "learning_rate": 1.925855356852112e-05, + "loss": 1.0426, + "step": 5492 + }, + { + "epoch": 14.967302452316076, + "grad_norm": 13.812178611755371, + "learning_rate": 1.925822005707302e-05, + "loss": 1.2158, + "step": 5493 + }, + { + "epoch": 14.970027247956404, + "grad_norm": 9.299683570861816, + "learning_rate": 1.9257886473522194e-05, + "loss": 1.2102, + "step": 5494 + }, + { + "epoch": 14.97275204359673, + "grad_norm": 11.779254913330078, + "learning_rate": 1.925755281787125e-05, + "loss": 1.1792, + "step": 5495 + }, + { + "epoch": 14.975476839237057, + "grad_norm": 15.099937438964844, + "learning_rate": 1.9257219090122782e-05, + "loss": 1.0396, + "step": 5496 + }, + { + "epoch": 14.978201634877385, + "grad_norm": 21.414133071899414, + "learning_rate": 1.925688529027939e-05, + "loss": 1.3333, + "step": 5497 + }, + { + "epoch": 14.98092643051771, + "grad_norm": 12.682548522949219, + "learning_rate": 1.925655141834367e-05, + "loss": 1.3135, + "step": 5498 + }, + { + "epoch": 14.983651226158038, + "grad_norm": 9.636043548583984, + "learning_rate": 1.9256217474318227e-05, + "loss": 1.1958, + "step": 5499 + }, + { + "epoch": 14.986376021798366, + "grad_norm": 9.636250495910645, + "learning_rate": 1.9255883458205664e-05, + "loss": 0.9243, + "step": 5500 + }, + { + "epoch": 14.989100817438691, + "grad_norm": 17.597333908081055, + "learning_rate": 1.9255549370008575e-05, + "loss": 1.0493, + "step": 5501 + }, + { + "epoch": 14.991825613079019, + "grad_norm": 8.619144439697266, + "learning_rate": 1.925521520972957e-05, + "loss": 1.1733, + "step": 5502 + }, + { + "epoch": 14.994550408719347, + "grad_norm": 10.077827453613281, + "learning_rate": 1.925488097737124e-05, + "loss": 1.0237, + "step": 5503 + }, + { + "epoch": 14.997275204359672, + "grad_norm": 8.45253849029541, + "learning_rate": 1.92545466729362e-05, + "loss": 1.1523, + "step": 5504 + }, + { + "epoch": 15.0, + "grad_norm": 9.242919921875, + "learning_rate": 1.9254212296427043e-05, + "loss": 1.1511, + "step": 5505 + }, + { + "epoch": 15.002724795640328, + "grad_norm": 9.065591812133789, + "learning_rate": 1.925387784784638e-05, + "loss": 0.8765, + "step": 5506 + }, + { + "epoch": 15.005449591280653, + "grad_norm": 9.483454704284668, + "learning_rate": 1.925354332719682e-05, + "loss": 0.8127, + "step": 5507 + }, + { + "epoch": 15.008174386920981, + "grad_norm": 9.035008430480957, + "learning_rate": 1.9253208734480953e-05, + "loss": 1.0515, + "step": 5508 + }, + { + "epoch": 15.010899182561309, + "grad_norm": 10.661617279052734, + "learning_rate": 1.9252874069701405e-05, + "loss": 0.9171, + "step": 5509 + }, + { + "epoch": 15.013623978201634, + "grad_norm": 8.760483741760254, + "learning_rate": 1.9252539332860762e-05, + "loss": 1.2288, + "step": 5510 + }, + { + "epoch": 15.016348773841962, + "grad_norm": 7.86459493637085, + "learning_rate": 1.9252204523961645e-05, + "loss": 0.906, + "step": 5511 + }, + { + "epoch": 15.01907356948229, + "grad_norm": 10.616339683532715, + "learning_rate": 1.9251869643006657e-05, + "loss": 1.2582, + "step": 5512 + }, + { + "epoch": 15.021798365122615, + "grad_norm": 7.371670722961426, + "learning_rate": 1.9251534689998406e-05, + "loss": 1.0967, + "step": 5513 + }, + { + "epoch": 15.024523160762943, + "grad_norm": 6.8104567527771, + "learning_rate": 1.92511996649395e-05, + "loss": 0.828, + "step": 5514 + }, + { + "epoch": 15.02724795640327, + "grad_norm": 12.358208656311035, + "learning_rate": 1.925086456783255e-05, + "loss": 1.0417, + "step": 5515 + }, + { + "epoch": 15.029972752043596, + "grad_norm": 8.836557388305664, + "learning_rate": 1.925052939868016e-05, + "loss": 1.0027, + "step": 5516 + }, + { + "epoch": 15.032697547683924, + "grad_norm": 9.613363265991211, + "learning_rate": 1.925019415748495e-05, + "loss": 1.0148, + "step": 5517 + }, + { + "epoch": 15.035422343324251, + "grad_norm": 8.410662651062012, + "learning_rate": 1.924985884424952e-05, + "loss": 0.9382, + "step": 5518 + }, + { + "epoch": 15.038147138964577, + "grad_norm": 8.761898040771484, + "learning_rate": 1.9249523458976494e-05, + "loss": 0.9354, + "step": 5519 + }, + { + "epoch": 15.040871934604905, + "grad_norm": 10.815780639648438, + "learning_rate": 1.9249188001668474e-05, + "loss": 0.8989, + "step": 5520 + }, + { + "epoch": 15.043596730245232, + "grad_norm": 8.083906173706055, + "learning_rate": 1.9248852472328075e-05, + "loss": 1.0005, + "step": 5521 + }, + { + "epoch": 15.046321525885558, + "grad_norm": 7.896905422210693, + "learning_rate": 1.924851687095791e-05, + "loss": 1.0674, + "step": 5522 + }, + { + "epoch": 15.049046321525886, + "grad_norm": 7.164858818054199, + "learning_rate": 1.9248181197560594e-05, + "loss": 0.9547, + "step": 5523 + }, + { + "epoch": 15.051771117166213, + "grad_norm": 11.201558113098145, + "learning_rate": 1.924784545213874e-05, + "loss": 0.9178, + "step": 5524 + }, + { + "epoch": 15.054495912806539, + "grad_norm": 9.608845710754395, + "learning_rate": 1.9247509634694963e-05, + "loss": 0.993, + "step": 5525 + }, + { + "epoch": 15.057220708446867, + "grad_norm": 9.189961433410645, + "learning_rate": 1.924717374523188e-05, + "loss": 1.0779, + "step": 5526 + }, + { + "epoch": 15.059945504087194, + "grad_norm": 8.895902633666992, + "learning_rate": 1.9246837783752106e-05, + "loss": 1.0948, + "step": 5527 + }, + { + "epoch": 15.06267029972752, + "grad_norm": 8.975088119506836, + "learning_rate": 1.9246501750258256e-05, + "loss": 0.959, + "step": 5528 + }, + { + "epoch": 15.065395095367847, + "grad_norm": 11.457137107849121, + "learning_rate": 1.9246165644752944e-05, + "loss": 0.8561, + "step": 5529 + }, + { + "epoch": 15.068119891008175, + "grad_norm": 8.237933158874512, + "learning_rate": 1.92458294672388e-05, + "loss": 0.9904, + "step": 5530 + }, + { + "epoch": 15.0708446866485, + "grad_norm": 12.692983627319336, + "learning_rate": 1.9245493217718426e-05, + "loss": 1.02, + "step": 5531 + }, + { + "epoch": 15.073569482288828, + "grad_norm": 8.939153671264648, + "learning_rate": 1.924515689619445e-05, + "loss": 0.9595, + "step": 5532 + }, + { + "epoch": 15.076294277929156, + "grad_norm": 7.779260635375977, + "learning_rate": 1.9244820502669494e-05, + "loss": 1.1637, + "step": 5533 + }, + { + "epoch": 15.079019073569482, + "grad_norm": 13.962143898010254, + "learning_rate": 1.924448403714617e-05, + "loss": 1.0122, + "step": 5534 + }, + { + "epoch": 15.08174386920981, + "grad_norm": 27.474210739135742, + "learning_rate": 1.9244147499627103e-05, + "loss": 0.9863, + "step": 5535 + }, + { + "epoch": 15.084468664850137, + "grad_norm": 11.234265327453613, + "learning_rate": 1.924381089011491e-05, + "loss": 1.0011, + "step": 5536 + }, + { + "epoch": 15.087193460490463, + "grad_norm": 25.47540855407715, + "learning_rate": 1.924347420861222e-05, + "loss": 0.9214, + "step": 5537 + }, + { + "epoch": 15.08991825613079, + "grad_norm": 9.881484985351562, + "learning_rate": 1.9243137455121648e-05, + "loss": 0.9729, + "step": 5538 + }, + { + "epoch": 15.092643051771118, + "grad_norm": 7.067080497741699, + "learning_rate": 1.9242800629645815e-05, + "loss": 0.9155, + "step": 5539 + }, + { + "epoch": 15.095367847411444, + "grad_norm": 8.203058242797852, + "learning_rate": 1.9242463732187355e-05, + "loss": 0.9041, + "step": 5540 + }, + { + "epoch": 15.098092643051771, + "grad_norm": 11.838784217834473, + "learning_rate": 1.924212676274888e-05, + "loss": 1.014, + "step": 5541 + }, + { + "epoch": 15.100817438692099, + "grad_norm": 8.50169849395752, + "learning_rate": 1.9241789721333023e-05, + "loss": 0.9708, + "step": 5542 + }, + { + "epoch": 15.103542234332425, + "grad_norm": 9.780434608459473, + "learning_rate": 1.9241452607942405e-05, + "loss": 0.99, + "step": 5543 + }, + { + "epoch": 15.106267029972752, + "grad_norm": 10.974543571472168, + "learning_rate": 1.9241115422579647e-05, + "loss": 1.0862, + "step": 5544 + }, + { + "epoch": 15.10899182561308, + "grad_norm": 9.12978744506836, + "learning_rate": 1.9240778165247384e-05, + "loss": 1.0861, + "step": 5545 + }, + { + "epoch": 15.111716621253406, + "grad_norm": 10.310650825500488, + "learning_rate": 1.9240440835948236e-05, + "loss": 1.0051, + "step": 5546 + }, + { + "epoch": 15.114441416893733, + "grad_norm": 13.019513130187988, + "learning_rate": 1.924010343468483e-05, + "loss": 0.9302, + "step": 5547 + }, + { + "epoch": 15.11716621253406, + "grad_norm": 14.484766006469727, + "learning_rate": 1.92397659614598e-05, + "loss": 1.1006, + "step": 5548 + }, + { + "epoch": 15.119891008174386, + "grad_norm": 11.86329174041748, + "learning_rate": 1.923942841627577e-05, + "loss": 1.0583, + "step": 5549 + }, + { + "epoch": 15.122615803814714, + "grad_norm": 13.653573989868164, + "learning_rate": 1.9239090799135365e-05, + "loss": 1.0862, + "step": 5550 + }, + { + "epoch": 15.125340599455042, + "grad_norm": 13.406563758850098, + "learning_rate": 1.923875311004122e-05, + "loss": 0.9261, + "step": 5551 + }, + { + "epoch": 15.128065395095367, + "grad_norm": 13.019432067871094, + "learning_rate": 1.9238415348995965e-05, + "loss": 1.0138, + "step": 5552 + }, + { + "epoch": 15.130790190735695, + "grad_norm": 12.109644889831543, + "learning_rate": 1.9238077516002228e-05, + "loss": 1.1106, + "step": 5553 + }, + { + "epoch": 15.133514986376023, + "grad_norm": 13.985251426696777, + "learning_rate": 1.9237739611062637e-05, + "loss": 0.9958, + "step": 5554 + }, + { + "epoch": 15.136239782016348, + "grad_norm": 12.948760986328125, + "learning_rate": 1.923740163417983e-05, + "loss": 1.1196, + "step": 5555 + }, + { + "epoch": 15.138964577656676, + "grad_norm": 12.464645385742188, + "learning_rate": 1.9237063585356438e-05, + "loss": 0.9337, + "step": 5556 + }, + { + "epoch": 15.141689373297003, + "grad_norm": 19.540958404541016, + "learning_rate": 1.923672546459509e-05, + "loss": 1.0425, + "step": 5557 + }, + { + "epoch": 15.14441416893733, + "grad_norm": 11.664422988891602, + "learning_rate": 1.9236387271898422e-05, + "loss": 0.9451, + "step": 5558 + }, + { + "epoch": 15.147138964577657, + "grad_norm": 14.192788124084473, + "learning_rate": 1.9236049007269065e-05, + "loss": 1.0309, + "step": 5559 + }, + { + "epoch": 15.149863760217984, + "grad_norm": 10.858256340026855, + "learning_rate": 1.923571067070966e-05, + "loss": 0.983, + "step": 5560 + }, + { + "epoch": 15.15258855585831, + "grad_norm": 62.61029052734375, + "learning_rate": 1.9235372262222836e-05, + "loss": 1.1512, + "step": 5561 + }, + { + "epoch": 15.155313351498638, + "grad_norm": 13.153077125549316, + "learning_rate": 1.923503378181123e-05, + "loss": 1.0171, + "step": 5562 + }, + { + "epoch": 15.158038147138965, + "grad_norm": 14.244160652160645, + "learning_rate": 1.9234695229477475e-05, + "loss": 0.9473, + "step": 5563 + }, + { + "epoch": 15.160762942779291, + "grad_norm": 11.219650268554688, + "learning_rate": 1.9234356605224214e-05, + "loss": 1.182, + "step": 5564 + }, + { + "epoch": 15.163487738419619, + "grad_norm": 10.995183944702148, + "learning_rate": 1.923401790905408e-05, + "loss": 1.0027, + "step": 5565 + }, + { + "epoch": 15.166212534059946, + "grad_norm": 66.59759521484375, + "learning_rate": 1.9233679140969712e-05, + "loss": 1.0862, + "step": 5566 + }, + { + "epoch": 15.168937329700272, + "grad_norm": 10.47517204284668, + "learning_rate": 1.9233340300973748e-05, + "loss": 1.0009, + "step": 5567 + }, + { + "epoch": 15.1716621253406, + "grad_norm": 9.122160911560059, + "learning_rate": 1.923300138906883e-05, + "loss": 0.9331, + "step": 5568 + }, + { + "epoch": 15.174386920980927, + "grad_norm": 13.863876342773438, + "learning_rate": 1.9232662405257587e-05, + "loss": 1.0895, + "step": 5569 + }, + { + "epoch": 15.177111716621253, + "grad_norm": 30.79233169555664, + "learning_rate": 1.9232323349542672e-05, + "loss": 0.9667, + "step": 5570 + }, + { + "epoch": 15.17983651226158, + "grad_norm": 29.254474639892578, + "learning_rate": 1.923198422192672e-05, + "loss": 0.8047, + "step": 5571 + }, + { + "epoch": 15.182561307901908, + "grad_norm": 13.909764289855957, + "learning_rate": 1.9231645022412367e-05, + "loss": 1.157, + "step": 5572 + }, + { + "epoch": 15.185286103542234, + "grad_norm": 9.685226440429688, + "learning_rate": 1.9231305751002264e-05, + "loss": 1.0886, + "step": 5573 + }, + { + "epoch": 15.188010899182562, + "grad_norm": 11.024321556091309, + "learning_rate": 1.9230966407699048e-05, + "loss": 1.0128, + "step": 5574 + }, + { + "epoch": 15.190735694822889, + "grad_norm": 11.645596504211426, + "learning_rate": 1.9230626992505363e-05, + "loss": 1.0615, + "step": 5575 + }, + { + "epoch": 15.193460490463215, + "grad_norm": 34.92819595336914, + "learning_rate": 1.9230287505423854e-05, + "loss": 0.9623, + "step": 5576 + }, + { + "epoch": 15.196185286103542, + "grad_norm": 11.23338794708252, + "learning_rate": 1.922994794645716e-05, + "loss": 1.1057, + "step": 5577 + }, + { + "epoch": 15.19891008174387, + "grad_norm": 11.245293617248535, + "learning_rate": 1.9229608315607927e-05, + "loss": 1.0365, + "step": 5578 + }, + { + "epoch": 15.201634877384196, + "grad_norm": 9.669820785522461, + "learning_rate": 1.9229268612878805e-05, + "loss": 1.1202, + "step": 5579 + }, + { + "epoch": 15.204359673024523, + "grad_norm": 12.526248931884766, + "learning_rate": 1.9228928838272436e-05, + "loss": 0.9048, + "step": 5580 + }, + { + "epoch": 15.207084468664851, + "grad_norm": 9.201279640197754, + "learning_rate": 1.9228588991791462e-05, + "loss": 1.1516, + "step": 5581 + }, + { + "epoch": 15.209809264305177, + "grad_norm": 8.671073913574219, + "learning_rate": 1.922824907343854e-05, + "loss": 0.9691, + "step": 5582 + }, + { + "epoch": 15.212534059945504, + "grad_norm": 11.62646484375, + "learning_rate": 1.9227909083216305e-05, + "loss": 1.1575, + "step": 5583 + }, + { + "epoch": 15.215258855585832, + "grad_norm": 8.900074005126953, + "learning_rate": 1.9227569021127418e-05, + "loss": 1.0645, + "step": 5584 + }, + { + "epoch": 15.217983651226158, + "grad_norm": 11.487918853759766, + "learning_rate": 1.9227228887174517e-05, + "loss": 1.0321, + "step": 5585 + }, + { + "epoch": 15.220708446866485, + "grad_norm": 9.938650131225586, + "learning_rate": 1.9226888681360253e-05, + "loss": 1.1611, + "step": 5586 + }, + { + "epoch": 15.223433242506813, + "grad_norm": 12.60831356048584, + "learning_rate": 1.9226548403687277e-05, + "loss": 1.0646, + "step": 5587 + }, + { + "epoch": 15.226158038147139, + "grad_norm": 12.61571979522705, + "learning_rate": 1.922620805415824e-05, + "loss": 1.1956, + "step": 5588 + }, + { + "epoch": 15.228882833787466, + "grad_norm": 14.253225326538086, + "learning_rate": 1.9225867632775792e-05, + "loss": 1.0023, + "step": 5589 + }, + { + "epoch": 15.231607629427794, + "grad_norm": 9.755847930908203, + "learning_rate": 1.922552713954258e-05, + "loss": 1.2346, + "step": 5590 + }, + { + "epoch": 15.23433242506812, + "grad_norm": 8.390456199645996, + "learning_rate": 1.9225186574461267e-05, + "loss": 0.9659, + "step": 5591 + }, + { + "epoch": 15.237057220708447, + "grad_norm": 11.750336647033691, + "learning_rate": 1.9224845937534493e-05, + "loss": 0.9033, + "step": 5592 + }, + { + "epoch": 15.239782016348773, + "grad_norm": 8.2207612991333, + "learning_rate": 1.9224505228764916e-05, + "loss": 1.0713, + "step": 5593 + }, + { + "epoch": 15.2425068119891, + "grad_norm": 9.45234203338623, + "learning_rate": 1.9224164448155188e-05, + "loss": 0.9524, + "step": 5594 + }, + { + "epoch": 15.245231607629428, + "grad_norm": 12.078112602233887, + "learning_rate": 1.9223823595707965e-05, + "loss": 1.0212, + "step": 5595 + }, + { + "epoch": 15.247956403269754, + "grad_norm": 9.097121238708496, + "learning_rate": 1.9223482671425904e-05, + "loss": 0.9946, + "step": 5596 + }, + { + "epoch": 15.250681198910081, + "grad_norm": 10.710465431213379, + "learning_rate": 1.9223141675311655e-05, + "loss": 0.8982, + "step": 5597 + }, + { + "epoch": 15.253405994550409, + "grad_norm": 8.28371524810791, + "learning_rate": 1.9222800607367877e-05, + "loss": 1.0732, + "step": 5598 + }, + { + "epoch": 15.256130790190735, + "grad_norm": 9.326583862304688, + "learning_rate": 1.9222459467597222e-05, + "loss": 1.0354, + "step": 5599 + }, + { + "epoch": 15.258855585831062, + "grad_norm": 11.349653244018555, + "learning_rate": 1.9222118256002348e-05, + "loss": 1.0374, + "step": 5600 + }, + { + "epoch": 15.26158038147139, + "grad_norm": 23.970081329345703, + "learning_rate": 1.9221776972585917e-05, + "loss": 1.1165, + "step": 5601 + }, + { + "epoch": 15.264305177111716, + "grad_norm": 9.690476417541504, + "learning_rate": 1.9221435617350583e-05, + "loss": 0.9819, + "step": 5602 + }, + { + "epoch": 15.267029972752043, + "grad_norm": 9.96845531463623, + "learning_rate": 1.9221094190299004e-05, + "loss": 1.0791, + "step": 5603 + }, + { + "epoch": 15.269754768392371, + "grad_norm": 8.391413688659668, + "learning_rate": 1.922075269143384e-05, + "loss": 0.7684, + "step": 5604 + }, + { + "epoch": 15.272479564032697, + "grad_norm": 11.63350772857666, + "learning_rate": 1.9220411120757753e-05, + "loss": 0.844, + "step": 5605 + }, + { + "epoch": 15.275204359673024, + "grad_norm": 10.096068382263184, + "learning_rate": 1.92200694782734e-05, + "loss": 1.0132, + "step": 5606 + }, + { + "epoch": 15.277929155313352, + "grad_norm": 15.669937133789062, + "learning_rate": 1.9219727763983443e-05, + "loss": 0.9551, + "step": 5607 + }, + { + "epoch": 15.280653950953678, + "grad_norm": 11.468816757202148, + "learning_rate": 1.9219385977890542e-05, + "loss": 0.9557, + "step": 5608 + }, + { + "epoch": 15.283378746594005, + "grad_norm": 13.702680587768555, + "learning_rate": 1.9219044119997362e-05, + "loss": 1.2427, + "step": 5609 + }, + { + "epoch": 15.286103542234333, + "grad_norm": 9.633628845214844, + "learning_rate": 1.9218702190306563e-05, + "loss": 0.9138, + "step": 5610 + }, + { + "epoch": 15.288828337874659, + "grad_norm": 9.522684097290039, + "learning_rate": 1.9218360188820804e-05, + "loss": 1.0321, + "step": 5611 + }, + { + "epoch": 15.291553133514986, + "grad_norm": 10.326404571533203, + "learning_rate": 1.9218018115542755e-05, + "loss": 1.0386, + "step": 5612 + }, + { + "epoch": 15.294277929155314, + "grad_norm": 10.368290901184082, + "learning_rate": 1.9217675970475076e-05, + "loss": 1.1053, + "step": 5613 + }, + { + "epoch": 15.29700272479564, + "grad_norm": 9.028491973876953, + "learning_rate": 1.9217333753620436e-05, + "loss": 1.0016, + "step": 5614 + }, + { + "epoch": 15.299727520435967, + "grad_norm": 11.764110565185547, + "learning_rate": 1.9216991464981496e-05, + "loss": 1.1145, + "step": 5615 + }, + { + "epoch": 15.302452316076295, + "grad_norm": 12.641221046447754, + "learning_rate": 1.9216649104560924e-05, + "loss": 1.2463, + "step": 5616 + }, + { + "epoch": 15.30517711171662, + "grad_norm": 22.181150436401367, + "learning_rate": 1.9216306672361385e-05, + "loss": 0.9446, + "step": 5617 + }, + { + "epoch": 15.307901907356948, + "grad_norm": 8.716134071350098, + "learning_rate": 1.9215964168385547e-05, + "loss": 1.0924, + "step": 5618 + }, + { + "epoch": 15.310626702997276, + "grad_norm": 7.8823113441467285, + "learning_rate": 1.9215621592636075e-05, + "loss": 1.0894, + "step": 5619 + }, + { + "epoch": 15.313351498637601, + "grad_norm": 8.83913516998291, + "learning_rate": 1.9215278945115638e-05, + "loss": 1.0728, + "step": 5620 + }, + { + "epoch": 15.316076294277929, + "grad_norm": 9.809870719909668, + "learning_rate": 1.9214936225826905e-05, + "loss": 0.9838, + "step": 5621 + }, + { + "epoch": 15.318801089918257, + "grad_norm": 8.821391105651855, + "learning_rate": 1.9214593434772547e-05, + "loss": 0.9503, + "step": 5622 + }, + { + "epoch": 15.321525885558582, + "grad_norm": 11.356760025024414, + "learning_rate": 1.9214250571955233e-05, + "loss": 1.1288, + "step": 5623 + }, + { + "epoch": 15.32425068119891, + "grad_norm": 15.601412773132324, + "learning_rate": 1.921390763737763e-05, + "loss": 0.8372, + "step": 5624 + }, + { + "epoch": 15.326975476839237, + "grad_norm": 10.478775024414062, + "learning_rate": 1.9213564631042412e-05, + "loss": 1.1282, + "step": 5625 + }, + { + "epoch": 15.329700272479563, + "grad_norm": 9.698952674865723, + "learning_rate": 1.9213221552952248e-05, + "loss": 1.0259, + "step": 5626 + }, + { + "epoch": 15.33242506811989, + "grad_norm": 8.53939151763916, + "learning_rate": 1.921287840310981e-05, + "loss": 0.9272, + "step": 5627 + }, + { + "epoch": 15.335149863760218, + "grad_norm": 10.980330467224121, + "learning_rate": 1.9212535181517773e-05, + "loss": 0.9717, + "step": 5628 + }, + { + "epoch": 15.337874659400544, + "grad_norm": 18.005285263061523, + "learning_rate": 1.9212191888178807e-05, + "loss": 1.0106, + "step": 5629 + }, + { + "epoch": 15.340599455040872, + "grad_norm": 9.591465950012207, + "learning_rate": 1.9211848523095594e-05, + "loss": 1.0352, + "step": 5630 + }, + { + "epoch": 15.3433242506812, + "grad_norm": 8.144366264343262, + "learning_rate": 1.9211505086270795e-05, + "loss": 0.9304, + "step": 5631 + }, + { + "epoch": 15.346049046321525, + "grad_norm": 13.091651916503906, + "learning_rate": 1.9211161577707092e-05, + "loss": 1.0085, + "step": 5632 + }, + { + "epoch": 15.348773841961853, + "grad_norm": 10.374743461608887, + "learning_rate": 1.9210817997407156e-05, + "loss": 0.9946, + "step": 5633 + }, + { + "epoch": 15.35149863760218, + "grad_norm": 9.456803321838379, + "learning_rate": 1.921047434537367e-05, + "loss": 1.0366, + "step": 5634 + }, + { + "epoch": 15.354223433242506, + "grad_norm": 13.099303245544434, + "learning_rate": 1.9210130621609307e-05, + "loss": 0.9717, + "step": 5635 + }, + { + "epoch": 15.356948228882834, + "grad_norm": 48.675018310546875, + "learning_rate": 1.9209786826116738e-05, + "loss": 1.0432, + "step": 5636 + }, + { + "epoch": 15.359673024523161, + "grad_norm": 13.054349899291992, + "learning_rate": 1.920944295889865e-05, + "loss": 0.96, + "step": 5637 + }, + { + "epoch": 15.362397820163487, + "grad_norm": 10.781517028808594, + "learning_rate": 1.9209099019957715e-05, + "loss": 1.1687, + "step": 5638 + }, + { + "epoch": 15.365122615803815, + "grad_norm": 17.755901336669922, + "learning_rate": 1.9208755009296615e-05, + "loss": 0.9841, + "step": 5639 + }, + { + "epoch": 15.367847411444142, + "grad_norm": 18.320762634277344, + "learning_rate": 1.9208410926918025e-05, + "loss": 0.9952, + "step": 5640 + }, + { + "epoch": 15.370572207084468, + "grad_norm": 9.680475234985352, + "learning_rate": 1.9208066772824628e-05, + "loss": 0.8379, + "step": 5641 + }, + { + "epoch": 15.373297002724795, + "grad_norm": 12.532292366027832, + "learning_rate": 1.9207722547019104e-05, + "loss": 1.1055, + "step": 5642 + }, + { + "epoch": 15.376021798365123, + "grad_norm": 9.265933990478516, + "learning_rate": 1.9207378249504134e-05, + "loss": 0.9614, + "step": 5643 + }, + { + "epoch": 15.378746594005449, + "grad_norm": 21.329524993896484, + "learning_rate": 1.9207033880282397e-05, + "loss": 0.9939, + "step": 5644 + }, + { + "epoch": 15.381471389645776, + "grad_norm": 33.45063400268555, + "learning_rate": 1.9206689439356576e-05, + "loss": 1.0686, + "step": 5645 + }, + { + "epoch": 15.384196185286104, + "grad_norm": 27.425533294677734, + "learning_rate": 1.9206344926729355e-05, + "loss": 1.006, + "step": 5646 + }, + { + "epoch": 15.38692098092643, + "grad_norm": 10.662958145141602, + "learning_rate": 1.9206000342403415e-05, + "loss": 1.0957, + "step": 5647 + }, + { + "epoch": 15.389645776566757, + "grad_norm": 11.13443374633789, + "learning_rate": 1.920565568638144e-05, + "loss": 1.188, + "step": 5648 + }, + { + "epoch": 15.392370572207085, + "grad_norm": 11.14825439453125, + "learning_rate": 1.9205310958666118e-05, + "loss": 1.075, + "step": 5649 + }, + { + "epoch": 15.39509536784741, + "grad_norm": 14.481292724609375, + "learning_rate": 1.9204966159260128e-05, + "loss": 1.1101, + "step": 5650 + }, + { + "epoch": 15.397820163487738, + "grad_norm": 11.095571517944336, + "learning_rate": 1.9204621288166158e-05, + "loss": 0.9299, + "step": 5651 + }, + { + "epoch": 15.400544959128066, + "grad_norm": 11.267986297607422, + "learning_rate": 1.9204276345386893e-05, + "loss": 1.0908, + "step": 5652 + }, + { + "epoch": 15.403269754768392, + "grad_norm": 9.950570106506348, + "learning_rate": 1.9203931330925024e-05, + "loss": 1.1143, + "step": 5653 + }, + { + "epoch": 15.40599455040872, + "grad_norm": 13.616087913513184, + "learning_rate": 1.920358624478323e-05, + "loss": 1.1476, + "step": 5654 + }, + { + "epoch": 15.408719346049047, + "grad_norm": 9.59421443939209, + "learning_rate": 1.9203241086964203e-05, + "loss": 0.9622, + "step": 5655 + }, + { + "epoch": 15.411444141689373, + "grad_norm": 11.054874420166016, + "learning_rate": 1.920289585747063e-05, + "loss": 1.1445, + "step": 5656 + }, + { + "epoch": 15.4141689373297, + "grad_norm": 13.57754135131836, + "learning_rate": 1.9202550556305203e-05, + "loss": 0.9258, + "step": 5657 + }, + { + "epoch": 15.416893732970028, + "grad_norm": 17.204612731933594, + "learning_rate": 1.9202205183470607e-05, + "loss": 1.0242, + "step": 5658 + }, + { + "epoch": 15.419618528610354, + "grad_norm": 13.986005783081055, + "learning_rate": 1.9201859738969532e-05, + "loss": 1.0354, + "step": 5659 + }, + { + "epoch": 15.422343324250681, + "grad_norm": 16.004863739013672, + "learning_rate": 1.9201514222804672e-05, + "loss": 1.0708, + "step": 5660 + }, + { + "epoch": 15.425068119891009, + "grad_norm": 26.976064682006836, + "learning_rate": 1.9201168634978714e-05, + "loss": 1.1501, + "step": 5661 + }, + { + "epoch": 15.427792915531334, + "grad_norm": 11.839661598205566, + "learning_rate": 1.920082297549435e-05, + "loss": 1.0608, + "step": 5662 + }, + { + "epoch": 15.430517711171662, + "grad_norm": 10.757123947143555, + "learning_rate": 1.9200477244354274e-05, + "loss": 1.2283, + "step": 5663 + }, + { + "epoch": 15.43324250681199, + "grad_norm": 18.2895565032959, + "learning_rate": 1.920013144156118e-05, + "loss": 1.0442, + "step": 5664 + }, + { + "epoch": 15.435967302452315, + "grad_norm": 31.786094665527344, + "learning_rate": 1.9199785567117755e-05, + "loss": 1.1907, + "step": 5665 + }, + { + "epoch": 15.438692098092643, + "grad_norm": 72.43460083007812, + "learning_rate": 1.9199439621026696e-05, + "loss": 1.0413, + "step": 5666 + }, + { + "epoch": 15.44141689373297, + "grad_norm": 71.09246826171875, + "learning_rate": 1.9199093603290697e-05, + "loss": 1.1392, + "step": 5667 + }, + { + "epoch": 15.444141689373296, + "grad_norm": 10.77194595336914, + "learning_rate": 1.9198747513912455e-05, + "loss": 0.9873, + "step": 5668 + }, + { + "epoch": 15.446866485013624, + "grad_norm": 10.256016731262207, + "learning_rate": 1.9198401352894663e-05, + "loss": 0.88, + "step": 5669 + }, + { + "epoch": 15.449591280653951, + "grad_norm": 41.68864059448242, + "learning_rate": 1.9198055120240012e-05, + "loss": 1.0861, + "step": 5670 + }, + { + "epoch": 15.452316076294277, + "grad_norm": 13.512534141540527, + "learning_rate": 1.919770881595121e-05, + "loss": 0.9462, + "step": 5671 + }, + { + "epoch": 15.455040871934605, + "grad_norm": 11.331838607788086, + "learning_rate": 1.9197362440030946e-05, + "loss": 0.9468, + "step": 5672 + }, + { + "epoch": 15.457765667574932, + "grad_norm": 13.011062622070312, + "learning_rate": 1.9197015992481918e-05, + "loss": 1.0844, + "step": 5673 + }, + { + "epoch": 15.460490463215258, + "grad_norm": 24.373592376708984, + "learning_rate": 1.919666947330683e-05, + "loss": 0.9351, + "step": 5674 + }, + { + "epoch": 15.463215258855586, + "grad_norm": 17.608154296875, + "learning_rate": 1.9196322882508372e-05, + "loss": 0.9045, + "step": 5675 + }, + { + "epoch": 15.465940054495913, + "grad_norm": 13.437183380126953, + "learning_rate": 1.919597622008925e-05, + "loss": 1.1609, + "step": 5676 + }, + { + "epoch": 15.46866485013624, + "grad_norm": 13.064347267150879, + "learning_rate": 1.919562948605216e-05, + "loss": 1.0714, + "step": 5677 + }, + { + "epoch": 15.471389645776567, + "grad_norm": 27.0733642578125, + "learning_rate": 1.9195282680399804e-05, + "loss": 1.1477, + "step": 5678 + }, + { + "epoch": 15.474114441416894, + "grad_norm": 15.739130020141602, + "learning_rate": 1.919493580313488e-05, + "loss": 1.0966, + "step": 5679 + }, + { + "epoch": 15.47683923705722, + "grad_norm": 14.389317512512207, + "learning_rate": 1.919458885426009e-05, + "loss": 0.9873, + "step": 5680 + }, + { + "epoch": 15.479564032697548, + "grad_norm": 10.674415588378906, + "learning_rate": 1.9194241833778148e-05, + "loss": 1.1765, + "step": 5681 + }, + { + "epoch": 15.482288828337875, + "grad_norm": 33.03879928588867, + "learning_rate": 1.9193894741691735e-05, + "loss": 1.0614, + "step": 5682 + }, + { + "epoch": 15.485013623978201, + "grad_norm": 8.198208808898926, + "learning_rate": 1.9193547578003574e-05, + "loss": 1.0408, + "step": 5683 + }, + { + "epoch": 15.487738419618529, + "grad_norm": 10.565143585205078, + "learning_rate": 1.9193200342716355e-05, + "loss": 0.9724, + "step": 5684 + }, + { + "epoch": 15.490463215258856, + "grad_norm": 15.008692741394043, + "learning_rate": 1.919285303583279e-05, + "loss": 1.1655, + "step": 5685 + }, + { + "epoch": 15.493188010899182, + "grad_norm": 10.448790550231934, + "learning_rate": 1.919250565735558e-05, + "loss": 0.9971, + "step": 5686 + }, + { + "epoch": 15.49591280653951, + "grad_norm": 13.054065704345703, + "learning_rate": 1.9192158207287435e-05, + "loss": 1.0354, + "step": 5687 + }, + { + "epoch": 15.498637602179837, + "grad_norm": 12.612138748168945, + "learning_rate": 1.9191810685631055e-05, + "loss": 1.1664, + "step": 5688 + }, + { + "epoch": 15.501362397820163, + "grad_norm": 13.168205261230469, + "learning_rate": 1.919146309238915e-05, + "loss": 1.0864, + "step": 5689 + }, + { + "epoch": 15.50408719346049, + "grad_norm": 13.737235069274902, + "learning_rate": 1.9191115427564425e-05, + "loss": 1.0398, + "step": 5690 + }, + { + "epoch": 15.506811989100818, + "grad_norm": 10.856537818908691, + "learning_rate": 1.9190767691159592e-05, + "loss": 1.0736, + "step": 5691 + }, + { + "epoch": 15.509536784741144, + "grad_norm": 18.237037658691406, + "learning_rate": 1.9190419883177355e-05, + "loss": 0.9568, + "step": 5692 + }, + { + "epoch": 15.512261580381471, + "grad_norm": 9.727873802185059, + "learning_rate": 1.919007200362042e-05, + "loss": 1.1021, + "step": 5693 + }, + { + "epoch": 15.514986376021799, + "grad_norm": 9.597294807434082, + "learning_rate": 1.9189724052491502e-05, + "loss": 1.1595, + "step": 5694 + }, + { + "epoch": 15.517711171662125, + "grad_norm": 18.482219696044922, + "learning_rate": 1.918937602979331e-05, + "loss": 1.1152, + "step": 5695 + }, + { + "epoch": 15.520435967302452, + "grad_norm": 9.99679183959961, + "learning_rate": 1.9189027935528553e-05, + "loss": 0.9644, + "step": 5696 + }, + { + "epoch": 15.52316076294278, + "grad_norm": 9.244872093200684, + "learning_rate": 1.9188679769699944e-05, + "loss": 0.998, + "step": 5697 + }, + { + "epoch": 15.525885558583106, + "grad_norm": 24.489723205566406, + "learning_rate": 1.918833153231019e-05, + "loss": 0.972, + "step": 5698 + }, + { + "epoch": 15.528610354223433, + "grad_norm": 10.590883255004883, + "learning_rate": 1.9187983223362006e-05, + "loss": 1.0823, + "step": 5699 + }, + { + "epoch": 15.53133514986376, + "grad_norm": 10.565340995788574, + "learning_rate": 1.9187634842858104e-05, + "loss": 0.9884, + "step": 5700 + }, + { + "epoch": 15.534059945504087, + "grad_norm": 10.080450057983398, + "learning_rate": 1.91872863908012e-05, + "loss": 0.9827, + "step": 5701 + }, + { + "epoch": 15.536784741144414, + "grad_norm": 11.24704647064209, + "learning_rate": 1.9186937867194e-05, + "loss": 1.0967, + "step": 5702 + }, + { + "epoch": 15.539509536784742, + "grad_norm": 11.711875915527344, + "learning_rate": 1.9186589272039227e-05, + "loss": 1.1519, + "step": 5703 + }, + { + "epoch": 15.542234332425068, + "grad_norm": 10.722929954528809, + "learning_rate": 1.9186240605339596e-05, + "loss": 1.1758, + "step": 5704 + }, + { + "epoch": 15.544959128065395, + "grad_norm": 9.224250793457031, + "learning_rate": 1.9185891867097813e-05, + "loss": 0.9614, + "step": 5705 + }, + { + "epoch": 15.547683923705723, + "grad_norm": 14.218178749084473, + "learning_rate": 1.9185543057316604e-05, + "loss": 1.014, + "step": 5706 + }, + { + "epoch": 15.550408719346049, + "grad_norm": 9.43051815032959, + "learning_rate": 1.9185194175998682e-05, + "loss": 1.0627, + "step": 5707 + }, + { + "epoch": 15.553133514986376, + "grad_norm": 9.282830238342285, + "learning_rate": 1.9184845223146757e-05, + "loss": 1.162, + "step": 5708 + }, + { + "epoch": 15.555858310626704, + "grad_norm": 9.06210708618164, + "learning_rate": 1.9184496198763557e-05, + "loss": 1.0413, + "step": 5709 + }, + { + "epoch": 15.55858310626703, + "grad_norm": 10.454787254333496, + "learning_rate": 1.9184147102851796e-05, + "loss": 1.0507, + "step": 5710 + }, + { + "epoch": 15.561307901907357, + "grad_norm": 9.729334831237793, + "learning_rate": 1.9183797935414194e-05, + "loss": 0.9071, + "step": 5711 + }, + { + "epoch": 15.564032697547685, + "grad_norm": 11.212459564208984, + "learning_rate": 1.918344869645347e-05, + "loss": 0.8904, + "step": 5712 + }, + { + "epoch": 15.56675749318801, + "grad_norm": 9.800729751586914, + "learning_rate": 1.918309938597234e-05, + "loss": 1.1301, + "step": 5713 + }, + { + "epoch": 15.569482288828338, + "grad_norm": 11.547163009643555, + "learning_rate": 1.918275000397353e-05, + "loss": 1.1277, + "step": 5714 + }, + { + "epoch": 15.572207084468666, + "grad_norm": 11.262359619140625, + "learning_rate": 1.9182400550459758e-05, + "loss": 1.1111, + "step": 5715 + }, + { + "epoch": 15.574931880108991, + "grad_norm": 9.875480651855469, + "learning_rate": 1.9182051025433743e-05, + "loss": 1.0226, + "step": 5716 + }, + { + "epoch": 15.577656675749319, + "grad_norm": 10.523189544677734, + "learning_rate": 1.9181701428898215e-05, + "loss": 1.1477, + "step": 5717 + }, + { + "epoch": 15.580381471389646, + "grad_norm": 11.124797821044922, + "learning_rate": 1.9181351760855888e-05, + "loss": 1.2227, + "step": 5718 + }, + { + "epoch": 15.583106267029972, + "grad_norm": 9.22188949584961, + "learning_rate": 1.918100202130949e-05, + "loss": 1.1023, + "step": 5719 + }, + { + "epoch": 15.5858310626703, + "grad_norm": 12.09113883972168, + "learning_rate": 1.9180652210261743e-05, + "loss": 0.9634, + "step": 5720 + }, + { + "epoch": 15.588555858310627, + "grad_norm": 10.632393836975098, + "learning_rate": 1.9180302327715376e-05, + "loss": 1.2341, + "step": 5721 + }, + { + "epoch": 15.591280653950953, + "grad_norm": 60.9536247253418, + "learning_rate": 1.9179952373673106e-05, + "loss": 1.1792, + "step": 5722 + }, + { + "epoch": 15.59400544959128, + "grad_norm": 10.613637924194336, + "learning_rate": 1.9179602348137664e-05, + "loss": 1.0394, + "step": 5723 + }, + { + "epoch": 15.596730245231608, + "grad_norm": 11.657779693603516, + "learning_rate": 1.9179252251111774e-05, + "loss": 1.0682, + "step": 5724 + }, + { + "epoch": 15.599455040871934, + "grad_norm": 15.660120010375977, + "learning_rate": 1.917890208259816e-05, + "loss": 1.1211, + "step": 5725 + }, + { + "epoch": 15.602179836512262, + "grad_norm": 13.824321746826172, + "learning_rate": 1.917855184259956e-05, + "loss": 1.0676, + "step": 5726 + }, + { + "epoch": 15.60490463215259, + "grad_norm": 9.168793678283691, + "learning_rate": 1.9178201531118686e-05, + "loss": 0.9479, + "step": 5727 + }, + { + "epoch": 15.607629427792915, + "grad_norm": 9.639008522033691, + "learning_rate": 1.9177851148158274e-05, + "loss": 1.0037, + "step": 5728 + }, + { + "epoch": 15.610354223433243, + "grad_norm": 8.819302558898926, + "learning_rate": 1.917750069372106e-05, + "loss": 1.0223, + "step": 5729 + }, + { + "epoch": 15.61307901907357, + "grad_norm": 10.01408863067627, + "learning_rate": 1.9177150167809756e-05, + "loss": 1.2766, + "step": 5730 + }, + { + "epoch": 15.615803814713896, + "grad_norm": 12.288567543029785, + "learning_rate": 1.9176799570427108e-05, + "loss": 1.063, + "step": 5731 + }, + { + "epoch": 15.618528610354224, + "grad_norm": 9.187858581542969, + "learning_rate": 1.9176448901575838e-05, + "loss": 0.9091, + "step": 5732 + }, + { + "epoch": 15.621253405994551, + "grad_norm": 8.205780982971191, + "learning_rate": 1.9176098161258684e-05, + "loss": 0.8153, + "step": 5733 + }, + { + "epoch": 15.623978201634877, + "grad_norm": 9.210580825805664, + "learning_rate": 1.9175747349478366e-05, + "loss": 0.9578, + "step": 5734 + }, + { + "epoch": 15.626702997275205, + "grad_norm": 11.467032432556152, + "learning_rate": 1.917539646623763e-05, + "loss": 0.9211, + "step": 5735 + }, + { + "epoch": 15.629427792915532, + "grad_norm": 13.662873268127441, + "learning_rate": 1.9175045511539197e-05, + "loss": 0.8729, + "step": 5736 + }, + { + "epoch": 15.632152588555858, + "grad_norm": 8.510534286499023, + "learning_rate": 1.9174694485385805e-05, + "loss": 1.0953, + "step": 5737 + }, + { + "epoch": 15.634877384196185, + "grad_norm": 8.807907104492188, + "learning_rate": 1.917434338778019e-05, + "loss": 1.0469, + "step": 5738 + }, + { + "epoch": 15.637602179836513, + "grad_norm": 18.483234405517578, + "learning_rate": 1.917399221872508e-05, + "loss": 0.9, + "step": 5739 + }, + { + "epoch": 15.640326975476839, + "grad_norm": 7.845697402954102, + "learning_rate": 1.9173640978223214e-05, + "loss": 1.042, + "step": 5740 + }, + { + "epoch": 15.643051771117166, + "grad_norm": 14.4625883102417, + "learning_rate": 1.917328966627733e-05, + "loss": 1.0551, + "step": 5741 + }, + { + "epoch": 15.645776566757494, + "grad_norm": 9.872694969177246, + "learning_rate": 1.9172938282890164e-05, + "loss": 1.0273, + "step": 5742 + }, + { + "epoch": 15.64850136239782, + "grad_norm": 10.579270362854004, + "learning_rate": 1.9172586828064446e-05, + "loss": 1.0469, + "step": 5743 + }, + { + "epoch": 15.651226158038147, + "grad_norm": 8.047989845275879, + "learning_rate": 1.9172235301802916e-05, + "loss": 0.9785, + "step": 5744 + }, + { + "epoch": 15.653950953678475, + "grad_norm": 12.386167526245117, + "learning_rate": 1.9171883704108316e-05, + "loss": 1.1707, + "step": 5745 + }, + { + "epoch": 15.6566757493188, + "grad_norm": 7.95110559463501, + "learning_rate": 1.9171532034983377e-05, + "loss": 0.9547, + "step": 5746 + }, + { + "epoch": 15.659400544959128, + "grad_norm": 8.568359375, + "learning_rate": 1.9171180294430847e-05, + "loss": 1.0623, + "step": 5747 + }, + { + "epoch": 15.662125340599456, + "grad_norm": 9.228265762329102, + "learning_rate": 1.9170828482453456e-05, + "loss": 1.03, + "step": 5748 + }, + { + "epoch": 15.664850136239782, + "grad_norm": 14.048735618591309, + "learning_rate": 1.9170476599053952e-05, + "loss": 1.1896, + "step": 5749 + }, + { + "epoch": 15.66757493188011, + "grad_norm": 16.577896118164062, + "learning_rate": 1.9170124644235066e-05, + "loss": 1.2175, + "step": 5750 + }, + { + "epoch": 15.670299727520437, + "grad_norm": 13.842279434204102, + "learning_rate": 1.9169772617999545e-05, + "loss": 1.1901, + "step": 5751 + }, + { + "epoch": 15.673024523160763, + "grad_norm": 10.956024169921875, + "learning_rate": 1.9169420520350135e-05, + "loss": 1.0266, + "step": 5752 + }, + { + "epoch": 15.67574931880109, + "grad_norm": 10.104551315307617, + "learning_rate": 1.916906835128957e-05, + "loss": 0.9318, + "step": 5753 + }, + { + "epoch": 15.678474114441418, + "grad_norm": 11.581619262695312, + "learning_rate": 1.9168716110820592e-05, + "loss": 1.0981, + "step": 5754 + }, + { + "epoch": 15.681198910081743, + "grad_norm": 34.04673385620117, + "learning_rate": 1.9168363798945955e-05, + "loss": 1.1523, + "step": 5755 + }, + { + "epoch": 15.683923705722071, + "grad_norm": 9.896060943603516, + "learning_rate": 1.9168011415668392e-05, + "loss": 0.8792, + "step": 5756 + }, + { + "epoch": 15.686648501362399, + "grad_norm": 11.737502098083496, + "learning_rate": 1.916765896099065e-05, + "loss": 1.1477, + "step": 5757 + }, + { + "epoch": 15.689373297002724, + "grad_norm": 8.23998737335205, + "learning_rate": 1.9167306434915475e-05, + "loss": 0.9487, + "step": 5758 + }, + { + "epoch": 15.692098092643052, + "grad_norm": 8.44018840789795, + "learning_rate": 1.9166953837445618e-05, + "loss": 1.004, + "step": 5759 + }, + { + "epoch": 15.69482288828338, + "grad_norm": 10.327585220336914, + "learning_rate": 1.9166601168583815e-05, + "loss": 1.2854, + "step": 5760 + }, + { + "epoch": 15.697547683923705, + "grad_norm": 11.30803394317627, + "learning_rate": 1.9166248428332816e-05, + "loss": 1.1277, + "step": 5761 + }, + { + "epoch": 15.700272479564033, + "grad_norm": 15.84594440460205, + "learning_rate": 1.9165895616695373e-05, + "loss": 0.996, + "step": 5762 + }, + { + "epoch": 15.70299727520436, + "grad_norm": 20.89583396911621, + "learning_rate": 1.9165542733674226e-05, + "loss": 1.0647, + "step": 5763 + }, + { + "epoch": 15.705722070844686, + "grad_norm": 9.654314041137695, + "learning_rate": 1.916518977927213e-05, + "loss": 1.0873, + "step": 5764 + }, + { + "epoch": 15.708446866485014, + "grad_norm": 8.791511535644531, + "learning_rate": 1.9164836753491834e-05, + "loss": 1.0981, + "step": 5765 + }, + { + "epoch": 15.711171662125341, + "grad_norm": 9.795890808105469, + "learning_rate": 1.916448365633608e-05, + "loss": 1.1212, + "step": 5766 + }, + { + "epoch": 15.713896457765667, + "grad_norm": 8.347766876220703, + "learning_rate": 1.9164130487807623e-05, + "loss": 0.9233, + "step": 5767 + }, + { + "epoch": 15.716621253405995, + "grad_norm": 9.630997657775879, + "learning_rate": 1.916377724790921e-05, + "loss": 1.2072, + "step": 5768 + }, + { + "epoch": 15.719346049046322, + "grad_norm": 8.77739143371582, + "learning_rate": 1.9163423936643598e-05, + "loss": 1.1823, + "step": 5769 + }, + { + "epoch": 15.722070844686648, + "grad_norm": 8.231311798095703, + "learning_rate": 1.9163070554013535e-05, + "loss": 0.9652, + "step": 5770 + }, + { + "epoch": 15.724795640326976, + "grad_norm": 10.8486328125, + "learning_rate": 1.9162717100021772e-05, + "loss": 1.074, + "step": 5771 + }, + { + "epoch": 15.727520435967303, + "grad_norm": 8.435831069946289, + "learning_rate": 1.9162363574671062e-05, + "loss": 0.9534, + "step": 5772 + }, + { + "epoch": 15.730245231607629, + "grad_norm": 8.546896934509277, + "learning_rate": 1.9162009977964165e-05, + "loss": 1.0242, + "step": 5773 + }, + { + "epoch": 15.732970027247957, + "grad_norm": 16.247638702392578, + "learning_rate": 1.9161656309903825e-05, + "loss": 1.0422, + "step": 5774 + }, + { + "epoch": 15.735694822888284, + "grad_norm": 13.46705150604248, + "learning_rate": 1.91613025704928e-05, + "loss": 1.0439, + "step": 5775 + }, + { + "epoch": 15.73841961852861, + "grad_norm": 12.30317497253418, + "learning_rate": 1.916094875973385e-05, + "loss": 1.1267, + "step": 5776 + }, + { + "epoch": 15.741144414168938, + "grad_norm": 9.070901870727539, + "learning_rate": 1.916059487762972e-05, + "loss": 1.0928, + "step": 5777 + }, + { + "epoch": 15.743869209809265, + "grad_norm": 8.931979179382324, + "learning_rate": 1.9160240924183174e-05, + "loss": 1.1189, + "step": 5778 + }, + { + "epoch": 15.746594005449591, + "grad_norm": 9.261917114257812, + "learning_rate": 1.9159886899396966e-05, + "loss": 1.0011, + "step": 5779 + }, + { + "epoch": 15.749318801089919, + "grad_norm": 14.735495567321777, + "learning_rate": 1.9159532803273856e-05, + "loss": 0.8273, + "step": 5780 + }, + { + "epoch": 15.752043596730246, + "grad_norm": 12.524917602539062, + "learning_rate": 1.91591786358166e-05, + "loss": 1.0941, + "step": 5781 + }, + { + "epoch": 15.754768392370572, + "grad_norm": 9.117819786071777, + "learning_rate": 1.9158824397027954e-05, + "loss": 1.0586, + "step": 5782 + }, + { + "epoch": 15.7574931880109, + "grad_norm": 253.52011108398438, + "learning_rate": 1.9158470086910677e-05, + "loss": 1.1418, + "step": 5783 + }, + { + "epoch": 15.760217983651227, + "grad_norm": 11.384540557861328, + "learning_rate": 1.9158115705467528e-05, + "loss": 0.9756, + "step": 5784 + }, + { + "epoch": 15.762942779291553, + "grad_norm": 13.110880851745605, + "learning_rate": 1.9157761252701273e-05, + "loss": 0.955, + "step": 5785 + }, + { + "epoch": 15.76566757493188, + "grad_norm": 10.360495567321777, + "learning_rate": 1.915740672861467e-05, + "loss": 1.2449, + "step": 5786 + }, + { + "epoch": 15.768392370572208, + "grad_norm": 11.14963436126709, + "learning_rate": 1.915705213321047e-05, + "loss": 1.0106, + "step": 5787 + }, + { + "epoch": 15.771117166212534, + "grad_norm": 11.102007865905762, + "learning_rate": 1.9156697466491447e-05, + "loss": 1.11, + "step": 5788 + }, + { + "epoch": 15.773841961852861, + "grad_norm": 11.817999839782715, + "learning_rate": 1.915634272846036e-05, + "loss": 1.0494, + "step": 5789 + }, + { + "epoch": 15.776566757493189, + "grad_norm": 13.184379577636719, + "learning_rate": 1.9155987919119973e-05, + "loss": 1.1912, + "step": 5790 + }, + { + "epoch": 15.779291553133515, + "grad_norm": 10.445209503173828, + "learning_rate": 1.915563303847304e-05, + "loss": 1.0676, + "step": 5791 + }, + { + "epoch": 15.782016348773842, + "grad_norm": 17.510478973388672, + "learning_rate": 1.9155278086522334e-05, + "loss": 1.0464, + "step": 5792 + }, + { + "epoch": 15.78474114441417, + "grad_norm": 12.840875625610352, + "learning_rate": 1.915492306327062e-05, + "loss": 1.2336, + "step": 5793 + }, + { + "epoch": 15.787465940054496, + "grad_norm": 13.593019485473633, + "learning_rate": 1.9154567968720656e-05, + "loss": 0.9667, + "step": 5794 + }, + { + "epoch": 15.790190735694823, + "grad_norm": 13.132856369018555, + "learning_rate": 1.9154212802875215e-05, + "loss": 1.0829, + "step": 5795 + }, + { + "epoch": 15.79291553133515, + "grad_norm": 19.62708282470703, + "learning_rate": 1.9153857565737058e-05, + "loss": 1.007, + "step": 5796 + }, + { + "epoch": 15.795640326975477, + "grad_norm": 12.598803520202637, + "learning_rate": 1.9153502257308952e-05, + "loss": 1.0894, + "step": 5797 + }, + { + "epoch": 15.798365122615804, + "grad_norm": 12.247570991516113, + "learning_rate": 1.9153146877593666e-05, + "loss": 1.2468, + "step": 5798 + }, + { + "epoch": 15.80108991825613, + "grad_norm": 11.259017944335938, + "learning_rate": 1.9152791426593964e-05, + "loss": 0.8749, + "step": 5799 + }, + { + "epoch": 15.803814713896458, + "grad_norm": 15.317924499511719, + "learning_rate": 1.9152435904312617e-05, + "loss": 1.0837, + "step": 5800 + }, + { + "epoch": 15.806539509536785, + "grad_norm": 10.472589492797852, + "learning_rate": 1.9152080310752398e-05, + "loss": 1.1927, + "step": 5801 + }, + { + "epoch": 15.809264305177111, + "grad_norm": 8.946378707885742, + "learning_rate": 1.9151724645916067e-05, + "loss": 0.9634, + "step": 5802 + }, + { + "epoch": 15.811989100817438, + "grad_norm": 9.994170188903809, + "learning_rate": 1.9151368909806403e-05, + "loss": 1.1936, + "step": 5803 + }, + { + "epoch": 15.814713896457766, + "grad_norm": 9.011474609375, + "learning_rate": 1.9151013102426174e-05, + "loss": 0.9994, + "step": 5804 + }, + { + "epoch": 15.817438692098092, + "grad_norm": 13.082215309143066, + "learning_rate": 1.9150657223778144e-05, + "loss": 1.1785, + "step": 5805 + }, + { + "epoch": 15.82016348773842, + "grad_norm": 13.153779983520508, + "learning_rate": 1.9150301273865093e-05, + "loss": 1.2297, + "step": 5806 + }, + { + "epoch": 15.822888283378747, + "grad_norm": 12.095719337463379, + "learning_rate": 1.914994525268979e-05, + "loss": 1.0507, + "step": 5807 + }, + { + "epoch": 15.825613079019073, + "grad_norm": 14.634735107421875, + "learning_rate": 1.914958916025501e-05, + "loss": 1.0647, + "step": 5808 + }, + { + "epoch": 15.8283378746594, + "grad_norm": 19.04387855529785, + "learning_rate": 1.914923299656352e-05, + "loss": 1.1753, + "step": 5809 + }, + { + "epoch": 15.831062670299728, + "grad_norm": 12.531530380249023, + "learning_rate": 1.91488767616181e-05, + "loss": 0.8816, + "step": 5810 + }, + { + "epoch": 15.833787465940054, + "grad_norm": 15.612229347229004, + "learning_rate": 1.914852045542152e-05, + "loss": 1.1462, + "step": 5811 + }, + { + "epoch": 15.836512261580381, + "grad_norm": 8.871306419372559, + "learning_rate": 1.914816407797656e-05, + "loss": 1.1921, + "step": 5812 + }, + { + "epoch": 15.839237057220709, + "grad_norm": 9.51230525970459, + "learning_rate": 1.9147807629285993e-05, + "loss": 0.8789, + "step": 5813 + }, + { + "epoch": 15.841961852861035, + "grad_norm": 8.646533012390137, + "learning_rate": 1.9147451109352592e-05, + "loss": 0.8663, + "step": 5814 + }, + { + "epoch": 15.844686648501362, + "grad_norm": 14.684822082519531, + "learning_rate": 1.9147094518179136e-05, + "loss": 1.115, + "step": 5815 + }, + { + "epoch": 15.84741144414169, + "grad_norm": 11.252645492553711, + "learning_rate": 1.9146737855768407e-05, + "loss": 1.1289, + "step": 5816 + }, + { + "epoch": 15.850136239782016, + "grad_norm": 16.818647384643555, + "learning_rate": 1.9146381122123176e-05, + "loss": 1.0566, + "step": 5817 + }, + { + "epoch": 15.852861035422343, + "grad_norm": 12.027950286865234, + "learning_rate": 1.9146024317246217e-05, + "loss": 1.1055, + "step": 5818 + }, + { + "epoch": 15.85558583106267, + "grad_norm": 10.26107120513916, + "learning_rate": 1.914566744114032e-05, + "loss": 0.9465, + "step": 5819 + }, + { + "epoch": 15.858310626702997, + "grad_norm": 9.16214370727539, + "learning_rate": 1.9145310493808264e-05, + "loss": 0.881, + "step": 5820 + }, + { + "epoch": 15.861035422343324, + "grad_norm": 18.3576602935791, + "learning_rate": 1.9144953475252818e-05, + "loss": 0.9797, + "step": 5821 + }, + { + "epoch": 15.863760217983652, + "grad_norm": 11.488898277282715, + "learning_rate": 1.914459638547677e-05, + "loss": 1.2394, + "step": 5822 + }, + { + "epoch": 15.866485013623977, + "grad_norm": 10.461718559265137, + "learning_rate": 1.91442392244829e-05, + "loss": 0.8883, + "step": 5823 + }, + { + "epoch": 15.869209809264305, + "grad_norm": 12.152205467224121, + "learning_rate": 1.9143881992273988e-05, + "loss": 1.011, + "step": 5824 + }, + { + "epoch": 15.871934604904633, + "grad_norm": 12.241488456726074, + "learning_rate": 1.914352468885282e-05, + "loss": 1.0708, + "step": 5825 + }, + { + "epoch": 15.874659400544958, + "grad_norm": 9.718058586120605, + "learning_rate": 1.9143167314222172e-05, + "loss": 1.0092, + "step": 5826 + }, + { + "epoch": 15.877384196185286, + "grad_norm": 14.82849407196045, + "learning_rate": 1.9142809868384836e-05, + "loss": 1.0952, + "step": 5827 + }, + { + "epoch": 15.880108991825614, + "grad_norm": 9.937234878540039, + "learning_rate": 1.9142452351343585e-05, + "loss": 1.1174, + "step": 5828 + }, + { + "epoch": 15.88283378746594, + "grad_norm": 8.828649520874023, + "learning_rate": 1.9142094763101216e-05, + "loss": 1.2395, + "step": 5829 + }, + { + "epoch": 15.885558583106267, + "grad_norm": 13.135193824768066, + "learning_rate": 1.9141737103660503e-05, + "loss": 1.1481, + "step": 5830 + }, + { + "epoch": 15.888283378746594, + "grad_norm": 9.514058113098145, + "learning_rate": 1.9141379373024235e-05, + "loss": 0.9443, + "step": 5831 + }, + { + "epoch": 15.89100817438692, + "grad_norm": 10.643321990966797, + "learning_rate": 1.9141021571195204e-05, + "loss": 1.0137, + "step": 5832 + }, + { + "epoch": 15.893732970027248, + "grad_norm": 11.337188720703125, + "learning_rate": 1.9140663698176183e-05, + "loss": 1.0775, + "step": 5833 + }, + { + "epoch": 15.896457765667575, + "grad_norm": 12.842183113098145, + "learning_rate": 1.9140305753969977e-05, + "loss": 1.0387, + "step": 5834 + }, + { + "epoch": 15.899182561307901, + "grad_norm": 9.45815658569336, + "learning_rate": 1.913994773857936e-05, + "loss": 1.291, + "step": 5835 + }, + { + "epoch": 15.901907356948229, + "grad_norm": 10.153657913208008, + "learning_rate": 1.913958965200712e-05, + "loss": 1.1455, + "step": 5836 + }, + { + "epoch": 15.904632152588556, + "grad_norm": 11.954771041870117, + "learning_rate": 1.9139231494256054e-05, + "loss": 1.2424, + "step": 5837 + }, + { + "epoch": 15.907356948228882, + "grad_norm": 9.33283519744873, + "learning_rate": 1.9138873265328944e-05, + "loss": 0.9509, + "step": 5838 + }, + { + "epoch": 15.91008174386921, + "grad_norm": 11.959882736206055, + "learning_rate": 1.9138514965228587e-05, + "loss": 1.1006, + "step": 5839 + }, + { + "epoch": 15.912806539509537, + "grad_norm": 10.285158157348633, + "learning_rate": 1.9138156593957767e-05, + "loss": 1.1519, + "step": 5840 + }, + { + "epoch": 15.915531335149863, + "grad_norm": 11.74209213256836, + "learning_rate": 1.913779815151928e-05, + "loss": 1.0012, + "step": 5841 + }, + { + "epoch": 15.91825613079019, + "grad_norm": 15.43689250946045, + "learning_rate": 1.9137439637915912e-05, + "loss": 0.9618, + "step": 5842 + }, + { + "epoch": 15.920980926430518, + "grad_norm": 34.82831954956055, + "learning_rate": 1.9137081053150465e-05, + "loss": 1.1279, + "step": 5843 + }, + { + "epoch": 15.923705722070844, + "grad_norm": 17.277294158935547, + "learning_rate": 1.913672239722572e-05, + "loss": 1.1492, + "step": 5844 + }, + { + "epoch": 15.926430517711172, + "grad_norm": 11.406451225280762, + "learning_rate": 1.9136363670144472e-05, + "loss": 1.1479, + "step": 5845 + }, + { + "epoch": 15.9291553133515, + "grad_norm": 8.550233840942383, + "learning_rate": 1.913600487190952e-05, + "loss": 0.9703, + "step": 5846 + }, + { + "epoch": 15.931880108991825, + "grad_norm": 7.3839616775512695, + "learning_rate": 1.913564600252366e-05, + "loss": 0.9032, + "step": 5847 + }, + { + "epoch": 15.934604904632153, + "grad_norm": 12.862568855285645, + "learning_rate": 1.9135287061989677e-05, + "loss": 1.1243, + "step": 5848 + }, + { + "epoch": 15.93732970027248, + "grad_norm": 8.45930290222168, + "learning_rate": 1.9134928050310374e-05, + "loss": 1.1049, + "step": 5849 + }, + { + "epoch": 15.940054495912806, + "grad_norm": 8.572096824645996, + "learning_rate": 1.9134568967488548e-05, + "loss": 0.9646, + "step": 5850 + }, + { + "epoch": 15.942779291553133, + "grad_norm": 11.794368743896484, + "learning_rate": 1.9134209813526992e-05, + "loss": 1.0782, + "step": 5851 + }, + { + "epoch": 15.945504087193461, + "grad_norm": 10.465714454650879, + "learning_rate": 1.9133850588428503e-05, + "loss": 1.1124, + "step": 5852 + }, + { + "epoch": 15.948228882833787, + "grad_norm": 10.074355125427246, + "learning_rate": 1.9133491292195878e-05, + "loss": 1.0828, + "step": 5853 + }, + { + "epoch": 15.950953678474114, + "grad_norm": 26.048002243041992, + "learning_rate": 1.9133131924831917e-05, + "loss": 1.0967, + "step": 5854 + }, + { + "epoch": 15.953678474114442, + "grad_norm": 15.029605865478516, + "learning_rate": 1.913277248633942e-05, + "loss": 0.9686, + "step": 5855 + }, + { + "epoch": 15.956403269754768, + "grad_norm": 9.323305130004883, + "learning_rate": 1.9132412976721185e-05, + "loss": 1.1111, + "step": 5856 + }, + { + "epoch": 15.959128065395095, + "grad_norm": 11.37041187286377, + "learning_rate": 1.9132053395980013e-05, + "loss": 1.1589, + "step": 5857 + }, + { + "epoch": 15.961852861035423, + "grad_norm": 10.822033882141113, + "learning_rate": 1.91316937441187e-05, + "loss": 0.9663, + "step": 5858 + }, + { + "epoch": 15.964577656675749, + "grad_norm": 18.556129455566406, + "learning_rate": 1.9131334021140052e-05, + "loss": 0.9749, + "step": 5859 + }, + { + "epoch": 15.967302452316076, + "grad_norm": 9.88136100769043, + "learning_rate": 1.913097422704687e-05, + "loss": 1.0925, + "step": 5860 + }, + { + "epoch": 15.970027247956404, + "grad_norm": 10.482797622680664, + "learning_rate": 1.913061436184195e-05, + "loss": 1.2273, + "step": 5861 + }, + { + "epoch": 15.97275204359673, + "grad_norm": 8.020975112915039, + "learning_rate": 1.9130254425528102e-05, + "loss": 0.9597, + "step": 5862 + }, + { + "epoch": 15.975476839237057, + "grad_norm": 9.891862869262695, + "learning_rate": 1.912989441810813e-05, + "loss": 0.9469, + "step": 5863 + }, + { + "epoch": 15.978201634877385, + "grad_norm": 12.917484283447266, + "learning_rate": 1.912953433958483e-05, + "loss": 1.0291, + "step": 5864 + }, + { + "epoch": 15.98092643051771, + "grad_norm": 7.872670650482178, + "learning_rate": 1.9129174189961008e-05, + "loss": 1.1296, + "step": 5865 + }, + { + "epoch": 15.983651226158038, + "grad_norm": 10.53221607208252, + "learning_rate": 1.9128813969239477e-05, + "loss": 1.0547, + "step": 5866 + }, + { + "epoch": 15.986376021798366, + "grad_norm": 11.600288391113281, + "learning_rate": 1.9128453677423032e-05, + "loss": 1.1653, + "step": 5867 + }, + { + "epoch": 15.989100817438691, + "grad_norm": 8.572115898132324, + "learning_rate": 1.9128093314514485e-05, + "loss": 1.001, + "step": 5868 + }, + { + "epoch": 15.991825613079019, + "grad_norm": 9.913413047790527, + "learning_rate": 1.912773288051664e-05, + "loss": 0.8827, + "step": 5869 + }, + { + "epoch": 15.994550408719347, + "grad_norm": 11.46878719329834, + "learning_rate": 1.912737237543231e-05, + "loss": 1.1794, + "step": 5870 + }, + { + "epoch": 15.997275204359672, + "grad_norm": 9.363706588745117, + "learning_rate": 1.9127011799264292e-05, + "loss": 0.9863, + "step": 5871 + }, + { + "epoch": 16.0, + "grad_norm": 9.271892547607422, + "learning_rate": 1.9126651152015404e-05, + "loss": 0.953, + "step": 5872 + }, + { + "epoch": 16.002724795640326, + "grad_norm": 15.289605140686035, + "learning_rate": 1.9126290433688448e-05, + "loss": 1.0168, + "step": 5873 + }, + { + "epoch": 16.005449591280655, + "grad_norm": 9.585624694824219, + "learning_rate": 1.9125929644286235e-05, + "loss": 1.0023, + "step": 5874 + }, + { + "epoch": 16.00817438692098, + "grad_norm": 8.111566543579102, + "learning_rate": 1.9125568783811578e-05, + "loss": 0.8453, + "step": 5875 + }, + { + "epoch": 16.010899182561307, + "grad_norm": 9.225383758544922, + "learning_rate": 1.9125207852267286e-05, + "loss": 0.9338, + "step": 5876 + }, + { + "epoch": 16.013623978201636, + "grad_norm": 53.07051467895508, + "learning_rate": 1.9124846849656164e-05, + "loss": 0.988, + "step": 5877 + }, + { + "epoch": 16.016348773841962, + "grad_norm": 24.62909507751465, + "learning_rate": 1.9124485775981034e-05, + "loss": 1.0154, + "step": 5878 + }, + { + "epoch": 16.019073569482288, + "grad_norm": 8.376246452331543, + "learning_rate": 1.9124124631244698e-05, + "loss": 0.9277, + "step": 5879 + }, + { + "epoch": 16.021798365122617, + "grad_norm": 8.503561973571777, + "learning_rate": 1.9123763415449972e-05, + "loss": 1.1198, + "step": 5880 + }, + { + "epoch": 16.024523160762943, + "grad_norm": 20.052303314208984, + "learning_rate": 1.9123402128599675e-05, + "loss": 0.8531, + "step": 5881 + }, + { + "epoch": 16.02724795640327, + "grad_norm": 11.620841979980469, + "learning_rate": 1.9123040770696616e-05, + "loss": 0.9486, + "step": 5882 + }, + { + "epoch": 16.029972752043598, + "grad_norm": 9.297019004821777, + "learning_rate": 1.9122679341743606e-05, + "loss": 0.913, + "step": 5883 + }, + { + "epoch": 16.032697547683924, + "grad_norm": 7.423447132110596, + "learning_rate": 1.912231784174346e-05, + "loss": 0.9808, + "step": 5884 + }, + { + "epoch": 16.03542234332425, + "grad_norm": 9.530950546264648, + "learning_rate": 1.9121956270699005e-05, + "loss": 0.9365, + "step": 5885 + }, + { + "epoch": 16.03814713896458, + "grad_norm": 8.53531265258789, + "learning_rate": 1.9121594628613044e-05, + "loss": 0.8394, + "step": 5886 + }, + { + "epoch": 16.040871934604905, + "grad_norm": 9.881158828735352, + "learning_rate": 1.91212329154884e-05, + "loss": 1.0618, + "step": 5887 + }, + { + "epoch": 16.04359673024523, + "grad_norm": 7.604527950286865, + "learning_rate": 1.912087113132788e-05, + "loss": 0.8291, + "step": 5888 + }, + { + "epoch": 16.04632152588556, + "grad_norm": 9.686923027038574, + "learning_rate": 1.9120509276134315e-05, + "loss": 1.0725, + "step": 5889 + }, + { + "epoch": 16.049046321525886, + "grad_norm": 9.359725952148438, + "learning_rate": 1.9120147349910515e-05, + "loss": 1.0834, + "step": 5890 + }, + { + "epoch": 16.05177111716621, + "grad_norm": 21.178882598876953, + "learning_rate": 1.9119785352659303e-05, + "loss": 0.9655, + "step": 5891 + }, + { + "epoch": 16.05449591280654, + "grad_norm": 8.237728118896484, + "learning_rate": 1.9119423284383494e-05, + "loss": 1.085, + "step": 5892 + }, + { + "epoch": 16.057220708446867, + "grad_norm": 9.693185806274414, + "learning_rate": 1.9119061145085913e-05, + "loss": 0.8539, + "step": 5893 + }, + { + "epoch": 16.059945504087192, + "grad_norm": 8.249167442321777, + "learning_rate": 1.9118698934769374e-05, + "loss": 1.0244, + "step": 5894 + }, + { + "epoch": 16.06267029972752, + "grad_norm": 15.477276802062988, + "learning_rate": 1.91183366534367e-05, + "loss": 1.1104, + "step": 5895 + }, + { + "epoch": 16.065395095367847, + "grad_norm": 9.014497756958008, + "learning_rate": 1.911797430109072e-05, + "loss": 0.932, + "step": 5896 + }, + { + "epoch": 16.068119891008173, + "grad_norm": 21.939722061157227, + "learning_rate": 1.9117611877734244e-05, + "loss": 0.9706, + "step": 5897 + }, + { + "epoch": 16.070844686648503, + "grad_norm": 10.217493057250977, + "learning_rate": 1.9117249383370105e-05, + "loss": 0.9189, + "step": 5898 + }, + { + "epoch": 16.07356948228883, + "grad_norm": 9.95344066619873, + "learning_rate": 1.9116886818001118e-05, + "loss": 0.975, + "step": 5899 + }, + { + "epoch": 16.076294277929154, + "grad_norm": 18.62358283996582, + "learning_rate": 1.9116524181630106e-05, + "loss": 1.1211, + "step": 5900 + }, + { + "epoch": 16.079019073569484, + "grad_norm": 9.568658828735352, + "learning_rate": 1.9116161474259902e-05, + "loss": 1.1132, + "step": 5901 + }, + { + "epoch": 16.08174386920981, + "grad_norm": 11.954379081726074, + "learning_rate": 1.9115798695893327e-05, + "loss": 1.0265, + "step": 5902 + }, + { + "epoch": 16.084468664850135, + "grad_norm": 8.741806983947754, + "learning_rate": 1.9115435846533204e-05, + "loss": 1.0, + "step": 5903 + }, + { + "epoch": 16.087193460490465, + "grad_norm": 10.515434265136719, + "learning_rate": 1.9115072926182358e-05, + "loss": 0.886, + "step": 5904 + }, + { + "epoch": 16.08991825613079, + "grad_norm": 10.62269115447998, + "learning_rate": 1.911470993484362e-05, + "loss": 0.8505, + "step": 5905 + }, + { + "epoch": 16.092643051771116, + "grad_norm": 7.906174659729004, + "learning_rate": 1.911434687251981e-05, + "loss": 0.8514, + "step": 5906 + }, + { + "epoch": 16.095367847411445, + "grad_norm": 8.911808967590332, + "learning_rate": 1.9113983739213765e-05, + "loss": 0.9045, + "step": 5907 + }, + { + "epoch": 16.09809264305177, + "grad_norm": 8.223689079284668, + "learning_rate": 1.9113620534928307e-05, + "loss": 0.8833, + "step": 5908 + }, + { + "epoch": 16.100817438692097, + "grad_norm": 8.558938980102539, + "learning_rate": 1.9113257259666262e-05, + "loss": 1.0228, + "step": 5909 + }, + { + "epoch": 16.103542234332426, + "grad_norm": 19.754425048828125, + "learning_rate": 1.9112893913430466e-05, + "loss": 0.9375, + "step": 5910 + }, + { + "epoch": 16.106267029972752, + "grad_norm": 8.726752281188965, + "learning_rate": 1.9112530496223748e-05, + "loss": 1.1094, + "step": 5911 + }, + { + "epoch": 16.108991825613078, + "grad_norm": 44.32742691040039, + "learning_rate": 1.911216700804893e-05, + "loss": 0.84, + "step": 5912 + }, + { + "epoch": 16.111716621253407, + "grad_norm": 9.230029106140137, + "learning_rate": 1.911180344890885e-05, + "loss": 0.8795, + "step": 5913 + }, + { + "epoch": 16.114441416893733, + "grad_norm": 9.848237991333008, + "learning_rate": 1.9111439818806338e-05, + "loss": 0.9354, + "step": 5914 + }, + { + "epoch": 16.11716621253406, + "grad_norm": 8.80485725402832, + "learning_rate": 1.911107611774423e-05, + "loss": 0.7859, + "step": 5915 + }, + { + "epoch": 16.11989100817439, + "grad_norm": 8.519614219665527, + "learning_rate": 1.911071234572535e-05, + "loss": 0.9137, + "step": 5916 + }, + { + "epoch": 16.122615803814714, + "grad_norm": 7.780332088470459, + "learning_rate": 1.9110348502752537e-05, + "loss": 0.9954, + "step": 5917 + }, + { + "epoch": 16.12534059945504, + "grad_norm": 8.060101509094238, + "learning_rate": 1.9109984588828622e-05, + "loss": 0.8457, + "step": 5918 + }, + { + "epoch": 16.12806539509537, + "grad_norm": 11.73392391204834, + "learning_rate": 1.9109620603956442e-05, + "loss": 0.9453, + "step": 5919 + }, + { + "epoch": 16.130790190735695, + "grad_norm": 9.113224983215332, + "learning_rate": 1.9109256548138832e-05, + "loss": 0.9738, + "step": 5920 + }, + { + "epoch": 16.13351498637602, + "grad_norm": 10.089421272277832, + "learning_rate": 1.910889242137862e-05, + "loss": 0.968, + "step": 5921 + }, + { + "epoch": 16.13623978201635, + "grad_norm": 9.667669296264648, + "learning_rate": 1.9108528223678652e-05, + "loss": 0.9104, + "step": 5922 + }, + { + "epoch": 16.138964577656676, + "grad_norm": 8.784872055053711, + "learning_rate": 1.9108163955041754e-05, + "loss": 0.863, + "step": 5923 + }, + { + "epoch": 16.141689373297, + "grad_norm": 7.899500846862793, + "learning_rate": 1.9107799615470773e-05, + "loss": 1.0374, + "step": 5924 + }, + { + "epoch": 16.14441416893733, + "grad_norm": 8.752492904663086, + "learning_rate": 1.9107435204968538e-05, + "loss": 0.9602, + "step": 5925 + }, + { + "epoch": 16.147138964577657, + "grad_norm": 9.13194465637207, + "learning_rate": 1.910707072353789e-05, + "loss": 0.9746, + "step": 5926 + }, + { + "epoch": 16.149863760217983, + "grad_norm": 8.339265823364258, + "learning_rate": 1.9106706171181673e-05, + "loss": 0.9867, + "step": 5927 + }, + { + "epoch": 16.152588555858312, + "grad_norm": 10.599468231201172, + "learning_rate": 1.910634154790272e-05, + "loss": 1.0702, + "step": 5928 + }, + { + "epoch": 16.155313351498638, + "grad_norm": 9.619460105895996, + "learning_rate": 1.9105976853703875e-05, + "loss": 1.0261, + "step": 5929 + }, + { + "epoch": 16.158038147138964, + "grad_norm": 9.088080406188965, + "learning_rate": 1.910561208858797e-05, + "loss": 1.0629, + "step": 5930 + }, + { + "epoch": 16.160762942779293, + "grad_norm": 23.779102325439453, + "learning_rate": 1.910524725255785e-05, + "loss": 0.8628, + "step": 5931 + }, + { + "epoch": 16.16348773841962, + "grad_norm": 9.341630935668945, + "learning_rate": 1.9104882345616363e-05, + "loss": 0.972, + "step": 5932 + }, + { + "epoch": 16.166212534059945, + "grad_norm": 9.080842018127441, + "learning_rate": 1.9104517367766344e-05, + "loss": 0.9935, + "step": 5933 + }, + { + "epoch": 16.168937329700274, + "grad_norm": 8.801554679870605, + "learning_rate": 1.9104152319010634e-05, + "loss": 1.0988, + "step": 5934 + }, + { + "epoch": 16.1716621253406, + "grad_norm": 9.890647888183594, + "learning_rate": 1.9103787199352077e-05, + "loss": 0.8812, + "step": 5935 + }, + { + "epoch": 16.174386920980925, + "grad_norm": 8.447457313537598, + "learning_rate": 1.9103422008793524e-05, + "loss": 1.0991, + "step": 5936 + }, + { + "epoch": 16.177111716621255, + "grad_norm": 8.268943786621094, + "learning_rate": 1.9103056747337813e-05, + "loss": 1.067, + "step": 5937 + }, + { + "epoch": 16.17983651226158, + "grad_norm": 9.503392219543457, + "learning_rate": 1.9102691414987785e-05, + "loss": 0.9934, + "step": 5938 + }, + { + "epoch": 16.182561307901906, + "grad_norm": 9.845125198364258, + "learning_rate": 1.910232601174629e-05, + "loss": 0.9785, + "step": 5939 + }, + { + "epoch": 16.185286103542236, + "grad_norm": 11.63794231414795, + "learning_rate": 1.9101960537616174e-05, + "loss": 1.0958, + "step": 5940 + }, + { + "epoch": 16.18801089918256, + "grad_norm": 9.296601295471191, + "learning_rate": 1.9101594992600283e-05, + "loss": 1.1799, + "step": 5941 + }, + { + "epoch": 16.190735694822887, + "grad_norm": 10.46290397644043, + "learning_rate": 1.9101229376701463e-05, + "loss": 0.9753, + "step": 5942 + }, + { + "epoch": 16.193460490463217, + "grad_norm": 9.994993209838867, + "learning_rate": 1.910086368992256e-05, + "loss": 0.9448, + "step": 5943 + }, + { + "epoch": 16.196185286103542, + "grad_norm": 9.466861724853516, + "learning_rate": 1.9100497932266423e-05, + "loss": 0.9169, + "step": 5944 + }, + { + "epoch": 16.19891008174387, + "grad_norm": 8.074040412902832, + "learning_rate": 1.9100132103735906e-05, + "loss": 0.8988, + "step": 5945 + }, + { + "epoch": 16.201634877384198, + "grad_norm": 8.387664794921875, + "learning_rate": 1.9099766204333847e-05, + "loss": 1.0031, + "step": 5946 + }, + { + "epoch": 16.204359673024523, + "grad_norm": 18.077465057373047, + "learning_rate": 1.9099400234063107e-05, + "loss": 1.0066, + "step": 5947 + }, + { + "epoch": 16.20708446866485, + "grad_norm": 13.21737289428711, + "learning_rate": 1.9099034192926527e-05, + "loss": 1.0029, + "step": 5948 + }, + { + "epoch": 16.20980926430518, + "grad_norm": 8.066934585571289, + "learning_rate": 1.909866808092696e-05, + "loss": 1.0518, + "step": 5949 + }, + { + "epoch": 16.212534059945504, + "grad_norm": 9.0236177444458, + "learning_rate": 1.9098301898067264e-05, + "loss": 0.8417, + "step": 5950 + }, + { + "epoch": 16.21525885558583, + "grad_norm": 9.770105361938477, + "learning_rate": 1.9097935644350284e-05, + "loss": 0.9471, + "step": 5951 + }, + { + "epoch": 16.21798365122616, + "grad_norm": 8.485394477844238, + "learning_rate": 1.909756931977887e-05, + "loss": 0.9606, + "step": 5952 + }, + { + "epoch": 16.220708446866485, + "grad_norm": 8.218755722045898, + "learning_rate": 1.9097202924355884e-05, + "loss": 1.0961, + "step": 5953 + }, + { + "epoch": 16.22343324250681, + "grad_norm": 9.037432670593262, + "learning_rate": 1.909683645808417e-05, + "loss": 1.0549, + "step": 5954 + }, + { + "epoch": 16.22615803814714, + "grad_norm": 11.103666305541992, + "learning_rate": 1.9096469920966592e-05, + "loss": 1.0444, + "step": 5955 + }, + { + "epoch": 16.228882833787466, + "grad_norm": 7.901222229003906, + "learning_rate": 1.9096103313005992e-05, + "loss": 0.9113, + "step": 5956 + }, + { + "epoch": 16.231607629427792, + "grad_norm": 8.758397102355957, + "learning_rate": 1.909573663420524e-05, + "loss": 0.8389, + "step": 5957 + }, + { + "epoch": 16.23433242506812, + "grad_norm": 9.530460357666016, + "learning_rate": 1.9095369884567178e-05, + "loss": 0.9973, + "step": 5958 + }, + { + "epoch": 16.237057220708447, + "grad_norm": 9.2470703125, + "learning_rate": 1.909500306409467e-05, + "loss": 1.0751, + "step": 5959 + }, + { + "epoch": 16.239782016348773, + "grad_norm": 8.239962577819824, + "learning_rate": 1.909463617279057e-05, + "loss": 0.7488, + "step": 5960 + }, + { + "epoch": 16.242506811989102, + "grad_norm": 9.150911331176758, + "learning_rate": 1.9094269210657737e-05, + "loss": 1.0393, + "step": 5961 + }, + { + "epoch": 16.245231607629428, + "grad_norm": 8.832514762878418, + "learning_rate": 1.9093902177699028e-05, + "loss": 1.0737, + "step": 5962 + }, + { + "epoch": 16.247956403269754, + "grad_norm": 25.83500862121582, + "learning_rate": 1.9093535073917304e-05, + "loss": 1.0029, + "step": 5963 + }, + { + "epoch": 16.250681198910083, + "grad_norm": 9.633893966674805, + "learning_rate": 1.9093167899315417e-05, + "loss": 1.0497, + "step": 5964 + }, + { + "epoch": 16.25340599455041, + "grad_norm": 10.280200004577637, + "learning_rate": 1.9092800653896236e-05, + "loss": 0.9462, + "step": 5965 + }, + { + "epoch": 16.256130790190735, + "grad_norm": 8.123982429504395, + "learning_rate": 1.9092433337662614e-05, + "loss": 0.8857, + "step": 5966 + }, + { + "epoch": 16.258855585831064, + "grad_norm": 7.409641742706299, + "learning_rate": 1.909206595061741e-05, + "loss": 0.8341, + "step": 5967 + }, + { + "epoch": 16.26158038147139, + "grad_norm": 10.250338554382324, + "learning_rate": 1.9091698492763494e-05, + "loss": 1.106, + "step": 5968 + }, + { + "epoch": 16.264305177111716, + "grad_norm": 7.752365589141846, + "learning_rate": 1.909133096410372e-05, + "loss": 0.9622, + "step": 5969 + }, + { + "epoch": 16.267029972752045, + "grad_norm": 8.367024421691895, + "learning_rate": 1.9090963364640954e-05, + "loss": 0.9623, + "step": 5970 + }, + { + "epoch": 16.26975476839237, + "grad_norm": 9.059532165527344, + "learning_rate": 1.909059569437806e-05, + "loss": 1.0144, + "step": 5971 + }, + { + "epoch": 16.272479564032697, + "grad_norm": 8.470860481262207, + "learning_rate": 1.9090227953317896e-05, + "loss": 0.9541, + "step": 5972 + }, + { + "epoch": 16.275204359673026, + "grad_norm": 8.233183860778809, + "learning_rate": 1.908986014146333e-05, + "loss": 0.9636, + "step": 5973 + }, + { + "epoch": 16.277929155313352, + "grad_norm": 8.340307235717773, + "learning_rate": 1.9089492258817225e-05, + "loss": 0.9459, + "step": 5974 + }, + { + "epoch": 16.280653950953678, + "grad_norm": 8.482439994812012, + "learning_rate": 1.908912430538245e-05, + "loss": 0.9739, + "step": 5975 + }, + { + "epoch": 16.283378746594007, + "grad_norm": 8.190013885498047, + "learning_rate": 1.9088756281161866e-05, + "loss": 0.876, + "step": 5976 + }, + { + "epoch": 16.286103542234333, + "grad_norm": 8.862380027770996, + "learning_rate": 1.908838818615834e-05, + "loss": 1.0016, + "step": 5977 + }, + { + "epoch": 16.28882833787466, + "grad_norm": 9.875590324401855, + "learning_rate": 1.908802002037474e-05, + "loss": 0.9709, + "step": 5978 + }, + { + "epoch": 16.291553133514988, + "grad_norm": 8.948189735412598, + "learning_rate": 1.908765178381393e-05, + "loss": 0.7603, + "step": 5979 + }, + { + "epoch": 16.294277929155314, + "grad_norm": 7.790036678314209, + "learning_rate": 1.9087283476478784e-05, + "loss": 1.0806, + "step": 5980 + }, + { + "epoch": 16.29700272479564, + "grad_norm": 19.806018829345703, + "learning_rate": 1.9086915098372166e-05, + "loss": 1.0457, + "step": 5981 + }, + { + "epoch": 16.29972752043597, + "grad_norm": 9.134679794311523, + "learning_rate": 1.9086546649496943e-05, + "loss": 0.8326, + "step": 5982 + }, + { + "epoch": 16.302452316076295, + "grad_norm": 9.624375343322754, + "learning_rate": 1.908617812985599e-05, + "loss": 1.0908, + "step": 5983 + }, + { + "epoch": 16.30517711171662, + "grad_norm": 8.333988189697266, + "learning_rate": 1.9085809539452174e-05, + "loss": 0.9963, + "step": 5984 + }, + { + "epoch": 16.30790190735695, + "grad_norm": 8.44038200378418, + "learning_rate": 1.9085440878288363e-05, + "loss": 0.9639, + "step": 5985 + }, + { + "epoch": 16.310626702997276, + "grad_norm": 7.278705596923828, + "learning_rate": 1.9085072146367434e-05, + "loss": 1.0146, + "step": 5986 + }, + { + "epoch": 16.3133514986376, + "grad_norm": 6.198719024658203, + "learning_rate": 1.9084703343692253e-05, + "loss": 0.9016, + "step": 5987 + }, + { + "epoch": 16.31607629427793, + "grad_norm": 8.337554931640625, + "learning_rate": 1.90843344702657e-05, + "loss": 0.8571, + "step": 5988 + }, + { + "epoch": 16.318801089918257, + "grad_norm": 8.546713829040527, + "learning_rate": 1.9083965526090635e-05, + "loss": 1.0874, + "step": 5989 + }, + { + "epoch": 16.321525885558582, + "grad_norm": 8.65063762664795, + "learning_rate": 1.908359651116994e-05, + "loss": 1.2061, + "step": 5990 + }, + { + "epoch": 16.32425068119891, + "grad_norm": 7.996217250823975, + "learning_rate": 1.908322742550649e-05, + "loss": 0.8696, + "step": 5991 + }, + { + "epoch": 16.326975476839237, + "grad_norm": 8.911670684814453, + "learning_rate": 1.9082858269103162e-05, + "loss": 1.0651, + "step": 5992 + }, + { + "epoch": 16.329700272479563, + "grad_norm": 23.596555709838867, + "learning_rate": 1.908248904196282e-05, + "loss": 1.0306, + "step": 5993 + }, + { + "epoch": 16.332425068119893, + "grad_norm": 7.521470069885254, + "learning_rate": 1.9082119744088348e-05, + "loss": 1.0576, + "step": 5994 + }, + { + "epoch": 16.33514986376022, + "grad_norm": 7.754633903503418, + "learning_rate": 1.9081750375482618e-05, + "loss": 0.8788, + "step": 5995 + }, + { + "epoch": 16.337874659400544, + "grad_norm": 9.71580982208252, + "learning_rate": 1.908138093614851e-05, + "loss": 1.104, + "step": 5996 + }, + { + "epoch": 16.340599455040874, + "grad_norm": 8.19369888305664, + "learning_rate": 1.90810114260889e-05, + "loss": 0.972, + "step": 5997 + }, + { + "epoch": 16.3433242506812, + "grad_norm": 7.382881164550781, + "learning_rate": 1.908064184530666e-05, + "loss": 0.8334, + "step": 5998 + }, + { + "epoch": 16.346049046321525, + "grad_norm": 11.877547264099121, + "learning_rate": 1.908027219380468e-05, + "loss": 0.861, + "step": 5999 + }, + { + "epoch": 16.348773841961854, + "grad_norm": 7.584044933319092, + "learning_rate": 1.907990247158583e-05, + "loss": 0.8782, + "step": 6000 + }, + { + "epoch": 16.35149863760218, + "grad_norm": 7.831441879272461, + "learning_rate": 1.907953267865299e-05, + "loss": 0.9613, + "step": 6001 + }, + { + "epoch": 16.354223433242506, + "grad_norm": 8.159957885742188, + "learning_rate": 1.9079162815009045e-05, + "loss": 1.0771, + "step": 6002 + }, + { + "epoch": 16.356948228882835, + "grad_norm": 8.454666137695312, + "learning_rate": 1.9078792880656868e-05, + "loss": 0.821, + "step": 6003 + }, + { + "epoch": 16.35967302452316, + "grad_norm": 7.667445659637451, + "learning_rate": 1.907842287559935e-05, + "loss": 1.0226, + "step": 6004 + }, + { + "epoch": 16.362397820163487, + "grad_norm": 8.185620307922363, + "learning_rate": 1.9078052799839363e-05, + "loss": 0.9062, + "step": 6005 + }, + { + "epoch": 16.365122615803816, + "grad_norm": 9.708785057067871, + "learning_rate": 1.9077682653379795e-05, + "loss": 0.9871, + "step": 6006 + }, + { + "epoch": 16.367847411444142, + "grad_norm": 8.769133567810059, + "learning_rate": 1.9077312436223524e-05, + "loss": 0.9122, + "step": 6007 + }, + { + "epoch": 16.370572207084468, + "grad_norm": 8.197275161743164, + "learning_rate": 1.907694214837344e-05, + "loss": 0.9888, + "step": 6008 + }, + { + "epoch": 16.373297002724797, + "grad_norm": 7.544145584106445, + "learning_rate": 1.9076571789832416e-05, + "loss": 1.0267, + "step": 6009 + }, + { + "epoch": 16.376021798365123, + "grad_norm": 8.935723304748535, + "learning_rate": 1.9076201360603347e-05, + "loss": 0.9645, + "step": 6010 + }, + { + "epoch": 16.37874659400545, + "grad_norm": 9.968594551086426, + "learning_rate": 1.9075830860689114e-05, + "loss": 1.0848, + "step": 6011 + }, + { + "epoch": 16.381471389645778, + "grad_norm": 8.968193054199219, + "learning_rate": 1.9075460290092604e-05, + "loss": 0.9851, + "step": 6012 + }, + { + "epoch": 16.384196185286104, + "grad_norm": 9.305635452270508, + "learning_rate": 1.9075089648816697e-05, + "loss": 1.1685, + "step": 6013 + }, + { + "epoch": 16.38692098092643, + "grad_norm": 11.007704734802246, + "learning_rate": 1.907471893686429e-05, + "loss": 0.8275, + "step": 6014 + }, + { + "epoch": 16.38964577656676, + "grad_norm": 9.118929862976074, + "learning_rate": 1.907434815423826e-05, + "loss": 1.014, + "step": 6015 + }, + { + "epoch": 16.392370572207085, + "grad_norm": 8.24226188659668, + "learning_rate": 1.9073977300941497e-05, + "loss": 0.8677, + "step": 6016 + }, + { + "epoch": 16.39509536784741, + "grad_norm": 7.754024505615234, + "learning_rate": 1.9073606376976895e-05, + "loss": 1.0286, + "step": 6017 + }, + { + "epoch": 16.39782016348774, + "grad_norm": 9.166144371032715, + "learning_rate": 1.9073235382347336e-05, + "loss": 1.0774, + "step": 6018 + }, + { + "epoch": 16.400544959128066, + "grad_norm": 7.809909343719482, + "learning_rate": 1.907286431705571e-05, + "loss": 0.8898, + "step": 6019 + }, + { + "epoch": 16.40326975476839, + "grad_norm": 8.78017807006836, + "learning_rate": 1.9072493181104916e-05, + "loss": 0.9423, + "step": 6020 + }, + { + "epoch": 16.40599455040872, + "grad_norm": 10.937439918518066, + "learning_rate": 1.907212197449783e-05, + "loss": 0.9635, + "step": 6021 + }, + { + "epoch": 16.408719346049047, + "grad_norm": 8.849957466125488, + "learning_rate": 1.907175069723735e-05, + "loss": 1.0122, + "step": 6022 + }, + { + "epoch": 16.411444141689373, + "grad_norm": 8.172831535339355, + "learning_rate": 1.9071379349326373e-05, + "loss": 0.9895, + "step": 6023 + }, + { + "epoch": 16.414168937329702, + "grad_norm": 8.49582290649414, + "learning_rate": 1.9071007930767782e-05, + "loss": 0.9797, + "step": 6024 + }, + { + "epoch": 16.416893732970028, + "grad_norm": 9.933019638061523, + "learning_rate": 1.9070636441564474e-05, + "loss": 1.2769, + "step": 6025 + }, + { + "epoch": 16.419618528610354, + "grad_norm": 8.22047233581543, + "learning_rate": 1.907026488171934e-05, + "loss": 0.8754, + "step": 6026 + }, + { + "epoch": 16.422343324250683, + "grad_norm": 8.400115013122559, + "learning_rate": 1.9069893251235277e-05, + "loss": 1.0231, + "step": 6027 + }, + { + "epoch": 16.42506811989101, + "grad_norm": 7.147830963134766, + "learning_rate": 1.9069521550115175e-05, + "loss": 1.0021, + "step": 6028 + }, + { + "epoch": 16.427792915531334, + "grad_norm": 7.267785549163818, + "learning_rate": 1.9069149778361934e-05, + "loss": 0.8904, + "step": 6029 + }, + { + "epoch": 16.430517711171664, + "grad_norm": 9.049951553344727, + "learning_rate": 1.9068777935978444e-05, + "loss": 0.9927, + "step": 6030 + }, + { + "epoch": 16.43324250681199, + "grad_norm": 9.180093765258789, + "learning_rate": 1.9068406022967605e-05, + "loss": 1.0958, + "step": 6031 + }, + { + "epoch": 16.435967302452315, + "grad_norm": 8.235403060913086, + "learning_rate": 1.906803403933231e-05, + "loss": 1.249, + "step": 6032 + }, + { + "epoch": 16.438692098092645, + "grad_norm": 10.791427612304688, + "learning_rate": 1.906766198507546e-05, + "loss": 1.0869, + "step": 6033 + }, + { + "epoch": 16.44141689373297, + "grad_norm": 6.91215705871582, + "learning_rate": 1.9067289860199945e-05, + "loss": 1.085, + "step": 6034 + }, + { + "epoch": 16.444141689373296, + "grad_norm": 8.863093376159668, + "learning_rate": 1.9066917664708674e-05, + "loss": 0.99, + "step": 6035 + }, + { + "epoch": 16.446866485013626, + "grad_norm": 7.740184307098389, + "learning_rate": 1.9066545398604538e-05, + "loss": 0.9575, + "step": 6036 + }, + { + "epoch": 16.44959128065395, + "grad_norm": 7.676769733428955, + "learning_rate": 1.9066173061890438e-05, + "loss": 1.0483, + "step": 6037 + }, + { + "epoch": 16.452316076294277, + "grad_norm": 15.380928993225098, + "learning_rate": 1.9065800654569277e-05, + "loss": 0.8556, + "step": 6038 + }, + { + "epoch": 16.455040871934607, + "grad_norm": 9.415081977844238, + "learning_rate": 1.906542817664395e-05, + "loss": 0.8867, + "step": 6039 + }, + { + "epoch": 16.457765667574932, + "grad_norm": 7.816688537597656, + "learning_rate": 1.9065055628117358e-05, + "loss": 0.9417, + "step": 6040 + }, + { + "epoch": 16.460490463215258, + "grad_norm": 8.097055435180664, + "learning_rate": 1.9064683008992407e-05, + "loss": 0.8629, + "step": 6041 + }, + { + "epoch": 16.463215258855588, + "grad_norm": 9.544647216796875, + "learning_rate": 1.9064310319271997e-05, + "loss": 1.0793, + "step": 6042 + }, + { + "epoch": 16.465940054495913, + "grad_norm": 8.068865776062012, + "learning_rate": 1.906393755895903e-05, + "loss": 0.9089, + "step": 6043 + }, + { + "epoch": 16.46866485013624, + "grad_norm": 9.3299560546875, + "learning_rate": 1.906356472805641e-05, + "loss": 1.1665, + "step": 6044 + }, + { + "epoch": 16.47138964577657, + "grad_norm": 9.5327730178833, + "learning_rate": 1.9063191826567035e-05, + "loss": 0.8313, + "step": 6045 + }, + { + "epoch": 16.474114441416894, + "grad_norm": 8.465132713317871, + "learning_rate": 1.9062818854493816e-05, + "loss": 0.9471, + "step": 6046 + }, + { + "epoch": 16.47683923705722, + "grad_norm": 7.73591947555542, + "learning_rate": 1.9062445811839655e-05, + "loss": 0.8947, + "step": 6047 + }, + { + "epoch": 16.479564032697546, + "grad_norm": 8.444184303283691, + "learning_rate": 1.9062072698607457e-05, + "loss": 1.0015, + "step": 6048 + }, + { + "epoch": 16.482288828337875, + "grad_norm": 7.189904689788818, + "learning_rate": 1.9061699514800128e-05, + "loss": 0.8428, + "step": 6049 + }, + { + "epoch": 16.4850136239782, + "grad_norm": 10.970808029174805, + "learning_rate": 1.906132626042058e-05, + "loss": 0.9288, + "step": 6050 + }, + { + "epoch": 16.48773841961853, + "grad_norm": 9.308109283447266, + "learning_rate": 1.906095293547171e-05, + "loss": 0.89, + "step": 6051 + }, + { + "epoch": 16.490463215258856, + "grad_norm": 8.384902000427246, + "learning_rate": 1.906057953995643e-05, + "loss": 0.9181, + "step": 6052 + }, + { + "epoch": 16.493188010899182, + "grad_norm": 9.699617385864258, + "learning_rate": 1.9060206073877655e-05, + "loss": 0.9622, + "step": 6053 + }, + { + "epoch": 16.495912806539508, + "grad_norm": 10.59549331665039, + "learning_rate": 1.9059832537238278e-05, + "loss": 0.9661, + "step": 6054 + }, + { + "epoch": 16.498637602179837, + "grad_norm": 8.202498435974121, + "learning_rate": 1.9059458930041222e-05, + "loss": 0.9198, + "step": 6055 + }, + { + "epoch": 16.501362397820163, + "grad_norm": 10.255706787109375, + "learning_rate": 1.9059085252289388e-05, + "loss": 0.8696, + "step": 6056 + }, + { + "epoch": 16.504087193460492, + "grad_norm": 7.805537700653076, + "learning_rate": 1.9058711503985692e-05, + "loss": 0.9667, + "step": 6057 + }, + { + "epoch": 16.506811989100818, + "grad_norm": 8.793238639831543, + "learning_rate": 1.9058337685133043e-05, + "loss": 0.952, + "step": 6058 + }, + { + "epoch": 16.509536784741144, + "grad_norm": 9.71096134185791, + "learning_rate": 1.905796379573435e-05, + "loss": 1.3391, + "step": 6059 + }, + { + "epoch": 16.51226158038147, + "grad_norm": 9.125404357910156, + "learning_rate": 1.9057589835792524e-05, + "loss": 1.2024, + "step": 6060 + }, + { + "epoch": 16.5149863760218, + "grad_norm": 7.917983531951904, + "learning_rate": 1.9057215805310485e-05, + "loss": 0.9601, + "step": 6061 + }, + { + "epoch": 16.517711171662125, + "grad_norm": 8.468579292297363, + "learning_rate": 1.9056841704291137e-05, + "loss": 0.9695, + "step": 6062 + }, + { + "epoch": 16.520435967302454, + "grad_norm": 8.051939964294434, + "learning_rate": 1.90564675327374e-05, + "loss": 0.9247, + "step": 6063 + }, + { + "epoch": 16.52316076294278, + "grad_norm": 8.476173400878906, + "learning_rate": 1.9056093290652186e-05, + "loss": 0.9005, + "step": 6064 + }, + { + "epoch": 16.525885558583106, + "grad_norm": 9.824795722961426, + "learning_rate": 1.9055718978038404e-05, + "loss": 0.9658, + "step": 6065 + }, + { + "epoch": 16.52861035422343, + "grad_norm": 9.040727615356445, + "learning_rate": 1.9055344594898978e-05, + "loss": 1.0005, + "step": 6066 + }, + { + "epoch": 16.53133514986376, + "grad_norm": 9.851045608520508, + "learning_rate": 1.905497014123682e-05, + "loss": 0.8988, + "step": 6067 + }, + { + "epoch": 16.534059945504087, + "grad_norm": 8.072575569152832, + "learning_rate": 1.9054595617054844e-05, + "loss": 0.9775, + "step": 6068 + }, + { + "epoch": 16.536784741144416, + "grad_norm": 10.031383514404297, + "learning_rate": 1.905422102235597e-05, + "loss": 1.0728, + "step": 6069 + }, + { + "epoch": 16.539509536784742, + "grad_norm": 11.542708396911621, + "learning_rate": 1.9053846357143114e-05, + "loss": 0.9026, + "step": 6070 + }, + { + "epoch": 16.542234332425068, + "grad_norm": 8.84055233001709, + "learning_rate": 1.9053471621419193e-05, + "loss": 1.0281, + "step": 6071 + }, + { + "epoch": 16.544959128065393, + "grad_norm": 9.412172317504883, + "learning_rate": 1.9053096815187125e-05, + "loss": 1.2434, + "step": 6072 + }, + { + "epoch": 16.547683923705723, + "grad_norm": 10.151601791381836, + "learning_rate": 1.9052721938449834e-05, + "loss": 1.189, + "step": 6073 + }, + { + "epoch": 16.55040871934605, + "grad_norm": 13.779661178588867, + "learning_rate": 1.9052346991210237e-05, + "loss": 1.0056, + "step": 6074 + }, + { + "epoch": 16.553133514986374, + "grad_norm": 8.894524574279785, + "learning_rate": 1.905197197347125e-05, + "loss": 1.0266, + "step": 6075 + }, + { + "epoch": 16.555858310626704, + "grad_norm": 13.412213325500488, + "learning_rate": 1.9051596885235795e-05, + "loss": 0.9729, + "step": 6076 + }, + { + "epoch": 16.55858310626703, + "grad_norm": 8.03742504119873, + "learning_rate": 1.9051221726506795e-05, + "loss": 0.9557, + "step": 6077 + }, + { + "epoch": 16.561307901907355, + "grad_norm": 11.525594711303711, + "learning_rate": 1.9050846497287175e-05, + "loss": 0.9634, + "step": 6078 + }, + { + "epoch": 16.564032697547685, + "grad_norm": 9.7057523727417, + "learning_rate": 1.905047119757985e-05, + "loss": 1.1147, + "step": 6079 + }, + { + "epoch": 16.56675749318801, + "grad_norm": 8.049863815307617, + "learning_rate": 1.9050095827387748e-05, + "loss": 1.092, + "step": 6080 + }, + { + "epoch": 16.569482288828336, + "grad_norm": 8.248735427856445, + "learning_rate": 1.9049720386713796e-05, + "loss": 1.0129, + "step": 6081 + }, + { + "epoch": 16.572207084468666, + "grad_norm": 9.346665382385254, + "learning_rate": 1.9049344875560906e-05, + "loss": 0.9362, + "step": 6082 + }, + { + "epoch": 16.57493188010899, + "grad_norm": 9.57408332824707, + "learning_rate": 1.9048969293932012e-05, + "loss": 1.2029, + "step": 6083 + }, + { + "epoch": 16.577656675749317, + "grad_norm": 8.063798904418945, + "learning_rate": 1.9048593641830034e-05, + "loss": 0.9291, + "step": 6084 + }, + { + "epoch": 16.580381471389646, + "grad_norm": 7.972892761230469, + "learning_rate": 1.9048217919257907e-05, + "loss": 1.1289, + "step": 6085 + }, + { + "epoch": 16.583106267029972, + "grad_norm": 7.366415977478027, + "learning_rate": 1.9047842126218544e-05, + "loss": 0.8733, + "step": 6086 + }, + { + "epoch": 16.585831062670298, + "grad_norm": 8.68867015838623, + "learning_rate": 1.904746626271488e-05, + "loss": 0.8827, + "step": 6087 + }, + { + "epoch": 16.588555858310627, + "grad_norm": 9.911465644836426, + "learning_rate": 1.9047090328749837e-05, + "loss": 0.8958, + "step": 6088 + }, + { + "epoch": 16.591280653950953, + "grad_norm": 7.827071189880371, + "learning_rate": 1.9046714324326347e-05, + "loss": 1.0327, + "step": 6089 + }, + { + "epoch": 16.59400544959128, + "grad_norm": 7.7089409828186035, + "learning_rate": 1.9046338249447335e-05, + "loss": 1.0076, + "step": 6090 + }, + { + "epoch": 16.59673024523161, + "grad_norm": 8.589584350585938, + "learning_rate": 1.9045962104115738e-05, + "loss": 0.9946, + "step": 6091 + }, + { + "epoch": 16.599455040871934, + "grad_norm": 8.614899635314941, + "learning_rate": 1.9045585888334475e-05, + "loss": 0.8456, + "step": 6092 + }, + { + "epoch": 16.60217983651226, + "grad_norm": 8.168996810913086, + "learning_rate": 1.904520960210648e-05, + "loss": 1.0383, + "step": 6093 + }, + { + "epoch": 16.60490463215259, + "grad_norm": 6.833440780639648, + "learning_rate": 1.9044833245434686e-05, + "loss": 0.8608, + "step": 6094 + }, + { + "epoch": 16.607629427792915, + "grad_norm": 8.260551452636719, + "learning_rate": 1.904445681832202e-05, + "loss": 1.0952, + "step": 6095 + }, + { + "epoch": 16.61035422343324, + "grad_norm": 7.668336391448975, + "learning_rate": 1.9044080320771416e-05, + "loss": 1.1274, + "step": 6096 + }, + { + "epoch": 16.61307901907357, + "grad_norm": 6.161644458770752, + "learning_rate": 1.9043703752785804e-05, + "loss": 0.8849, + "step": 6097 + }, + { + "epoch": 16.615803814713896, + "grad_norm": 8.076497077941895, + "learning_rate": 1.9043327114368118e-05, + "loss": 0.9469, + "step": 6098 + }, + { + "epoch": 16.618528610354222, + "grad_norm": 13.970622062683105, + "learning_rate": 1.9042950405521296e-05, + "loss": 1.0378, + "step": 6099 + }, + { + "epoch": 16.62125340599455, + "grad_norm": 7.201518535614014, + "learning_rate": 1.9042573626248266e-05, + "loss": 0.9572, + "step": 6100 + }, + { + "epoch": 16.623978201634877, + "grad_norm": 9.967567443847656, + "learning_rate": 1.904219677655196e-05, + "loss": 1.0217, + "step": 6101 + }, + { + "epoch": 16.626702997275203, + "grad_norm": 7.625209808349609, + "learning_rate": 1.9041819856435318e-05, + "loss": 1.0759, + "step": 6102 + }, + { + "epoch": 16.629427792915532, + "grad_norm": 8.119585037231445, + "learning_rate": 1.9041442865901276e-05, + "loss": 1.0013, + "step": 6103 + }, + { + "epoch": 16.632152588555858, + "grad_norm": 8.203313827514648, + "learning_rate": 1.9041065804952764e-05, + "loss": 1.0774, + "step": 6104 + }, + { + "epoch": 16.634877384196184, + "grad_norm": 10.273894309997559, + "learning_rate": 1.9040688673592725e-05, + "loss": 1.0244, + "step": 6105 + }, + { + "epoch": 16.637602179836513, + "grad_norm": 6.8131103515625, + "learning_rate": 1.9040311471824092e-05, + "loss": 0.97, + "step": 6106 + }, + { + "epoch": 16.64032697547684, + "grad_norm": 10.750165939331055, + "learning_rate": 1.903993419964981e-05, + "loss": 1.0129, + "step": 6107 + }, + { + "epoch": 16.643051771117165, + "grad_norm": 8.18924331665039, + "learning_rate": 1.9039556857072808e-05, + "loss": 0.959, + "step": 6108 + }, + { + "epoch": 16.645776566757494, + "grad_norm": 7.18798303604126, + "learning_rate": 1.9039179444096025e-05, + "loss": 1.1155, + "step": 6109 + }, + { + "epoch": 16.64850136239782, + "grad_norm": 8.120108604431152, + "learning_rate": 1.9038801960722405e-05, + "loss": 1.0562, + "step": 6110 + }, + { + "epoch": 16.651226158038146, + "grad_norm": 9.277802467346191, + "learning_rate": 1.903842440695489e-05, + "loss": 0.9187, + "step": 6111 + }, + { + "epoch": 16.653950953678475, + "grad_norm": 9.661819458007812, + "learning_rate": 1.903804678279641e-05, + "loss": 1.0353, + "step": 6112 + }, + { + "epoch": 16.6566757493188, + "grad_norm": 7.471489906311035, + "learning_rate": 1.903766908824992e-05, + "loss": 0.9988, + "step": 6113 + }, + { + "epoch": 16.659400544959126, + "grad_norm": 8.371833801269531, + "learning_rate": 1.9037291323318348e-05, + "loss": 0.9868, + "step": 6114 + }, + { + "epoch": 16.662125340599456, + "grad_norm": 7.713346004486084, + "learning_rate": 1.9036913488004646e-05, + "loss": 0.8154, + "step": 6115 + }, + { + "epoch": 16.66485013623978, + "grad_norm": 7.333027362823486, + "learning_rate": 1.903653558231175e-05, + "loss": 1.0903, + "step": 6116 + }, + { + "epoch": 16.667574931880107, + "grad_norm": 7.406708717346191, + "learning_rate": 1.9036157606242603e-05, + "loss": 0.9045, + "step": 6117 + }, + { + "epoch": 16.670299727520437, + "grad_norm": 10.05079174041748, + "learning_rate": 1.903577955980016e-05, + "loss": 1.0574, + "step": 6118 + }, + { + "epoch": 16.673024523160763, + "grad_norm": 7.7181878089904785, + "learning_rate": 1.903540144298735e-05, + "loss": 1.1055, + "step": 6119 + }, + { + "epoch": 16.67574931880109, + "grad_norm": 8.098625183105469, + "learning_rate": 1.9035023255807124e-05, + "loss": 0.8563, + "step": 6120 + }, + { + "epoch": 16.678474114441418, + "grad_norm": 8.74626636505127, + "learning_rate": 1.903464499826243e-05, + "loss": 0.9667, + "step": 6121 + }, + { + "epoch": 16.681198910081743, + "grad_norm": 8.023555755615234, + "learning_rate": 1.903426667035621e-05, + "loss": 0.8154, + "step": 6122 + }, + { + "epoch": 16.68392370572207, + "grad_norm": 9.104249954223633, + "learning_rate": 1.9033888272091416e-05, + "loss": 0.967, + "step": 6123 + }, + { + "epoch": 16.6866485013624, + "grad_norm": 8.570528030395508, + "learning_rate": 1.9033509803470986e-05, + "loss": 1.1956, + "step": 6124 + }, + { + "epoch": 16.689373297002724, + "grad_norm": 8.387625694274902, + "learning_rate": 1.9033131264497876e-05, + "loss": 1.1216, + "step": 6125 + }, + { + "epoch": 16.69209809264305, + "grad_norm": 6.991154193878174, + "learning_rate": 1.9032752655175025e-05, + "loss": 0.9769, + "step": 6126 + }, + { + "epoch": 16.69482288828338, + "grad_norm": 8.776601791381836, + "learning_rate": 1.9032373975505393e-05, + "loss": 1.0464, + "step": 6127 + }, + { + "epoch": 16.697547683923705, + "grad_norm": 9.082233428955078, + "learning_rate": 1.903199522549192e-05, + "loss": 0.864, + "step": 6128 + }, + { + "epoch": 16.70027247956403, + "grad_norm": 10.216814994812012, + "learning_rate": 1.9031616405137563e-05, + "loss": 1.1111, + "step": 6129 + }, + { + "epoch": 16.70299727520436, + "grad_norm": 8.663824081420898, + "learning_rate": 1.9031237514445264e-05, + "loss": 0.897, + "step": 6130 + }, + { + "epoch": 16.705722070844686, + "grad_norm": 8.798577308654785, + "learning_rate": 1.9030858553417978e-05, + "loss": 0.8569, + "step": 6131 + }, + { + "epoch": 16.708446866485012, + "grad_norm": 9.070158958435059, + "learning_rate": 1.9030479522058656e-05, + "loss": 1.0791, + "step": 6132 + }, + { + "epoch": 16.71117166212534, + "grad_norm": 8.712905883789062, + "learning_rate": 1.9030100420370254e-05, + "loss": 0.8652, + "step": 6133 + }, + { + "epoch": 16.713896457765667, + "grad_norm": 8.393935203552246, + "learning_rate": 1.9029721248355718e-05, + "loss": 0.9224, + "step": 6134 + }, + { + "epoch": 16.716621253405993, + "grad_norm": 7.922507286071777, + "learning_rate": 1.9029342006018002e-05, + "loss": 0.8901, + "step": 6135 + }, + { + "epoch": 16.719346049046322, + "grad_norm": 8.726856231689453, + "learning_rate": 1.9028962693360062e-05, + "loss": 1.0376, + "step": 6136 + }, + { + "epoch": 16.722070844686648, + "grad_norm": 7.232251167297363, + "learning_rate": 1.9028583310384852e-05, + "loss": 0.8041, + "step": 6137 + }, + { + "epoch": 16.724795640326974, + "grad_norm": 8.879591941833496, + "learning_rate": 1.9028203857095326e-05, + "loss": 1.2061, + "step": 6138 + }, + { + "epoch": 16.727520435967303, + "grad_norm": 8.938133239746094, + "learning_rate": 1.902782433349444e-05, + "loss": 0.9741, + "step": 6139 + }, + { + "epoch": 16.73024523160763, + "grad_norm": 9.896289825439453, + "learning_rate": 1.9027444739585145e-05, + "loss": 0.905, + "step": 6140 + }, + { + "epoch": 16.732970027247955, + "grad_norm": 8.938760757446289, + "learning_rate": 1.9027065075370405e-05, + "loss": 0.8906, + "step": 6141 + }, + { + "epoch": 16.735694822888284, + "grad_norm": 7.5377984046936035, + "learning_rate": 1.9026685340853167e-05, + "loss": 0.8879, + "step": 6142 + }, + { + "epoch": 16.73841961852861, + "grad_norm": 8.72514533996582, + "learning_rate": 1.90263055360364e-05, + "loss": 1.0676, + "step": 6143 + }, + { + "epoch": 16.741144414168936, + "grad_norm": 8.462060928344727, + "learning_rate": 1.9025925660923053e-05, + "loss": 1.0444, + "step": 6144 + }, + { + "epoch": 16.743869209809265, + "grad_norm": 8.33977222442627, + "learning_rate": 1.902554571551609e-05, + "loss": 0.8572, + "step": 6145 + }, + { + "epoch": 16.74659400544959, + "grad_norm": 8.435555458068848, + "learning_rate": 1.902516569981846e-05, + "loss": 1.0098, + "step": 6146 + }, + { + "epoch": 16.749318801089917, + "grad_norm": 8.936212539672852, + "learning_rate": 1.902478561383314e-05, + "loss": 0.9421, + "step": 6147 + }, + { + "epoch": 16.752043596730246, + "grad_norm": 7.517622947692871, + "learning_rate": 1.9024405457563072e-05, + "loss": 0.9481, + "step": 6148 + }, + { + "epoch": 16.754768392370572, + "grad_norm": 8.736359596252441, + "learning_rate": 1.902402523101123e-05, + "loss": 1.2015, + "step": 6149 + }, + { + "epoch": 16.757493188010898, + "grad_norm": 9.770566940307617, + "learning_rate": 1.9023644934180568e-05, + "loss": 0.8751, + "step": 6150 + }, + { + "epoch": 16.760217983651227, + "grad_norm": 6.670861721038818, + "learning_rate": 1.902326456707405e-05, + "loss": 0.9161, + "step": 6151 + }, + { + "epoch": 16.762942779291553, + "grad_norm": 10.840482711791992, + "learning_rate": 1.902288412969464e-05, + "loss": 0.8964, + "step": 6152 + }, + { + "epoch": 16.76566757493188, + "grad_norm": 8.162219047546387, + "learning_rate": 1.9022503622045297e-05, + "loss": 0.9651, + "step": 6153 + }, + { + "epoch": 16.768392370572208, + "grad_norm": 10.338919639587402, + "learning_rate": 1.9022123044128985e-05, + "loss": 1.0435, + "step": 6154 + }, + { + "epoch": 16.771117166212534, + "grad_norm": 7.12001371383667, + "learning_rate": 1.9021742395948668e-05, + "loss": 0.944, + "step": 6155 + }, + { + "epoch": 16.77384196185286, + "grad_norm": 8.560159683227539, + "learning_rate": 1.9021361677507316e-05, + "loss": 1.1262, + "step": 6156 + }, + { + "epoch": 16.77656675749319, + "grad_norm": 18.946989059448242, + "learning_rate": 1.902098088880789e-05, + "loss": 0.8376, + "step": 6157 + }, + { + "epoch": 16.779291553133515, + "grad_norm": 9.131311416625977, + "learning_rate": 1.902060002985335e-05, + "loss": 0.9604, + "step": 6158 + }, + { + "epoch": 16.78201634877384, + "grad_norm": 7.698740005493164, + "learning_rate": 1.9020219100646667e-05, + "loss": 0.9002, + "step": 6159 + }, + { + "epoch": 16.78474114441417, + "grad_norm": 14.020658493041992, + "learning_rate": 1.9019838101190812e-05, + "loss": 1.1304, + "step": 6160 + }, + { + "epoch": 16.787465940054496, + "grad_norm": 17.247962951660156, + "learning_rate": 1.9019457031488747e-05, + "loss": 0.9744, + "step": 6161 + }, + { + "epoch": 16.79019073569482, + "grad_norm": 9.009391784667969, + "learning_rate": 1.901907589154344e-05, + "loss": 0.786, + "step": 6162 + }, + { + "epoch": 16.79291553133515, + "grad_norm": 11.710041999816895, + "learning_rate": 1.9018694681357865e-05, + "loss": 1.1375, + "step": 6163 + }, + { + "epoch": 16.795640326975477, + "grad_norm": 8.075738906860352, + "learning_rate": 1.901831340093498e-05, + "loss": 0.9253, + "step": 6164 + }, + { + "epoch": 16.798365122615802, + "grad_norm": 8.50547981262207, + "learning_rate": 1.9017932050277762e-05, + "loss": 0.9177, + "step": 6165 + }, + { + "epoch": 16.80108991825613, + "grad_norm": 8.390825271606445, + "learning_rate": 1.901755062938918e-05, + "loss": 0.9508, + "step": 6166 + }, + { + "epoch": 16.803814713896458, + "grad_norm": 7.8770599365234375, + "learning_rate": 1.9017169138272203e-05, + "loss": 0.9116, + "step": 6167 + }, + { + "epoch": 16.806539509536783, + "grad_norm": 7.977993011474609, + "learning_rate": 1.9016787576929805e-05, + "loss": 0.9384, + "step": 6168 + }, + { + "epoch": 16.809264305177113, + "grad_norm": 8.234292984008789, + "learning_rate": 1.901640594536495e-05, + "loss": 0.9983, + "step": 6169 + }, + { + "epoch": 16.81198910081744, + "grad_norm": 16.994550704956055, + "learning_rate": 1.9016024243580626e-05, + "loss": 0.8649, + "step": 6170 + }, + { + "epoch": 16.814713896457764, + "grad_norm": 7.928983211517334, + "learning_rate": 1.9015642471579786e-05, + "loss": 1.0641, + "step": 6171 + }, + { + "epoch": 16.817438692098094, + "grad_norm": 6.782833576202393, + "learning_rate": 1.9015260629365417e-05, + "loss": 0.978, + "step": 6172 + }, + { + "epoch": 16.82016348773842, + "grad_norm": 7.612330436706543, + "learning_rate": 1.9014878716940487e-05, + "loss": 0.9536, + "step": 6173 + }, + { + "epoch": 16.822888283378745, + "grad_norm": 9.662505149841309, + "learning_rate": 1.9014496734307974e-05, + "loss": 0.8308, + "step": 6174 + }, + { + "epoch": 16.825613079019075, + "grad_norm": 9.241847038269043, + "learning_rate": 1.9014114681470847e-05, + "loss": 1.126, + "step": 6175 + }, + { + "epoch": 16.8283378746594, + "grad_norm": 11.356974601745605, + "learning_rate": 1.9013732558432086e-05, + "loss": 1.1019, + "step": 6176 + }, + { + "epoch": 16.831062670299726, + "grad_norm": 8.605137825012207, + "learning_rate": 1.901335036519467e-05, + "loss": 0.9619, + "step": 6177 + }, + { + "epoch": 16.833787465940055, + "grad_norm": 9.019730567932129, + "learning_rate": 1.9012968101761567e-05, + "loss": 1.014, + "step": 6178 + }, + { + "epoch": 16.83651226158038, + "grad_norm": 8.747864723205566, + "learning_rate": 1.901258576813576e-05, + "loss": 1.1597, + "step": 6179 + }, + { + "epoch": 16.839237057220707, + "grad_norm": 8.210248947143555, + "learning_rate": 1.9012203364320223e-05, + "loss": 0.9534, + "step": 6180 + }, + { + "epoch": 16.841961852861036, + "grad_norm": 8.457579612731934, + "learning_rate": 1.901182089031794e-05, + "loss": 0.9187, + "step": 6181 + }, + { + "epoch": 16.844686648501362, + "grad_norm": 7.20169734954834, + "learning_rate": 1.9011438346131882e-05, + "loss": 0.9009, + "step": 6182 + }, + { + "epoch": 16.847411444141688, + "grad_norm": 7.486141681671143, + "learning_rate": 1.9011055731765036e-05, + "loss": 0.894, + "step": 6183 + }, + { + "epoch": 16.850136239782017, + "grad_norm": 7.9857177734375, + "learning_rate": 1.9010673047220373e-05, + "loss": 1.1331, + "step": 6184 + }, + { + "epoch": 16.852861035422343, + "grad_norm": 11.257291793823242, + "learning_rate": 1.9010290292500883e-05, + "loss": 0.9967, + "step": 6185 + }, + { + "epoch": 16.85558583106267, + "grad_norm": 8.070331573486328, + "learning_rate": 1.9009907467609544e-05, + "loss": 0.8953, + "step": 6186 + }, + { + "epoch": 16.858310626703, + "grad_norm": 7.690113067626953, + "learning_rate": 1.900952457254933e-05, + "loss": 1.0862, + "step": 6187 + }, + { + "epoch": 16.861035422343324, + "grad_norm": 8.162193298339844, + "learning_rate": 1.900914160732323e-05, + "loss": 1.0521, + "step": 6188 + }, + { + "epoch": 16.86376021798365, + "grad_norm": 8.463749885559082, + "learning_rate": 1.900875857193423e-05, + "loss": 0.9612, + "step": 6189 + }, + { + "epoch": 16.86648501362398, + "grad_norm": 7.926802158355713, + "learning_rate": 1.90083754663853e-05, + "loss": 1.0518, + "step": 6190 + }, + { + "epoch": 16.869209809264305, + "grad_norm": 9.436305046081543, + "learning_rate": 1.9007992290679437e-05, + "loss": 0.9889, + "step": 6191 + }, + { + "epoch": 16.87193460490463, + "grad_norm": 6.777631759643555, + "learning_rate": 1.900760904481962e-05, + "loss": 0.861, + "step": 6192 + }, + { + "epoch": 16.87465940054496, + "grad_norm": 6.63100528717041, + "learning_rate": 1.900722572880883e-05, + "loss": 0.9363, + "step": 6193 + }, + { + "epoch": 16.877384196185286, + "grad_norm": 9.927841186523438, + "learning_rate": 1.900684234265006e-05, + "loss": 1.0352, + "step": 6194 + }, + { + "epoch": 16.88010899182561, + "grad_norm": 9.591605186462402, + "learning_rate": 1.900645888634629e-05, + "loss": 1.0769, + "step": 6195 + }, + { + "epoch": 16.88283378746594, + "grad_norm": 8.075156211853027, + "learning_rate": 1.9006075359900507e-05, + "loss": 0.8705, + "step": 6196 + }, + { + "epoch": 16.885558583106267, + "grad_norm": 8.7380952835083, + "learning_rate": 1.9005691763315703e-05, + "loss": 0.8654, + "step": 6197 + }, + { + "epoch": 16.888283378746593, + "grad_norm": 9.685803413391113, + "learning_rate": 1.9005308096594856e-05, + "loss": 0.9965, + "step": 6198 + }, + { + "epoch": 16.891008174386922, + "grad_norm": 9.106147766113281, + "learning_rate": 1.9004924359740965e-05, + "loss": 0.9927, + "step": 6199 + }, + { + "epoch": 16.893732970027248, + "grad_norm": 9.183213233947754, + "learning_rate": 1.9004540552757008e-05, + "loss": 0.9373, + "step": 6200 + }, + { + "epoch": 16.896457765667574, + "grad_norm": 10.00035572052002, + "learning_rate": 1.900415667564598e-05, + "loss": 1.0916, + "step": 6201 + }, + { + "epoch": 16.899182561307903, + "grad_norm": 7.394097805023193, + "learning_rate": 1.900377272841087e-05, + "loss": 0.856, + "step": 6202 + }, + { + "epoch": 16.90190735694823, + "grad_norm": 8.062369346618652, + "learning_rate": 1.900338871105467e-05, + "loss": 1.0668, + "step": 6203 + }, + { + "epoch": 16.904632152588555, + "grad_norm": 9.141656875610352, + "learning_rate": 1.9003004623580365e-05, + "loss": 1.0283, + "step": 6204 + }, + { + "epoch": 16.907356948228884, + "grad_norm": 9.296113967895508, + "learning_rate": 1.9002620465990952e-05, + "loss": 0.9728, + "step": 6205 + }, + { + "epoch": 16.91008174386921, + "grad_norm": 7.998512268066406, + "learning_rate": 1.900223623828942e-05, + "loss": 0.99, + "step": 6206 + }, + { + "epoch": 16.912806539509535, + "grad_norm": 6.6857829093933105, + "learning_rate": 1.9001851940478765e-05, + "loss": 0.9277, + "step": 6207 + }, + { + "epoch": 16.915531335149865, + "grad_norm": 8.054292678833008, + "learning_rate": 1.9001467572561974e-05, + "loss": 1.0079, + "step": 6208 + }, + { + "epoch": 16.91825613079019, + "grad_norm": 7.670961380004883, + "learning_rate": 1.900108313454204e-05, + "loss": 0.8792, + "step": 6209 + }, + { + "epoch": 16.920980926430516, + "grad_norm": 12.54238510131836, + "learning_rate": 1.9000698626421966e-05, + "loss": 1.0015, + "step": 6210 + }, + { + "epoch": 16.923705722070846, + "grad_norm": 8.54481029510498, + "learning_rate": 1.9000314048204736e-05, + "loss": 0.9761, + "step": 6211 + }, + { + "epoch": 16.92643051771117, + "grad_norm": 7.279057025909424, + "learning_rate": 1.899992939989335e-05, + "loss": 1.0864, + "step": 6212 + }, + { + "epoch": 16.929155313351497, + "grad_norm": 11.931070327758789, + "learning_rate": 1.8999544681490807e-05, + "loss": 0.9958, + "step": 6213 + }, + { + "epoch": 16.931880108991827, + "grad_norm": 8.158348083496094, + "learning_rate": 1.89991598930001e-05, + "loss": 0.9166, + "step": 6214 + }, + { + "epoch": 16.934604904632153, + "grad_norm": 9.551117897033691, + "learning_rate": 1.8998775034424222e-05, + "loss": 1.1122, + "step": 6215 + }, + { + "epoch": 16.93732970027248, + "grad_norm": 8.071077346801758, + "learning_rate": 1.8998390105766175e-05, + "loss": 0.8949, + "step": 6216 + }, + { + "epoch": 16.940054495912808, + "grad_norm": 8.414925575256348, + "learning_rate": 1.8998005107028956e-05, + "loss": 0.8184, + "step": 6217 + }, + { + "epoch": 16.942779291553133, + "grad_norm": 8.011565208435059, + "learning_rate": 1.8997620038215562e-05, + "loss": 0.9697, + "step": 6218 + }, + { + "epoch": 16.94550408719346, + "grad_norm": 15.543701171875, + "learning_rate": 1.8997234899328997e-05, + "loss": 0.9996, + "step": 6219 + }, + { + "epoch": 16.94822888283379, + "grad_norm": 18.687339782714844, + "learning_rate": 1.899684969037225e-05, + "loss": 0.816, + "step": 6220 + }, + { + "epoch": 16.950953678474114, + "grad_norm": 9.535623550415039, + "learning_rate": 1.899646441134833e-05, + "loss": 0.9839, + "step": 6221 + }, + { + "epoch": 16.95367847411444, + "grad_norm": 9.265975952148438, + "learning_rate": 1.8996079062260234e-05, + "loss": 1.0645, + "step": 6222 + }, + { + "epoch": 16.95640326975477, + "grad_norm": 8.745752334594727, + "learning_rate": 1.8995693643110964e-05, + "loss": 1.0349, + "step": 6223 + }, + { + "epoch": 16.959128065395095, + "grad_norm": 7.420135498046875, + "learning_rate": 1.899530815390352e-05, + "loss": 0.8781, + "step": 6224 + }, + { + "epoch": 16.96185286103542, + "grad_norm": 8.341424942016602, + "learning_rate": 1.8994922594640907e-05, + "loss": 0.9097, + "step": 6225 + }, + { + "epoch": 16.96457765667575, + "grad_norm": 7.917690753936768, + "learning_rate": 1.899453696532613e-05, + "loss": 1.1034, + "step": 6226 + }, + { + "epoch": 16.967302452316076, + "grad_norm": 8.074682235717773, + "learning_rate": 1.8994151265962184e-05, + "loss": 1.0903, + "step": 6227 + }, + { + "epoch": 16.970027247956402, + "grad_norm": 7.362932205200195, + "learning_rate": 1.8993765496552078e-05, + "loss": 0.9917, + "step": 6228 + }, + { + "epoch": 16.97275204359673, + "grad_norm": 8.595783233642578, + "learning_rate": 1.8993379657098815e-05, + "loss": 0.8716, + "step": 6229 + }, + { + "epoch": 16.975476839237057, + "grad_norm": 9.306862831115723, + "learning_rate": 1.89929937476054e-05, + "loss": 0.9995, + "step": 6230 + }, + { + "epoch": 16.978201634877383, + "grad_norm": 8.560187339782715, + "learning_rate": 1.899260776807484e-05, + "loss": 1.1692, + "step": 6231 + }, + { + "epoch": 16.980926430517712, + "grad_norm": 20.176673889160156, + "learning_rate": 1.8992221718510143e-05, + "loss": 0.8344, + "step": 6232 + }, + { + "epoch": 16.983651226158038, + "grad_norm": 8.303386688232422, + "learning_rate": 1.8991835598914313e-05, + "loss": 1.0613, + "step": 6233 + }, + { + "epoch": 16.986376021798364, + "grad_norm": 9.151183128356934, + "learning_rate": 1.8991449409290355e-05, + "loss": 1.098, + "step": 6234 + }, + { + "epoch": 16.989100817438693, + "grad_norm": 7.211446285247803, + "learning_rate": 1.8991063149641276e-05, + "loss": 1.0529, + "step": 6235 + }, + { + "epoch": 16.99182561307902, + "grad_norm": 9.654312133789062, + "learning_rate": 1.8990676819970087e-05, + "loss": 1.0745, + "step": 6236 + }, + { + "epoch": 16.994550408719345, + "grad_norm": 7.851251602172852, + "learning_rate": 1.89902904202798e-05, + "loss": 0.7695, + "step": 6237 + }, + { + "epoch": 16.997275204359674, + "grad_norm": 9.32390022277832, + "learning_rate": 1.8989903950573422e-05, + "loss": 1.0144, + "step": 6238 + }, + { + "epoch": 17.0, + "grad_norm": 8.421369552612305, + "learning_rate": 1.8989517410853956e-05, + "loss": 0.8492, + "step": 6239 + }, + { + "epoch": 17.002724795640326, + "grad_norm": 10.002796173095703, + "learning_rate": 1.898913080112442e-05, + "loss": 0.9569, + "step": 6240 + }, + { + "epoch": 17.005449591280655, + "grad_norm": 13.980656623840332, + "learning_rate": 1.898874412138782e-05, + "loss": 0.9341, + "step": 6241 + }, + { + "epoch": 17.00817438692098, + "grad_norm": 7.3156561851501465, + "learning_rate": 1.8988357371647173e-05, + "loss": 0.8428, + "step": 6242 + }, + { + "epoch": 17.010899182561307, + "grad_norm": 7.414515018463135, + "learning_rate": 1.898797055190549e-05, + "loss": 0.8074, + "step": 6243 + }, + { + "epoch": 17.013623978201636, + "grad_norm": 8.65429401397705, + "learning_rate": 1.8987583662165775e-05, + "loss": 0.7615, + "step": 6244 + }, + { + "epoch": 17.016348773841962, + "grad_norm": 7.639221668243408, + "learning_rate": 1.8987196702431053e-05, + "loss": 0.7936, + "step": 6245 + }, + { + "epoch": 17.019073569482288, + "grad_norm": 7.511865615844727, + "learning_rate": 1.8986809672704328e-05, + "loss": 0.7023, + "step": 6246 + }, + { + "epoch": 17.021798365122617, + "grad_norm": 6.386614799499512, + "learning_rate": 1.8986422572988626e-05, + "loss": 0.8512, + "step": 6247 + }, + { + "epoch": 17.024523160762943, + "grad_norm": 8.6180419921875, + "learning_rate": 1.8986035403286948e-05, + "loss": 1.0215, + "step": 6248 + }, + { + "epoch": 17.02724795640327, + "grad_norm": 9.61176872253418, + "learning_rate": 1.8985648163602318e-05, + "loss": 0.9308, + "step": 6249 + }, + { + "epoch": 17.029972752043598, + "grad_norm": 7.482372283935547, + "learning_rate": 1.898526085393775e-05, + "loss": 0.9282, + "step": 6250 + }, + { + "epoch": 17.032697547683924, + "grad_norm": 8.454015731811523, + "learning_rate": 1.8984873474296256e-05, + "loss": 0.7462, + "step": 6251 + }, + { + "epoch": 17.03542234332425, + "grad_norm": 7.860104560852051, + "learning_rate": 1.898448602468086e-05, + "loss": 0.9888, + "step": 6252 + }, + { + "epoch": 17.03814713896458, + "grad_norm": 8.912753105163574, + "learning_rate": 1.8984098505094574e-05, + "loss": 0.6791, + "step": 6253 + }, + { + "epoch": 17.040871934604905, + "grad_norm": 8.656185150146484, + "learning_rate": 1.898371091554042e-05, + "loss": 0.8683, + "step": 6254 + }, + { + "epoch": 17.04359673024523, + "grad_norm": 7.228968143463135, + "learning_rate": 1.8983323256021412e-05, + "loss": 0.8091, + "step": 6255 + }, + { + "epoch": 17.04632152588556, + "grad_norm": 7.749083995819092, + "learning_rate": 1.8982935526540572e-05, + "loss": 0.901, + "step": 6256 + }, + { + "epoch": 17.049046321525886, + "grad_norm": 8.07095718383789, + "learning_rate": 1.898254772710092e-05, + "loss": 0.8671, + "step": 6257 + }, + { + "epoch": 17.05177111716621, + "grad_norm": 8.128870010375977, + "learning_rate": 1.8982159857705475e-05, + "loss": 0.8062, + "step": 6258 + }, + { + "epoch": 17.05449591280654, + "grad_norm": 8.751575469970703, + "learning_rate": 1.8981771918357257e-05, + "loss": 0.9467, + "step": 6259 + }, + { + "epoch": 17.057220708446867, + "grad_norm": 6.564663410186768, + "learning_rate": 1.898138390905929e-05, + "loss": 1.0685, + "step": 6260 + }, + { + "epoch": 17.059945504087192, + "grad_norm": 11.437712669372559, + "learning_rate": 1.8980995829814593e-05, + "loss": 1.0762, + "step": 6261 + }, + { + "epoch": 17.06267029972752, + "grad_norm": 9.941190719604492, + "learning_rate": 1.8980607680626194e-05, + "loss": 0.713, + "step": 6262 + }, + { + "epoch": 17.065395095367847, + "grad_norm": 8.763118743896484, + "learning_rate": 1.8980219461497106e-05, + "loss": 0.7267, + "step": 6263 + }, + { + "epoch": 17.068119891008173, + "grad_norm": 8.583393096923828, + "learning_rate": 1.8979831172430364e-05, + "loss": 0.9388, + "step": 6264 + }, + { + "epoch": 17.070844686648503, + "grad_norm": 10.55490779876709, + "learning_rate": 1.897944281342898e-05, + "loss": 0.8036, + "step": 6265 + }, + { + "epoch": 17.07356948228883, + "grad_norm": 6.606943130493164, + "learning_rate": 1.8979054384495987e-05, + "loss": 0.8143, + "step": 6266 + }, + { + "epoch": 17.076294277929154, + "grad_norm": 8.044092178344727, + "learning_rate": 1.8978665885634406e-05, + "loss": 0.8848, + "step": 6267 + }, + { + "epoch": 17.079019073569484, + "grad_norm": 8.02966594696045, + "learning_rate": 1.8978277316847265e-05, + "loss": 0.8705, + "step": 6268 + }, + { + "epoch": 17.08174386920981, + "grad_norm": 7.176367282867432, + "learning_rate": 1.897788867813759e-05, + "loss": 0.874, + "step": 6269 + }, + { + "epoch": 17.084468664850135, + "grad_norm": 8.880574226379395, + "learning_rate": 1.8977499969508405e-05, + "loss": 0.9612, + "step": 6270 + }, + { + "epoch": 17.087193460490465, + "grad_norm": 8.524381637573242, + "learning_rate": 1.897711119096274e-05, + "loss": 0.7632, + "step": 6271 + }, + { + "epoch": 17.08991825613079, + "grad_norm": 7.7911810874938965, + "learning_rate": 1.897672234250362e-05, + "loss": 0.8545, + "step": 6272 + }, + { + "epoch": 17.092643051771116, + "grad_norm": 6.824251174926758, + "learning_rate": 1.897633342413408e-05, + "loss": 0.7018, + "step": 6273 + }, + { + "epoch": 17.095367847411445, + "grad_norm": 8.821577072143555, + "learning_rate": 1.897594443585714e-05, + "loss": 0.916, + "step": 6274 + }, + { + "epoch": 17.09809264305177, + "grad_norm": 10.299895286560059, + "learning_rate": 1.8975555377675835e-05, + "loss": 0.8342, + "step": 6275 + }, + { + "epoch": 17.100817438692097, + "grad_norm": 17.8612117767334, + "learning_rate": 1.8975166249593194e-05, + "loss": 0.8192, + "step": 6276 + }, + { + "epoch": 17.103542234332426, + "grad_norm": 8.529385566711426, + "learning_rate": 1.897477705161225e-05, + "loss": 0.858, + "step": 6277 + }, + { + "epoch": 17.106267029972752, + "grad_norm": 6.327038288116455, + "learning_rate": 1.8974387783736022e-05, + "loss": 0.9072, + "step": 6278 + }, + { + "epoch": 17.108991825613078, + "grad_norm": 7.227954864501953, + "learning_rate": 1.897399844596756e-05, + "loss": 0.9475, + "step": 6279 + }, + { + "epoch": 17.111716621253407, + "grad_norm": 8.278307914733887, + "learning_rate": 1.8973609038309883e-05, + "loss": 0.8021, + "step": 6280 + }, + { + "epoch": 17.114441416893733, + "grad_norm": 8.912012100219727, + "learning_rate": 1.897321956076603e-05, + "loss": 0.8528, + "step": 6281 + }, + { + "epoch": 17.11716621253406, + "grad_norm": 8.555465698242188, + "learning_rate": 1.897283001333903e-05, + "loss": 0.7938, + "step": 6282 + }, + { + "epoch": 17.11989100817439, + "grad_norm": 11.952853202819824, + "learning_rate": 1.8972440396031916e-05, + "loss": 0.96, + "step": 6283 + }, + { + "epoch": 17.122615803814714, + "grad_norm": 7.701216220855713, + "learning_rate": 1.897205070884773e-05, + "loss": 0.8625, + "step": 6284 + }, + { + "epoch": 17.12534059945504, + "grad_norm": 9.567951202392578, + "learning_rate": 1.89716609517895e-05, + "loss": 1.071, + "step": 6285 + }, + { + "epoch": 17.12806539509537, + "grad_norm": 7.93927526473999, + "learning_rate": 1.8971271124860263e-05, + "loss": 1.0347, + "step": 6286 + }, + { + "epoch": 17.130790190735695, + "grad_norm": 8.100805282592773, + "learning_rate": 1.8970881228063055e-05, + "loss": 0.7579, + "step": 6287 + }, + { + "epoch": 17.13351498637602, + "grad_norm": 8.478625297546387, + "learning_rate": 1.8970491261400913e-05, + "loss": 0.9678, + "step": 6288 + }, + { + "epoch": 17.13623978201635, + "grad_norm": 8.492572784423828, + "learning_rate": 1.8970101224876872e-05, + "loss": 0.8484, + "step": 6289 + }, + { + "epoch": 17.138964577656676, + "grad_norm": 8.242562294006348, + "learning_rate": 1.8969711118493976e-05, + "loss": 0.9191, + "step": 6290 + }, + { + "epoch": 17.141689373297, + "grad_norm": 9.903480529785156, + "learning_rate": 1.8969320942255252e-05, + "loss": 0.9205, + "step": 6291 + }, + { + "epoch": 17.14441416893733, + "grad_norm": 8.240567207336426, + "learning_rate": 1.896893069616375e-05, + "loss": 0.8055, + "step": 6292 + }, + { + "epoch": 17.147138964577657, + "grad_norm": 9.593177795410156, + "learning_rate": 1.89685403802225e-05, + "loss": 1.0905, + "step": 6293 + }, + { + "epoch": 17.149863760217983, + "grad_norm": 7.517264366149902, + "learning_rate": 1.8968149994434552e-05, + "loss": 0.8064, + "step": 6294 + }, + { + "epoch": 17.152588555858312, + "grad_norm": 8.686984062194824, + "learning_rate": 1.896775953880294e-05, + "loss": 0.9446, + "step": 6295 + }, + { + "epoch": 17.155313351498638, + "grad_norm": 8.225557327270508, + "learning_rate": 1.8967369013330702e-05, + "loss": 0.8792, + "step": 6296 + }, + { + "epoch": 17.158038147138964, + "grad_norm": 8.14830493927002, + "learning_rate": 1.8966978418020883e-05, + "loss": 0.924, + "step": 6297 + }, + { + "epoch": 17.160762942779293, + "grad_norm": 7.562781810760498, + "learning_rate": 1.8966587752876524e-05, + "loss": 0.895, + "step": 6298 + }, + { + "epoch": 17.16348773841962, + "grad_norm": 8.645089149475098, + "learning_rate": 1.8966197017900672e-05, + "loss": 0.9468, + "step": 6299 + }, + { + "epoch": 17.166212534059945, + "grad_norm": 10.737967491149902, + "learning_rate": 1.8965806213096363e-05, + "loss": 0.8529, + "step": 6300 + }, + { + "epoch": 17.168937329700274, + "grad_norm": 9.399730682373047, + "learning_rate": 1.8965415338466645e-05, + "loss": 0.9579, + "step": 6301 + }, + { + "epoch": 17.1716621253406, + "grad_norm": 7.219324588775635, + "learning_rate": 1.896502439401456e-05, + "loss": 0.8975, + "step": 6302 + }, + { + "epoch": 17.174386920980925, + "grad_norm": 9.04008960723877, + "learning_rate": 1.8964633379743154e-05, + "loss": 0.927, + "step": 6303 + }, + { + "epoch": 17.177111716621255, + "grad_norm": 7.370367527008057, + "learning_rate": 1.8964242295655473e-05, + "loss": 0.7427, + "step": 6304 + }, + { + "epoch": 17.17983651226158, + "grad_norm": 9.304048538208008, + "learning_rate": 1.8963851141754558e-05, + "loss": 1.1201, + "step": 6305 + }, + { + "epoch": 17.182561307901906, + "grad_norm": 7.377665042877197, + "learning_rate": 1.8963459918043463e-05, + "loss": 0.9453, + "step": 6306 + }, + { + "epoch": 17.185286103542236, + "grad_norm": 7.910454273223877, + "learning_rate": 1.896306862452523e-05, + "loss": 0.7621, + "step": 6307 + }, + { + "epoch": 17.18801089918256, + "grad_norm": 10.67541790008545, + "learning_rate": 1.8962677261202905e-05, + "loss": 1.0029, + "step": 6308 + }, + { + "epoch": 17.190735694822887, + "grad_norm": 9.604737281799316, + "learning_rate": 1.896228582807954e-05, + "loss": 0.876, + "step": 6309 + }, + { + "epoch": 17.193460490463217, + "grad_norm": 10.053817749023438, + "learning_rate": 1.896189432515818e-05, + "loss": 0.8694, + "step": 6310 + }, + { + "epoch": 17.196185286103542, + "grad_norm": 9.115626335144043, + "learning_rate": 1.8961502752441875e-05, + "loss": 0.9108, + "step": 6311 + }, + { + "epoch": 17.19891008174387, + "grad_norm": 7.803097724914551, + "learning_rate": 1.8961111109933673e-05, + "loss": 1.002, + "step": 6312 + }, + { + "epoch": 17.201634877384198, + "grad_norm": 9.898059844970703, + "learning_rate": 1.896071939763663e-05, + "loss": 0.9833, + "step": 6313 + }, + { + "epoch": 17.204359673024523, + "grad_norm": 9.695001602172852, + "learning_rate": 1.8960327615553794e-05, + "loss": 0.8746, + "step": 6314 + }, + { + "epoch": 17.20708446866485, + "grad_norm": 7.691354274749756, + "learning_rate": 1.8959935763688212e-05, + "loss": 0.991, + "step": 6315 + }, + { + "epoch": 17.20980926430518, + "grad_norm": 9.531713485717773, + "learning_rate": 1.895954384204294e-05, + "loss": 0.8604, + "step": 6316 + }, + { + "epoch": 17.212534059945504, + "grad_norm": 8.945476531982422, + "learning_rate": 1.8959151850621025e-05, + "loss": 0.9231, + "step": 6317 + }, + { + "epoch": 17.21525885558583, + "grad_norm": 8.44931411743164, + "learning_rate": 1.895875978942553e-05, + "loss": 0.9095, + "step": 6318 + }, + { + "epoch": 17.21798365122616, + "grad_norm": 12.240138053894043, + "learning_rate": 1.8958367658459494e-05, + "loss": 0.8, + "step": 6319 + }, + { + "epoch": 17.220708446866485, + "grad_norm": 9.020398139953613, + "learning_rate": 1.8957975457725985e-05, + "loss": 0.9055, + "step": 6320 + }, + { + "epoch": 17.22343324250681, + "grad_norm": 10.042925834655762, + "learning_rate": 1.895758318722805e-05, + "loss": 1.037, + "step": 6321 + }, + { + "epoch": 17.22615803814714, + "grad_norm": 10.284613609313965, + "learning_rate": 1.8957190846968747e-05, + "loss": 0.8844, + "step": 6322 + }, + { + "epoch": 17.228882833787466, + "grad_norm": 8.101875305175781, + "learning_rate": 1.895679843695113e-05, + "loss": 0.8673, + "step": 6323 + }, + { + "epoch": 17.231607629427792, + "grad_norm": 8.890040397644043, + "learning_rate": 1.8956405957178253e-05, + "loss": 1.0253, + "step": 6324 + }, + { + "epoch": 17.23433242506812, + "grad_norm": 9.763956069946289, + "learning_rate": 1.8956013407653175e-05, + "loss": 0.7611, + "step": 6325 + }, + { + "epoch": 17.237057220708447, + "grad_norm": 11.538614273071289, + "learning_rate": 1.895562078837895e-05, + "loss": 1.0217, + "step": 6326 + }, + { + "epoch": 17.239782016348773, + "grad_norm": 7.710923194885254, + "learning_rate": 1.8955228099358646e-05, + "loss": 0.9299, + "step": 6327 + }, + { + "epoch": 17.242506811989102, + "grad_norm": 7.830203056335449, + "learning_rate": 1.8954835340595305e-05, + "loss": 0.8936, + "step": 6328 + }, + { + "epoch": 17.245231607629428, + "grad_norm": 8.240415573120117, + "learning_rate": 1.8954442512092e-05, + "loss": 0.7858, + "step": 6329 + }, + { + "epoch": 17.247956403269754, + "grad_norm": 9.944801330566406, + "learning_rate": 1.8954049613851783e-05, + "loss": 1.1096, + "step": 6330 + }, + { + "epoch": 17.250681198910083, + "grad_norm": 11.277527809143066, + "learning_rate": 1.895365664587772e-05, + "loss": 1.0118, + "step": 6331 + }, + { + "epoch": 17.25340599455041, + "grad_norm": 8.25351619720459, + "learning_rate": 1.8953263608172864e-05, + "loss": 0.9305, + "step": 6332 + }, + { + "epoch": 17.256130790190735, + "grad_norm": 13.284163475036621, + "learning_rate": 1.895287050074028e-05, + "loss": 0.9869, + "step": 6333 + }, + { + "epoch": 17.258855585831064, + "grad_norm": 11.260553359985352, + "learning_rate": 1.8952477323583024e-05, + "loss": 0.864, + "step": 6334 + }, + { + "epoch": 17.26158038147139, + "grad_norm": 6.351672649383545, + "learning_rate": 1.895208407670417e-05, + "loss": 0.811, + "step": 6335 + }, + { + "epoch": 17.264305177111716, + "grad_norm": 9.822250366210938, + "learning_rate": 1.895169076010677e-05, + "loss": 0.9417, + "step": 6336 + }, + { + "epoch": 17.267029972752045, + "grad_norm": 8.968976974487305, + "learning_rate": 1.895129737379389e-05, + "loss": 1.0801, + "step": 6337 + }, + { + "epoch": 17.26975476839237, + "grad_norm": 9.320754051208496, + "learning_rate": 1.8950903917768594e-05, + "loss": 0.9358, + "step": 6338 + }, + { + "epoch": 17.272479564032697, + "grad_norm": 9.100393295288086, + "learning_rate": 1.8950510392033945e-05, + "loss": 1.0525, + "step": 6339 + }, + { + "epoch": 17.275204359673026, + "grad_norm": 10.278422355651855, + "learning_rate": 1.8950116796593013e-05, + "loss": 0.8978, + "step": 6340 + }, + { + "epoch": 17.277929155313352, + "grad_norm": 9.044394493103027, + "learning_rate": 1.894972313144886e-05, + "loss": 0.8734, + "step": 6341 + }, + { + "epoch": 17.280653950953678, + "grad_norm": 9.296480178833008, + "learning_rate": 1.8949329396604544e-05, + "loss": 0.8167, + "step": 6342 + }, + { + "epoch": 17.283378746594007, + "grad_norm": 10.087651252746582, + "learning_rate": 1.8948935592063145e-05, + "loss": 0.9, + "step": 6343 + }, + { + "epoch": 17.286103542234333, + "grad_norm": 9.543252944946289, + "learning_rate": 1.8948541717827723e-05, + "loss": 0.995, + "step": 6344 + }, + { + "epoch": 17.28882833787466, + "grad_norm": 7.406209468841553, + "learning_rate": 1.8948147773901343e-05, + "loss": 0.9407, + "step": 6345 + }, + { + "epoch": 17.291553133514988, + "grad_norm": 10.631805419921875, + "learning_rate": 1.894775376028708e-05, + "loss": 0.8137, + "step": 6346 + }, + { + "epoch": 17.294277929155314, + "grad_norm": 7.886234283447266, + "learning_rate": 1.8947359676988e-05, + "loss": 0.7477, + "step": 6347 + }, + { + "epoch": 17.29700272479564, + "grad_norm": 7.540974140167236, + "learning_rate": 1.8946965524007166e-05, + "loss": 0.8324, + "step": 6348 + }, + { + "epoch": 17.29972752043597, + "grad_norm": 8.333446502685547, + "learning_rate": 1.8946571301347654e-05, + "loss": 0.8212, + "step": 6349 + }, + { + "epoch": 17.302452316076295, + "grad_norm": 8.617403030395508, + "learning_rate": 1.894617700901253e-05, + "loss": 1.0049, + "step": 6350 + }, + { + "epoch": 17.30517711171662, + "grad_norm": 9.715551376342773, + "learning_rate": 1.894578264700487e-05, + "loss": 0.8395, + "step": 6351 + }, + { + "epoch": 17.30790190735695, + "grad_norm": 10.217767715454102, + "learning_rate": 1.8945388215327746e-05, + "loss": 0.9055, + "step": 6352 + }, + { + "epoch": 17.310626702997276, + "grad_norm": 102.19203186035156, + "learning_rate": 1.8944993713984224e-05, + "loss": 1.031, + "step": 6353 + }, + { + "epoch": 17.3133514986376, + "grad_norm": 8.108960151672363, + "learning_rate": 1.8944599142977378e-05, + "loss": 0.8411, + "step": 6354 + }, + { + "epoch": 17.31607629427793, + "grad_norm": 9.639787673950195, + "learning_rate": 1.8944204502310282e-05, + "loss": 0.9253, + "step": 6355 + }, + { + "epoch": 17.318801089918257, + "grad_norm": 8.786418914794922, + "learning_rate": 1.894380979198601e-05, + "loss": 0.9468, + "step": 6356 + }, + { + "epoch": 17.321525885558582, + "grad_norm": 9.127197265625, + "learning_rate": 1.8943415012007634e-05, + "loss": 0.9567, + "step": 6357 + }, + { + "epoch": 17.32425068119891, + "grad_norm": 9.39046859741211, + "learning_rate": 1.8943020162378228e-05, + "loss": 0.8103, + "step": 6358 + }, + { + "epoch": 17.326975476839237, + "grad_norm": 9.742119789123535, + "learning_rate": 1.8942625243100874e-05, + "loss": 0.9304, + "step": 6359 + }, + { + "epoch": 17.329700272479563, + "grad_norm": 7.917878150939941, + "learning_rate": 1.8942230254178638e-05, + "loss": 0.8494, + "step": 6360 + }, + { + "epoch": 17.332425068119893, + "grad_norm": 8.42175579071045, + "learning_rate": 1.8941835195614603e-05, + "loss": 0.9329, + "step": 6361 + }, + { + "epoch": 17.33514986376022, + "grad_norm": 10.603105545043945, + "learning_rate": 1.894144006741184e-05, + "loss": 0.9562, + "step": 6362 + }, + { + "epoch": 17.337874659400544, + "grad_norm": 8.681341171264648, + "learning_rate": 1.8941044869573433e-05, + "loss": 0.9583, + "step": 6363 + }, + { + "epoch": 17.340599455040874, + "grad_norm": 10.419084548950195, + "learning_rate": 1.8940649602102454e-05, + "loss": 0.8289, + "step": 6364 + }, + { + "epoch": 17.3433242506812, + "grad_norm": 10.981396675109863, + "learning_rate": 1.8940254265001986e-05, + "loss": 0.92, + "step": 6365 + }, + { + "epoch": 17.346049046321525, + "grad_norm": 11.663156509399414, + "learning_rate": 1.8939858858275104e-05, + "loss": 1.0793, + "step": 6366 + }, + { + "epoch": 17.348773841961854, + "grad_norm": 8.68185043334961, + "learning_rate": 1.893946338192489e-05, + "loss": 1.0023, + "step": 6367 + }, + { + "epoch": 17.35149863760218, + "grad_norm": 8.913244247436523, + "learning_rate": 1.8939067835954423e-05, + "loss": 0.8899, + "step": 6368 + }, + { + "epoch": 17.354223433242506, + "grad_norm": 10.504867553710938, + "learning_rate": 1.8938672220366784e-05, + "loss": 0.8185, + "step": 6369 + }, + { + "epoch": 17.356948228882835, + "grad_norm": 9.94072437286377, + "learning_rate": 1.893827653516505e-05, + "loss": 0.9678, + "step": 6370 + }, + { + "epoch": 17.35967302452316, + "grad_norm": 8.40544605255127, + "learning_rate": 1.8937880780352307e-05, + "loss": 1.281, + "step": 6371 + }, + { + "epoch": 17.362397820163487, + "grad_norm": 8.515037536621094, + "learning_rate": 1.893748495593164e-05, + "loss": 0.9246, + "step": 6372 + }, + { + "epoch": 17.365122615803816, + "grad_norm": 10.380634307861328, + "learning_rate": 1.8937089061906123e-05, + "loss": 1.0804, + "step": 6373 + }, + { + "epoch": 17.367847411444142, + "grad_norm": 8.567737579345703, + "learning_rate": 1.8936693098278846e-05, + "loss": 1.0319, + "step": 6374 + }, + { + "epoch": 17.370572207084468, + "grad_norm": 9.313538551330566, + "learning_rate": 1.893629706505289e-05, + "loss": 1.0248, + "step": 6375 + }, + { + "epoch": 17.373297002724797, + "grad_norm": 7.999496936798096, + "learning_rate": 1.8935900962231342e-05, + "loss": 0.9978, + "step": 6376 + }, + { + "epoch": 17.376021798365123, + "grad_norm": 64.70576477050781, + "learning_rate": 1.8935504789817284e-05, + "loss": 0.8835, + "step": 6377 + }, + { + "epoch": 17.37874659400545, + "grad_norm": 7.945390224456787, + "learning_rate": 1.89351085478138e-05, + "loss": 0.891, + "step": 6378 + }, + { + "epoch": 17.381471389645778, + "grad_norm": 10.59921932220459, + "learning_rate": 1.8934712236223984e-05, + "loss": 0.8534, + "step": 6379 + }, + { + "epoch": 17.384196185286104, + "grad_norm": 9.016999244689941, + "learning_rate": 1.893431585505091e-05, + "loss": 0.8776, + "step": 6380 + }, + { + "epoch": 17.38692098092643, + "grad_norm": 9.705224990844727, + "learning_rate": 1.8933919404297676e-05, + "loss": 0.9087, + "step": 6381 + }, + { + "epoch": 17.38964577656676, + "grad_norm": 8.3832426071167, + "learning_rate": 1.8933522883967363e-05, + "loss": 0.8979, + "step": 6382 + }, + { + "epoch": 17.392370572207085, + "grad_norm": 8.460915565490723, + "learning_rate": 1.893312629406306e-05, + "loss": 0.9712, + "step": 6383 + }, + { + "epoch": 17.39509536784741, + "grad_norm": 11.178568840026855, + "learning_rate": 1.8932729634587863e-05, + "loss": 0.9543, + "step": 6384 + }, + { + "epoch": 17.39782016348774, + "grad_norm": 8.727524757385254, + "learning_rate": 1.893233290554485e-05, + "loss": 0.9111, + "step": 6385 + }, + { + "epoch": 17.400544959128066, + "grad_norm": 9.653977394104004, + "learning_rate": 1.8931936106937116e-05, + "loss": 0.8831, + "step": 6386 + }, + { + "epoch": 17.40326975476839, + "grad_norm": 8.617438316345215, + "learning_rate": 1.8931539238767753e-05, + "loss": 0.8729, + "step": 6387 + }, + { + "epoch": 17.40599455040872, + "grad_norm": 11.906661033630371, + "learning_rate": 1.893114230103985e-05, + "loss": 0.8965, + "step": 6388 + }, + { + "epoch": 17.408719346049047, + "grad_norm": 8.372017860412598, + "learning_rate": 1.8930745293756496e-05, + "loss": 0.9081, + "step": 6389 + }, + { + "epoch": 17.411444141689373, + "grad_norm": 10.073421478271484, + "learning_rate": 1.8930348216920786e-05, + "loss": 0.8654, + "step": 6390 + }, + { + "epoch": 17.414168937329702, + "grad_norm": 10.309469223022461, + "learning_rate": 1.8929951070535814e-05, + "loss": 1.1105, + "step": 6391 + }, + { + "epoch": 17.416893732970028, + "grad_norm": 8.19256591796875, + "learning_rate": 1.8929553854604667e-05, + "loss": 0.9758, + "step": 6392 + }, + { + "epoch": 17.419618528610354, + "grad_norm": 8.794842720031738, + "learning_rate": 1.892915656913044e-05, + "loss": 0.8052, + "step": 6393 + }, + { + "epoch": 17.422343324250683, + "grad_norm": 9.917633056640625, + "learning_rate": 1.8928759214116236e-05, + "loss": 1.0466, + "step": 6394 + }, + { + "epoch": 17.42506811989101, + "grad_norm": 7.508038520812988, + "learning_rate": 1.8928361789565136e-05, + "loss": 0.8617, + "step": 6395 + }, + { + "epoch": 17.427792915531334, + "grad_norm": 10.217451095581055, + "learning_rate": 1.8927964295480244e-05, + "loss": 0.9473, + "step": 6396 + }, + { + "epoch": 17.430517711171664, + "grad_norm": 9.991721153259277, + "learning_rate": 1.8927566731864658e-05, + "loss": 1.0593, + "step": 6397 + }, + { + "epoch": 17.43324250681199, + "grad_norm": 7.884134292602539, + "learning_rate": 1.8927169098721462e-05, + "loss": 1.0217, + "step": 6398 + }, + { + "epoch": 17.435967302452315, + "grad_norm": 9.229854583740234, + "learning_rate": 1.892677139605377e-05, + "loss": 1.0544, + "step": 6399 + }, + { + "epoch": 17.438692098092645, + "grad_norm": 10.268136024475098, + "learning_rate": 1.892637362386466e-05, + "loss": 0.9286, + "step": 6400 + }, + { + "epoch": 17.44141689373297, + "grad_norm": 10.877610206604004, + "learning_rate": 1.8925975782157243e-05, + "loss": 1.0356, + "step": 6401 + }, + { + "epoch": 17.444141689373296, + "grad_norm": 10.455604553222656, + "learning_rate": 1.8925577870934612e-05, + "loss": 0.809, + "step": 6402 + }, + { + "epoch": 17.446866485013626, + "grad_norm": 8.860418319702148, + "learning_rate": 1.8925179890199873e-05, + "loss": 0.9276, + "step": 6403 + }, + { + "epoch": 17.44959128065395, + "grad_norm": 8.77723503112793, + "learning_rate": 1.8924781839956116e-05, + "loss": 1.0107, + "step": 6404 + }, + { + "epoch": 17.452316076294277, + "grad_norm": 9.204261779785156, + "learning_rate": 1.8924383720206445e-05, + "loss": 1.035, + "step": 6405 + }, + { + "epoch": 17.455040871934607, + "grad_norm": 10.360713005065918, + "learning_rate": 1.8923985530953963e-05, + "loss": 0.999, + "step": 6406 + }, + { + "epoch": 17.457765667574932, + "grad_norm": 12.03943920135498, + "learning_rate": 1.892358727220177e-05, + "loss": 0.9657, + "step": 6407 + }, + { + "epoch": 17.460490463215258, + "grad_norm": 9.930057525634766, + "learning_rate": 1.892318894395296e-05, + "loss": 1.1375, + "step": 6408 + }, + { + "epoch": 17.463215258855588, + "grad_norm": 7.339794158935547, + "learning_rate": 1.892279054621065e-05, + "loss": 0.7582, + "step": 6409 + }, + { + "epoch": 17.465940054495913, + "grad_norm": 13.046171188354492, + "learning_rate": 1.892239207897793e-05, + "loss": 0.934, + "step": 6410 + }, + { + "epoch": 17.46866485013624, + "grad_norm": 8.831766128540039, + "learning_rate": 1.892199354225791e-05, + "loss": 0.9197, + "step": 6411 + }, + { + "epoch": 17.47138964577657, + "grad_norm": 8.978260040283203, + "learning_rate": 1.8921594936053686e-05, + "loss": 1.1469, + "step": 6412 + }, + { + "epoch": 17.474114441416894, + "grad_norm": 8.057010650634766, + "learning_rate": 1.8921196260368374e-05, + "loss": 0.7601, + "step": 6413 + }, + { + "epoch": 17.47683923705722, + "grad_norm": 10.006945610046387, + "learning_rate": 1.892079751520507e-05, + "loss": 0.7833, + "step": 6414 + }, + { + "epoch": 17.479564032697546, + "grad_norm": 9.494051933288574, + "learning_rate": 1.8920398700566884e-05, + "loss": 0.8442, + "step": 6415 + }, + { + "epoch": 17.482288828337875, + "grad_norm": 10.400253295898438, + "learning_rate": 1.8919999816456917e-05, + "loss": 0.9158, + "step": 6416 + }, + { + "epoch": 17.4850136239782, + "grad_norm": 10.488839149475098, + "learning_rate": 1.8919600862878282e-05, + "loss": 0.8466, + "step": 6417 + }, + { + "epoch": 17.48773841961853, + "grad_norm": 7.895549774169922, + "learning_rate": 1.8919201839834078e-05, + "loss": 1.0416, + "step": 6418 + }, + { + "epoch": 17.490463215258856, + "grad_norm": 9.203743934631348, + "learning_rate": 1.891880274732742e-05, + "loss": 0.908, + "step": 6419 + }, + { + "epoch": 17.493188010899182, + "grad_norm": 6.967998027801514, + "learning_rate": 1.891840358536141e-05, + "loss": 0.7302, + "step": 6420 + }, + { + "epoch": 17.495912806539508, + "grad_norm": 7.7992329597473145, + "learning_rate": 1.8918004353939166e-05, + "loss": 0.8354, + "step": 6421 + }, + { + "epoch": 17.498637602179837, + "grad_norm": 10.46932315826416, + "learning_rate": 1.891760505306379e-05, + "loss": 0.958, + "step": 6422 + }, + { + "epoch": 17.501362397820163, + "grad_norm": 10.07521915435791, + "learning_rate": 1.8917205682738387e-05, + "loss": 0.8993, + "step": 6423 + }, + { + "epoch": 17.504087193460492, + "grad_norm": 8.106224060058594, + "learning_rate": 1.891680624296608e-05, + "loss": 0.9456, + "step": 6424 + }, + { + "epoch": 17.506811989100818, + "grad_norm": 14.495341300964355, + "learning_rate": 1.891640673374997e-05, + "loss": 1.0131, + "step": 6425 + }, + { + "epoch": 17.509536784741144, + "grad_norm": 9.03091049194336, + "learning_rate": 1.8916007155093168e-05, + "loss": 0.9318, + "step": 6426 + }, + { + "epoch": 17.51226158038147, + "grad_norm": 9.570588111877441, + "learning_rate": 1.8915607506998796e-05, + "loss": 1.0874, + "step": 6427 + }, + { + "epoch": 17.5149863760218, + "grad_norm": 13.135885238647461, + "learning_rate": 1.8915207789469954e-05, + "loss": 0.9535, + "step": 6428 + }, + { + "epoch": 17.517711171662125, + "grad_norm": 7.8600664138793945, + "learning_rate": 1.891480800250976e-05, + "loss": 0.8834, + "step": 6429 + }, + { + "epoch": 17.520435967302454, + "grad_norm": 12.449604034423828, + "learning_rate": 1.8914408146121333e-05, + "loss": 0.9648, + "step": 6430 + }, + { + "epoch": 17.52316076294278, + "grad_norm": 8.533634185791016, + "learning_rate": 1.891400822030778e-05, + "loss": 1.0886, + "step": 6431 + }, + { + "epoch": 17.525885558583106, + "grad_norm": 9.208283424377441, + "learning_rate": 1.891360822507222e-05, + "loss": 0.9509, + "step": 6432 + }, + { + "epoch": 17.52861035422343, + "grad_norm": 8.09561824798584, + "learning_rate": 1.8913208160417763e-05, + "loss": 0.9425, + "step": 6433 + }, + { + "epoch": 17.53133514986376, + "grad_norm": 10.107198715209961, + "learning_rate": 1.8912808026347527e-05, + "loss": 0.9836, + "step": 6434 + }, + { + "epoch": 17.534059945504087, + "grad_norm": 8.906506538391113, + "learning_rate": 1.8912407822864632e-05, + "loss": 0.8306, + "step": 6435 + }, + { + "epoch": 17.536784741144416, + "grad_norm": 8.324662208557129, + "learning_rate": 1.891200754997219e-05, + "loss": 0.9647, + "step": 6436 + }, + { + "epoch": 17.539509536784742, + "grad_norm": 6.878514289855957, + "learning_rate": 1.8911607207673318e-05, + "loss": 0.7291, + "step": 6437 + }, + { + "epoch": 17.542234332425068, + "grad_norm": 9.264095306396484, + "learning_rate": 1.891120679597114e-05, + "loss": 1.0203, + "step": 6438 + }, + { + "epoch": 17.544959128065393, + "grad_norm": 10.99022102355957, + "learning_rate": 1.891080631486877e-05, + "loss": 0.9336, + "step": 6439 + }, + { + "epoch": 17.547683923705723, + "grad_norm": 9.272268295288086, + "learning_rate": 1.8910405764369326e-05, + "loss": 1.0581, + "step": 6440 + }, + { + "epoch": 17.55040871934605, + "grad_norm": 10.952085494995117, + "learning_rate": 1.891000514447593e-05, + "loss": 0.8505, + "step": 6441 + }, + { + "epoch": 17.553133514986374, + "grad_norm": 8.9260892868042, + "learning_rate": 1.8909604455191698e-05, + "loss": 0.7598, + "step": 6442 + }, + { + "epoch": 17.555858310626704, + "grad_norm": 9.91944408416748, + "learning_rate": 1.8909203696519753e-05, + "loss": 0.9639, + "step": 6443 + }, + { + "epoch": 17.55858310626703, + "grad_norm": 10.126349449157715, + "learning_rate": 1.890880286846322e-05, + "loss": 1.0109, + "step": 6444 + }, + { + "epoch": 17.561307901907355, + "grad_norm": 7.965224742889404, + "learning_rate": 1.8908401971025214e-05, + "loss": 0.7958, + "step": 6445 + }, + { + "epoch": 17.564032697547685, + "grad_norm": 9.00943374633789, + "learning_rate": 1.890800100420886e-05, + "loss": 0.8862, + "step": 6446 + }, + { + "epoch": 17.56675749318801, + "grad_norm": 12.013262748718262, + "learning_rate": 1.8907599968017284e-05, + "loss": 0.9553, + "step": 6447 + }, + { + "epoch": 17.569482288828336, + "grad_norm": 8.990498542785645, + "learning_rate": 1.8907198862453604e-05, + "loss": 1.1107, + "step": 6448 + }, + { + "epoch": 17.572207084468666, + "grad_norm": 9.534433364868164, + "learning_rate": 1.8906797687520944e-05, + "loss": 0.9305, + "step": 6449 + }, + { + "epoch": 17.57493188010899, + "grad_norm": 8.413612365722656, + "learning_rate": 1.8906396443222436e-05, + "loss": 0.8855, + "step": 6450 + }, + { + "epoch": 17.577656675749317, + "grad_norm": 9.258137702941895, + "learning_rate": 1.8905995129561195e-05, + "loss": 1.0669, + "step": 6451 + }, + { + "epoch": 17.580381471389646, + "grad_norm": 8.99902057647705, + "learning_rate": 1.890559374654035e-05, + "loss": 0.9724, + "step": 6452 + }, + { + "epoch": 17.583106267029972, + "grad_norm": 8.523558616638184, + "learning_rate": 1.8905192294163028e-05, + "loss": 0.8833, + "step": 6453 + }, + { + "epoch": 17.585831062670298, + "grad_norm": 8.714370727539062, + "learning_rate": 1.8904790772432355e-05, + "loss": 1.0326, + "step": 6454 + }, + { + "epoch": 17.588555858310627, + "grad_norm": 10.08273696899414, + "learning_rate": 1.890438918135146e-05, + "loss": 1.0527, + "step": 6455 + }, + { + "epoch": 17.591280653950953, + "grad_norm": 8.469697952270508, + "learning_rate": 1.8903987520923465e-05, + "loss": 0.9312, + "step": 6456 + }, + { + "epoch": 17.59400544959128, + "grad_norm": 8.257137298583984, + "learning_rate": 1.8903585791151506e-05, + "loss": 0.998, + "step": 6457 + }, + { + "epoch": 17.59673024523161, + "grad_norm": 8.074660301208496, + "learning_rate": 1.8903183992038705e-05, + "loss": 0.8622, + "step": 6458 + }, + { + "epoch": 17.599455040871934, + "grad_norm": 18.93331527709961, + "learning_rate": 1.8902782123588194e-05, + "loss": 1.0923, + "step": 6459 + }, + { + "epoch": 17.60217983651226, + "grad_norm": 6.862919807434082, + "learning_rate": 1.8902380185803103e-05, + "loss": 0.8423, + "step": 6460 + }, + { + "epoch": 17.60490463215259, + "grad_norm": 6.449989318847656, + "learning_rate": 1.8901978178686563e-05, + "loss": 0.962, + "step": 6461 + }, + { + "epoch": 17.607629427792915, + "grad_norm": 7.540862083435059, + "learning_rate": 1.8901576102241698e-05, + "loss": 0.9778, + "step": 6462 + }, + { + "epoch": 17.61035422343324, + "grad_norm": 8.875688552856445, + "learning_rate": 1.890117395647165e-05, + "loss": 0.9824, + "step": 6463 + }, + { + "epoch": 17.61307901907357, + "grad_norm": 8.375256538391113, + "learning_rate": 1.8900771741379544e-05, + "loss": 1.0098, + "step": 6464 + }, + { + "epoch": 17.615803814713896, + "grad_norm": 9.36380386352539, + "learning_rate": 1.8900369456968513e-05, + "loss": 0.9539, + "step": 6465 + }, + { + "epoch": 17.618528610354222, + "grad_norm": 8.860440254211426, + "learning_rate": 1.8899967103241693e-05, + "loss": 0.8457, + "step": 6466 + }, + { + "epoch": 17.62125340599455, + "grad_norm": 7.205599784851074, + "learning_rate": 1.8899564680202215e-05, + "loss": 1.0072, + "step": 6467 + }, + { + "epoch": 17.623978201634877, + "grad_norm": 9.090911865234375, + "learning_rate": 1.8899162187853215e-05, + "loss": 0.9652, + "step": 6468 + }, + { + "epoch": 17.626702997275203, + "grad_norm": 11.18416976928711, + "learning_rate": 1.889875962619782e-05, + "loss": 0.9319, + "step": 6469 + }, + { + "epoch": 17.629427792915532, + "grad_norm": 7.465579986572266, + "learning_rate": 1.889835699523918e-05, + "loss": 0.9143, + "step": 6470 + }, + { + "epoch": 17.632152588555858, + "grad_norm": 8.837275505065918, + "learning_rate": 1.889795429498042e-05, + "loss": 0.9601, + "step": 6471 + }, + { + "epoch": 17.634877384196184, + "grad_norm": 8.674745559692383, + "learning_rate": 1.8897551525424674e-05, + "loss": 0.9813, + "step": 6472 + }, + { + "epoch": 17.637602179836513, + "grad_norm": 7.9291839599609375, + "learning_rate": 1.889714868657509e-05, + "loss": 0.9471, + "step": 6473 + }, + { + "epoch": 17.64032697547684, + "grad_norm": 9.651131629943848, + "learning_rate": 1.8896745778434793e-05, + "loss": 0.8705, + "step": 6474 + }, + { + "epoch": 17.643051771117165, + "grad_norm": 7.559269428253174, + "learning_rate": 1.8896342801006927e-05, + "loss": 0.8284, + "step": 6475 + }, + { + "epoch": 17.645776566757494, + "grad_norm": 10.888666152954102, + "learning_rate": 1.8895939754294627e-05, + "loss": 0.8474, + "step": 6476 + }, + { + "epoch": 17.64850136239782, + "grad_norm": 8.872111320495605, + "learning_rate": 1.889553663830104e-05, + "loss": 0.9799, + "step": 6477 + }, + { + "epoch": 17.651226158038146, + "grad_norm": 11.895491600036621, + "learning_rate": 1.88951334530293e-05, + "loss": 1.1519, + "step": 6478 + }, + { + "epoch": 17.653950953678475, + "grad_norm": 17.710891723632812, + "learning_rate": 1.8894730198482543e-05, + "loss": 1.0701, + "step": 6479 + }, + { + "epoch": 17.6566757493188, + "grad_norm": 8.096800804138184, + "learning_rate": 1.889432687466391e-05, + "loss": 0.7501, + "step": 6480 + }, + { + "epoch": 17.659400544959126, + "grad_norm": 9.141026496887207, + "learning_rate": 1.8893923481576555e-05, + "loss": 0.9192, + "step": 6481 + }, + { + "epoch": 17.662125340599456, + "grad_norm": 8.910099029541016, + "learning_rate": 1.8893520019223605e-05, + "loss": 0.9043, + "step": 6482 + }, + { + "epoch": 17.66485013623978, + "grad_norm": 8.54745101928711, + "learning_rate": 1.889311648760821e-05, + "loss": 1.0664, + "step": 6483 + }, + { + "epoch": 17.667574931880107, + "grad_norm": 7.215934753417969, + "learning_rate": 1.8892712886733506e-05, + "loss": 1.1074, + "step": 6484 + }, + { + "epoch": 17.670299727520437, + "grad_norm": 10.302400588989258, + "learning_rate": 1.8892309216602642e-05, + "loss": 0.9835, + "step": 6485 + }, + { + "epoch": 17.673024523160763, + "grad_norm": 7.602528095245361, + "learning_rate": 1.889190547721876e-05, + "loss": 0.9707, + "step": 6486 + }, + { + "epoch": 17.67574931880109, + "grad_norm": 9.652894020080566, + "learning_rate": 1.8891501668585006e-05, + "loss": 0.9296, + "step": 6487 + }, + { + "epoch": 17.678474114441418, + "grad_norm": 7.052173614501953, + "learning_rate": 1.8891097790704522e-05, + "loss": 0.9863, + "step": 6488 + }, + { + "epoch": 17.681198910081743, + "grad_norm": 9.30596923828125, + "learning_rate": 1.8890693843580454e-05, + "loss": 0.8997, + "step": 6489 + }, + { + "epoch": 17.68392370572207, + "grad_norm": 11.857169151306152, + "learning_rate": 1.8890289827215952e-05, + "loss": 1.0737, + "step": 6490 + }, + { + "epoch": 17.6866485013624, + "grad_norm": 11.911252975463867, + "learning_rate": 1.8889885741614153e-05, + "loss": 1.144, + "step": 6491 + }, + { + "epoch": 17.689373297002724, + "grad_norm": 8.49942398071289, + "learning_rate": 1.8889481586778212e-05, + "loss": 1.0328, + "step": 6492 + }, + { + "epoch": 17.69209809264305, + "grad_norm": 7.845510959625244, + "learning_rate": 1.8889077362711277e-05, + "loss": 0.7596, + "step": 6493 + }, + { + "epoch": 17.69482288828338, + "grad_norm": 11.397034645080566, + "learning_rate": 1.888867306941649e-05, + "loss": 1.0274, + "step": 6494 + }, + { + "epoch": 17.697547683923705, + "grad_norm": 9.5137357711792, + "learning_rate": 1.8888268706897007e-05, + "loss": 1.0266, + "step": 6495 + }, + { + "epoch": 17.70027247956403, + "grad_norm": 8.97117805480957, + "learning_rate": 1.888786427515597e-05, + "loss": 0.8964, + "step": 6496 + }, + { + "epoch": 17.70299727520436, + "grad_norm": 8.997941970825195, + "learning_rate": 1.8887459774196536e-05, + "loss": 1.072, + "step": 6497 + }, + { + "epoch": 17.705722070844686, + "grad_norm": 7.437220573425293, + "learning_rate": 1.888705520402185e-05, + "loss": 0.8298, + "step": 6498 + }, + { + "epoch": 17.708446866485012, + "grad_norm": 7.677548408508301, + "learning_rate": 1.888665056463506e-05, + "loss": 1.0582, + "step": 6499 + }, + { + "epoch": 17.71117166212534, + "grad_norm": 8.739337921142578, + "learning_rate": 1.888624585603933e-05, + "loss": 0.9309, + "step": 6500 + }, + { + "epoch": 17.713896457765667, + "grad_norm": 10.512234687805176, + "learning_rate": 1.888584107823779e-05, + "loss": 0.9874, + "step": 6501 + }, + { + "epoch": 17.716621253405993, + "grad_norm": 9.074308395385742, + "learning_rate": 1.8885436231233617e-05, + "loss": 1.1477, + "step": 6502 + }, + { + "epoch": 17.719346049046322, + "grad_norm": 9.153244972229004, + "learning_rate": 1.888503131502995e-05, + "loss": 0.9447, + "step": 6503 + }, + { + "epoch": 17.722070844686648, + "grad_norm": 8.506519317626953, + "learning_rate": 1.8884626329629942e-05, + "loss": 1.1488, + "step": 6504 + }, + { + "epoch": 17.724795640326974, + "grad_norm": 11.738155364990234, + "learning_rate": 1.8884221275036753e-05, + "loss": 0.743, + "step": 6505 + }, + { + "epoch": 17.727520435967303, + "grad_norm": 7.9107489585876465, + "learning_rate": 1.8883816151253532e-05, + "loss": 0.8867, + "step": 6506 + }, + { + "epoch": 17.73024523160763, + "grad_norm": 7.033042907714844, + "learning_rate": 1.888341095828344e-05, + "loss": 0.9698, + "step": 6507 + }, + { + "epoch": 17.732970027247955, + "grad_norm": 10.325312614440918, + "learning_rate": 1.888300569612963e-05, + "loss": 0.9685, + "step": 6508 + }, + { + "epoch": 17.735694822888284, + "grad_norm": 8.544760704040527, + "learning_rate": 1.8882600364795255e-05, + "loss": 1.1158, + "step": 6509 + }, + { + "epoch": 17.73841961852861, + "grad_norm": 8.458165168762207, + "learning_rate": 1.8882194964283473e-05, + "loss": 0.7937, + "step": 6510 + }, + { + "epoch": 17.741144414168936, + "grad_norm": 7.65460205078125, + "learning_rate": 1.888178949459745e-05, + "loss": 0.7695, + "step": 6511 + }, + { + "epoch": 17.743869209809265, + "grad_norm": 17.94519805908203, + "learning_rate": 1.8881383955740324e-05, + "loss": 1.012, + "step": 6512 + }, + { + "epoch": 17.74659400544959, + "grad_norm": 8.303767204284668, + "learning_rate": 1.8880978347715272e-05, + "loss": 0.8011, + "step": 6513 + }, + { + "epoch": 17.749318801089917, + "grad_norm": 9.062012672424316, + "learning_rate": 1.888057267052545e-05, + "loss": 0.9065, + "step": 6514 + }, + { + "epoch": 17.752043596730246, + "grad_norm": 9.889007568359375, + "learning_rate": 1.888016692417401e-05, + "loss": 0.9719, + "step": 6515 + }, + { + "epoch": 17.754768392370572, + "grad_norm": 9.427414894104004, + "learning_rate": 1.8879761108664114e-05, + "loss": 0.9438, + "step": 6516 + }, + { + "epoch": 17.757493188010898, + "grad_norm": 12.378963470458984, + "learning_rate": 1.8879355223998928e-05, + "loss": 0.8348, + "step": 6517 + }, + { + "epoch": 17.760217983651227, + "grad_norm": 7.321284770965576, + "learning_rate": 1.8878949270181606e-05, + "loss": 0.9183, + "step": 6518 + }, + { + "epoch": 17.762942779291553, + "grad_norm": 12.255606651306152, + "learning_rate": 1.8878543247215314e-05, + "loss": 1.0635, + "step": 6519 + }, + { + "epoch": 17.76566757493188, + "grad_norm": 7.989128589630127, + "learning_rate": 1.8878137155103214e-05, + "loss": 0.8168, + "step": 6520 + }, + { + "epoch": 17.768392370572208, + "grad_norm": 7.796993732452393, + "learning_rate": 1.887773099384847e-05, + "loss": 0.8943, + "step": 6521 + }, + { + "epoch": 17.771117166212534, + "grad_norm": 9.63947582244873, + "learning_rate": 1.887732476345424e-05, + "loss": 1.1299, + "step": 6522 + }, + { + "epoch": 17.77384196185286, + "grad_norm": 9.127558708190918, + "learning_rate": 1.887691846392369e-05, + "loss": 0.9191, + "step": 6523 + }, + { + "epoch": 17.77656675749319, + "grad_norm": 6.981589317321777, + "learning_rate": 1.8876512095259986e-05, + "loss": 0.7831, + "step": 6524 + }, + { + "epoch": 17.779291553133515, + "grad_norm": 10.201642036437988, + "learning_rate": 1.8876105657466287e-05, + "loss": 0.8218, + "step": 6525 + }, + { + "epoch": 17.78201634877384, + "grad_norm": 7.945437908172607, + "learning_rate": 1.8875699150545768e-05, + "loss": 0.9926, + "step": 6526 + }, + { + "epoch": 17.78474114441417, + "grad_norm": 13.129316329956055, + "learning_rate": 1.887529257450159e-05, + "loss": 1.011, + "step": 6527 + }, + { + "epoch": 17.787465940054496, + "grad_norm": 7.099358558654785, + "learning_rate": 1.8874885929336916e-05, + "loss": 0.9521, + "step": 6528 + }, + { + "epoch": 17.79019073569482, + "grad_norm": 8.41981029510498, + "learning_rate": 1.8874479215054916e-05, + "loss": 0.8042, + "step": 6529 + }, + { + "epoch": 17.79291553133515, + "grad_norm": 7.612015247344971, + "learning_rate": 1.887407243165876e-05, + "loss": 1.0214, + "step": 6530 + }, + { + "epoch": 17.795640326975477, + "grad_norm": 7.234619140625, + "learning_rate": 1.887366557915161e-05, + "loss": 1.1766, + "step": 6531 + }, + { + "epoch": 17.798365122615802, + "grad_norm": 10.151055335998535, + "learning_rate": 1.8873258657536643e-05, + "loss": 0.7668, + "step": 6532 + }, + { + "epoch": 17.80108991825613, + "grad_norm": 11.343910217285156, + "learning_rate": 1.8872851666817017e-05, + "loss": 0.9978, + "step": 6533 + }, + { + "epoch": 17.803814713896458, + "grad_norm": 7.596022605895996, + "learning_rate": 1.8872444606995915e-05, + "loss": 0.8854, + "step": 6534 + }, + { + "epoch": 17.806539509536783, + "grad_norm": 11.584070205688477, + "learning_rate": 1.8872037478076494e-05, + "loss": 1.0798, + "step": 6535 + }, + { + "epoch": 17.809264305177113, + "grad_norm": 11.176453590393066, + "learning_rate": 1.8871630280061933e-05, + "loss": 0.9156, + "step": 6536 + }, + { + "epoch": 17.81198910081744, + "grad_norm": 7.551270961761475, + "learning_rate": 1.8871223012955402e-05, + "loss": 0.813, + "step": 6537 + }, + { + "epoch": 17.814713896457764, + "grad_norm": 7.892640113830566, + "learning_rate": 1.887081567676007e-05, + "loss": 0.7803, + "step": 6538 + }, + { + "epoch": 17.817438692098094, + "grad_norm": 8.432889938354492, + "learning_rate": 1.887040827147911e-05, + "loss": 1.0027, + "step": 6539 + }, + { + "epoch": 17.82016348773842, + "grad_norm": 10.599292755126953, + "learning_rate": 1.88700007971157e-05, + "loss": 0.9885, + "step": 6540 + }, + { + "epoch": 17.822888283378745, + "grad_norm": 13.277148246765137, + "learning_rate": 1.8869593253673005e-05, + "loss": 0.8337, + "step": 6541 + }, + { + "epoch": 17.825613079019075, + "grad_norm": 10.260055541992188, + "learning_rate": 1.8869185641154204e-05, + "loss": 1.01, + "step": 6542 + }, + { + "epoch": 17.8283378746594, + "grad_norm": 11.372323989868164, + "learning_rate": 1.8868777959562472e-05, + "loss": 1.0792, + "step": 6543 + }, + { + "epoch": 17.831062670299726, + "grad_norm": 9.509187698364258, + "learning_rate": 1.886837020890098e-05, + "loss": 0.9797, + "step": 6544 + }, + { + "epoch": 17.833787465940055, + "grad_norm": 7.478908538818359, + "learning_rate": 1.8867962389172912e-05, + "loss": 0.8768, + "step": 6545 + }, + { + "epoch": 17.83651226158038, + "grad_norm": 7.537795543670654, + "learning_rate": 1.8867554500381433e-05, + "loss": 0.9341, + "step": 6546 + }, + { + "epoch": 17.839237057220707, + "grad_norm": 6.650048732757568, + "learning_rate": 1.886714654252973e-05, + "loss": 0.697, + "step": 6547 + }, + { + "epoch": 17.841961852861036, + "grad_norm": 8.197768211364746, + "learning_rate": 1.886673851562097e-05, + "loss": 0.8198, + "step": 6548 + }, + { + "epoch": 17.844686648501362, + "grad_norm": 7.36025333404541, + "learning_rate": 1.8866330419658338e-05, + "loss": 1.0024, + "step": 6549 + }, + { + "epoch": 17.847411444141688, + "grad_norm": 7.918854236602783, + "learning_rate": 1.8865922254645008e-05, + "loss": 0.9758, + "step": 6550 + }, + { + "epoch": 17.850136239782017, + "grad_norm": 11.31563663482666, + "learning_rate": 1.8865514020584164e-05, + "loss": 1.0156, + "step": 6551 + }, + { + "epoch": 17.852861035422343, + "grad_norm": 9.666770935058594, + "learning_rate": 1.886510571747898e-05, + "loss": 1.0446, + "step": 6552 + }, + { + "epoch": 17.85558583106267, + "grad_norm": 10.833832740783691, + "learning_rate": 1.886469734533264e-05, + "loss": 0.8052, + "step": 6553 + }, + { + "epoch": 17.858310626703, + "grad_norm": 9.465039253234863, + "learning_rate": 1.886428890414832e-05, + "loss": 0.9031, + "step": 6554 + }, + { + "epoch": 17.861035422343324, + "grad_norm": 12.025474548339844, + "learning_rate": 1.8863880393929202e-05, + "loss": 0.8853, + "step": 6555 + }, + { + "epoch": 17.86376021798365, + "grad_norm": 9.478365898132324, + "learning_rate": 1.8863471814678475e-05, + "loss": 0.9048, + "step": 6556 + }, + { + "epoch": 17.86648501362398, + "grad_norm": 8.645143508911133, + "learning_rate": 1.886306316639931e-05, + "loss": 0.9694, + "step": 6557 + }, + { + "epoch": 17.869209809264305, + "grad_norm": 9.461164474487305, + "learning_rate": 1.8862654449094892e-05, + "loss": 0.9735, + "step": 6558 + }, + { + "epoch": 17.87193460490463, + "grad_norm": 7.370994567871094, + "learning_rate": 1.886224566276841e-05, + "loss": 0.7737, + "step": 6559 + }, + { + "epoch": 17.87465940054496, + "grad_norm": 8.07332992553711, + "learning_rate": 1.8861836807423045e-05, + "loss": 0.8976, + "step": 6560 + }, + { + "epoch": 17.877384196185286, + "grad_norm": 8.453144073486328, + "learning_rate": 1.8861427883061977e-05, + "loss": 0.9255, + "step": 6561 + }, + { + "epoch": 17.88010899182561, + "grad_norm": 7.679013252258301, + "learning_rate": 1.8861018889688395e-05, + "loss": 0.7972, + "step": 6562 + }, + { + "epoch": 17.88283378746594, + "grad_norm": 9.931220054626465, + "learning_rate": 1.8860609827305487e-05, + "loss": 1.0492, + "step": 6563 + }, + { + "epoch": 17.885558583106267, + "grad_norm": 8.279606819152832, + "learning_rate": 1.886020069591643e-05, + "loss": 1.0369, + "step": 6564 + }, + { + "epoch": 17.888283378746593, + "grad_norm": 10.057707786560059, + "learning_rate": 1.885979149552442e-05, + "loss": 1.0364, + "step": 6565 + }, + { + "epoch": 17.891008174386922, + "grad_norm": 7.192422866821289, + "learning_rate": 1.8859382226132635e-05, + "loss": 0.9194, + "step": 6566 + }, + { + "epoch": 17.893732970027248, + "grad_norm": 9.681727409362793, + "learning_rate": 1.8858972887744268e-05, + "loss": 1.0321, + "step": 6567 + }, + { + "epoch": 17.896457765667574, + "grad_norm": 18.173507690429688, + "learning_rate": 1.8858563480362503e-05, + "loss": 0.9209, + "step": 6568 + }, + { + "epoch": 17.899182561307903, + "grad_norm": 8.38066291809082, + "learning_rate": 1.885815400399053e-05, + "loss": 0.908, + "step": 6569 + }, + { + "epoch": 17.90190735694823, + "grad_norm": 8.17420482635498, + "learning_rate": 1.885774445863154e-05, + "loss": 0.939, + "step": 6570 + }, + { + "epoch": 17.904632152588555, + "grad_norm": 7.61351203918457, + "learning_rate": 1.8857334844288723e-05, + "loss": 0.9016, + "step": 6571 + }, + { + "epoch": 17.907356948228884, + "grad_norm": 7.483287811279297, + "learning_rate": 1.8856925160965267e-05, + "loss": 0.9607, + "step": 6572 + }, + { + "epoch": 17.91008174386921, + "grad_norm": 8.12373161315918, + "learning_rate": 1.8856515408664363e-05, + "loss": 0.9045, + "step": 6573 + }, + { + "epoch": 17.912806539509535, + "grad_norm": 10.766953468322754, + "learning_rate": 1.88561055873892e-05, + "loss": 1.0854, + "step": 6574 + }, + { + "epoch": 17.915531335149865, + "grad_norm": 7.82476806640625, + "learning_rate": 1.8855695697142972e-05, + "loss": 1.0293, + "step": 6575 + }, + { + "epoch": 17.91825613079019, + "grad_norm": 13.205169677734375, + "learning_rate": 1.8855285737928874e-05, + "loss": 1.1251, + "step": 6576 + }, + { + "epoch": 17.920980926430516, + "grad_norm": 8.568056106567383, + "learning_rate": 1.8854875709750092e-05, + "loss": 0.9249, + "step": 6577 + }, + { + "epoch": 17.923705722070846, + "grad_norm": 9.343592643737793, + "learning_rate": 1.8854465612609828e-05, + "loss": 1.0399, + "step": 6578 + }, + { + "epoch": 17.92643051771117, + "grad_norm": 8.471595764160156, + "learning_rate": 1.8854055446511267e-05, + "loss": 0.7042, + "step": 6579 + }, + { + "epoch": 17.929155313351497, + "grad_norm": 8.00652027130127, + "learning_rate": 1.8853645211457606e-05, + "loss": 1.0095, + "step": 6580 + }, + { + "epoch": 17.931880108991827, + "grad_norm": 8.351338386535645, + "learning_rate": 1.8853234907452042e-05, + "loss": 1.0315, + "step": 6581 + }, + { + "epoch": 17.934604904632153, + "grad_norm": 9.317249298095703, + "learning_rate": 1.8852824534497772e-05, + "loss": 0.9215, + "step": 6582 + }, + { + "epoch": 17.93732970027248, + "grad_norm": 10.584437370300293, + "learning_rate": 1.8852414092597985e-05, + "loss": 0.7916, + "step": 6583 + }, + { + "epoch": 17.940054495912808, + "grad_norm": 6.993414402008057, + "learning_rate": 1.8852003581755886e-05, + "loss": 0.9595, + "step": 6584 + }, + { + "epoch": 17.942779291553133, + "grad_norm": 7.56000280380249, + "learning_rate": 1.8851593001974663e-05, + "loss": 0.8101, + "step": 6585 + }, + { + "epoch": 17.94550408719346, + "grad_norm": 9.294096946716309, + "learning_rate": 1.8851182353257524e-05, + "loss": 1.0363, + "step": 6586 + }, + { + "epoch": 17.94822888283379, + "grad_norm": 7.075156211853027, + "learning_rate": 1.885077163560766e-05, + "loss": 0.7717, + "step": 6587 + }, + { + "epoch": 17.950953678474114, + "grad_norm": 8.787549018859863, + "learning_rate": 1.885036084902827e-05, + "loss": 0.8955, + "step": 6588 + }, + { + "epoch": 17.95367847411444, + "grad_norm": 9.324135780334473, + "learning_rate": 1.8849949993522557e-05, + "loss": 1.0061, + "step": 6589 + }, + { + "epoch": 17.95640326975477, + "grad_norm": 12.604859352111816, + "learning_rate": 1.8849539069093717e-05, + "loss": 0.9661, + "step": 6590 + }, + { + "epoch": 17.959128065395095, + "grad_norm": 8.067110061645508, + "learning_rate": 1.884912807574495e-05, + "loss": 0.9313, + "step": 6591 + }, + { + "epoch": 17.96185286103542, + "grad_norm": 8.262900352478027, + "learning_rate": 1.884871701347946e-05, + "loss": 0.9541, + "step": 6592 + }, + { + "epoch": 17.96457765667575, + "grad_norm": 9.744215965270996, + "learning_rate": 1.884830588230045e-05, + "loss": 0.989, + "step": 6593 + }, + { + "epoch": 17.967302452316076, + "grad_norm": 7.75123405456543, + "learning_rate": 1.8847894682211113e-05, + "loss": 0.9637, + "step": 6594 + }, + { + "epoch": 17.970027247956402, + "grad_norm": 8.812027931213379, + "learning_rate": 1.884748341321466e-05, + "loss": 0.925, + "step": 6595 + }, + { + "epoch": 17.97275204359673, + "grad_norm": 7.7459588050842285, + "learning_rate": 1.8847072075314288e-05, + "loss": 0.9319, + "step": 6596 + }, + { + "epoch": 17.975476839237057, + "grad_norm": 8.137155532836914, + "learning_rate": 1.8846660668513206e-05, + "loss": 0.8538, + "step": 6597 + }, + { + "epoch": 17.978201634877383, + "grad_norm": 10.407999992370605, + "learning_rate": 1.8846249192814613e-05, + "loss": 1.0244, + "step": 6598 + }, + { + "epoch": 17.980926430517712, + "grad_norm": 8.504861831665039, + "learning_rate": 1.884583764822172e-05, + "loss": 0.8186, + "step": 6599 + }, + { + "epoch": 17.983651226158038, + "grad_norm": 8.649380683898926, + "learning_rate": 1.8845426034737724e-05, + "loss": 0.7762, + "step": 6600 + }, + { + "epoch": 17.986376021798364, + "grad_norm": 7.561326503753662, + "learning_rate": 1.8845014352365836e-05, + "loss": 0.8407, + "step": 6601 + }, + { + "epoch": 17.989100817438693, + "grad_norm": 7.720953464508057, + "learning_rate": 1.8844602601109265e-05, + "loss": 0.9877, + "step": 6602 + }, + { + "epoch": 17.99182561307902, + "grad_norm": 9.713851928710938, + "learning_rate": 1.884419078097121e-05, + "loss": 1.0118, + "step": 6603 + }, + { + "epoch": 17.994550408719345, + "grad_norm": 8.336447715759277, + "learning_rate": 1.8843778891954883e-05, + "loss": 0.8303, + "step": 6604 + }, + { + "epoch": 17.997275204359674, + "grad_norm": 8.688618659973145, + "learning_rate": 1.884336693406349e-05, + "loss": 1.0134, + "step": 6605 + }, + { + "epoch": 18.0, + "grad_norm": 12.853461265563965, + "learning_rate": 1.8842954907300236e-05, + "loss": 1.071, + "step": 6606 + }, + { + "epoch": 18.002724795640326, + "grad_norm": 7.621571063995361, + "learning_rate": 1.884254281166834e-05, + "loss": 0.8401, + "step": 6607 + }, + { + "epoch": 18.005449591280655, + "grad_norm": 6.969585418701172, + "learning_rate": 1.8842130647171003e-05, + "loss": 0.7584, + "step": 6608 + }, + { + "epoch": 18.00817438692098, + "grad_norm": 9.190740585327148, + "learning_rate": 1.8841718413811433e-05, + "loss": 0.9208, + "step": 6609 + }, + { + "epoch": 18.010899182561307, + "grad_norm": 7.002579689025879, + "learning_rate": 1.884130611159285e-05, + "loss": 0.8711, + "step": 6610 + }, + { + "epoch": 18.013623978201636, + "grad_norm": 9.554093360900879, + "learning_rate": 1.8840893740518458e-05, + "loss": 0.8696, + "step": 6611 + }, + { + "epoch": 18.016348773841962, + "grad_norm": 7.839029788970947, + "learning_rate": 1.8840481300591473e-05, + "loss": 0.691, + "step": 6612 + }, + { + "epoch": 18.019073569482288, + "grad_norm": 9.62078857421875, + "learning_rate": 1.88400687918151e-05, + "loss": 1.0929, + "step": 6613 + }, + { + "epoch": 18.021798365122617, + "grad_norm": 8.053839683532715, + "learning_rate": 1.8839656214192557e-05, + "loss": 0.7987, + "step": 6614 + }, + { + "epoch": 18.024523160762943, + "grad_norm": 7.5099663734436035, + "learning_rate": 1.8839243567727053e-05, + "loss": 0.8634, + "step": 6615 + }, + { + "epoch": 18.02724795640327, + "grad_norm": 7.961956024169922, + "learning_rate": 1.8838830852421807e-05, + "loss": 0.816, + "step": 6616 + }, + { + "epoch": 18.029972752043598, + "grad_norm": 7.8157958984375, + "learning_rate": 1.8838418068280032e-05, + "loss": 0.7692, + "step": 6617 + }, + { + "epoch": 18.032697547683924, + "grad_norm": 8.519083976745605, + "learning_rate": 1.883800521530494e-05, + "loss": 0.8165, + "step": 6618 + }, + { + "epoch": 18.03542234332425, + "grad_norm": 8.912421226501465, + "learning_rate": 1.8837592293499747e-05, + "loss": 0.8987, + "step": 6619 + }, + { + "epoch": 18.03814713896458, + "grad_norm": 7.688618183135986, + "learning_rate": 1.883717930286767e-05, + "loss": 0.8966, + "step": 6620 + }, + { + "epoch": 18.040871934604905, + "grad_norm": 8.02383804321289, + "learning_rate": 1.8836766243411932e-05, + "loss": 0.8664, + "step": 6621 + }, + { + "epoch": 18.04359673024523, + "grad_norm": 7.162313461303711, + "learning_rate": 1.8836353115135735e-05, + "loss": 0.764, + "step": 6622 + }, + { + "epoch": 18.04632152588556, + "grad_norm": 8.650481224060059, + "learning_rate": 1.8835939918042308e-05, + "loss": 0.8461, + "step": 6623 + }, + { + "epoch": 18.049046321525886, + "grad_norm": 9.792577743530273, + "learning_rate": 1.883552665213486e-05, + "loss": 0.903, + "step": 6624 + }, + { + "epoch": 18.05177111716621, + "grad_norm": 9.125471115112305, + "learning_rate": 1.883511331741662e-05, + "loss": 0.837, + "step": 6625 + }, + { + "epoch": 18.05449591280654, + "grad_norm": 7.903054237365723, + "learning_rate": 1.88346999138908e-05, + "loss": 0.7997, + "step": 6626 + }, + { + "epoch": 18.057220708446867, + "grad_norm": 7.64015007019043, + "learning_rate": 1.8834286441560622e-05, + "loss": 0.8661, + "step": 6627 + }, + { + "epoch": 18.059945504087192, + "grad_norm": 7.844747543334961, + "learning_rate": 1.8833872900429307e-05, + "loss": 1.0045, + "step": 6628 + }, + { + "epoch": 18.06267029972752, + "grad_norm": 7.97361946105957, + "learning_rate": 1.8833459290500073e-05, + "loss": 0.8038, + "step": 6629 + }, + { + "epoch": 18.065395095367847, + "grad_norm": 8.794074058532715, + "learning_rate": 1.8833045611776143e-05, + "loss": 1.0504, + "step": 6630 + }, + { + "epoch": 18.068119891008173, + "grad_norm": 7.852278709411621, + "learning_rate": 1.883263186426073e-05, + "loss": 0.8947, + "step": 6631 + }, + { + "epoch": 18.070844686648503, + "grad_norm": 9.553807258605957, + "learning_rate": 1.8832218047957072e-05, + "loss": 0.7778, + "step": 6632 + }, + { + "epoch": 18.07356948228883, + "grad_norm": 8.006525039672852, + "learning_rate": 1.883180416286839e-05, + "loss": 0.936, + "step": 6633 + }, + { + "epoch": 18.076294277929154, + "grad_norm": 8.542932510375977, + "learning_rate": 1.8831390208997892e-05, + "loss": 0.6926, + "step": 6634 + }, + { + "epoch": 18.079019073569484, + "grad_norm": 7.582610130310059, + "learning_rate": 1.883097618634881e-05, + "loss": 0.7317, + "step": 6635 + }, + { + "epoch": 18.08174386920981, + "grad_norm": 7.989914894104004, + "learning_rate": 1.8830562094924375e-05, + "loss": 0.8495, + "step": 6636 + }, + { + "epoch": 18.084468664850135, + "grad_norm": 8.978856086730957, + "learning_rate": 1.8830147934727806e-05, + "loss": 0.8517, + "step": 6637 + }, + { + "epoch": 18.087193460490465, + "grad_norm": 8.952409744262695, + "learning_rate": 1.882973370576233e-05, + "loss": 0.8947, + "step": 6638 + }, + { + "epoch": 18.08991825613079, + "grad_norm": 7.963160037994385, + "learning_rate": 1.882931940803117e-05, + "loss": 0.7739, + "step": 6639 + }, + { + "epoch": 18.092643051771116, + "grad_norm": 8.281893730163574, + "learning_rate": 1.8828905041537556e-05, + "loss": 0.7975, + "step": 6640 + }, + { + "epoch": 18.095367847411445, + "grad_norm": 8.743407249450684, + "learning_rate": 1.882849060628471e-05, + "loss": 0.8799, + "step": 6641 + }, + { + "epoch": 18.09809264305177, + "grad_norm": 9.185464859008789, + "learning_rate": 1.882807610227587e-05, + "loss": 0.9502, + "step": 6642 + }, + { + "epoch": 18.100817438692097, + "grad_norm": 10.43502426147461, + "learning_rate": 1.882766152951425e-05, + "loss": 0.9673, + "step": 6643 + }, + { + "epoch": 18.103542234332426, + "grad_norm": 7.852787971496582, + "learning_rate": 1.882724688800309e-05, + "loss": 0.9082, + "step": 6644 + }, + { + "epoch": 18.106267029972752, + "grad_norm": 8.680418014526367, + "learning_rate": 1.8826832177745617e-05, + "loss": 0.9612, + "step": 6645 + }, + { + "epoch": 18.108991825613078, + "grad_norm": 11.557866096496582, + "learning_rate": 1.882641739874506e-05, + "loss": 0.8992, + "step": 6646 + }, + { + "epoch": 18.111716621253407, + "grad_norm": 9.403258323669434, + "learning_rate": 1.882600255100464e-05, + "loss": 0.8704, + "step": 6647 + }, + { + "epoch": 18.114441416893733, + "grad_norm": 6.144392013549805, + "learning_rate": 1.8825587634527603e-05, + "loss": 0.8552, + "step": 6648 + }, + { + "epoch": 18.11716621253406, + "grad_norm": 7.077390670776367, + "learning_rate": 1.8825172649317172e-05, + "loss": 0.8794, + "step": 6649 + }, + { + "epoch": 18.11989100817439, + "grad_norm": 8.0903902053833, + "learning_rate": 1.882475759537658e-05, + "loss": 0.958, + "step": 6650 + }, + { + "epoch": 18.122615803814714, + "grad_norm": 7.654234409332275, + "learning_rate": 1.882434247270906e-05, + "loss": 0.9238, + "step": 6651 + }, + { + "epoch": 18.12534059945504, + "grad_norm": 7.101521015167236, + "learning_rate": 1.8823927281317848e-05, + "loss": 0.9688, + "step": 6652 + }, + { + "epoch": 18.12806539509537, + "grad_norm": 7.770018577575684, + "learning_rate": 1.882351202120617e-05, + "loss": 0.6746, + "step": 6653 + }, + { + "epoch": 18.130790190735695, + "grad_norm": 10.246801376342773, + "learning_rate": 1.882309669237727e-05, + "loss": 0.908, + "step": 6654 + }, + { + "epoch": 18.13351498637602, + "grad_norm": 7.705492973327637, + "learning_rate": 1.882268129483437e-05, + "loss": 0.7057, + "step": 6655 + }, + { + "epoch": 18.13623978201635, + "grad_norm": 10.161961555480957, + "learning_rate": 1.8822265828580716e-05, + "loss": 0.8679, + "step": 6656 + }, + { + "epoch": 18.138964577656676, + "grad_norm": 7.283121585845947, + "learning_rate": 1.8821850293619536e-05, + "loss": 0.9399, + "step": 6657 + }, + { + "epoch": 18.141689373297, + "grad_norm": 8.794880867004395, + "learning_rate": 1.8821434689954074e-05, + "loss": 0.7854, + "step": 6658 + }, + { + "epoch": 18.14441416893733, + "grad_norm": 7.504270553588867, + "learning_rate": 1.8821019017587562e-05, + "loss": 0.8784, + "step": 6659 + }, + { + "epoch": 18.147138964577657, + "grad_norm": 7.3743438720703125, + "learning_rate": 1.882060327652324e-05, + "loss": 0.9117, + "step": 6660 + }, + { + "epoch": 18.149863760217983, + "grad_norm": 8.664271354675293, + "learning_rate": 1.8820187466764337e-05, + "loss": 0.849, + "step": 6661 + }, + { + "epoch": 18.152588555858312, + "grad_norm": 8.355574607849121, + "learning_rate": 1.88197715883141e-05, + "loss": 0.8354, + "step": 6662 + }, + { + "epoch": 18.155313351498638, + "grad_norm": 7.7394514083862305, + "learning_rate": 1.8819355641175767e-05, + "loss": 0.7986, + "step": 6663 + }, + { + "epoch": 18.158038147138964, + "grad_norm": 8.34272575378418, + "learning_rate": 1.8818939625352577e-05, + "loss": 0.7178, + "step": 6664 + }, + { + "epoch": 18.160762942779293, + "grad_norm": 7.23603630065918, + "learning_rate": 1.8818523540847768e-05, + "loss": 0.8145, + "step": 6665 + }, + { + "epoch": 18.16348773841962, + "grad_norm": 7.129431247711182, + "learning_rate": 1.8818107387664582e-05, + "loss": 0.6943, + "step": 6666 + }, + { + "epoch": 18.166212534059945, + "grad_norm": 9.455894470214844, + "learning_rate": 1.881769116580626e-05, + "loss": 0.9041, + "step": 6667 + }, + { + "epoch": 18.168937329700274, + "grad_norm": 8.3630952835083, + "learning_rate": 1.881727487527604e-05, + "loss": 1.0199, + "step": 6668 + }, + { + "epoch": 18.1716621253406, + "grad_norm": 9.230984687805176, + "learning_rate": 1.881685851607717e-05, + "loss": 0.9042, + "step": 6669 + }, + { + "epoch": 18.174386920980925, + "grad_norm": 6.956221580505371, + "learning_rate": 1.881644208821289e-05, + "loss": 0.6833, + "step": 6670 + }, + { + "epoch": 18.177111716621255, + "grad_norm": 8.737435340881348, + "learning_rate": 1.881602559168644e-05, + "loss": 1.0133, + "step": 6671 + }, + { + "epoch": 18.17983651226158, + "grad_norm": 7.035590171813965, + "learning_rate": 1.881560902650107e-05, + "loss": 0.8278, + "step": 6672 + }, + { + "epoch": 18.182561307901906, + "grad_norm": 13.982083320617676, + "learning_rate": 1.881519239266002e-05, + "loss": 1.0471, + "step": 6673 + }, + { + "epoch": 18.185286103542236, + "grad_norm": 7.48789119720459, + "learning_rate": 1.8814775690166535e-05, + "loss": 0.8416, + "step": 6674 + }, + { + "epoch": 18.18801089918256, + "grad_norm": 6.988489627838135, + "learning_rate": 1.8814358919023855e-05, + "loss": 0.7903, + "step": 6675 + }, + { + "epoch": 18.190735694822887, + "grad_norm": 13.37846851348877, + "learning_rate": 1.8813942079235237e-05, + "loss": 0.6805, + "step": 6676 + }, + { + "epoch": 18.193460490463217, + "grad_norm": 9.722649574279785, + "learning_rate": 1.881352517080392e-05, + "loss": 1.0209, + "step": 6677 + }, + { + "epoch": 18.196185286103542, + "grad_norm": 9.827420234680176, + "learning_rate": 1.8813108193733155e-05, + "loss": 0.83, + "step": 6678 + }, + { + "epoch": 18.19891008174387, + "grad_norm": 8.813655853271484, + "learning_rate": 1.8812691148026186e-05, + "loss": 0.828, + "step": 6679 + }, + { + "epoch": 18.201634877384198, + "grad_norm": 7.097906112670898, + "learning_rate": 1.881227403368626e-05, + "loss": 0.7917, + "step": 6680 + }, + { + "epoch": 18.204359673024523, + "grad_norm": 7.607766151428223, + "learning_rate": 1.881185685071663e-05, + "loss": 0.8481, + "step": 6681 + }, + { + "epoch": 18.20708446866485, + "grad_norm": 7.371726036071777, + "learning_rate": 1.8811439599120543e-05, + "loss": 0.8933, + "step": 6682 + }, + { + "epoch": 18.20980926430518, + "grad_norm": 7.199708938598633, + "learning_rate": 1.8811022278901244e-05, + "loss": 0.9622, + "step": 6683 + }, + { + "epoch": 18.212534059945504, + "grad_norm": 7.4748663902282715, + "learning_rate": 1.881060489006199e-05, + "loss": 1.014, + "step": 6684 + }, + { + "epoch": 18.21525885558583, + "grad_norm": 8.907736778259277, + "learning_rate": 1.881018743260603e-05, + "loss": 0.7926, + "step": 6685 + }, + { + "epoch": 18.21798365122616, + "grad_norm": 6.982027530670166, + "learning_rate": 1.880976990653661e-05, + "loss": 0.9241, + "step": 6686 + }, + { + "epoch": 18.220708446866485, + "grad_norm": 8.772224426269531, + "learning_rate": 1.8809352311856987e-05, + "loss": 0.7861, + "step": 6687 + }, + { + "epoch": 18.22343324250681, + "grad_norm": 9.9409818649292, + "learning_rate": 1.8808934648570412e-05, + "loss": 0.7244, + "step": 6688 + }, + { + "epoch": 18.22615803814714, + "grad_norm": 7.434682846069336, + "learning_rate": 1.8808516916680138e-05, + "loss": 0.9373, + "step": 6689 + }, + { + "epoch": 18.228882833787466, + "grad_norm": 7.6927642822265625, + "learning_rate": 1.880809911618942e-05, + "loss": 0.9325, + "step": 6690 + }, + { + "epoch": 18.231607629427792, + "grad_norm": 10.556446075439453, + "learning_rate": 1.8807681247101507e-05, + "loss": 0.9557, + "step": 6691 + }, + { + "epoch": 18.23433242506812, + "grad_norm": 8.532793998718262, + "learning_rate": 1.8807263309419656e-05, + "loss": 0.7985, + "step": 6692 + }, + { + "epoch": 18.237057220708447, + "grad_norm": 6.721668243408203, + "learning_rate": 1.8806845303147123e-05, + "loss": 0.902, + "step": 6693 + }, + { + "epoch": 18.239782016348773, + "grad_norm": 8.049880981445312, + "learning_rate": 1.880642722828716e-05, + "loss": 0.8823, + "step": 6694 + }, + { + "epoch": 18.242506811989102, + "grad_norm": 10.84933853149414, + "learning_rate": 1.8806009084843025e-05, + "loss": 0.8455, + "step": 6695 + }, + { + "epoch": 18.245231607629428, + "grad_norm": 9.497926712036133, + "learning_rate": 1.8805590872817976e-05, + "loss": 0.8737, + "step": 6696 + }, + { + "epoch": 18.247956403269754, + "grad_norm": 8.234804153442383, + "learning_rate": 1.880517259221527e-05, + "loss": 0.724, + "step": 6697 + }, + { + "epoch": 18.250681198910083, + "grad_norm": 8.508273124694824, + "learning_rate": 1.880475424303816e-05, + "loss": 0.7722, + "step": 6698 + }, + { + "epoch": 18.25340599455041, + "grad_norm": 9.23184871673584, + "learning_rate": 1.880433582528991e-05, + "loss": 0.8793, + "step": 6699 + }, + { + "epoch": 18.256130790190735, + "grad_norm": 8.031156539916992, + "learning_rate": 1.8803917338973778e-05, + "loss": 0.7725, + "step": 6700 + }, + { + "epoch": 18.258855585831064, + "grad_norm": 8.23066520690918, + "learning_rate": 1.8803498784093014e-05, + "loss": 0.9756, + "step": 6701 + }, + { + "epoch": 18.26158038147139, + "grad_norm": 8.178288459777832, + "learning_rate": 1.880308016065089e-05, + "loss": 0.835, + "step": 6702 + }, + { + "epoch": 18.264305177111716, + "grad_norm": 7.084980487823486, + "learning_rate": 1.880266146865066e-05, + "loss": 0.6921, + "step": 6703 + }, + { + "epoch": 18.267029972752045, + "grad_norm": 7.853808403015137, + "learning_rate": 1.8802242708095586e-05, + "loss": 0.8521, + "step": 6704 + }, + { + "epoch": 18.26975476839237, + "grad_norm": 9.48322582244873, + "learning_rate": 1.880182387898893e-05, + "loss": 0.9736, + "step": 6705 + }, + { + "epoch": 18.272479564032697, + "grad_norm": 8.77895450592041, + "learning_rate": 1.880140498133395e-05, + "loss": 0.963, + "step": 6706 + }, + { + "epoch": 18.275204359673026, + "grad_norm": 7.374267101287842, + "learning_rate": 1.8800986015133914e-05, + "loss": 0.9132, + "step": 6707 + }, + { + "epoch": 18.277929155313352, + "grad_norm": 8.246108055114746, + "learning_rate": 1.8800566980392082e-05, + "loss": 0.8914, + "step": 6708 + }, + { + "epoch": 18.280653950953678, + "grad_norm": 8.349637985229492, + "learning_rate": 1.8800147877111716e-05, + "loss": 0.7456, + "step": 6709 + }, + { + "epoch": 18.283378746594007, + "grad_norm": 9.123753547668457, + "learning_rate": 1.8799728705296084e-05, + "loss": 0.8217, + "step": 6710 + }, + { + "epoch": 18.286103542234333, + "grad_norm": 6.784246444702148, + "learning_rate": 1.8799309464948446e-05, + "loss": 0.8553, + "step": 6711 + }, + { + "epoch": 18.28882833787466, + "grad_norm": 7.580383777618408, + "learning_rate": 1.8798890156072068e-05, + "loss": 0.7469, + "step": 6712 + }, + { + "epoch": 18.291553133514988, + "grad_norm": 11.182293891906738, + "learning_rate": 1.879847077867022e-05, + "loss": 0.8315, + "step": 6713 + }, + { + "epoch": 18.294277929155314, + "grad_norm": 9.869726181030273, + "learning_rate": 1.879805133274616e-05, + "loss": 0.8164, + "step": 6714 + }, + { + "epoch": 18.29700272479564, + "grad_norm": 7.502408504486084, + "learning_rate": 1.8797631818303164e-05, + "loss": 0.9302, + "step": 6715 + }, + { + "epoch": 18.29972752043597, + "grad_norm": 8.410951614379883, + "learning_rate": 1.8797212235344492e-05, + "loss": 0.774, + "step": 6716 + }, + { + "epoch": 18.302452316076295, + "grad_norm": 7.368539333343506, + "learning_rate": 1.8796792583873418e-05, + "loss": 1.0969, + "step": 6717 + }, + { + "epoch": 18.30517711171662, + "grad_norm": 8.469276428222656, + "learning_rate": 1.87963728638932e-05, + "loss": 0.9127, + "step": 6718 + }, + { + "epoch": 18.30790190735695, + "grad_norm": 11.788848876953125, + "learning_rate": 1.8795953075407117e-05, + "loss": 0.8334, + "step": 6719 + }, + { + "epoch": 18.310626702997276, + "grad_norm": 7.8592047691345215, + "learning_rate": 1.8795533218418437e-05, + "loss": 0.8579, + "step": 6720 + }, + { + "epoch": 18.3133514986376, + "grad_norm": 8.544289588928223, + "learning_rate": 1.8795113292930425e-05, + "loss": 0.8611, + "step": 6721 + }, + { + "epoch": 18.31607629427793, + "grad_norm": 8.519726753234863, + "learning_rate": 1.8794693298946352e-05, + "loss": 0.8892, + "step": 6722 + }, + { + "epoch": 18.318801089918257, + "grad_norm": 10.280699729919434, + "learning_rate": 1.8794273236469495e-05, + "loss": 0.9015, + "step": 6723 + }, + { + "epoch": 18.321525885558582, + "grad_norm": 8.979537010192871, + "learning_rate": 1.8793853105503118e-05, + "loss": 0.9293, + "step": 6724 + }, + { + "epoch": 18.32425068119891, + "grad_norm": 6.912249565124512, + "learning_rate": 1.8793432906050496e-05, + "loss": 0.84, + "step": 6725 + }, + { + "epoch": 18.326975476839237, + "grad_norm": 6.5656256675720215, + "learning_rate": 1.87930126381149e-05, + "loss": 0.7482, + "step": 6726 + }, + { + "epoch": 18.329700272479563, + "grad_norm": 6.806774616241455, + "learning_rate": 1.879259230169961e-05, + "loss": 0.8, + "step": 6727 + }, + { + "epoch": 18.332425068119893, + "grad_norm": 15.59570026397705, + "learning_rate": 1.8792171896807886e-05, + "loss": 0.9402, + "step": 6728 + }, + { + "epoch": 18.33514986376022, + "grad_norm": 8.757286071777344, + "learning_rate": 1.879175142344302e-05, + "loss": 0.9177, + "step": 6729 + }, + { + "epoch": 18.337874659400544, + "grad_norm": 8.42879867553711, + "learning_rate": 1.8791330881608266e-05, + "loss": 0.8497, + "step": 6730 + }, + { + "epoch": 18.340599455040874, + "grad_norm": 7.903569221496582, + "learning_rate": 1.879091027130692e-05, + "loss": 0.7772, + "step": 6731 + }, + { + "epoch": 18.3433242506812, + "grad_norm": 6.854870319366455, + "learning_rate": 1.8790489592542243e-05, + "loss": 1.0813, + "step": 6732 + }, + { + "epoch": 18.346049046321525, + "grad_norm": 12.01852798461914, + "learning_rate": 1.8790068845317516e-05, + "loss": 0.9101, + "step": 6733 + }, + { + "epoch": 18.348773841961854, + "grad_norm": 8.10268497467041, + "learning_rate": 1.8789648029636014e-05, + "loss": 0.8087, + "step": 6734 + }, + { + "epoch": 18.35149863760218, + "grad_norm": 7.030385494232178, + "learning_rate": 1.8789227145501023e-05, + "loss": 0.6307, + "step": 6735 + }, + { + "epoch": 18.354223433242506, + "grad_norm": 8.755697250366211, + "learning_rate": 1.8788806192915804e-05, + "loss": 0.8468, + "step": 6736 + }, + { + "epoch": 18.356948228882835, + "grad_norm": 7.640406608581543, + "learning_rate": 1.8788385171883653e-05, + "loss": 1.0275, + "step": 6737 + }, + { + "epoch": 18.35967302452316, + "grad_norm": 6.8547515869140625, + "learning_rate": 1.878796408240784e-05, + "loss": 0.7567, + "step": 6738 + }, + { + "epoch": 18.362397820163487, + "grad_norm": 13.387345314025879, + "learning_rate": 1.878754292449164e-05, + "loss": 0.9679, + "step": 6739 + }, + { + "epoch": 18.365122615803816, + "grad_norm": 8.199585914611816, + "learning_rate": 1.8787121698138344e-05, + "loss": 0.8151, + "step": 6740 + }, + { + "epoch": 18.367847411444142, + "grad_norm": 9.504558563232422, + "learning_rate": 1.8786700403351226e-05, + "loss": 0.983, + "step": 6741 + }, + { + "epoch": 18.370572207084468, + "grad_norm": 7.679377555847168, + "learning_rate": 1.878627904013357e-05, + "loss": 0.8545, + "step": 6742 + }, + { + "epoch": 18.373297002724797, + "grad_norm": 11.670575141906738, + "learning_rate": 1.878585760848865e-05, + "loss": 0.7836, + "step": 6743 + }, + { + "epoch": 18.376021798365123, + "grad_norm": 8.45013427734375, + "learning_rate": 1.878543610841976e-05, + "loss": 0.8475, + "step": 6744 + }, + { + "epoch": 18.37874659400545, + "grad_norm": 9.006660461425781, + "learning_rate": 1.878501453993017e-05, + "loss": 0.9005, + "step": 6745 + }, + { + "epoch": 18.381471389645778, + "grad_norm": 7.631886005401611, + "learning_rate": 1.8784592903023175e-05, + "loss": 0.8474, + "step": 6746 + }, + { + "epoch": 18.384196185286104, + "grad_norm": 6.807475566864014, + "learning_rate": 1.8784171197702053e-05, + "loss": 0.7784, + "step": 6747 + }, + { + "epoch": 18.38692098092643, + "grad_norm": 8.734243392944336, + "learning_rate": 1.8783749423970085e-05, + "loss": 0.8893, + "step": 6748 + }, + { + "epoch": 18.38964577656676, + "grad_norm": 10.451774597167969, + "learning_rate": 1.878332758183056e-05, + "loss": 0.9891, + "step": 6749 + }, + { + "epoch": 18.392370572207085, + "grad_norm": 7.548184394836426, + "learning_rate": 1.8782905671286763e-05, + "loss": 0.9047, + "step": 6750 + }, + { + "epoch": 18.39509536784741, + "grad_norm": 7.679628849029541, + "learning_rate": 1.878248369234198e-05, + "loss": 0.9084, + "step": 6751 + }, + { + "epoch": 18.39782016348774, + "grad_norm": 7.905241966247559, + "learning_rate": 1.8782061644999497e-05, + "loss": 0.9534, + "step": 6752 + }, + { + "epoch": 18.400544959128066, + "grad_norm": 7.051769733428955, + "learning_rate": 1.8781639529262598e-05, + "loss": 0.7361, + "step": 6753 + }, + { + "epoch": 18.40326975476839, + "grad_norm": 10.122602462768555, + "learning_rate": 1.8781217345134574e-05, + "loss": 0.8901, + "step": 6754 + }, + { + "epoch": 18.40599455040872, + "grad_norm": 9.768773078918457, + "learning_rate": 1.8780795092618717e-05, + "loss": 0.8539, + "step": 6755 + }, + { + "epoch": 18.408719346049047, + "grad_norm": 9.212475776672363, + "learning_rate": 1.8780372771718302e-05, + "loss": 1.0101, + "step": 6756 + }, + { + "epoch": 18.411444141689373, + "grad_norm": 6.382621765136719, + "learning_rate": 1.8779950382436632e-05, + "loss": 0.7898, + "step": 6757 + }, + { + "epoch": 18.414168937329702, + "grad_norm": 8.457864761352539, + "learning_rate": 1.8779527924776988e-05, + "loss": 0.948, + "step": 6758 + }, + { + "epoch": 18.416893732970028, + "grad_norm": 8.18539810180664, + "learning_rate": 1.877910539874267e-05, + "loss": 0.8048, + "step": 6759 + }, + { + "epoch": 18.419618528610354, + "grad_norm": 7.24704122543335, + "learning_rate": 1.877868280433695e-05, + "loss": 0.8054, + "step": 6760 + }, + { + "epoch": 18.422343324250683, + "grad_norm": 10.048449516296387, + "learning_rate": 1.877826014156314e-05, + "loss": 0.9694, + "step": 6761 + }, + { + "epoch": 18.42506811989101, + "grad_norm": 8.157830238342285, + "learning_rate": 1.877783741042452e-05, + "loss": 0.9662, + "step": 6762 + }, + { + "epoch": 18.427792915531334, + "grad_norm": 7.6305928230285645, + "learning_rate": 1.8777414610924386e-05, + "loss": 0.7234, + "step": 6763 + }, + { + "epoch": 18.430517711171664, + "grad_norm": 9.370262145996094, + "learning_rate": 1.8776991743066025e-05, + "loss": 0.9136, + "step": 6764 + }, + { + "epoch": 18.43324250681199, + "grad_norm": 8.10416030883789, + "learning_rate": 1.8776568806852738e-05, + "loss": 0.7332, + "step": 6765 + }, + { + "epoch": 18.435967302452315, + "grad_norm": 7.520824909210205, + "learning_rate": 1.8776145802287816e-05, + "loss": 0.8267, + "step": 6766 + }, + { + "epoch": 18.438692098092645, + "grad_norm": 8.330543518066406, + "learning_rate": 1.8775722729374552e-05, + "loss": 0.8585, + "step": 6767 + }, + { + "epoch": 18.44141689373297, + "grad_norm": 7.984499931335449, + "learning_rate": 1.8775299588116243e-05, + "loss": 0.7097, + "step": 6768 + }, + { + "epoch": 18.444141689373296, + "grad_norm": 7.713501453399658, + "learning_rate": 1.877487637851618e-05, + "loss": 0.8645, + "step": 6769 + }, + { + "epoch": 18.446866485013626, + "grad_norm": 7.1620283126831055, + "learning_rate": 1.8774453100577664e-05, + "loss": 1.0524, + "step": 6770 + }, + { + "epoch": 18.44959128065395, + "grad_norm": 7.688859462738037, + "learning_rate": 1.8774029754303995e-05, + "loss": 0.833, + "step": 6771 + }, + { + "epoch": 18.452316076294277, + "grad_norm": 7.874576568603516, + "learning_rate": 1.877360633969846e-05, + "loss": 0.8827, + "step": 6772 + }, + { + "epoch": 18.455040871934607, + "grad_norm": 8.26817512512207, + "learning_rate": 1.877318285676436e-05, + "loss": 0.8549, + "step": 6773 + }, + { + "epoch": 18.457765667574932, + "grad_norm": 7.061283111572266, + "learning_rate": 1.8772759305504996e-05, + "loss": 0.7936, + "step": 6774 + }, + { + "epoch": 18.460490463215258, + "grad_norm": 12.622628211975098, + "learning_rate": 1.877233568592366e-05, + "loss": 0.9607, + "step": 6775 + }, + { + "epoch": 18.463215258855588, + "grad_norm": 8.405427932739258, + "learning_rate": 1.877191199802366e-05, + "loss": 0.9612, + "step": 6776 + }, + { + "epoch": 18.465940054495913, + "grad_norm": 9.933815956115723, + "learning_rate": 1.8771488241808295e-05, + "loss": 0.7939, + "step": 6777 + }, + { + "epoch": 18.46866485013624, + "grad_norm": 6.550434112548828, + "learning_rate": 1.8771064417280856e-05, + "loss": 0.9353, + "step": 6778 + }, + { + "epoch": 18.47138964577657, + "grad_norm": 10.655665397644043, + "learning_rate": 1.8770640524444653e-05, + "loss": 0.9561, + "step": 6779 + }, + { + "epoch": 18.474114441416894, + "grad_norm": 7.041699409484863, + "learning_rate": 1.8770216563302984e-05, + "loss": 0.7959, + "step": 6780 + }, + { + "epoch": 18.47683923705722, + "grad_norm": 8.465987205505371, + "learning_rate": 1.876979253385915e-05, + "loss": 0.8094, + "step": 6781 + }, + { + "epoch": 18.479564032697546, + "grad_norm": 9.416106224060059, + "learning_rate": 1.8769368436116454e-05, + "loss": 0.7689, + "step": 6782 + }, + { + "epoch": 18.482288828337875, + "grad_norm": 9.46136474609375, + "learning_rate": 1.87689442700782e-05, + "loss": 0.9694, + "step": 6783 + }, + { + "epoch": 18.4850136239782, + "grad_norm": 9.132607460021973, + "learning_rate": 1.876852003574769e-05, + "loss": 0.8503, + "step": 6784 + }, + { + "epoch": 18.48773841961853, + "grad_norm": 10.33657169342041, + "learning_rate": 1.8768095733128226e-05, + "loss": 0.907, + "step": 6785 + }, + { + "epoch": 18.490463215258856, + "grad_norm": 8.639205932617188, + "learning_rate": 1.8767671362223117e-05, + "loss": 0.8226, + "step": 6786 + }, + { + "epoch": 18.493188010899182, + "grad_norm": 8.91231632232666, + "learning_rate": 1.8767246923035663e-05, + "loss": 0.9209, + "step": 6787 + }, + { + "epoch": 18.495912806539508, + "grad_norm": 7.934805393218994, + "learning_rate": 1.8766822415569175e-05, + "loss": 0.8568, + "step": 6788 + }, + { + "epoch": 18.498637602179837, + "grad_norm": 8.37930965423584, + "learning_rate": 1.8766397839826952e-05, + "loss": 0.886, + "step": 6789 + }, + { + "epoch": 18.501362397820163, + "grad_norm": 8.110930442810059, + "learning_rate": 1.876597319581231e-05, + "loss": 0.8521, + "step": 6790 + }, + { + "epoch": 18.504087193460492, + "grad_norm": 7.500209331512451, + "learning_rate": 1.8765548483528548e-05, + "loss": 0.8661, + "step": 6791 + }, + { + "epoch": 18.506811989100818, + "grad_norm": 7.315430641174316, + "learning_rate": 1.876512370297898e-05, + "loss": 0.78, + "step": 6792 + }, + { + "epoch": 18.509536784741144, + "grad_norm": 7.014491081237793, + "learning_rate": 1.8764698854166904e-05, + "loss": 0.9225, + "step": 6793 + }, + { + "epoch": 18.51226158038147, + "grad_norm": 6.934720039367676, + "learning_rate": 1.8764273937095642e-05, + "loss": 0.8499, + "step": 6794 + }, + { + "epoch": 18.5149863760218, + "grad_norm": 7.059356689453125, + "learning_rate": 1.876384895176849e-05, + "loss": 0.8367, + "step": 6795 + }, + { + "epoch": 18.517711171662125, + "grad_norm": 9.518843650817871, + "learning_rate": 1.876342389818877e-05, + "loss": 0.8096, + "step": 6796 + }, + { + "epoch": 18.520435967302454, + "grad_norm": 7.209913730621338, + "learning_rate": 1.8762998776359785e-05, + "loss": 0.8041, + "step": 6797 + }, + { + "epoch": 18.52316076294278, + "grad_norm": 7.684715747833252, + "learning_rate": 1.8762573586284847e-05, + "loss": 0.9806, + "step": 6798 + }, + { + "epoch": 18.525885558583106, + "grad_norm": 7.682023048400879, + "learning_rate": 1.876214832796727e-05, + "loss": 0.7159, + "step": 6799 + }, + { + "epoch": 18.52861035422343, + "grad_norm": 9.923916816711426, + "learning_rate": 1.876172300141036e-05, + "loss": 0.9024, + "step": 6800 + }, + { + "epoch": 18.53133514986376, + "grad_norm": 8.820189476013184, + "learning_rate": 1.8761297606617436e-05, + "loss": 0.8292, + "step": 6801 + }, + { + "epoch": 18.534059945504087, + "grad_norm": 9.852216720581055, + "learning_rate": 1.876087214359181e-05, + "loss": 0.8995, + "step": 6802 + }, + { + "epoch": 18.536784741144416, + "grad_norm": 7.489625453948975, + "learning_rate": 1.876044661233679e-05, + "loss": 0.9141, + "step": 6803 + }, + { + "epoch": 18.539509536784742, + "grad_norm": 8.809782981872559, + "learning_rate": 1.8760021012855694e-05, + "loss": 1.0233, + "step": 6804 + }, + { + "epoch": 18.542234332425068, + "grad_norm": 8.199651718139648, + "learning_rate": 1.875959534515184e-05, + "loss": 0.8774, + "step": 6805 + }, + { + "epoch": 18.544959128065393, + "grad_norm": 10.005997657775879, + "learning_rate": 1.8759169609228536e-05, + "loss": 0.8667, + "step": 6806 + }, + { + "epoch": 18.547683923705723, + "grad_norm": 8.236612319946289, + "learning_rate": 1.8758743805089104e-05, + "loss": 0.7457, + "step": 6807 + }, + { + "epoch": 18.55040871934605, + "grad_norm": 8.340702056884766, + "learning_rate": 1.8758317932736855e-05, + "loss": 0.8894, + "step": 6808 + }, + { + "epoch": 18.553133514986374, + "grad_norm": 8.727513313293457, + "learning_rate": 1.8757891992175106e-05, + "loss": 0.9464, + "step": 6809 + }, + { + "epoch": 18.555858310626704, + "grad_norm": 8.727365493774414, + "learning_rate": 1.875746598340718e-05, + "loss": 0.9033, + "step": 6810 + }, + { + "epoch": 18.55858310626703, + "grad_norm": 8.104939460754395, + "learning_rate": 1.8757039906436388e-05, + "loss": 0.8466, + "step": 6811 + }, + { + "epoch": 18.561307901907355, + "grad_norm": 7.656373500823975, + "learning_rate": 1.8756613761266052e-05, + "loss": 0.9034, + "step": 6812 + }, + { + "epoch": 18.564032697547685, + "grad_norm": 10.777390480041504, + "learning_rate": 1.875618754789949e-05, + "loss": 0.9558, + "step": 6813 + }, + { + "epoch": 18.56675749318801, + "grad_norm": 7.567367076873779, + "learning_rate": 1.8755761266340018e-05, + "loss": 0.8656, + "step": 6814 + }, + { + "epoch": 18.569482288828336, + "grad_norm": 7.490059852600098, + "learning_rate": 1.8755334916590964e-05, + "loss": 0.9022, + "step": 6815 + }, + { + "epoch": 18.572207084468666, + "grad_norm": 8.64775276184082, + "learning_rate": 1.875490849865564e-05, + "loss": 1.0067, + "step": 6816 + }, + { + "epoch": 18.57493188010899, + "grad_norm": 8.965628623962402, + "learning_rate": 1.8754482012537374e-05, + "loss": 0.921, + "step": 6817 + }, + { + "epoch": 18.577656675749317, + "grad_norm": 9.244271278381348, + "learning_rate": 1.875405545823948e-05, + "loss": 0.6953, + "step": 6818 + }, + { + "epoch": 18.580381471389646, + "grad_norm": 8.459924697875977, + "learning_rate": 1.8753628835765284e-05, + "loss": 0.8523, + "step": 6819 + }, + { + "epoch": 18.583106267029972, + "grad_norm": 8.601913452148438, + "learning_rate": 1.875320214511811e-05, + "loss": 0.8688, + "step": 6820 + }, + { + "epoch": 18.585831062670298, + "grad_norm": 8.533843994140625, + "learning_rate": 1.875277538630128e-05, + "loss": 0.7902, + "step": 6821 + }, + { + "epoch": 18.588555858310627, + "grad_norm": 7.612013339996338, + "learning_rate": 1.8752348559318116e-05, + "loss": 0.7195, + "step": 6822 + }, + { + "epoch": 18.591280653950953, + "grad_norm": 7.308195114135742, + "learning_rate": 1.8751921664171944e-05, + "loss": 0.6616, + "step": 6823 + }, + { + "epoch": 18.59400544959128, + "grad_norm": 8.093254089355469, + "learning_rate": 1.8751494700866088e-05, + "loss": 0.8279, + "step": 6824 + }, + { + "epoch": 18.59673024523161, + "grad_norm": 7.823365688323975, + "learning_rate": 1.875106766940387e-05, + "loss": 1.1262, + "step": 6825 + }, + { + "epoch": 18.599455040871934, + "grad_norm": 7.550796985626221, + "learning_rate": 1.8750640569788624e-05, + "loss": 0.8933, + "step": 6826 + }, + { + "epoch": 18.60217983651226, + "grad_norm": 7.996880054473877, + "learning_rate": 1.8750213402023664e-05, + "loss": 0.8503, + "step": 6827 + }, + { + "epoch": 18.60490463215259, + "grad_norm": 9.51594066619873, + "learning_rate": 1.874978616611233e-05, + "loss": 0.9055, + "step": 6828 + }, + { + "epoch": 18.607629427792915, + "grad_norm": 8.002632141113281, + "learning_rate": 1.874935886205794e-05, + "loss": 0.797, + "step": 6829 + }, + { + "epoch": 18.61035422343324, + "grad_norm": 7.839196681976318, + "learning_rate": 1.8748931489863823e-05, + "loss": 0.932, + "step": 6830 + }, + { + "epoch": 18.61307901907357, + "grad_norm": 8.164216995239258, + "learning_rate": 1.874850404953331e-05, + "loss": 0.8767, + "step": 6831 + }, + { + "epoch": 18.615803814713896, + "grad_norm": 9.41263198852539, + "learning_rate": 1.8748076541069734e-05, + "loss": 0.9336, + "step": 6832 + }, + { + "epoch": 18.618528610354222, + "grad_norm": 8.057923316955566, + "learning_rate": 1.874764896447641e-05, + "loss": 0.8961, + "step": 6833 + }, + { + "epoch": 18.62125340599455, + "grad_norm": 8.388008117675781, + "learning_rate": 1.8747221319756686e-05, + "loss": 0.8668, + "step": 6834 + }, + { + "epoch": 18.623978201634877, + "grad_norm": 8.542396545410156, + "learning_rate": 1.874679360691388e-05, + "loss": 0.9678, + "step": 6835 + }, + { + "epoch": 18.626702997275203, + "grad_norm": 8.668232917785645, + "learning_rate": 1.874636582595133e-05, + "loss": 0.976, + "step": 6836 + }, + { + "epoch": 18.629427792915532, + "grad_norm": 6.552305698394775, + "learning_rate": 1.874593797687236e-05, + "loss": 0.72, + "step": 6837 + }, + { + "epoch": 18.632152588555858, + "grad_norm": 9.538304328918457, + "learning_rate": 1.874551005968031e-05, + "loss": 0.91, + "step": 6838 + }, + { + "epoch": 18.634877384196184, + "grad_norm": 8.393935203552246, + "learning_rate": 1.8745082074378507e-05, + "loss": 0.9698, + "step": 6839 + }, + { + "epoch": 18.637602179836513, + "grad_norm": 8.084198951721191, + "learning_rate": 1.8744654020970284e-05, + "loss": 0.9087, + "step": 6840 + }, + { + "epoch": 18.64032697547684, + "grad_norm": 7.184995651245117, + "learning_rate": 1.8744225899458982e-05, + "loss": 0.6638, + "step": 6841 + }, + { + "epoch": 18.643051771117165, + "grad_norm": 7.042233467102051, + "learning_rate": 1.874379770984793e-05, + "loss": 0.7306, + "step": 6842 + }, + { + "epoch": 18.645776566757494, + "grad_norm": 7.042173385620117, + "learning_rate": 1.8743369452140457e-05, + "loss": 0.879, + "step": 6843 + }, + { + "epoch": 18.64850136239782, + "grad_norm": 7.013894081115723, + "learning_rate": 1.874294112633991e-05, + "loss": 0.8345, + "step": 6844 + }, + { + "epoch": 18.651226158038146, + "grad_norm": 8.85759162902832, + "learning_rate": 1.874251273244962e-05, + "loss": 0.8652, + "step": 6845 + }, + { + "epoch": 18.653950953678475, + "grad_norm": 7.782415866851807, + "learning_rate": 1.874208427047292e-05, + "loss": 0.9827, + "step": 6846 + }, + { + "epoch": 18.6566757493188, + "grad_norm": 7.596438884735107, + "learning_rate": 1.8741655740413143e-05, + "loss": 0.9199, + "step": 6847 + }, + { + "epoch": 18.659400544959126, + "grad_norm": 7.295292854309082, + "learning_rate": 1.874122714227364e-05, + "loss": 1.0024, + "step": 6848 + }, + { + "epoch": 18.662125340599456, + "grad_norm": 7.571012496948242, + "learning_rate": 1.8740798476057737e-05, + "loss": 0.9304, + "step": 6849 + }, + { + "epoch": 18.66485013623978, + "grad_norm": 7.809437274932861, + "learning_rate": 1.874036974176878e-05, + "loss": 0.755, + "step": 6850 + }, + { + "epoch": 18.667574931880107, + "grad_norm": 8.06397533416748, + "learning_rate": 1.8739940939410102e-05, + "loss": 0.8961, + "step": 6851 + }, + { + "epoch": 18.670299727520437, + "grad_norm": 8.416884422302246, + "learning_rate": 1.8739512068985052e-05, + "loss": 0.9575, + "step": 6852 + }, + { + "epoch": 18.673024523160763, + "grad_norm": 9.632649421691895, + "learning_rate": 1.8739083130496957e-05, + "loss": 0.9338, + "step": 6853 + }, + { + "epoch": 18.67574931880109, + "grad_norm": 7.96435546875, + "learning_rate": 1.8738654123949165e-05, + "loss": 0.9298, + "step": 6854 + }, + { + "epoch": 18.678474114441418, + "grad_norm": 9.763521194458008, + "learning_rate": 1.8738225049345017e-05, + "loss": 0.7675, + "step": 6855 + }, + { + "epoch": 18.681198910081743, + "grad_norm": 7.3949384689331055, + "learning_rate": 1.873779590668785e-05, + "loss": 0.7509, + "step": 6856 + }, + { + "epoch": 18.68392370572207, + "grad_norm": 7.49371862411499, + "learning_rate": 1.873736669598101e-05, + "loss": 0.7791, + "step": 6857 + }, + { + "epoch": 18.6866485013624, + "grad_norm": 8.469500541687012, + "learning_rate": 1.8736937417227845e-05, + "loss": 1.0149, + "step": 6858 + }, + { + "epoch": 18.689373297002724, + "grad_norm": 6.933372497558594, + "learning_rate": 1.873650807043169e-05, + "loss": 0.7024, + "step": 6859 + }, + { + "epoch": 18.69209809264305, + "grad_norm": 7.969101428985596, + "learning_rate": 1.873607865559589e-05, + "loss": 1.2202, + "step": 6860 + }, + { + "epoch": 18.69482288828338, + "grad_norm": 8.198660850524902, + "learning_rate": 1.8735649172723792e-05, + "loss": 0.8574, + "step": 6861 + }, + { + "epoch": 18.697547683923705, + "grad_norm": 8.389801025390625, + "learning_rate": 1.8735219621818737e-05, + "loss": 0.807, + "step": 6862 + }, + { + "epoch": 18.70027247956403, + "grad_norm": 7.781229019165039, + "learning_rate": 1.8734790002884074e-05, + "loss": 0.7609, + "step": 6863 + }, + { + "epoch": 18.70299727520436, + "grad_norm": 8.59720516204834, + "learning_rate": 1.8734360315923146e-05, + "loss": 0.8466, + "step": 6864 + }, + { + "epoch": 18.705722070844686, + "grad_norm": 16.442710876464844, + "learning_rate": 1.8733930560939305e-05, + "loss": 0.9008, + "step": 6865 + }, + { + "epoch": 18.708446866485012, + "grad_norm": 9.491679191589355, + "learning_rate": 1.873350073793589e-05, + "loss": 0.9946, + "step": 6866 + }, + { + "epoch": 18.71117166212534, + "grad_norm": 7.669342994689941, + "learning_rate": 1.8733070846916253e-05, + "loss": 0.8419, + "step": 6867 + }, + { + "epoch": 18.713896457765667, + "grad_norm": 7.897876262664795, + "learning_rate": 1.8732640887883744e-05, + "loss": 0.8983, + "step": 6868 + }, + { + "epoch": 18.716621253405993, + "grad_norm": 7.866222381591797, + "learning_rate": 1.8732210860841706e-05, + "loss": 0.882, + "step": 6869 + }, + { + "epoch": 18.719346049046322, + "grad_norm": 7.729693412780762, + "learning_rate": 1.8731780765793493e-05, + "loss": 0.9286, + "step": 6870 + }, + { + "epoch": 18.722070844686648, + "grad_norm": 6.747142314910889, + "learning_rate": 1.8731350602742453e-05, + "loss": 0.975, + "step": 6871 + }, + { + "epoch": 18.724795640326974, + "grad_norm": 7.245094299316406, + "learning_rate": 1.8730920371691934e-05, + "loss": 0.9503, + "step": 6872 + }, + { + "epoch": 18.727520435967303, + "grad_norm": 9.75373649597168, + "learning_rate": 1.8730490072645285e-05, + "loss": 0.8794, + "step": 6873 + }, + { + "epoch": 18.73024523160763, + "grad_norm": 8.557443618774414, + "learning_rate": 1.8730059705605862e-05, + "loss": 0.7939, + "step": 6874 + }, + { + "epoch": 18.732970027247955, + "grad_norm": 8.528529167175293, + "learning_rate": 1.8729629270577018e-05, + "loss": 0.8118, + "step": 6875 + }, + { + "epoch": 18.735694822888284, + "grad_norm": 8.50214958190918, + "learning_rate": 1.8729198767562102e-05, + "loss": 0.8206, + "step": 6876 + }, + { + "epoch": 18.73841961852861, + "grad_norm": 7.377909183502197, + "learning_rate": 1.8728768196564467e-05, + "loss": 0.724, + "step": 6877 + }, + { + "epoch": 18.741144414168936, + "grad_norm": 9.095946311950684, + "learning_rate": 1.8728337557587464e-05, + "loss": 0.89, + "step": 6878 + }, + { + "epoch": 18.743869209809265, + "grad_norm": 6.619362831115723, + "learning_rate": 1.872790685063445e-05, + "loss": 0.8712, + "step": 6879 + }, + { + "epoch": 18.74659400544959, + "grad_norm": 8.90834903717041, + "learning_rate": 1.8727476075708778e-05, + "loss": 0.9437, + "step": 6880 + }, + { + "epoch": 18.749318801089917, + "grad_norm": 7.974592685699463, + "learning_rate": 1.8727045232813804e-05, + "loss": 0.7578, + "step": 6881 + }, + { + "epoch": 18.752043596730246, + "grad_norm": 15.871769905090332, + "learning_rate": 1.872661432195288e-05, + "loss": 0.8325, + "step": 6882 + }, + { + "epoch": 18.754768392370572, + "grad_norm": 7.1992692947387695, + "learning_rate": 1.8726183343129368e-05, + "loss": 0.9443, + "step": 6883 + }, + { + "epoch": 18.757493188010898, + "grad_norm": 8.193685531616211, + "learning_rate": 1.872575229634662e-05, + "loss": 1.0295, + "step": 6884 + }, + { + "epoch": 18.760217983651227, + "grad_norm": 7.6046342849731445, + "learning_rate": 1.8725321181607993e-05, + "loss": 0.8723, + "step": 6885 + }, + { + "epoch": 18.762942779291553, + "grad_norm": 9.461565017700195, + "learning_rate": 1.8724889998916845e-05, + "loss": 1.074, + "step": 6886 + }, + { + "epoch": 18.76566757493188, + "grad_norm": 9.257078170776367, + "learning_rate": 1.8724458748276534e-05, + "loss": 0.9036, + "step": 6887 + }, + { + "epoch": 18.768392370572208, + "grad_norm": 8.74255657196045, + "learning_rate": 1.8724027429690422e-05, + "loss": 0.7805, + "step": 6888 + }, + { + "epoch": 18.771117166212534, + "grad_norm": 8.370862007141113, + "learning_rate": 1.8723596043161865e-05, + "loss": 0.7791, + "step": 6889 + }, + { + "epoch": 18.77384196185286, + "grad_norm": 11.671736717224121, + "learning_rate": 1.872316458869422e-05, + "loss": 0.8114, + "step": 6890 + }, + { + "epoch": 18.77656675749319, + "grad_norm": 7.444977283477783, + "learning_rate": 1.872273306629085e-05, + "loss": 0.9426, + "step": 6891 + }, + { + "epoch": 18.779291553133515, + "grad_norm": 8.131038665771484, + "learning_rate": 1.872230147595512e-05, + "loss": 0.8264, + "step": 6892 + }, + { + "epoch": 18.78201634877384, + "grad_norm": 13.566511154174805, + "learning_rate": 1.872186981769038e-05, + "loss": 0.7626, + "step": 6893 + }, + { + "epoch": 18.78474114441417, + "grad_norm": 8.058342933654785, + "learning_rate": 1.8721438091500003e-05, + "loss": 0.9114, + "step": 6894 + }, + { + "epoch": 18.787465940054496, + "grad_norm": 7.539575099945068, + "learning_rate": 1.8721006297387348e-05, + "loss": 1.0406, + "step": 6895 + }, + { + "epoch": 18.79019073569482, + "grad_norm": 9.61542797088623, + "learning_rate": 1.8720574435355776e-05, + "loss": 0.8738, + "step": 6896 + }, + { + "epoch": 18.79291553133515, + "grad_norm": 7.583422660827637, + "learning_rate": 1.8720142505408648e-05, + "loss": 0.9052, + "step": 6897 + }, + { + "epoch": 18.795640326975477, + "grad_norm": 7.3413472175598145, + "learning_rate": 1.8719710507549332e-05, + "loss": 0.8181, + "step": 6898 + }, + { + "epoch": 18.798365122615802, + "grad_norm": 8.460395812988281, + "learning_rate": 1.8719278441781193e-05, + "loss": 0.9628, + "step": 6899 + }, + { + "epoch": 18.80108991825613, + "grad_norm": 8.27148151397705, + "learning_rate": 1.871884630810759e-05, + "loss": 0.8704, + "step": 6900 + }, + { + "epoch": 18.803814713896458, + "grad_norm": 8.32595443725586, + "learning_rate": 1.8718414106531898e-05, + "loss": 0.8131, + "step": 6901 + }, + { + "epoch": 18.806539509536783, + "grad_norm": 8.904982566833496, + "learning_rate": 1.8717981837057475e-05, + "loss": 0.939, + "step": 6902 + }, + { + "epoch": 18.809264305177113, + "grad_norm": 7.2709221839904785, + "learning_rate": 1.871754949968769e-05, + "loss": 0.8385, + "step": 6903 + }, + { + "epoch": 18.81198910081744, + "grad_norm": 8.22236442565918, + "learning_rate": 1.871711709442591e-05, + "loss": 0.814, + "step": 6904 + }, + { + "epoch": 18.814713896457764, + "grad_norm": 8.144975662231445, + "learning_rate": 1.87166846212755e-05, + "loss": 0.9263, + "step": 6905 + }, + { + "epoch": 18.817438692098094, + "grad_norm": 10.323326110839844, + "learning_rate": 1.8716252080239835e-05, + "loss": 0.8673, + "step": 6906 + }, + { + "epoch": 18.82016348773842, + "grad_norm": 10.343846321105957, + "learning_rate": 1.8715819471322278e-05, + "loss": 1.0734, + "step": 6907 + }, + { + "epoch": 18.822888283378745, + "grad_norm": 13.378046989440918, + "learning_rate": 1.87153867945262e-05, + "loss": 0.9152, + "step": 6908 + }, + { + "epoch": 18.825613079019075, + "grad_norm": 8.570001602172852, + "learning_rate": 1.871495404985497e-05, + "loss": 0.8552, + "step": 6909 + }, + { + "epoch": 18.8283378746594, + "grad_norm": 8.434952735900879, + "learning_rate": 1.8714521237311956e-05, + "loss": 0.8588, + "step": 6910 + }, + { + "epoch": 18.831062670299726, + "grad_norm": 6.612369060516357, + "learning_rate": 1.8714088356900536e-05, + "loss": 1.0029, + "step": 6911 + }, + { + "epoch": 18.833787465940055, + "grad_norm": 12.763958930969238, + "learning_rate": 1.8713655408624073e-05, + "loss": 0.8953, + "step": 6912 + }, + { + "epoch": 18.83651226158038, + "grad_norm": 11.677885055541992, + "learning_rate": 1.8713222392485943e-05, + "loss": 0.751, + "step": 6913 + }, + { + "epoch": 18.839237057220707, + "grad_norm": 8.051769256591797, + "learning_rate": 1.8712789308489516e-05, + "loss": 0.9045, + "step": 6914 + }, + { + "epoch": 18.841961852861036, + "grad_norm": 10.129505157470703, + "learning_rate": 1.8712356156638164e-05, + "loss": 0.9486, + "step": 6915 + }, + { + "epoch": 18.844686648501362, + "grad_norm": 7.85394287109375, + "learning_rate": 1.871192293693527e-05, + "loss": 0.9458, + "step": 6916 + }, + { + "epoch": 18.847411444141688, + "grad_norm": 11.273139953613281, + "learning_rate": 1.8711489649384194e-05, + "loss": 0.8696, + "step": 6917 + }, + { + "epoch": 18.850136239782017, + "grad_norm": 8.475065231323242, + "learning_rate": 1.8711056293988318e-05, + "loss": 0.9227, + "step": 6918 + }, + { + "epoch": 18.852861035422343, + "grad_norm": 8.927240371704102, + "learning_rate": 1.871062287075102e-05, + "loss": 0.7208, + "step": 6919 + }, + { + "epoch": 18.85558583106267, + "grad_norm": 10.094076156616211, + "learning_rate": 1.8710189379675667e-05, + "loss": 0.9561, + "step": 6920 + }, + { + "epoch": 18.858310626703, + "grad_norm": 8.230749130249023, + "learning_rate": 1.870975582076564e-05, + "loss": 0.9272, + "step": 6921 + }, + { + "epoch": 18.861035422343324, + "grad_norm": 8.077170372009277, + "learning_rate": 1.870932219402432e-05, + "loss": 0.947, + "step": 6922 + }, + { + "epoch": 18.86376021798365, + "grad_norm": 9.002728462219238, + "learning_rate": 1.8708888499455075e-05, + "loss": 0.8989, + "step": 6923 + }, + { + "epoch": 18.86648501362398, + "grad_norm": 8.719640731811523, + "learning_rate": 1.8708454737061284e-05, + "loss": 0.8878, + "step": 6924 + }, + { + "epoch": 18.869209809264305, + "grad_norm": 8.23000431060791, + "learning_rate": 1.870802090684633e-05, + "loss": 0.7559, + "step": 6925 + }, + { + "epoch": 18.87193460490463, + "grad_norm": 7.957650184631348, + "learning_rate": 1.8707587008813593e-05, + "loss": 0.8157, + "step": 6926 + }, + { + "epoch": 18.87465940054496, + "grad_norm": 9.691078186035156, + "learning_rate": 1.8707153042966445e-05, + "loss": 0.9717, + "step": 6927 + }, + { + "epoch": 18.877384196185286, + "grad_norm": 7.17464017868042, + "learning_rate": 1.870671900930827e-05, + "loss": 0.989, + "step": 6928 + }, + { + "epoch": 18.88010899182561, + "grad_norm": 8.259840965270996, + "learning_rate": 1.8706284907842446e-05, + "loss": 0.9609, + "step": 6929 + }, + { + "epoch": 18.88283378746594, + "grad_norm": 7.825801372528076, + "learning_rate": 1.8705850738572357e-05, + "loss": 0.7622, + "step": 6930 + }, + { + "epoch": 18.885558583106267, + "grad_norm": 9.720499038696289, + "learning_rate": 1.8705416501501383e-05, + "loss": 0.7961, + "step": 6931 + }, + { + "epoch": 18.888283378746593, + "grad_norm": 8.514625549316406, + "learning_rate": 1.8704982196632904e-05, + "loss": 0.7432, + "step": 6932 + }, + { + "epoch": 18.891008174386922, + "grad_norm": 9.289460182189941, + "learning_rate": 1.8704547823970306e-05, + "loss": 0.8408, + "step": 6933 + }, + { + "epoch": 18.893732970027248, + "grad_norm": 10.373196601867676, + "learning_rate": 1.8704113383516967e-05, + "loss": 0.9124, + "step": 6934 + }, + { + "epoch": 18.896457765667574, + "grad_norm": 9.915992736816406, + "learning_rate": 1.8703678875276277e-05, + "loss": 0.8114, + "step": 6935 + }, + { + "epoch": 18.899182561307903, + "grad_norm": 8.494244575500488, + "learning_rate": 1.8703244299251612e-05, + "loss": 0.9077, + "step": 6936 + }, + { + "epoch": 18.90190735694823, + "grad_norm": 8.14223575592041, + "learning_rate": 1.8702809655446364e-05, + "loss": 1.0366, + "step": 6937 + }, + { + "epoch": 18.904632152588555, + "grad_norm": 9.234797477722168, + "learning_rate": 1.8702374943863912e-05, + "loss": 0.825, + "step": 6938 + }, + { + "epoch": 18.907356948228884, + "grad_norm": 10.01010513305664, + "learning_rate": 1.8701940164507646e-05, + "loss": 1.0437, + "step": 6939 + }, + { + "epoch": 18.91008174386921, + "grad_norm": 8.667445182800293, + "learning_rate": 1.870150531738095e-05, + "loss": 0.9082, + "step": 6940 + }, + { + "epoch": 18.912806539509535, + "grad_norm": 8.761026382446289, + "learning_rate": 1.8701070402487208e-05, + "loss": 0.8855, + "step": 6941 + }, + { + "epoch": 18.915531335149865, + "grad_norm": 9.522194862365723, + "learning_rate": 1.8700635419829808e-05, + "loss": 1.02, + "step": 6942 + }, + { + "epoch": 18.91825613079019, + "grad_norm": 9.89741325378418, + "learning_rate": 1.8700200369412143e-05, + "loss": 1.1108, + "step": 6943 + }, + { + "epoch": 18.920980926430516, + "grad_norm": 7.780826568603516, + "learning_rate": 1.86997652512376e-05, + "loss": 0.8074, + "step": 6944 + }, + { + "epoch": 18.923705722070846, + "grad_norm": 6.950511455535889, + "learning_rate": 1.869933006530956e-05, + "loss": 0.8043, + "step": 6945 + }, + { + "epoch": 18.92643051771117, + "grad_norm": 7.270721912384033, + "learning_rate": 1.869889481163142e-05, + "loss": 0.8287, + "step": 6946 + }, + { + "epoch": 18.929155313351497, + "grad_norm": 9.197299003601074, + "learning_rate": 1.8698459490206568e-05, + "loss": 0.8691, + "step": 6947 + }, + { + "epoch": 18.931880108991827, + "grad_norm": 7.520884037017822, + "learning_rate": 1.8698024101038395e-05, + "loss": 0.7726, + "step": 6948 + }, + { + "epoch": 18.934604904632153, + "grad_norm": 8.074854850769043, + "learning_rate": 1.8697588644130283e-05, + "loss": 0.8833, + "step": 6949 + }, + { + "epoch": 18.93732970027248, + "grad_norm": 11.02020263671875, + "learning_rate": 1.8697153119485638e-05, + "loss": 1.0754, + "step": 6950 + }, + { + "epoch": 18.940054495912808, + "grad_norm": 10.82308578491211, + "learning_rate": 1.869671752710784e-05, + "loss": 1.0528, + "step": 6951 + }, + { + "epoch": 18.942779291553133, + "grad_norm": 8.439906120300293, + "learning_rate": 1.869628186700029e-05, + "loss": 0.812, + "step": 6952 + }, + { + "epoch": 18.94550408719346, + "grad_norm": 9.263603210449219, + "learning_rate": 1.8695846139166372e-05, + "loss": 0.9401, + "step": 6953 + }, + { + "epoch": 18.94822888283379, + "grad_norm": 8.745004653930664, + "learning_rate": 1.8695410343609487e-05, + "loss": 0.8589, + "step": 6954 + }, + { + "epoch": 18.950953678474114, + "grad_norm": 8.685702323913574, + "learning_rate": 1.8694974480333027e-05, + "loss": 0.8623, + "step": 6955 + }, + { + "epoch": 18.95367847411444, + "grad_norm": 8.876229286193848, + "learning_rate": 1.8694538549340385e-05, + "loss": 0.6804, + "step": 6956 + }, + { + "epoch": 18.95640326975477, + "grad_norm": 10.44974136352539, + "learning_rate": 1.8694102550634953e-05, + "loss": 0.9973, + "step": 6957 + }, + { + "epoch": 18.959128065395095, + "grad_norm": 9.667427062988281, + "learning_rate": 1.8693666484220134e-05, + "loss": 1.0387, + "step": 6958 + }, + { + "epoch": 18.96185286103542, + "grad_norm": 7.096478462219238, + "learning_rate": 1.8693230350099318e-05, + "loss": 0.7067, + "step": 6959 + }, + { + "epoch": 18.96457765667575, + "grad_norm": 7.511812686920166, + "learning_rate": 1.8692794148275904e-05, + "loss": 0.7866, + "step": 6960 + }, + { + "epoch": 18.967302452316076, + "grad_norm": 10.978753089904785, + "learning_rate": 1.869235787875329e-05, + "loss": 0.761, + "step": 6961 + }, + { + "epoch": 18.970027247956402, + "grad_norm": 7.78998327255249, + "learning_rate": 1.8691921541534876e-05, + "loss": 0.8462, + "step": 6962 + }, + { + "epoch": 18.97275204359673, + "grad_norm": 7.815904140472412, + "learning_rate": 1.869148513662405e-05, + "loss": 0.9651, + "step": 6963 + }, + { + "epoch": 18.975476839237057, + "grad_norm": 8.173052787780762, + "learning_rate": 1.869104866402422e-05, + "loss": 0.85, + "step": 6964 + }, + { + "epoch": 18.978201634877383, + "grad_norm": 10.576380729675293, + "learning_rate": 1.8690612123738784e-05, + "loss": 0.9049, + "step": 6965 + }, + { + "epoch": 18.980926430517712, + "grad_norm": 8.267260551452637, + "learning_rate": 1.869017551577114e-05, + "loss": 0.8013, + "step": 6966 + }, + { + "epoch": 18.983651226158038, + "grad_norm": 7.477278709411621, + "learning_rate": 1.8689738840124688e-05, + "loss": 0.7417, + "step": 6967 + }, + { + "epoch": 18.986376021798364, + "grad_norm": 10.80232048034668, + "learning_rate": 1.868930209680283e-05, + "loss": 0.7968, + "step": 6968 + }, + { + "epoch": 18.989100817438693, + "grad_norm": 9.751068115234375, + "learning_rate": 1.8688865285808968e-05, + "loss": 1.0911, + "step": 6969 + }, + { + "epoch": 18.99182561307902, + "grad_norm": 8.407898902893066, + "learning_rate": 1.8688428407146504e-05, + "loss": 0.8999, + "step": 6970 + }, + { + "epoch": 18.994550408719345, + "grad_norm": 9.125184059143066, + "learning_rate": 1.8687991460818836e-05, + "loss": 0.7819, + "step": 6971 + }, + { + "epoch": 18.997275204359674, + "grad_norm": 10.857903480529785, + "learning_rate": 1.868755444682937e-05, + "loss": 0.8312, + "step": 6972 + }, + { + "epoch": 19.0, + "grad_norm": 7.471215724945068, + "learning_rate": 1.8687117365181514e-05, + "loss": 0.8665, + "step": 6973 + }, + { + "epoch": 19.002724795640326, + "grad_norm": 7.7133469581604, + "learning_rate": 1.8686680215878663e-05, + "loss": 0.8215, + "step": 6974 + }, + { + "epoch": 19.005449591280655, + "grad_norm": 8.016887664794922, + "learning_rate": 1.8686242998924226e-05, + "loss": 0.7863, + "step": 6975 + }, + { + "epoch": 19.00817438692098, + "grad_norm": 9.045573234558105, + "learning_rate": 1.868580571432161e-05, + "loss": 0.9286, + "step": 6976 + }, + { + "epoch": 19.010899182561307, + "grad_norm": 8.61864185333252, + "learning_rate": 1.868536836207422e-05, + "loss": 0.9485, + "step": 6977 + }, + { + "epoch": 19.013623978201636, + "grad_norm": 9.215364456176758, + "learning_rate": 1.8684930942185457e-05, + "loss": 0.8007, + "step": 6978 + }, + { + "epoch": 19.016348773841962, + "grad_norm": 9.163359642028809, + "learning_rate": 1.8684493454658736e-05, + "loss": 0.795, + "step": 6979 + }, + { + "epoch": 19.019073569482288, + "grad_norm": 6.857732772827148, + "learning_rate": 1.8684055899497456e-05, + "loss": 0.65, + "step": 6980 + }, + { + "epoch": 19.021798365122617, + "grad_norm": 9.368291854858398, + "learning_rate": 1.8683618276705028e-05, + "loss": 0.8838, + "step": 6981 + }, + { + "epoch": 19.024523160762943, + "grad_norm": 8.756336212158203, + "learning_rate": 1.8683180586284862e-05, + "loss": 0.8461, + "step": 6982 + }, + { + "epoch": 19.02724795640327, + "grad_norm": 6.407591342926025, + "learning_rate": 1.8682742828240364e-05, + "loss": 0.855, + "step": 6983 + }, + { + "epoch": 19.029972752043598, + "grad_norm": 6.976788520812988, + "learning_rate": 1.8682305002574942e-05, + "loss": 0.9747, + "step": 6984 + }, + { + "epoch": 19.032697547683924, + "grad_norm": 11.912771224975586, + "learning_rate": 1.8681867109292012e-05, + "loss": 0.7258, + "step": 6985 + }, + { + "epoch": 19.03542234332425, + "grad_norm": 10.014404296875, + "learning_rate": 1.868142914839498e-05, + "loss": 0.8751, + "step": 6986 + }, + { + "epoch": 19.03814713896458, + "grad_norm": 10.036844253540039, + "learning_rate": 1.8680991119887256e-05, + "loss": 0.8563, + "step": 6987 + }, + { + "epoch": 19.040871934604905, + "grad_norm": 7.314995288848877, + "learning_rate": 1.868055302377225e-05, + "loss": 0.8879, + "step": 6988 + }, + { + "epoch": 19.04359673024523, + "grad_norm": 11.716142654418945, + "learning_rate": 1.8680114860053384e-05, + "loss": 0.7828, + "step": 6989 + }, + { + "epoch": 19.04632152588556, + "grad_norm": 7.671077251434326, + "learning_rate": 1.867967662873406e-05, + "loss": 0.8896, + "step": 6990 + }, + { + "epoch": 19.049046321525886, + "grad_norm": 7.949674129486084, + "learning_rate": 1.867923832981769e-05, + "loss": 0.8278, + "step": 6991 + }, + { + "epoch": 19.05177111716621, + "grad_norm": 9.292261123657227, + "learning_rate": 1.8678799963307693e-05, + "loss": 0.7715, + "step": 6992 + }, + { + "epoch": 19.05449591280654, + "grad_norm": 12.970134735107422, + "learning_rate": 1.867836152920748e-05, + "loss": 0.7914, + "step": 6993 + }, + { + "epoch": 19.057220708446867, + "grad_norm": 7.971855640411377, + "learning_rate": 1.867792302752047e-05, + "loss": 0.844, + "step": 6994 + }, + { + "epoch": 19.059945504087192, + "grad_norm": 9.02824878692627, + "learning_rate": 1.867748445825007e-05, + "loss": 0.6703, + "step": 6995 + }, + { + "epoch": 19.06267029972752, + "grad_norm": 7.739848613739014, + "learning_rate": 1.8677045821399705e-05, + "loss": 0.7098, + "step": 6996 + }, + { + "epoch": 19.065395095367847, + "grad_norm": 7.71321439743042, + "learning_rate": 1.8676607116972786e-05, + "loss": 0.871, + "step": 6997 + }, + { + "epoch": 19.068119891008173, + "grad_norm": 9.267059326171875, + "learning_rate": 1.8676168344972726e-05, + "loss": 0.8959, + "step": 6998 + }, + { + "epoch": 19.070844686648503, + "grad_norm": 7.251643180847168, + "learning_rate": 1.867572950540295e-05, + "loss": 0.8425, + "step": 6999 + }, + { + "epoch": 19.07356948228883, + "grad_norm": 8.379535675048828, + "learning_rate": 1.8675290598266872e-05, + "loss": 0.7917, + "step": 7000 + }, + { + "epoch": 19.076294277929154, + "grad_norm": 10.302045822143555, + "learning_rate": 1.8674851623567908e-05, + "loss": 0.879, + "step": 7001 + }, + { + "epoch": 19.079019073569484, + "grad_norm": 10.175151824951172, + "learning_rate": 1.8674412581309477e-05, + "loss": 0.9104, + "step": 7002 + }, + { + "epoch": 19.08174386920981, + "grad_norm": 8.297521591186523, + "learning_rate": 1.8673973471495005e-05, + "loss": 0.7986, + "step": 7003 + }, + { + "epoch": 19.084468664850135, + "grad_norm": 11.142738342285156, + "learning_rate": 1.8673534294127905e-05, + "loss": 0.9346, + "step": 7004 + }, + { + "epoch": 19.087193460490465, + "grad_norm": 7.376419544219971, + "learning_rate": 1.8673095049211597e-05, + "loss": 0.6486, + "step": 7005 + }, + { + "epoch": 19.08991825613079, + "grad_norm": 7.580418586730957, + "learning_rate": 1.8672655736749507e-05, + "loss": 0.918, + "step": 7006 + }, + { + "epoch": 19.092643051771116, + "grad_norm": 8.258780479431152, + "learning_rate": 1.867221635674505e-05, + "loss": 0.8269, + "step": 7007 + }, + { + "epoch": 19.095367847411445, + "grad_norm": 12.455347061157227, + "learning_rate": 1.867177690920165e-05, + "loss": 0.9009, + "step": 7008 + }, + { + "epoch": 19.09809264305177, + "grad_norm": 6.943690776824951, + "learning_rate": 1.8671337394122733e-05, + "loss": 0.6227, + "step": 7009 + }, + { + "epoch": 19.100817438692097, + "grad_norm": 8.154997825622559, + "learning_rate": 1.867089781151172e-05, + "loss": 0.7135, + "step": 7010 + }, + { + "epoch": 19.103542234332426, + "grad_norm": 7.797388553619385, + "learning_rate": 1.8670458161372033e-05, + "loss": 0.89, + "step": 7011 + }, + { + "epoch": 19.106267029972752, + "grad_norm": 10.197694778442383, + "learning_rate": 1.8670018443707098e-05, + "loss": 0.8024, + "step": 7012 + }, + { + "epoch": 19.108991825613078, + "grad_norm": 7.500790596008301, + "learning_rate": 1.866957865852034e-05, + "loss": 0.7478, + "step": 7013 + }, + { + "epoch": 19.111716621253407, + "grad_norm": 8.322009086608887, + "learning_rate": 1.866913880581518e-05, + "loss": 0.8334, + "step": 7014 + }, + { + "epoch": 19.114441416893733, + "grad_norm": 8.339186668395996, + "learning_rate": 1.8668698885595045e-05, + "loss": 0.8549, + "step": 7015 + }, + { + "epoch": 19.11716621253406, + "grad_norm": 7.383385181427002, + "learning_rate": 1.866825889786336e-05, + "loss": 0.8645, + "step": 7016 + }, + { + "epoch": 19.11989100817439, + "grad_norm": 7.881433486938477, + "learning_rate": 1.866781884262356e-05, + "loss": 0.7115, + "step": 7017 + }, + { + "epoch": 19.122615803814714, + "grad_norm": 7.964922904968262, + "learning_rate": 1.866737871987906e-05, + "loss": 0.808, + "step": 7018 + }, + { + "epoch": 19.12534059945504, + "grad_norm": 7.4784650802612305, + "learning_rate": 1.86669385296333e-05, + "loss": 0.7885, + "step": 7019 + }, + { + "epoch": 19.12806539509537, + "grad_norm": 9.835017204284668, + "learning_rate": 1.8666498271889698e-05, + "loss": 0.6842, + "step": 7020 + }, + { + "epoch": 19.130790190735695, + "grad_norm": 9.407984733581543, + "learning_rate": 1.8666057946651682e-05, + "loss": 0.6931, + "step": 7021 + }, + { + "epoch": 19.13351498637602, + "grad_norm": 9.08998966217041, + "learning_rate": 1.866561755392269e-05, + "loss": 0.8494, + "step": 7022 + }, + { + "epoch": 19.13623978201635, + "grad_norm": 8.443471908569336, + "learning_rate": 1.866517709370615e-05, + "loss": 0.6473, + "step": 7023 + }, + { + "epoch": 19.138964577656676, + "grad_norm": 10.57610034942627, + "learning_rate": 1.8664736566005487e-05, + "loss": 0.7864, + "step": 7024 + }, + { + "epoch": 19.141689373297, + "grad_norm": 8.669187545776367, + "learning_rate": 1.8664295970824136e-05, + "loss": 0.7316, + "step": 7025 + }, + { + "epoch": 19.14441416893733, + "grad_norm": 8.262614250183105, + "learning_rate": 1.8663855308165524e-05, + "loss": 0.9006, + "step": 7026 + }, + { + "epoch": 19.147138964577657, + "grad_norm": 7.1119842529296875, + "learning_rate": 1.8663414578033084e-05, + "loss": 0.8217, + "step": 7027 + }, + { + "epoch": 19.149863760217983, + "grad_norm": 10.65214729309082, + "learning_rate": 1.8662973780430256e-05, + "loss": 0.9548, + "step": 7028 + }, + { + "epoch": 19.152588555858312, + "grad_norm": 9.513092041015625, + "learning_rate": 1.8662532915360466e-05, + "loss": 0.8422, + "step": 7029 + }, + { + "epoch": 19.155313351498638, + "grad_norm": 11.064226150512695, + "learning_rate": 1.8662091982827142e-05, + "loss": 0.7493, + "step": 7030 + }, + { + "epoch": 19.158038147138964, + "grad_norm": 8.788904190063477, + "learning_rate": 1.8661650982833733e-05, + "loss": 0.6814, + "step": 7031 + }, + { + "epoch": 19.160762942779293, + "grad_norm": 8.584736824035645, + "learning_rate": 1.866120991538366e-05, + "loss": 0.8593, + "step": 7032 + }, + { + "epoch": 19.16348773841962, + "grad_norm": 10.5648832321167, + "learning_rate": 1.8660768780480364e-05, + "loss": 0.6584, + "step": 7033 + }, + { + "epoch": 19.166212534059945, + "grad_norm": 10.726306915283203, + "learning_rate": 1.866032757812728e-05, + "loss": 0.7759, + "step": 7034 + }, + { + "epoch": 19.168937329700274, + "grad_norm": 7.508849620819092, + "learning_rate": 1.8659886308327842e-05, + "loss": 0.6902, + "step": 7035 + }, + { + "epoch": 19.1716621253406, + "grad_norm": 9.58052921295166, + "learning_rate": 1.865944497108549e-05, + "loss": 0.8102, + "step": 7036 + }, + { + "epoch": 19.174386920980925, + "grad_norm": 15.089922904968262, + "learning_rate": 1.8659003566403658e-05, + "loss": 0.8425, + "step": 7037 + }, + { + "epoch": 19.177111716621255, + "grad_norm": 9.278483390808105, + "learning_rate": 1.8658562094285786e-05, + "loss": 0.7423, + "step": 7038 + }, + { + "epoch": 19.17983651226158, + "grad_norm": 7.667381763458252, + "learning_rate": 1.865812055473531e-05, + "loss": 0.7751, + "step": 7039 + }, + { + "epoch": 19.182561307901906, + "grad_norm": 8.727204322814941, + "learning_rate": 1.865767894775567e-05, + "loss": 0.9486, + "step": 7040 + }, + { + "epoch": 19.185286103542236, + "grad_norm": 8.394052505493164, + "learning_rate": 1.8657237273350305e-05, + "loss": 1.0408, + "step": 7041 + }, + { + "epoch": 19.18801089918256, + "grad_norm": 7.457240104675293, + "learning_rate": 1.8656795531522655e-05, + "loss": 0.6155, + "step": 7042 + }, + { + "epoch": 19.190735694822887, + "grad_norm": 11.908757209777832, + "learning_rate": 1.865635372227616e-05, + "loss": 0.9937, + "step": 7043 + }, + { + "epoch": 19.193460490463217, + "grad_norm": 9.040936470031738, + "learning_rate": 1.865591184561426e-05, + "loss": 0.7816, + "step": 7044 + }, + { + "epoch": 19.196185286103542, + "grad_norm": 6.818192958831787, + "learning_rate": 1.8655469901540398e-05, + "loss": 0.7806, + "step": 7045 + }, + { + "epoch": 19.19891008174387, + "grad_norm": 8.640161514282227, + "learning_rate": 1.8655027890058014e-05, + "loss": 0.7217, + "step": 7046 + }, + { + "epoch": 19.201634877384198, + "grad_norm": 9.699905395507812, + "learning_rate": 1.8654585811170553e-05, + "loss": 0.8181, + "step": 7047 + }, + { + "epoch": 19.204359673024523, + "grad_norm": 8.94979190826416, + "learning_rate": 1.8654143664881455e-05, + "loss": 0.9097, + "step": 7048 + }, + { + "epoch": 19.20708446866485, + "grad_norm": 7.599967956542969, + "learning_rate": 1.8653701451194166e-05, + "loss": 0.8625, + "step": 7049 + }, + { + "epoch": 19.20980926430518, + "grad_norm": 7.219893932342529, + "learning_rate": 1.8653259170112128e-05, + "loss": 0.8013, + "step": 7050 + }, + { + "epoch": 19.212534059945504, + "grad_norm": 9.76356029510498, + "learning_rate": 1.8652816821638783e-05, + "loss": 0.8273, + "step": 7051 + }, + { + "epoch": 19.21525885558583, + "grad_norm": 9.20617961883545, + "learning_rate": 1.8652374405777584e-05, + "loss": 0.8942, + "step": 7052 + }, + { + "epoch": 19.21798365122616, + "grad_norm": 8.287347793579102, + "learning_rate": 1.865193192253197e-05, + "loss": 0.7924, + "step": 7053 + }, + { + "epoch": 19.220708446866485, + "grad_norm": 6.710139751434326, + "learning_rate": 1.8651489371905386e-05, + "loss": 0.6537, + "step": 7054 + }, + { + "epoch": 19.22343324250681, + "grad_norm": 9.382214546203613, + "learning_rate": 1.8651046753901286e-05, + "loss": 0.8285, + "step": 7055 + }, + { + "epoch": 19.22615803814714, + "grad_norm": 7.651352882385254, + "learning_rate": 1.8650604068523107e-05, + "loss": 0.8624, + "step": 7056 + }, + { + "epoch": 19.228882833787466, + "grad_norm": 7.876631736755371, + "learning_rate": 1.8650161315774306e-05, + "loss": 0.8689, + "step": 7057 + }, + { + "epoch": 19.231607629427792, + "grad_norm": 8.066032409667969, + "learning_rate": 1.8649718495658325e-05, + "loss": 0.9088, + "step": 7058 + }, + { + "epoch": 19.23433242506812, + "grad_norm": 8.066088676452637, + "learning_rate": 1.8649275608178617e-05, + "loss": 0.8839, + "step": 7059 + }, + { + "epoch": 19.237057220708447, + "grad_norm": 7.8374481201171875, + "learning_rate": 1.8648832653338628e-05, + "loss": 0.9174, + "step": 7060 + }, + { + "epoch": 19.239782016348773, + "grad_norm": 9.005922317504883, + "learning_rate": 1.864838963114181e-05, + "loss": 0.7836, + "step": 7061 + }, + { + "epoch": 19.242506811989102, + "grad_norm": 8.517781257629395, + "learning_rate": 1.8647946541591607e-05, + "loss": 0.9065, + "step": 7062 + }, + { + "epoch": 19.245231607629428, + "grad_norm": 7.555675506591797, + "learning_rate": 1.8647503384691477e-05, + "loss": 0.6729, + "step": 7063 + }, + { + "epoch": 19.247956403269754, + "grad_norm": 10.002867698669434, + "learning_rate": 1.864706016044487e-05, + "loss": 0.8395, + "step": 7064 + }, + { + "epoch": 19.250681198910083, + "grad_norm": 8.23402214050293, + "learning_rate": 1.8646616868855236e-05, + "loss": 0.7773, + "step": 7065 + }, + { + "epoch": 19.25340599455041, + "grad_norm": 7.119266510009766, + "learning_rate": 1.864617350992603e-05, + "loss": 0.7239, + "step": 7066 + }, + { + "epoch": 19.256130790190735, + "grad_norm": 10.741050720214844, + "learning_rate": 1.86457300836607e-05, + "loss": 0.7881, + "step": 7067 + }, + { + "epoch": 19.258855585831064, + "grad_norm": 8.45600414276123, + "learning_rate": 1.8645286590062705e-05, + "loss": 0.6841, + "step": 7068 + }, + { + "epoch": 19.26158038147139, + "grad_norm": 8.414836883544922, + "learning_rate": 1.8644843029135496e-05, + "loss": 0.7979, + "step": 7069 + }, + { + "epoch": 19.264305177111716, + "grad_norm": 9.2487154006958, + "learning_rate": 1.8644399400882525e-05, + "loss": 0.7239, + "step": 7070 + }, + { + "epoch": 19.267029972752045, + "grad_norm": 9.046351432800293, + "learning_rate": 1.8643955705307252e-05, + "loss": 0.7223, + "step": 7071 + }, + { + "epoch": 19.26975476839237, + "grad_norm": 12.175895690917969, + "learning_rate": 1.864351194241313e-05, + "loss": 0.9025, + "step": 7072 + }, + { + "epoch": 19.272479564032697, + "grad_norm": 8.9979248046875, + "learning_rate": 1.8643068112203612e-05, + "loss": 0.8207, + "step": 7073 + }, + { + "epoch": 19.275204359673026, + "grad_norm": 13.657709121704102, + "learning_rate": 1.864262421468216e-05, + "loss": 0.8423, + "step": 7074 + }, + { + "epoch": 19.277929155313352, + "grad_norm": 14.252540588378906, + "learning_rate": 1.864218024985223e-05, + "loss": 0.8728, + "step": 7075 + }, + { + "epoch": 19.280653950953678, + "grad_norm": 11.971515655517578, + "learning_rate": 1.864173621771728e-05, + "loss": 0.7352, + "step": 7076 + }, + { + "epoch": 19.283378746594007, + "grad_norm": 9.648859024047852, + "learning_rate": 1.8641292118280764e-05, + "loss": 0.8773, + "step": 7077 + }, + { + "epoch": 19.286103542234333, + "grad_norm": 11.207634925842285, + "learning_rate": 1.8640847951546145e-05, + "loss": 0.8191, + "step": 7078 + }, + { + "epoch": 19.28882833787466, + "grad_norm": 9.115625381469727, + "learning_rate": 1.8640403717516877e-05, + "loss": 0.7565, + "step": 7079 + }, + { + "epoch": 19.291553133514988, + "grad_norm": 8.175503730773926, + "learning_rate": 1.8639959416196424e-05, + "loss": 0.7382, + "step": 7080 + }, + { + "epoch": 19.294277929155314, + "grad_norm": 8.28620719909668, + "learning_rate": 1.8639515047588247e-05, + "loss": 0.689, + "step": 7081 + }, + { + "epoch": 19.29700272479564, + "grad_norm": 10.554699897766113, + "learning_rate": 1.86390706116958e-05, + "loss": 0.7982, + "step": 7082 + }, + { + "epoch": 19.29972752043597, + "grad_norm": 12.142552375793457, + "learning_rate": 1.863862610852255e-05, + "loss": 0.9542, + "step": 7083 + }, + { + "epoch": 19.302452316076295, + "grad_norm": 9.547401428222656, + "learning_rate": 1.8638181538071966e-05, + "loss": 0.7208, + "step": 7084 + }, + { + "epoch": 19.30517711171662, + "grad_norm": 9.361517906188965, + "learning_rate": 1.8637736900347496e-05, + "loss": 0.861, + "step": 7085 + }, + { + "epoch": 19.30790190735695, + "grad_norm": 8.348713874816895, + "learning_rate": 1.863729219535261e-05, + "loss": 0.9124, + "step": 7086 + }, + { + "epoch": 19.310626702997276, + "grad_norm": 7.464922904968262, + "learning_rate": 1.8636847423090768e-05, + "loss": 0.8086, + "step": 7087 + }, + { + "epoch": 19.3133514986376, + "grad_norm": 9.388986587524414, + "learning_rate": 1.863640258356544e-05, + "loss": 0.8484, + "step": 7088 + }, + { + "epoch": 19.31607629427793, + "grad_norm": 12.31118106842041, + "learning_rate": 1.8635957676780085e-05, + "loss": 0.8545, + "step": 7089 + }, + { + "epoch": 19.318801089918257, + "grad_norm": 7.389854431152344, + "learning_rate": 1.8635512702738168e-05, + "loss": 0.8845, + "step": 7090 + }, + { + "epoch": 19.321525885558582, + "grad_norm": 9.636378288269043, + "learning_rate": 1.8635067661443157e-05, + "loss": 0.858, + "step": 7091 + }, + { + "epoch": 19.32425068119891, + "grad_norm": 12.663843154907227, + "learning_rate": 1.8634622552898516e-05, + "loss": 1.1116, + "step": 7092 + }, + { + "epoch": 19.326975476839237, + "grad_norm": 8.857486724853516, + "learning_rate": 1.8634177377107717e-05, + "loss": 0.8301, + "step": 7093 + }, + { + "epoch": 19.329700272479563, + "grad_norm": 7.673715591430664, + "learning_rate": 1.863373213407422e-05, + "loss": 0.6119, + "step": 7094 + }, + { + "epoch": 19.332425068119893, + "grad_norm": 8.896916389465332, + "learning_rate": 1.8633286823801495e-05, + "loss": 0.869, + "step": 7095 + }, + { + "epoch": 19.33514986376022, + "grad_norm": 7.086410045623779, + "learning_rate": 1.8632841446293008e-05, + "loss": 0.8376, + "step": 7096 + }, + { + "epoch": 19.337874659400544, + "grad_norm": 8.21198558807373, + "learning_rate": 1.8632396001552232e-05, + "loss": 0.741, + "step": 7097 + }, + { + "epoch": 19.340599455040874, + "grad_norm": 11.218838691711426, + "learning_rate": 1.863195048958263e-05, + "loss": 0.9675, + "step": 7098 + }, + { + "epoch": 19.3433242506812, + "grad_norm": 14.552414894104004, + "learning_rate": 1.863150491038768e-05, + "loss": 0.848, + "step": 7099 + }, + { + "epoch": 19.346049046321525, + "grad_norm": 8.315683364868164, + "learning_rate": 1.863105926397085e-05, + "loss": 0.8341, + "step": 7100 + }, + { + "epoch": 19.348773841961854, + "grad_norm": 8.802910804748535, + "learning_rate": 1.86306135503356e-05, + "loss": 0.7502, + "step": 7101 + }, + { + "epoch": 19.35149863760218, + "grad_norm": 9.626164436340332, + "learning_rate": 1.8630167769485417e-05, + "loss": 0.8588, + "step": 7102 + }, + { + "epoch": 19.354223433242506, + "grad_norm": 7.273528099060059, + "learning_rate": 1.862972192142376e-05, + "loss": 0.8357, + "step": 7103 + }, + { + "epoch": 19.356948228882835, + "grad_norm": 12.616958618164062, + "learning_rate": 1.862927600615411e-05, + "loss": 0.8398, + "step": 7104 + }, + { + "epoch": 19.35967302452316, + "grad_norm": 8.385083198547363, + "learning_rate": 1.862883002367993e-05, + "loss": 0.7583, + "step": 7105 + }, + { + "epoch": 19.362397820163487, + "grad_norm": 7.05576229095459, + "learning_rate": 1.8628383974004707e-05, + "loss": 0.8187, + "step": 7106 + }, + { + "epoch": 19.365122615803816, + "grad_norm": 10.724347114562988, + "learning_rate": 1.8627937857131904e-05, + "loss": 0.8776, + "step": 7107 + }, + { + "epoch": 19.367847411444142, + "grad_norm": 8.391908645629883, + "learning_rate": 1.8627491673065e-05, + "loss": 0.8613, + "step": 7108 + }, + { + "epoch": 19.370572207084468, + "grad_norm": 8.110748291015625, + "learning_rate": 1.8627045421807466e-05, + "loss": 0.8065, + "step": 7109 + }, + { + "epoch": 19.373297002724797, + "grad_norm": 8.11498737335205, + "learning_rate": 1.8626599103362783e-05, + "loss": 0.719, + "step": 7110 + }, + { + "epoch": 19.376021798365123, + "grad_norm": 9.259939193725586, + "learning_rate": 1.862615271773442e-05, + "loss": 0.7861, + "step": 7111 + }, + { + "epoch": 19.37874659400545, + "grad_norm": 7.308506965637207, + "learning_rate": 1.862570626492586e-05, + "loss": 0.653, + "step": 7112 + }, + { + "epoch": 19.381471389645778, + "grad_norm": 6.963586807250977, + "learning_rate": 1.8625259744940578e-05, + "loss": 0.8174, + "step": 7113 + }, + { + "epoch": 19.384196185286104, + "grad_norm": 8.394465446472168, + "learning_rate": 1.862481315778205e-05, + "loss": 0.8184, + "step": 7114 + }, + { + "epoch": 19.38692098092643, + "grad_norm": 8.269073486328125, + "learning_rate": 1.8624366503453752e-05, + "loss": 0.9324, + "step": 7115 + }, + { + "epoch": 19.38964577656676, + "grad_norm": 9.482769966125488, + "learning_rate": 1.862391978195917e-05, + "loss": 0.8301, + "step": 7116 + }, + { + "epoch": 19.392370572207085, + "grad_norm": 10.183133125305176, + "learning_rate": 1.8623472993301774e-05, + "loss": 0.7036, + "step": 7117 + }, + { + "epoch": 19.39509536784741, + "grad_norm": 8.745038986206055, + "learning_rate": 1.8623026137485047e-05, + "loss": 0.9237, + "step": 7118 + }, + { + "epoch": 19.39782016348774, + "grad_norm": 12.041457176208496, + "learning_rate": 1.8622579214512476e-05, + "loss": 0.8619, + "step": 7119 + }, + { + "epoch": 19.400544959128066, + "grad_norm": 8.609764099121094, + "learning_rate": 1.862213222438753e-05, + "loss": 0.8923, + "step": 7120 + }, + { + "epoch": 19.40326975476839, + "grad_norm": 9.28745174407959, + "learning_rate": 1.86216851671137e-05, + "loss": 0.745, + "step": 7121 + }, + { + "epoch": 19.40599455040872, + "grad_norm": 11.696236610412598, + "learning_rate": 1.862123804269446e-05, + "loss": 0.8381, + "step": 7122 + }, + { + "epoch": 19.408719346049047, + "grad_norm": 10.133161544799805, + "learning_rate": 1.8620790851133294e-05, + "loss": 1.0443, + "step": 7123 + }, + { + "epoch": 19.411444141689373, + "grad_norm": 10.21315860748291, + "learning_rate": 1.862034359243369e-05, + "loss": 0.9352, + "step": 7124 + }, + { + "epoch": 19.414168937329702, + "grad_norm": 8.50641918182373, + "learning_rate": 1.8619896266599128e-05, + "loss": 0.8772, + "step": 7125 + }, + { + "epoch": 19.416893732970028, + "grad_norm": 9.827706336975098, + "learning_rate": 1.861944887363309e-05, + "loss": 0.7192, + "step": 7126 + }, + { + "epoch": 19.419618528610354, + "grad_norm": 10.437112808227539, + "learning_rate": 1.861900141353906e-05, + "loss": 0.7804, + "step": 7127 + }, + { + "epoch": 19.422343324250683, + "grad_norm": 11.694056510925293, + "learning_rate": 1.8618553886320527e-05, + "loss": 0.858, + "step": 7128 + }, + { + "epoch": 19.42506811989101, + "grad_norm": 9.052674293518066, + "learning_rate": 1.861810629198097e-05, + "loss": 0.9775, + "step": 7129 + }, + { + "epoch": 19.427792915531334, + "grad_norm": 8.512746810913086, + "learning_rate": 1.8617658630523884e-05, + "loss": 1.0008, + "step": 7130 + }, + { + "epoch": 19.430517711171664, + "grad_norm": 9.113412857055664, + "learning_rate": 1.8617210901952747e-05, + "loss": 0.849, + "step": 7131 + }, + { + "epoch": 19.43324250681199, + "grad_norm": 7.726861476898193, + "learning_rate": 1.861676310627105e-05, + "loss": 0.7202, + "step": 7132 + }, + { + "epoch": 19.435967302452315, + "grad_norm": 9.574609756469727, + "learning_rate": 1.8616315243482278e-05, + "loss": 0.8007, + "step": 7133 + }, + { + "epoch": 19.438692098092645, + "grad_norm": 8.07555866241455, + "learning_rate": 1.861586731358992e-05, + "loss": 0.8369, + "step": 7134 + }, + { + "epoch": 19.44141689373297, + "grad_norm": 8.209267616271973, + "learning_rate": 1.8615419316597466e-05, + "loss": 0.9718, + "step": 7135 + }, + { + "epoch": 19.444141689373296, + "grad_norm": 8.566980361938477, + "learning_rate": 1.8614971252508404e-05, + "loss": 0.7947, + "step": 7136 + }, + { + "epoch": 19.446866485013626, + "grad_norm": 8.924108505249023, + "learning_rate": 1.861452312132622e-05, + "loss": 0.7556, + "step": 7137 + }, + { + "epoch": 19.44959128065395, + "grad_norm": 7.728081703186035, + "learning_rate": 1.861407492305441e-05, + "loss": 0.8705, + "step": 7138 + }, + { + "epoch": 19.452316076294277, + "grad_norm": 9.532186508178711, + "learning_rate": 1.861362665769646e-05, + "loss": 0.7142, + "step": 7139 + }, + { + "epoch": 19.455040871934607, + "grad_norm": 10.082612991333008, + "learning_rate": 1.8613178325255864e-05, + "loss": 0.8036, + "step": 7140 + }, + { + "epoch": 19.457765667574932, + "grad_norm": 7.684032917022705, + "learning_rate": 1.861272992573611e-05, + "loss": 0.7967, + "step": 7141 + }, + { + "epoch": 19.460490463215258, + "grad_norm": 9.457315444946289, + "learning_rate": 1.8612281459140697e-05, + "loss": 0.9214, + "step": 7142 + }, + { + "epoch": 19.463215258855588, + "grad_norm": 10.618170738220215, + "learning_rate": 1.861183292547311e-05, + "loss": 0.7838, + "step": 7143 + }, + { + "epoch": 19.465940054495913, + "grad_norm": 8.46899700164795, + "learning_rate": 1.8611384324736846e-05, + "loss": 0.8322, + "step": 7144 + }, + { + "epoch": 19.46866485013624, + "grad_norm": 14.252891540527344, + "learning_rate": 1.8610935656935397e-05, + "loss": 0.7529, + "step": 7145 + }, + { + "epoch": 19.47138964577657, + "grad_norm": 8.75171947479248, + "learning_rate": 1.8610486922072263e-05, + "loss": 0.9302, + "step": 7146 + }, + { + "epoch": 19.474114441416894, + "grad_norm": 9.981742858886719, + "learning_rate": 1.861003812015093e-05, + "loss": 0.8142, + "step": 7147 + }, + { + "epoch": 19.47683923705722, + "grad_norm": 8.651573181152344, + "learning_rate": 1.8609589251174897e-05, + "loss": 0.7855, + "step": 7148 + }, + { + "epoch": 19.479564032697546, + "grad_norm": 8.043776512145996, + "learning_rate": 1.860914031514766e-05, + "loss": 0.8999, + "step": 7149 + }, + { + "epoch": 19.482288828337875, + "grad_norm": 8.118514060974121, + "learning_rate": 1.8608691312072714e-05, + "loss": 0.696, + "step": 7150 + }, + { + "epoch": 19.4850136239782, + "grad_norm": 9.851868629455566, + "learning_rate": 1.8608242241953563e-05, + "loss": 0.8085, + "step": 7151 + }, + { + "epoch": 19.48773841961853, + "grad_norm": 9.400286674499512, + "learning_rate": 1.8607793104793696e-05, + "loss": 0.9197, + "step": 7152 + }, + { + "epoch": 19.490463215258856, + "grad_norm": 10.697088241577148, + "learning_rate": 1.8607343900596612e-05, + "loss": 0.8051, + "step": 7153 + }, + { + "epoch": 19.493188010899182, + "grad_norm": 8.79265022277832, + "learning_rate": 1.860689462936581e-05, + "loss": 0.9979, + "step": 7154 + }, + { + "epoch": 19.495912806539508, + "grad_norm": 10.787165641784668, + "learning_rate": 1.860644529110479e-05, + "loss": 0.9614, + "step": 7155 + }, + { + "epoch": 19.498637602179837, + "grad_norm": 15.625445365905762, + "learning_rate": 1.860599588581705e-05, + "loss": 0.9706, + "step": 7156 + }, + { + "epoch": 19.501362397820163, + "grad_norm": 8.949894905090332, + "learning_rate": 1.8605546413506092e-05, + "loss": 0.7184, + "step": 7157 + }, + { + "epoch": 19.504087193460492, + "grad_norm": 10.700446128845215, + "learning_rate": 1.8605096874175418e-05, + "loss": 0.7781, + "step": 7158 + }, + { + "epoch": 19.506811989100818, + "grad_norm": 10.570991516113281, + "learning_rate": 1.860464726782852e-05, + "loss": 0.8612, + "step": 7159 + }, + { + "epoch": 19.509536784741144, + "grad_norm": 6.78163480758667, + "learning_rate": 1.860419759446891e-05, + "loss": 0.7797, + "step": 7160 + }, + { + "epoch": 19.51226158038147, + "grad_norm": 7.994595527648926, + "learning_rate": 1.860374785410009e-05, + "loss": 0.8046, + "step": 7161 + }, + { + "epoch": 19.5149863760218, + "grad_norm": 7.7101616859436035, + "learning_rate": 1.8603298046725556e-05, + "loss": 0.7093, + "step": 7162 + }, + { + "epoch": 19.517711171662125, + "grad_norm": 8.135588645935059, + "learning_rate": 1.860284817234881e-05, + "loss": 0.9785, + "step": 7163 + }, + { + "epoch": 19.520435967302454, + "grad_norm": 8.23460578918457, + "learning_rate": 1.8602398230973363e-05, + "loss": 0.8845, + "step": 7164 + }, + { + "epoch": 19.52316076294278, + "grad_norm": 8.690340995788574, + "learning_rate": 1.8601948222602715e-05, + "loss": 0.782, + "step": 7165 + }, + { + "epoch": 19.525885558583106, + "grad_norm": 8.22935962677002, + "learning_rate": 1.860149814724037e-05, + "loss": 0.7798, + "step": 7166 + }, + { + "epoch": 19.52861035422343, + "grad_norm": 8.305482864379883, + "learning_rate": 1.8601048004889835e-05, + "loss": 0.9558, + "step": 7167 + }, + { + "epoch": 19.53133514986376, + "grad_norm": 8.000179290771484, + "learning_rate": 1.8600597795554613e-05, + "loss": 0.8922, + "step": 7168 + }, + { + "epoch": 19.534059945504087, + "grad_norm": 7.575944900512695, + "learning_rate": 1.8600147519238217e-05, + "loss": 0.5796, + "step": 7169 + }, + { + "epoch": 19.536784741144416, + "grad_norm": 7.775625228881836, + "learning_rate": 1.8599697175944145e-05, + "loss": 0.6722, + "step": 7170 + }, + { + "epoch": 19.539509536784742, + "grad_norm": 13.651352882385254, + "learning_rate": 1.859924676567591e-05, + "loss": 0.8679, + "step": 7171 + }, + { + "epoch": 19.542234332425068, + "grad_norm": 8.39905071258545, + "learning_rate": 1.8598796288437017e-05, + "loss": 0.991, + "step": 7172 + }, + { + "epoch": 19.544959128065393, + "grad_norm": 7.791860580444336, + "learning_rate": 1.8598345744230975e-05, + "loss": 0.6833, + "step": 7173 + }, + { + "epoch": 19.547683923705723, + "grad_norm": 9.090578079223633, + "learning_rate": 1.8597895133061293e-05, + "loss": 0.6956, + "step": 7174 + }, + { + "epoch": 19.55040871934605, + "grad_norm": 9.28824234008789, + "learning_rate": 1.859744445493148e-05, + "loss": 1.0017, + "step": 7175 + }, + { + "epoch": 19.553133514986374, + "grad_norm": 8.328651428222656, + "learning_rate": 1.8596993709845047e-05, + "loss": 0.817, + "step": 7176 + }, + { + "epoch": 19.555858310626704, + "grad_norm": 9.966940879821777, + "learning_rate": 1.8596542897805504e-05, + "loss": 0.9116, + "step": 7177 + }, + { + "epoch": 19.55858310626703, + "grad_norm": 8.67443561553955, + "learning_rate": 1.8596092018816364e-05, + "loss": 0.824, + "step": 7178 + }, + { + "epoch": 19.561307901907355, + "grad_norm": 8.581880569458008, + "learning_rate": 1.859564107288113e-05, + "loss": 0.7651, + "step": 7179 + }, + { + "epoch": 19.564032697547685, + "grad_norm": 6.821385383605957, + "learning_rate": 1.8595190060003327e-05, + "loss": 0.8549, + "step": 7180 + }, + { + "epoch": 19.56675749318801, + "grad_norm": 7.707915306091309, + "learning_rate": 1.8594738980186456e-05, + "loss": 0.7549, + "step": 7181 + }, + { + "epoch": 19.569482288828336, + "grad_norm": 9.711687088012695, + "learning_rate": 1.8594287833434033e-05, + "loss": 0.7441, + "step": 7182 + }, + { + "epoch": 19.572207084468666, + "grad_norm": 6.779923439025879, + "learning_rate": 1.8593836619749576e-05, + "loss": 0.9248, + "step": 7183 + }, + { + "epoch": 19.57493188010899, + "grad_norm": 8.128297805786133, + "learning_rate": 1.8593385339136596e-05, + "loss": 1.0179, + "step": 7184 + }, + { + "epoch": 19.577656675749317, + "grad_norm": 7.063774108886719, + "learning_rate": 1.8592933991598605e-05, + "loss": 0.7955, + "step": 7185 + }, + { + "epoch": 19.580381471389646, + "grad_norm": 8.919217109680176, + "learning_rate": 1.8592482577139125e-05, + "loss": 0.8444, + "step": 7186 + }, + { + "epoch": 19.583106267029972, + "grad_norm": 8.478561401367188, + "learning_rate": 1.8592031095761665e-05, + "loss": 0.7125, + "step": 7187 + }, + { + "epoch": 19.585831062670298, + "grad_norm": 8.336913108825684, + "learning_rate": 1.8591579547469743e-05, + "loss": 0.8051, + "step": 7188 + }, + { + "epoch": 19.588555858310627, + "grad_norm": 8.41412353515625, + "learning_rate": 1.8591127932266874e-05, + "loss": 0.7394, + "step": 7189 + }, + { + "epoch": 19.591280653950953, + "grad_norm": 9.4815034866333, + "learning_rate": 1.859067625015658e-05, + "loss": 0.85, + "step": 7190 + }, + { + "epoch": 19.59400544959128, + "grad_norm": 9.293360710144043, + "learning_rate": 1.8590224501142377e-05, + "loss": 0.832, + "step": 7191 + }, + { + "epoch": 19.59673024523161, + "grad_norm": 8.675623893737793, + "learning_rate": 1.8589772685227777e-05, + "loss": 1.0309, + "step": 7192 + }, + { + "epoch": 19.599455040871934, + "grad_norm": 7.507985591888428, + "learning_rate": 1.858932080241631e-05, + "loss": 0.6049, + "step": 7193 + }, + { + "epoch": 19.60217983651226, + "grad_norm": 9.1579008102417, + "learning_rate": 1.8588868852711487e-05, + "loss": 0.7317, + "step": 7194 + }, + { + "epoch": 19.60490463215259, + "grad_norm": 9.267694473266602, + "learning_rate": 1.8588416836116824e-05, + "loss": 0.9226, + "step": 7195 + }, + { + "epoch": 19.607629427792915, + "grad_norm": 8.240072250366211, + "learning_rate": 1.8587964752635856e-05, + "loss": 0.684, + "step": 7196 + }, + { + "epoch": 19.61035422343324, + "grad_norm": 7.696627616882324, + "learning_rate": 1.8587512602272088e-05, + "loss": 0.8578, + "step": 7197 + }, + { + "epoch": 19.61307901907357, + "grad_norm": 8.939593315124512, + "learning_rate": 1.8587060385029052e-05, + "loss": 0.8292, + "step": 7198 + }, + { + "epoch": 19.615803814713896, + "grad_norm": 8.204903602600098, + "learning_rate": 1.8586608100910265e-05, + "loss": 0.7584, + "step": 7199 + }, + { + "epoch": 19.618528610354222, + "grad_norm": 7.829612731933594, + "learning_rate": 1.858615574991925e-05, + "loss": 0.7552, + "step": 7200 + }, + { + "epoch": 19.62125340599455, + "grad_norm": 9.322164535522461, + "learning_rate": 1.858570333205953e-05, + "loss": 0.8754, + "step": 7201 + }, + { + "epoch": 19.623978201634877, + "grad_norm": 7.925443172454834, + "learning_rate": 1.858525084733463e-05, + "loss": 0.7184, + "step": 7202 + }, + { + "epoch": 19.626702997275203, + "grad_norm": 7.421473979949951, + "learning_rate": 1.8584798295748072e-05, + "loss": 0.8631, + "step": 7203 + }, + { + "epoch": 19.629427792915532, + "grad_norm": 8.25426197052002, + "learning_rate": 1.8584345677303385e-05, + "loss": 0.8169, + "step": 7204 + }, + { + "epoch": 19.632152588555858, + "grad_norm": 9.868017196655273, + "learning_rate": 1.8583892992004084e-05, + "loss": 0.7183, + "step": 7205 + }, + { + "epoch": 19.634877384196184, + "grad_norm": 11.133771896362305, + "learning_rate": 1.8583440239853705e-05, + "loss": 0.797, + "step": 7206 + }, + { + "epoch": 19.637602179836513, + "grad_norm": 7.968581676483154, + "learning_rate": 1.8582987420855766e-05, + "loss": 0.9005, + "step": 7207 + }, + { + "epoch": 19.64032697547684, + "grad_norm": 8.879183769226074, + "learning_rate": 1.8582534535013802e-05, + "loss": 0.8459, + "step": 7208 + }, + { + "epoch": 19.643051771117165, + "grad_norm": 9.460929870605469, + "learning_rate": 1.858208158233133e-05, + "loss": 0.8223, + "step": 7209 + }, + { + "epoch": 19.645776566757494, + "grad_norm": 10.924003601074219, + "learning_rate": 1.8581628562811887e-05, + "loss": 1.0322, + "step": 7210 + }, + { + "epoch": 19.64850136239782, + "grad_norm": 9.068217277526855, + "learning_rate": 1.8581175476458993e-05, + "loss": 0.9371, + "step": 7211 + }, + { + "epoch": 19.651226158038146, + "grad_norm": 8.336944580078125, + "learning_rate": 1.8580722323276186e-05, + "loss": 0.8612, + "step": 7212 + }, + { + "epoch": 19.653950953678475, + "grad_norm": 7.832804203033447, + "learning_rate": 1.8580269103266985e-05, + "loss": 0.7006, + "step": 7213 + }, + { + "epoch": 19.6566757493188, + "grad_norm": 11.483506202697754, + "learning_rate": 1.8579815816434928e-05, + "loss": 0.962, + "step": 7214 + }, + { + "epoch": 19.659400544959126, + "grad_norm": 9.328773498535156, + "learning_rate": 1.857936246278354e-05, + "loss": 0.7187, + "step": 7215 + }, + { + "epoch": 19.662125340599456, + "grad_norm": 9.086725234985352, + "learning_rate": 1.857890904231635e-05, + "loss": 0.8785, + "step": 7216 + }, + { + "epoch": 19.66485013623978, + "grad_norm": 8.559444427490234, + "learning_rate": 1.8578455555036898e-05, + "loss": 0.9489, + "step": 7217 + }, + { + "epoch": 19.667574931880107, + "grad_norm": 11.644548416137695, + "learning_rate": 1.8578002000948707e-05, + "loss": 0.9829, + "step": 7218 + }, + { + "epoch": 19.670299727520437, + "grad_norm": 8.787369728088379, + "learning_rate": 1.8577548380055312e-05, + "loss": 0.7469, + "step": 7219 + }, + { + "epoch": 19.673024523160763, + "grad_norm": 9.432893753051758, + "learning_rate": 1.8577094692360248e-05, + "loss": 0.8535, + "step": 7220 + }, + { + "epoch": 19.67574931880109, + "grad_norm": 8.616509437561035, + "learning_rate": 1.8576640937867047e-05, + "loss": 0.7623, + "step": 7221 + }, + { + "epoch": 19.678474114441418, + "grad_norm": 10.964095115661621, + "learning_rate": 1.857618711657924e-05, + "loss": 0.7573, + "step": 7222 + }, + { + "epoch": 19.681198910081743, + "grad_norm": 8.31070327758789, + "learning_rate": 1.8575733228500364e-05, + "loss": 0.8906, + "step": 7223 + }, + { + "epoch": 19.68392370572207, + "grad_norm": 7.251931667327881, + "learning_rate": 1.8575279273633957e-05, + "loss": 0.8314, + "step": 7224 + }, + { + "epoch": 19.6866485013624, + "grad_norm": 10.5338134765625, + "learning_rate": 1.857482525198355e-05, + "loss": 0.9138, + "step": 7225 + }, + { + "epoch": 19.689373297002724, + "grad_norm": 8.392162322998047, + "learning_rate": 1.8574371163552677e-05, + "loss": 0.6933, + "step": 7226 + }, + { + "epoch": 19.69209809264305, + "grad_norm": 9.30006217956543, + "learning_rate": 1.857391700834488e-05, + "loss": 0.824, + "step": 7227 + }, + { + "epoch": 19.69482288828338, + "grad_norm": 8.00703239440918, + "learning_rate": 1.857346278636369e-05, + "loss": 0.8078, + "step": 7228 + }, + { + "epoch": 19.697547683923705, + "grad_norm": 8.627029418945312, + "learning_rate": 1.857300849761265e-05, + "loss": 0.7823, + "step": 7229 + }, + { + "epoch": 19.70027247956403, + "grad_norm": 8.846247673034668, + "learning_rate": 1.8572554142095296e-05, + "loss": 0.8359, + "step": 7230 + }, + { + "epoch": 19.70299727520436, + "grad_norm": 9.047361373901367, + "learning_rate": 1.8572099719815167e-05, + "loss": 0.749, + "step": 7231 + }, + { + "epoch": 19.705722070844686, + "grad_norm": 7.625607490539551, + "learning_rate": 1.85716452307758e-05, + "loss": 0.8597, + "step": 7232 + }, + { + "epoch": 19.708446866485012, + "grad_norm": 9.168447494506836, + "learning_rate": 1.8571190674980734e-05, + "loss": 0.8319, + "step": 7233 + }, + { + "epoch": 19.71117166212534, + "grad_norm": 8.939648628234863, + "learning_rate": 1.8570736052433515e-05, + "loss": 0.7706, + "step": 7234 + }, + { + "epoch": 19.713896457765667, + "grad_norm": 9.04534912109375, + "learning_rate": 1.8570281363137677e-05, + "loss": 0.86, + "step": 7235 + }, + { + "epoch": 19.716621253405993, + "grad_norm": 9.590156555175781, + "learning_rate": 1.8569826607096764e-05, + "loss": 0.8484, + "step": 7236 + }, + { + "epoch": 19.719346049046322, + "grad_norm": 8.071600914001465, + "learning_rate": 1.8569371784314318e-05, + "loss": 0.7587, + "step": 7237 + }, + { + "epoch": 19.722070844686648, + "grad_norm": 7.5778703689575195, + "learning_rate": 1.856891689479388e-05, + "loss": 0.9353, + "step": 7238 + }, + { + "epoch": 19.724795640326974, + "grad_norm": 8.062702178955078, + "learning_rate": 1.8568461938538994e-05, + "loss": 0.7383, + "step": 7239 + }, + { + "epoch": 19.727520435967303, + "grad_norm": 8.187978744506836, + "learning_rate": 1.8568006915553202e-05, + "loss": 0.774, + "step": 7240 + }, + { + "epoch": 19.73024523160763, + "grad_norm": 7.880321502685547, + "learning_rate": 1.856755182584004e-05, + "loss": 0.6434, + "step": 7241 + }, + { + "epoch": 19.732970027247955, + "grad_norm": 8.603689193725586, + "learning_rate": 1.856709666940307e-05, + "loss": 0.9297, + "step": 7242 + }, + { + "epoch": 19.735694822888284, + "grad_norm": 8.921660423278809, + "learning_rate": 1.8566641446245825e-05, + "loss": 0.9548, + "step": 7243 + }, + { + "epoch": 19.73841961852861, + "grad_norm": 8.69922924041748, + "learning_rate": 1.856618615637185e-05, + "loss": 0.9243, + "step": 7244 + }, + { + "epoch": 19.741144414168936, + "grad_norm": 8.331897735595703, + "learning_rate": 1.8565730799784693e-05, + "loss": 0.8177, + "step": 7245 + }, + { + "epoch": 19.743869209809265, + "grad_norm": 8.047229766845703, + "learning_rate": 1.85652753764879e-05, + "loss": 0.7662, + "step": 7246 + }, + { + "epoch": 19.74659400544959, + "grad_norm": 11.7498140335083, + "learning_rate": 1.856481988648502e-05, + "loss": 0.77, + "step": 7247 + }, + { + "epoch": 19.749318801089917, + "grad_norm": 7.757480144500732, + "learning_rate": 1.85643643297796e-05, + "loss": 0.9216, + "step": 7248 + }, + { + "epoch": 19.752043596730246, + "grad_norm": 8.10046672821045, + "learning_rate": 1.8563908706375183e-05, + "loss": 0.916, + "step": 7249 + }, + { + "epoch": 19.754768392370572, + "grad_norm": 7.660522937774658, + "learning_rate": 1.8563453016275322e-05, + "loss": 0.7997, + "step": 7250 + }, + { + "epoch": 19.757493188010898, + "grad_norm": 8.821773529052734, + "learning_rate": 1.8562997259483563e-05, + "loss": 0.947, + "step": 7251 + }, + { + "epoch": 19.760217983651227, + "grad_norm": 7.833026885986328, + "learning_rate": 1.856254143600346e-05, + "loss": 1.0444, + "step": 7252 + }, + { + "epoch": 19.762942779291553, + "grad_norm": 9.46402359008789, + "learning_rate": 1.8562085545838557e-05, + "loss": 0.8815, + "step": 7253 + }, + { + "epoch": 19.76566757493188, + "grad_norm": 10.266973495483398, + "learning_rate": 1.8561629588992405e-05, + "loss": 0.7732, + "step": 7254 + }, + { + "epoch": 19.768392370572208, + "grad_norm": 8.80599594116211, + "learning_rate": 1.856117356546856e-05, + "loss": 0.7681, + "step": 7255 + }, + { + "epoch": 19.771117166212534, + "grad_norm": 8.57168197631836, + "learning_rate": 1.8560717475270573e-05, + "loss": 0.7834, + "step": 7256 + }, + { + "epoch": 19.77384196185286, + "grad_norm": 7.505406379699707, + "learning_rate": 1.856026131840199e-05, + "loss": 0.7225, + "step": 7257 + }, + { + "epoch": 19.77656675749319, + "grad_norm": 7.946703910827637, + "learning_rate": 1.855980509486637e-05, + "loss": 0.8301, + "step": 7258 + }, + { + "epoch": 19.779291553133515, + "grad_norm": 10.383882522583008, + "learning_rate": 1.8559348804667265e-05, + "loss": 0.7971, + "step": 7259 + }, + { + "epoch": 19.78201634877384, + "grad_norm": 7.882511615753174, + "learning_rate": 1.8558892447808224e-05, + "loss": 0.8564, + "step": 7260 + }, + { + "epoch": 19.78474114441417, + "grad_norm": 11.38111400604248, + "learning_rate": 1.8558436024292803e-05, + "loss": 0.9023, + "step": 7261 + }, + { + "epoch": 19.787465940054496, + "grad_norm": 7.0735249519348145, + "learning_rate": 1.855797953412456e-05, + "loss": 0.7559, + "step": 7262 + }, + { + "epoch": 19.79019073569482, + "grad_norm": 9.781344413757324, + "learning_rate": 1.8557522977307045e-05, + "loss": 0.8533, + "step": 7263 + }, + { + "epoch": 19.79291553133515, + "grad_norm": 8.610528945922852, + "learning_rate": 1.8557066353843822e-05, + "loss": 0.6511, + "step": 7264 + }, + { + "epoch": 19.795640326975477, + "grad_norm": 8.943483352661133, + "learning_rate": 1.8556609663738435e-05, + "loss": 0.9783, + "step": 7265 + }, + { + "epoch": 19.798365122615802, + "grad_norm": 8.305816650390625, + "learning_rate": 1.8556152906994453e-05, + "loss": 0.892, + "step": 7266 + }, + { + "epoch": 19.80108991825613, + "grad_norm": 7.825862407684326, + "learning_rate": 1.8555696083615425e-05, + "loss": 0.8247, + "step": 7267 + }, + { + "epoch": 19.803814713896458, + "grad_norm": 7.026774883270264, + "learning_rate": 1.8555239193604913e-05, + "loss": 0.7625, + "step": 7268 + }, + { + "epoch": 19.806539509536783, + "grad_norm": 10.513520240783691, + "learning_rate": 1.855478223696647e-05, + "loss": 0.8748, + "step": 7269 + }, + { + "epoch": 19.809264305177113, + "grad_norm": 8.773707389831543, + "learning_rate": 1.8554325213703663e-05, + "loss": 0.813, + "step": 7270 + }, + { + "epoch": 19.81198910081744, + "grad_norm": 46.05637741088867, + "learning_rate": 1.8553868123820043e-05, + "loss": 0.8654, + "step": 7271 + }, + { + "epoch": 19.814713896457764, + "grad_norm": 9.854783058166504, + "learning_rate": 1.8553410967319173e-05, + "loss": 1.0159, + "step": 7272 + }, + { + "epoch": 19.817438692098094, + "grad_norm": 7.48112678527832, + "learning_rate": 1.8552953744204613e-05, + "loss": 0.818, + "step": 7273 + }, + { + "epoch": 19.82016348773842, + "grad_norm": 8.394046783447266, + "learning_rate": 1.855249645447993e-05, + "loss": 0.8461, + "step": 7274 + }, + { + "epoch": 19.822888283378745, + "grad_norm": 8.375469207763672, + "learning_rate": 1.8552039098148677e-05, + "loss": 0.8241, + "step": 7275 + }, + { + "epoch": 19.825613079019075, + "grad_norm": 8.33053970336914, + "learning_rate": 1.8551581675214416e-05, + "loss": 0.8422, + "step": 7276 + }, + { + "epoch": 19.8283378746594, + "grad_norm": 9.191420555114746, + "learning_rate": 1.8551124185680716e-05, + "loss": 0.7114, + "step": 7277 + }, + { + "epoch": 19.831062670299726, + "grad_norm": 9.85604476928711, + "learning_rate": 1.855066662955113e-05, + "loss": 0.8715, + "step": 7278 + }, + { + "epoch": 19.833787465940055, + "grad_norm": 7.668471813201904, + "learning_rate": 1.8550209006829236e-05, + "loss": 1.1304, + "step": 7279 + }, + { + "epoch": 19.83651226158038, + "grad_norm": 9.162517547607422, + "learning_rate": 1.8549751317518583e-05, + "loss": 0.9307, + "step": 7280 + }, + { + "epoch": 19.839237057220707, + "grad_norm": 7.64418888092041, + "learning_rate": 1.8549293561622742e-05, + "loss": 0.7964, + "step": 7281 + }, + { + "epoch": 19.841961852861036, + "grad_norm": 10.020888328552246, + "learning_rate": 1.854883573914528e-05, + "loss": 0.8617, + "step": 7282 + }, + { + "epoch": 19.844686648501362, + "grad_norm": 8.746636390686035, + "learning_rate": 1.8548377850089764e-05, + "loss": 0.7571, + "step": 7283 + }, + { + "epoch": 19.847411444141688, + "grad_norm": 8.420528411865234, + "learning_rate": 1.8547919894459753e-05, + "loss": 0.7667, + "step": 7284 + }, + { + "epoch": 19.850136239782017, + "grad_norm": 10.011277198791504, + "learning_rate": 1.8547461872258816e-05, + "loss": 0.8011, + "step": 7285 + }, + { + "epoch": 19.852861035422343, + "grad_norm": 10.89472484588623, + "learning_rate": 1.854700378349052e-05, + "loss": 1.0264, + "step": 7286 + }, + { + "epoch": 19.85558583106267, + "grad_norm": 9.870013236999512, + "learning_rate": 1.854654562815844e-05, + "loss": 0.9823, + "step": 7287 + }, + { + "epoch": 19.858310626703, + "grad_norm": 24.940608978271484, + "learning_rate": 1.854608740626613e-05, + "loss": 1.1353, + "step": 7288 + }, + { + "epoch": 19.861035422343324, + "grad_norm": 6.848790168762207, + "learning_rate": 1.854562911781717e-05, + "loss": 0.7698, + "step": 7289 + }, + { + "epoch": 19.86376021798365, + "grad_norm": 9.606679916381836, + "learning_rate": 1.8545170762815122e-05, + "loss": 0.9084, + "step": 7290 + }, + { + "epoch": 19.86648501362398, + "grad_norm": 12.181947708129883, + "learning_rate": 1.8544712341263566e-05, + "loss": 0.9169, + "step": 7291 + }, + { + "epoch": 19.869209809264305, + "grad_norm": 8.039779663085938, + "learning_rate": 1.854425385316606e-05, + "loss": 1.0466, + "step": 7292 + }, + { + "epoch": 19.87193460490463, + "grad_norm": 8.474559783935547, + "learning_rate": 1.854379529852618e-05, + "loss": 0.912, + "step": 7293 + }, + { + "epoch": 19.87465940054496, + "grad_norm": 7.942590713500977, + "learning_rate": 1.85433366773475e-05, + "loss": 0.8755, + "step": 7294 + }, + { + "epoch": 19.877384196185286, + "grad_norm": 9.164682388305664, + "learning_rate": 1.854287798963359e-05, + "loss": 0.8634, + "step": 7295 + }, + { + "epoch": 19.88010899182561, + "grad_norm": 7.278963088989258, + "learning_rate": 1.8542419235388016e-05, + "loss": 0.8492, + "step": 7296 + }, + { + "epoch": 19.88283378746594, + "grad_norm": 9.253836631774902, + "learning_rate": 1.854196041461436e-05, + "loss": 1.0032, + "step": 7297 + }, + { + "epoch": 19.885558583106267, + "grad_norm": 10.022604942321777, + "learning_rate": 1.854150152731619e-05, + "loss": 0.7737, + "step": 7298 + }, + { + "epoch": 19.888283378746593, + "grad_norm": 6.893654823303223, + "learning_rate": 1.854104257349708e-05, + "loss": 0.8645, + "step": 7299 + }, + { + "epoch": 19.891008174386922, + "grad_norm": 6.988736152648926, + "learning_rate": 1.8540583553160606e-05, + "loss": 0.8486, + "step": 7300 + }, + { + "epoch": 19.893732970027248, + "grad_norm": 9.518927574157715, + "learning_rate": 1.8540124466310345e-05, + "loss": 0.8699, + "step": 7301 + }, + { + "epoch": 19.896457765667574, + "grad_norm": 13.948290824890137, + "learning_rate": 1.8539665312949864e-05, + "loss": 0.9276, + "step": 7302 + }, + { + "epoch": 19.899182561307903, + "grad_norm": 8.599923133850098, + "learning_rate": 1.8539206093082748e-05, + "loss": 0.7977, + "step": 7303 + }, + { + "epoch": 19.90190735694823, + "grad_norm": 10.82606029510498, + "learning_rate": 1.8538746806712568e-05, + "loss": 0.767, + "step": 7304 + }, + { + "epoch": 19.904632152588555, + "grad_norm": 9.037323951721191, + "learning_rate": 1.8538287453842906e-05, + "loss": 0.9191, + "step": 7305 + }, + { + "epoch": 19.907356948228884, + "grad_norm": 7.831912994384766, + "learning_rate": 1.853782803447733e-05, + "loss": 0.7819, + "step": 7306 + }, + { + "epoch": 19.91008174386921, + "grad_norm": 10.063775062561035, + "learning_rate": 1.853736854861943e-05, + "loss": 0.8586, + "step": 7307 + }, + { + "epoch": 19.912806539509535, + "grad_norm": 8.359786033630371, + "learning_rate": 1.8536908996272777e-05, + "loss": 0.8816, + "step": 7308 + }, + { + "epoch": 19.915531335149865, + "grad_norm": 7.736542701721191, + "learning_rate": 1.853644937744095e-05, + "loss": 0.7466, + "step": 7309 + }, + { + "epoch": 19.91825613079019, + "grad_norm": 7.516117095947266, + "learning_rate": 1.853598969212753e-05, + "loss": 0.9105, + "step": 7310 + }, + { + "epoch": 19.920980926430516, + "grad_norm": 10.034730911254883, + "learning_rate": 1.8535529940336098e-05, + "loss": 0.8567, + "step": 7311 + }, + { + "epoch": 19.923705722070846, + "grad_norm": 7.54212760925293, + "learning_rate": 1.8535070122070237e-05, + "loss": 0.7722, + "step": 7312 + }, + { + "epoch": 19.92643051771117, + "grad_norm": 7.285183429718018, + "learning_rate": 1.853461023733352e-05, + "loss": 0.7952, + "step": 7313 + }, + { + "epoch": 19.929155313351497, + "grad_norm": 7.934067726135254, + "learning_rate": 1.853415028612953e-05, + "loss": 0.7682, + "step": 7314 + }, + { + "epoch": 19.931880108991827, + "grad_norm": 9.840912818908691, + "learning_rate": 1.8533690268461862e-05, + "loss": 0.8525, + "step": 7315 + }, + { + "epoch": 19.934604904632153, + "grad_norm": 9.348376274108887, + "learning_rate": 1.853323018433408e-05, + "loss": 0.9363, + "step": 7316 + }, + { + "epoch": 19.93732970027248, + "grad_norm": 8.461465835571289, + "learning_rate": 1.853277003374978e-05, + "loss": 0.8999, + "step": 7317 + }, + { + "epoch": 19.940054495912808, + "grad_norm": 8.06180191040039, + "learning_rate": 1.8532309816712542e-05, + "loss": 0.7518, + "step": 7318 + }, + { + "epoch": 19.942779291553133, + "grad_norm": 9.115461349487305, + "learning_rate": 1.8531849533225948e-05, + "loss": 0.9355, + "step": 7319 + }, + { + "epoch": 19.94550408719346, + "grad_norm": 9.954212188720703, + "learning_rate": 1.8531389183293583e-05, + "loss": 0.8217, + "step": 7320 + }, + { + "epoch": 19.94822888283379, + "grad_norm": 8.282428741455078, + "learning_rate": 1.853092876691904e-05, + "loss": 1.0406, + "step": 7321 + }, + { + "epoch": 19.950953678474114, + "grad_norm": 8.437095642089844, + "learning_rate": 1.853046828410589e-05, + "loss": 0.8442, + "step": 7322 + }, + { + "epoch": 19.95367847411444, + "grad_norm": 7.819126129150391, + "learning_rate": 1.8530007734857734e-05, + "loss": 0.7717, + "step": 7323 + }, + { + "epoch": 19.95640326975477, + "grad_norm": 8.74654483795166, + "learning_rate": 1.852954711917815e-05, + "loss": 0.817, + "step": 7324 + }, + { + "epoch": 19.959128065395095, + "grad_norm": 8.207504272460938, + "learning_rate": 1.8529086437070726e-05, + "loss": 0.8737, + "step": 7325 + }, + { + "epoch": 19.96185286103542, + "grad_norm": 9.41775131225586, + "learning_rate": 1.8528625688539055e-05, + "loss": 0.9446, + "step": 7326 + }, + { + "epoch": 19.96457765667575, + "grad_norm": 9.330113410949707, + "learning_rate": 1.8528164873586717e-05, + "loss": 0.8481, + "step": 7327 + }, + { + "epoch": 19.967302452316076, + "grad_norm": 8.378766059875488, + "learning_rate": 1.852770399221731e-05, + "loss": 0.9222, + "step": 7328 + }, + { + "epoch": 19.970027247956402, + "grad_norm": 11.528024673461914, + "learning_rate": 1.8527243044434415e-05, + "loss": 0.7509, + "step": 7329 + }, + { + "epoch": 19.97275204359673, + "grad_norm": 7.323259353637695, + "learning_rate": 1.852678203024163e-05, + "loss": 0.9354, + "step": 7330 + }, + { + "epoch": 19.975476839237057, + "grad_norm": 7.935391902923584, + "learning_rate": 1.8526320949642536e-05, + "loss": 0.9752, + "step": 7331 + }, + { + "epoch": 19.978201634877383, + "grad_norm": 7.215292930603027, + "learning_rate": 1.8525859802640733e-05, + "loss": 0.7661, + "step": 7332 + }, + { + "epoch": 19.980926430517712, + "grad_norm": 7.696983814239502, + "learning_rate": 1.8525398589239803e-05, + "loss": 0.9115, + "step": 7333 + }, + { + "epoch": 19.983651226158038, + "grad_norm": 10.614715576171875, + "learning_rate": 1.8524937309443346e-05, + "loss": 0.6874, + "step": 7334 + }, + { + "epoch": 19.986376021798364, + "grad_norm": 9.582474708557129, + "learning_rate": 1.8524475963254955e-05, + "loss": 0.939, + "step": 7335 + }, + { + "epoch": 19.989100817438693, + "grad_norm": 7.234864711761475, + "learning_rate": 1.8524014550678212e-05, + "loss": 0.7971, + "step": 7336 + }, + { + "epoch": 19.99182561307902, + "grad_norm": 8.474017143249512, + "learning_rate": 1.8523553071716726e-05, + "loss": 0.7489, + "step": 7337 + }, + { + "epoch": 19.994550408719345, + "grad_norm": 8.070943832397461, + "learning_rate": 1.852309152637408e-05, + "loss": 0.8862, + "step": 7338 + }, + { + "epoch": 19.997275204359674, + "grad_norm": 8.766613006591797, + "learning_rate": 1.852262991465387e-05, + "loss": 0.8653, + "step": 7339 + }, + { + "epoch": 20.0, + "grad_norm": 8.434788703918457, + "learning_rate": 1.8522168236559693e-05, + "loss": 0.7374, + "step": 7340 + }, + { + "epoch": 20.002724795640326, + "grad_norm": 10.932939529418945, + "learning_rate": 1.8521706492095147e-05, + "loss": 0.8364, + "step": 7341 + }, + { + "epoch": 20.005449591280655, + "grad_norm": 7.836805820465088, + "learning_rate": 1.852124468126382e-05, + "loss": 0.8916, + "step": 7342 + }, + { + "epoch": 20.00817438692098, + "grad_norm": 7.299636363983154, + "learning_rate": 1.8520782804069317e-05, + "loss": 0.619, + "step": 7343 + }, + { + "epoch": 20.010899182561307, + "grad_norm": 6.49599027633667, + "learning_rate": 1.8520320860515233e-05, + "loss": 0.745, + "step": 7344 + }, + { + "epoch": 20.013623978201636, + "grad_norm": 7.857719421386719, + "learning_rate": 1.851985885060516e-05, + "loss": 0.7843, + "step": 7345 + }, + { + "epoch": 20.016348773841962, + "grad_norm": 6.397619247436523, + "learning_rate": 1.8519396774342707e-05, + "loss": 0.6598, + "step": 7346 + }, + { + "epoch": 20.019073569482288, + "grad_norm": 6.885274410247803, + "learning_rate": 1.8518934631731463e-05, + "loss": 0.8165, + "step": 7347 + }, + { + "epoch": 20.021798365122617, + "grad_norm": 10.903122901916504, + "learning_rate": 1.8518472422775027e-05, + "loss": 0.7291, + "step": 7348 + }, + { + "epoch": 20.024523160762943, + "grad_norm": 7.2153425216674805, + "learning_rate": 1.8518010147477007e-05, + "loss": 0.8179, + "step": 7349 + }, + { + "epoch": 20.02724795640327, + "grad_norm": 12.313626289367676, + "learning_rate": 1.8517547805840995e-05, + "loss": 0.9888, + "step": 7350 + }, + { + "epoch": 20.029972752043598, + "grad_norm": 7.701757431030273, + "learning_rate": 1.8517085397870594e-05, + "loss": 0.7278, + "step": 7351 + }, + { + "epoch": 20.032697547683924, + "grad_norm": 7.067673206329346, + "learning_rate": 1.8516622923569406e-05, + "loss": 0.7112, + "step": 7352 + }, + { + "epoch": 20.03542234332425, + "grad_norm": 16.146074295043945, + "learning_rate": 1.8516160382941035e-05, + "loss": 0.8728, + "step": 7353 + }, + { + "epoch": 20.03814713896458, + "grad_norm": 9.322784423828125, + "learning_rate": 1.851569777598908e-05, + "loss": 0.6955, + "step": 7354 + }, + { + "epoch": 20.040871934604905, + "grad_norm": 7.918156147003174, + "learning_rate": 1.8515235102717145e-05, + "loss": 0.7109, + "step": 7355 + }, + { + "epoch": 20.04359673024523, + "grad_norm": 7.2958574295043945, + "learning_rate": 1.8514772363128833e-05, + "loss": 0.8171, + "step": 7356 + }, + { + "epoch": 20.04632152588556, + "grad_norm": 7.862805366516113, + "learning_rate": 1.851430955722775e-05, + "loss": 0.5814, + "step": 7357 + }, + { + "epoch": 20.049046321525886, + "grad_norm": 7.682487964630127, + "learning_rate": 1.8513846685017498e-05, + "loss": 0.7802, + "step": 7358 + }, + { + "epoch": 20.05177111716621, + "grad_norm": 8.207341194152832, + "learning_rate": 1.8513383746501678e-05, + "loss": 0.8322, + "step": 7359 + }, + { + "epoch": 20.05449591280654, + "grad_norm": 8.06595230102539, + "learning_rate": 1.85129207416839e-05, + "loss": 0.7709, + "step": 7360 + }, + { + "epoch": 20.057220708446867, + "grad_norm": 7.644371032714844, + "learning_rate": 1.8512457670567773e-05, + "loss": 0.7821, + "step": 7361 + }, + { + "epoch": 20.059945504087192, + "grad_norm": 8.130538940429688, + "learning_rate": 1.8511994533156898e-05, + "loss": 0.8824, + "step": 7362 + }, + { + "epoch": 20.06267029972752, + "grad_norm": 8.64433479309082, + "learning_rate": 1.8511531329454883e-05, + "loss": 0.7031, + "step": 7363 + }, + { + "epoch": 20.065395095367847, + "grad_norm": 8.260018348693848, + "learning_rate": 1.8511068059465334e-05, + "loss": 0.7408, + "step": 7364 + }, + { + "epoch": 20.068119891008173, + "grad_norm": 8.091988563537598, + "learning_rate": 1.8510604723191865e-05, + "loss": 0.7526, + "step": 7365 + }, + { + "epoch": 20.070844686648503, + "grad_norm": 8.094756126403809, + "learning_rate": 1.8510141320638078e-05, + "loss": 0.7114, + "step": 7366 + }, + { + "epoch": 20.07356948228883, + "grad_norm": 10.249007225036621, + "learning_rate": 1.8509677851807584e-05, + "loss": 0.8809, + "step": 7367 + }, + { + "epoch": 20.076294277929154, + "grad_norm": 7.930947303771973, + "learning_rate": 1.8509214316703993e-05, + "loss": 0.8882, + "step": 7368 + }, + { + "epoch": 20.079019073569484, + "grad_norm": 8.538778305053711, + "learning_rate": 1.8508750715330913e-05, + "loss": 0.6705, + "step": 7369 + }, + { + "epoch": 20.08174386920981, + "grad_norm": 7.569141864776611, + "learning_rate": 1.850828704769196e-05, + "loss": 0.7793, + "step": 7370 + }, + { + "epoch": 20.084468664850135, + "grad_norm": 11.548090934753418, + "learning_rate": 1.850782331379074e-05, + "loss": 0.8179, + "step": 7371 + }, + { + "epoch": 20.087193460490465, + "grad_norm": 7.210183143615723, + "learning_rate": 1.8507359513630865e-05, + "loss": 0.7361, + "step": 7372 + }, + { + "epoch": 20.08991825613079, + "grad_norm": 7.356325149536133, + "learning_rate": 1.850689564721595e-05, + "loss": 0.7419, + "step": 7373 + }, + { + "epoch": 20.092643051771116, + "grad_norm": 8.463406562805176, + "learning_rate": 1.8506431714549606e-05, + "loss": 0.9131, + "step": 7374 + }, + { + "epoch": 20.095367847411445, + "grad_norm": 11.675747871398926, + "learning_rate": 1.850596771563544e-05, + "loss": 0.8203, + "step": 7375 + }, + { + "epoch": 20.09809264305177, + "grad_norm": 7.034526348114014, + "learning_rate": 1.8505503650477074e-05, + "loss": 0.7858, + "step": 7376 + }, + { + "epoch": 20.100817438692097, + "grad_norm": 7.410828113555908, + "learning_rate": 1.850503951907812e-05, + "loss": 0.8191, + "step": 7377 + }, + { + "epoch": 20.103542234332426, + "grad_norm": 8.026698112487793, + "learning_rate": 1.8504575321442194e-05, + "loss": 0.7474, + "step": 7378 + }, + { + "epoch": 20.106267029972752, + "grad_norm": 7.907639503479004, + "learning_rate": 1.8504111057572905e-05, + "loss": 0.7725, + "step": 7379 + }, + { + "epoch": 20.108991825613078, + "grad_norm": 6.920834064483643, + "learning_rate": 1.8503646727473877e-05, + "loss": 0.7247, + "step": 7380 + }, + { + "epoch": 20.111716621253407, + "grad_norm": 7.789642810821533, + "learning_rate": 1.850318233114872e-05, + "loss": 0.6345, + "step": 7381 + }, + { + "epoch": 20.114441416893733, + "grad_norm": 7.425340175628662, + "learning_rate": 1.8502717868601054e-05, + "loss": 0.6998, + "step": 7382 + }, + { + "epoch": 20.11716621253406, + "grad_norm": 8.662664413452148, + "learning_rate": 1.850225333983449e-05, + "loss": 0.795, + "step": 7383 + }, + { + "epoch": 20.11989100817439, + "grad_norm": 7.657357215881348, + "learning_rate": 1.8501788744852652e-05, + "loss": 0.7484, + "step": 7384 + }, + { + "epoch": 20.122615803814714, + "grad_norm": 7.295523643493652, + "learning_rate": 1.850132408365916e-05, + "loss": 0.624, + "step": 7385 + }, + { + "epoch": 20.12534059945504, + "grad_norm": 8.386079788208008, + "learning_rate": 1.850085935625763e-05, + "loss": 0.8629, + "step": 7386 + }, + { + "epoch": 20.12806539509537, + "grad_norm": 9.70673942565918, + "learning_rate": 1.850039456265168e-05, + "loss": 0.9041, + "step": 7387 + }, + { + "epoch": 20.130790190735695, + "grad_norm": 7.998185157775879, + "learning_rate": 1.8499929702844932e-05, + "loss": 0.7749, + "step": 7388 + }, + { + "epoch": 20.13351498637602, + "grad_norm": 7.6672444343566895, + "learning_rate": 1.8499464776841e-05, + "loss": 0.7769, + "step": 7389 + }, + { + "epoch": 20.13623978201635, + "grad_norm": 9.27935791015625, + "learning_rate": 1.8498999784643517e-05, + "loss": 0.8093, + "step": 7390 + }, + { + "epoch": 20.138964577656676, + "grad_norm": 7.795583724975586, + "learning_rate": 1.8498534726256094e-05, + "loss": 0.8046, + "step": 7391 + }, + { + "epoch": 20.141689373297, + "grad_norm": 7.7575273513793945, + "learning_rate": 1.8498069601682353e-05, + "loss": 0.7775, + "step": 7392 + }, + { + "epoch": 20.14441416893733, + "grad_norm": 8.204751968383789, + "learning_rate": 1.8497604410925923e-05, + "loss": 0.741, + "step": 7393 + }, + { + "epoch": 20.147138964577657, + "grad_norm": 7.928032875061035, + "learning_rate": 1.849713915399042e-05, + "loss": 0.8253, + "step": 7394 + }, + { + "epoch": 20.149863760217983, + "grad_norm": 8.550969123840332, + "learning_rate": 1.8496673830879475e-05, + "loss": 0.6736, + "step": 7395 + }, + { + "epoch": 20.152588555858312, + "grad_norm": 6.771650791168213, + "learning_rate": 1.8496208441596706e-05, + "loss": 0.7365, + "step": 7396 + }, + { + "epoch": 20.155313351498638, + "grad_norm": 8.69344425201416, + "learning_rate": 1.8495742986145737e-05, + "loss": 0.6356, + "step": 7397 + }, + { + "epoch": 20.158038147138964, + "grad_norm": 8.5400390625, + "learning_rate": 1.8495277464530198e-05, + "loss": 0.7332, + "step": 7398 + }, + { + "epoch": 20.160762942779293, + "grad_norm": 8.132911682128906, + "learning_rate": 1.8494811876753712e-05, + "loss": 0.7512, + "step": 7399 + }, + { + "epoch": 20.16348773841962, + "grad_norm": 7.471899032592773, + "learning_rate": 1.84943462228199e-05, + "loss": 0.7015, + "step": 7400 + }, + { + "epoch": 20.166212534059945, + "grad_norm": 7.605429649353027, + "learning_rate": 1.84938805027324e-05, + "loss": 0.7745, + "step": 7401 + }, + { + "epoch": 20.168937329700274, + "grad_norm": 8.774757385253906, + "learning_rate": 1.8493414716494826e-05, + "loss": 0.7217, + "step": 7402 + }, + { + "epoch": 20.1716621253406, + "grad_norm": 7.752110481262207, + "learning_rate": 1.849294886411081e-05, + "loss": 0.675, + "step": 7403 + }, + { + "epoch": 20.174386920980925, + "grad_norm": 7.987790107727051, + "learning_rate": 1.849248294558399e-05, + "loss": 0.7279, + "step": 7404 + }, + { + "epoch": 20.177111716621255, + "grad_norm": 7.009028434753418, + "learning_rate": 1.849201696091798e-05, + "loss": 0.6802, + "step": 7405 + }, + { + "epoch": 20.17983651226158, + "grad_norm": 7.810697078704834, + "learning_rate": 1.8491550910116415e-05, + "loss": 0.8302, + "step": 7406 + }, + { + "epoch": 20.182561307901906, + "grad_norm": 9.02009105682373, + "learning_rate": 1.8491084793182925e-05, + "loss": 0.8419, + "step": 7407 + }, + { + "epoch": 20.185286103542236, + "grad_norm": 9.22038459777832, + "learning_rate": 1.8490618610121144e-05, + "loss": 0.6157, + "step": 7408 + }, + { + "epoch": 20.18801089918256, + "grad_norm": 6.129733562469482, + "learning_rate": 1.8490152360934695e-05, + "loss": 0.6604, + "step": 7409 + }, + { + "epoch": 20.190735694822887, + "grad_norm": 6.585142612457275, + "learning_rate": 1.848968604562721e-05, + "loss": 0.7493, + "step": 7410 + }, + { + "epoch": 20.193460490463217, + "grad_norm": 13.595898628234863, + "learning_rate": 1.848921966420233e-05, + "loss": 0.7126, + "step": 7411 + }, + { + "epoch": 20.196185286103542, + "grad_norm": 9.962562561035156, + "learning_rate": 1.8488753216663675e-05, + "loss": 0.826, + "step": 7412 + }, + { + "epoch": 20.19891008174387, + "grad_norm": 8.39643383026123, + "learning_rate": 1.848828670301489e-05, + "loss": 0.6631, + "step": 7413 + }, + { + "epoch": 20.201634877384198, + "grad_norm": 8.44212532043457, + "learning_rate": 1.8487820123259595e-05, + "loss": 0.6271, + "step": 7414 + }, + { + "epoch": 20.204359673024523, + "grad_norm": 7.178295135498047, + "learning_rate": 1.848735347740143e-05, + "loss": 0.8287, + "step": 7415 + }, + { + "epoch": 20.20708446866485, + "grad_norm": 14.088622093200684, + "learning_rate": 1.848688676544403e-05, + "loss": 0.9037, + "step": 7416 + }, + { + "epoch": 20.20980926430518, + "grad_norm": 9.695867538452148, + "learning_rate": 1.848641998739103e-05, + "loss": 0.8507, + "step": 7417 + }, + { + "epoch": 20.212534059945504, + "grad_norm": 8.77767276763916, + "learning_rate": 1.8485953143246065e-05, + "loss": 0.6851, + "step": 7418 + }, + { + "epoch": 20.21525885558583, + "grad_norm": 7.242414474487305, + "learning_rate": 1.848548623301277e-05, + "loss": 0.6465, + "step": 7419 + }, + { + "epoch": 20.21798365122616, + "grad_norm": 11.707669258117676, + "learning_rate": 1.848501925669478e-05, + "loss": 0.7872, + "step": 7420 + }, + { + "epoch": 20.220708446866485, + "grad_norm": 8.391408920288086, + "learning_rate": 1.8484552214295735e-05, + "loss": 0.6744, + "step": 7421 + }, + { + "epoch": 20.22343324250681, + "grad_norm": 7.5969767570495605, + "learning_rate": 1.8484085105819267e-05, + "loss": 0.7931, + "step": 7422 + }, + { + "epoch": 20.22615803814714, + "grad_norm": 8.797009468078613, + "learning_rate": 1.8483617931269022e-05, + "loss": 0.7268, + "step": 7423 + }, + { + "epoch": 20.228882833787466, + "grad_norm": 8.09107780456543, + "learning_rate": 1.848315069064863e-05, + "loss": 0.7107, + "step": 7424 + }, + { + "epoch": 20.231607629427792, + "grad_norm": 10.13934326171875, + "learning_rate": 1.8482683383961734e-05, + "loss": 0.6779, + "step": 7425 + }, + { + "epoch": 20.23433242506812, + "grad_norm": 7.996647834777832, + "learning_rate": 1.8482216011211976e-05, + "loss": 0.7646, + "step": 7426 + }, + { + "epoch": 20.237057220708447, + "grad_norm": 7.624180793762207, + "learning_rate": 1.8481748572402986e-05, + "loss": 0.7559, + "step": 7427 + }, + { + "epoch": 20.239782016348773, + "grad_norm": 11.821518898010254, + "learning_rate": 1.8481281067538416e-05, + "loss": 0.7444, + "step": 7428 + }, + { + "epoch": 20.242506811989102, + "grad_norm": 9.72706413269043, + "learning_rate": 1.8480813496621902e-05, + "loss": 0.833, + "step": 7429 + }, + { + "epoch": 20.245231607629428, + "grad_norm": 13.47059154510498, + "learning_rate": 1.8480345859657085e-05, + "loss": 0.8408, + "step": 7430 + }, + { + "epoch": 20.247956403269754, + "grad_norm": 8.498688697814941, + "learning_rate": 1.8479878156647606e-05, + "loss": 0.7551, + "step": 7431 + }, + { + "epoch": 20.250681198910083, + "grad_norm": 7.454466342926025, + "learning_rate": 1.847941038759711e-05, + "loss": 0.8337, + "step": 7432 + }, + { + "epoch": 20.25340599455041, + "grad_norm": 7.318837642669678, + "learning_rate": 1.847894255250924e-05, + "loss": 0.6942, + "step": 7433 + }, + { + "epoch": 20.256130790190735, + "grad_norm": 8.633078575134277, + "learning_rate": 1.8478474651387633e-05, + "loss": 0.774, + "step": 7434 + }, + { + "epoch": 20.258855585831064, + "grad_norm": 17.29705238342285, + "learning_rate": 1.8478006684235944e-05, + "loss": 0.826, + "step": 7435 + }, + { + "epoch": 20.26158038147139, + "grad_norm": 7.4252848625183105, + "learning_rate": 1.8477538651057812e-05, + "loss": 0.6229, + "step": 7436 + }, + { + "epoch": 20.264305177111716, + "grad_norm": 7.693795680999756, + "learning_rate": 1.847707055185688e-05, + "loss": 0.6783, + "step": 7437 + }, + { + "epoch": 20.267029972752045, + "grad_norm": 10.12563705444336, + "learning_rate": 1.8476602386636795e-05, + "loss": 0.7482, + "step": 7438 + }, + { + "epoch": 20.26975476839237, + "grad_norm": 7.601416110992432, + "learning_rate": 1.8476134155401202e-05, + "loss": 0.6664, + "step": 7439 + }, + { + "epoch": 20.272479564032697, + "grad_norm": 8.094047546386719, + "learning_rate": 1.8475665858153752e-05, + "loss": 0.734, + "step": 7440 + }, + { + "epoch": 20.275204359673026, + "grad_norm": 6.953584671020508, + "learning_rate": 1.847519749489809e-05, + "loss": 0.7358, + "step": 7441 + }, + { + "epoch": 20.277929155313352, + "grad_norm": 8.376222610473633, + "learning_rate": 1.8474729065637858e-05, + "loss": 0.8031, + "step": 7442 + }, + { + "epoch": 20.280653950953678, + "grad_norm": 10.219070434570312, + "learning_rate": 1.847426057037671e-05, + "loss": 0.8011, + "step": 7443 + }, + { + "epoch": 20.283378746594007, + "grad_norm": 10.703056335449219, + "learning_rate": 1.8473792009118297e-05, + "loss": 0.7283, + "step": 7444 + }, + { + "epoch": 20.286103542234333, + "grad_norm": 8.556020736694336, + "learning_rate": 1.8473323381866262e-05, + "loss": 0.7957, + "step": 7445 + }, + { + "epoch": 20.28882833787466, + "grad_norm": 9.588483810424805, + "learning_rate": 1.8472854688624255e-05, + "loss": 0.6652, + "step": 7446 + }, + { + "epoch": 20.291553133514988, + "grad_norm": 7.484055042266846, + "learning_rate": 1.847238592939593e-05, + "loss": 0.7836, + "step": 7447 + }, + { + "epoch": 20.294277929155314, + "grad_norm": 7.0402421951293945, + "learning_rate": 1.847191710418494e-05, + "loss": 0.7645, + "step": 7448 + }, + { + "epoch": 20.29700272479564, + "grad_norm": 7.735825061798096, + "learning_rate": 1.8471448212994927e-05, + "loss": 0.7928, + "step": 7449 + }, + { + "epoch": 20.29972752043597, + "grad_norm": 8.195221900939941, + "learning_rate": 1.847097925582955e-05, + "loss": 0.8018, + "step": 7450 + }, + { + "epoch": 20.302452316076295, + "grad_norm": 8.101825714111328, + "learning_rate": 1.847051023269246e-05, + "loss": 0.6886, + "step": 7451 + }, + { + "epoch": 20.30517711171662, + "grad_norm": 9.327179908752441, + "learning_rate": 1.8470041143587307e-05, + "loss": 0.9258, + "step": 7452 + }, + { + "epoch": 20.30790190735695, + "grad_norm": 8.218055725097656, + "learning_rate": 1.846957198851775e-05, + "loss": 0.8246, + "step": 7453 + }, + { + "epoch": 20.310626702997276, + "grad_norm": 6.9764580726623535, + "learning_rate": 1.8469102767487434e-05, + "loss": 0.7168, + "step": 7454 + }, + { + "epoch": 20.3133514986376, + "grad_norm": 9.409618377685547, + "learning_rate": 1.8468633480500024e-05, + "loss": 0.8809, + "step": 7455 + }, + { + "epoch": 20.31607629427793, + "grad_norm": 7.560911178588867, + "learning_rate": 1.8468164127559162e-05, + "loss": 0.7257, + "step": 7456 + }, + { + "epoch": 20.318801089918257, + "grad_norm": 7.362529277801514, + "learning_rate": 1.8467694708668516e-05, + "loss": 0.8376, + "step": 7457 + }, + { + "epoch": 20.321525885558582, + "grad_norm": 8.374099731445312, + "learning_rate": 1.8467225223831733e-05, + "loss": 0.7881, + "step": 7458 + }, + { + "epoch": 20.32425068119891, + "grad_norm": 9.146530151367188, + "learning_rate": 1.8466755673052472e-05, + "loss": 0.781, + "step": 7459 + }, + { + "epoch": 20.326975476839237, + "grad_norm": 8.215435981750488, + "learning_rate": 1.8466286056334394e-05, + "loss": 0.9, + "step": 7460 + }, + { + "epoch": 20.329700272479563, + "grad_norm": 8.195052146911621, + "learning_rate": 1.846581637368115e-05, + "loss": 0.7197, + "step": 7461 + }, + { + "epoch": 20.332425068119893, + "grad_norm": 8.552736282348633, + "learning_rate": 1.84653466250964e-05, + "loss": 0.7437, + "step": 7462 + }, + { + "epoch": 20.33514986376022, + "grad_norm": 7.810488224029541, + "learning_rate": 1.8464876810583806e-05, + "loss": 0.7225, + "step": 7463 + }, + { + "epoch": 20.337874659400544, + "grad_norm": 9.693074226379395, + "learning_rate": 1.846440693014702e-05, + "loss": 0.9473, + "step": 7464 + }, + { + "epoch": 20.340599455040874, + "grad_norm": 8.138737678527832, + "learning_rate": 1.8463936983789706e-05, + "loss": 0.8163, + "step": 7465 + }, + { + "epoch": 20.3433242506812, + "grad_norm": 9.098084449768066, + "learning_rate": 1.8463466971515525e-05, + "loss": 0.7632, + "step": 7466 + }, + { + "epoch": 20.346049046321525, + "grad_norm": 8.016382217407227, + "learning_rate": 1.8462996893328134e-05, + "loss": 0.7781, + "step": 7467 + }, + { + "epoch": 20.348773841961854, + "grad_norm": 9.49134349822998, + "learning_rate": 1.84625267492312e-05, + "loss": 0.8644, + "step": 7468 + }, + { + "epoch": 20.35149863760218, + "grad_norm": 7.997730255126953, + "learning_rate": 1.8462056539228378e-05, + "loss": 0.7477, + "step": 7469 + }, + { + "epoch": 20.354223433242506, + "grad_norm": 7.561858177185059, + "learning_rate": 1.8461586263323327e-05, + "loss": 0.876, + "step": 7470 + }, + { + "epoch": 20.356948228882835, + "grad_norm": 9.587177276611328, + "learning_rate": 1.846111592151972e-05, + "loss": 0.5931, + "step": 7471 + }, + { + "epoch": 20.35967302452316, + "grad_norm": 10.550204277038574, + "learning_rate": 1.846064551382121e-05, + "loss": 0.9094, + "step": 7472 + }, + { + "epoch": 20.362397820163487, + "grad_norm": 9.21194839477539, + "learning_rate": 1.8460175040231468e-05, + "loss": 0.8365, + "step": 7473 + }, + { + "epoch": 20.365122615803816, + "grad_norm": 8.397749900817871, + "learning_rate": 1.8459704500754155e-05, + "loss": 0.7267, + "step": 7474 + }, + { + "epoch": 20.367847411444142, + "grad_norm": 8.124926567077637, + "learning_rate": 1.8459233895392933e-05, + "loss": 0.7791, + "step": 7475 + }, + { + "epoch": 20.370572207084468, + "grad_norm": 7.280975341796875, + "learning_rate": 1.8458763224151476e-05, + "loss": 1.043, + "step": 7476 + }, + { + "epoch": 20.373297002724797, + "grad_norm": 8.212790489196777, + "learning_rate": 1.845829248703344e-05, + "loss": 0.7695, + "step": 7477 + }, + { + "epoch": 20.376021798365123, + "grad_norm": 8.955096244812012, + "learning_rate": 1.8457821684042492e-05, + "loss": 0.8295, + "step": 7478 + }, + { + "epoch": 20.37874659400545, + "grad_norm": 8.780290603637695, + "learning_rate": 1.8457350815182303e-05, + "loss": 0.7451, + "step": 7479 + }, + { + "epoch": 20.381471389645778, + "grad_norm": 7.5337090492248535, + "learning_rate": 1.8456879880456537e-05, + "loss": 0.7841, + "step": 7480 + }, + { + "epoch": 20.384196185286104, + "grad_norm": 8.871101379394531, + "learning_rate": 1.8456408879868864e-05, + "loss": 0.8707, + "step": 7481 + }, + { + "epoch": 20.38692098092643, + "grad_norm": 16.11921501159668, + "learning_rate": 1.845593781342295e-05, + "loss": 0.6917, + "step": 7482 + }, + { + "epoch": 20.38964577656676, + "grad_norm": 8.842729568481445, + "learning_rate": 1.8455466681122463e-05, + "loss": 0.785, + "step": 7483 + }, + { + "epoch": 20.392370572207085, + "grad_norm": 8.087883949279785, + "learning_rate": 1.8454995482971077e-05, + "loss": 0.8903, + "step": 7484 + }, + { + "epoch": 20.39509536784741, + "grad_norm": 8.730992317199707, + "learning_rate": 1.8454524218972457e-05, + "loss": 0.8339, + "step": 7485 + }, + { + "epoch": 20.39782016348774, + "grad_norm": 8.91746997833252, + "learning_rate": 1.8454052889130273e-05, + "loss": 0.8063, + "step": 7486 + }, + { + "epoch": 20.400544959128066, + "grad_norm": 9.099474906921387, + "learning_rate": 1.84535814934482e-05, + "loss": 0.787, + "step": 7487 + }, + { + "epoch": 20.40326975476839, + "grad_norm": 10.209683418273926, + "learning_rate": 1.84531100319299e-05, + "loss": 0.9791, + "step": 7488 + }, + { + "epoch": 20.40599455040872, + "grad_norm": 7.775052070617676, + "learning_rate": 1.8452638504579056e-05, + "loss": 0.6804, + "step": 7489 + }, + { + "epoch": 20.408719346049047, + "grad_norm": 9.734155654907227, + "learning_rate": 1.8452166911399336e-05, + "loss": 0.7009, + "step": 7490 + }, + { + "epoch": 20.411444141689373, + "grad_norm": 7.811398506164551, + "learning_rate": 1.8451695252394413e-05, + "loss": 0.8672, + "step": 7491 + }, + { + "epoch": 20.414168937329702, + "grad_norm": 9.408904075622559, + "learning_rate": 1.8451223527567956e-05, + "loss": 0.9297, + "step": 7492 + }, + { + "epoch": 20.416893732970028, + "grad_norm": 12.2958402633667, + "learning_rate": 1.8450751736923644e-05, + "loss": 0.8146, + "step": 7493 + }, + { + "epoch": 20.419618528610354, + "grad_norm": 8.134531021118164, + "learning_rate": 1.845027988046515e-05, + "loss": 0.8298, + "step": 7494 + }, + { + "epoch": 20.422343324250683, + "grad_norm": 11.866950035095215, + "learning_rate": 1.844980795819615e-05, + "loss": 0.9991, + "step": 7495 + }, + { + "epoch": 20.42506811989101, + "grad_norm": 9.131204605102539, + "learning_rate": 1.844933597012031e-05, + "loss": 0.8635, + "step": 7496 + }, + { + "epoch": 20.427792915531334, + "grad_norm": 7.015655040740967, + "learning_rate": 1.8448863916241324e-05, + "loss": 0.6737, + "step": 7497 + }, + { + "epoch": 20.430517711171664, + "grad_norm": 8.82425308227539, + "learning_rate": 1.844839179656285e-05, + "loss": 0.7856, + "step": 7498 + }, + { + "epoch": 20.43324250681199, + "grad_norm": 8.597686767578125, + "learning_rate": 1.8447919611088574e-05, + "loss": 0.8732, + "step": 7499 + }, + { + "epoch": 20.435967302452315, + "grad_norm": 8.5596342086792, + "learning_rate": 1.8447447359822172e-05, + "loss": 0.7124, + "step": 7500 + }, + { + "epoch": 20.438692098092645, + "grad_norm": 10.065719604492188, + "learning_rate": 1.844697504276732e-05, + "loss": 0.8853, + "step": 7501 + }, + { + "epoch": 20.44141689373297, + "grad_norm": 7.822795867919922, + "learning_rate": 1.8446502659927702e-05, + "loss": 0.7365, + "step": 7502 + }, + { + "epoch": 20.444141689373296, + "grad_norm": 9.746071815490723, + "learning_rate": 1.8446030211306993e-05, + "loss": 0.6361, + "step": 7503 + }, + { + "epoch": 20.446866485013626, + "grad_norm": 8.904976844787598, + "learning_rate": 1.8445557696908874e-05, + "loss": 0.8429, + "step": 7504 + }, + { + "epoch": 20.44959128065395, + "grad_norm": 14.334179878234863, + "learning_rate": 1.844508511673702e-05, + "loss": 0.7555, + "step": 7505 + }, + { + "epoch": 20.452316076294277, + "grad_norm": 8.744474411010742, + "learning_rate": 1.8444612470795114e-05, + "loss": 0.8788, + "step": 7506 + }, + { + "epoch": 20.455040871934607, + "grad_norm": 8.65246295928955, + "learning_rate": 1.844413975908684e-05, + "loss": 0.7695, + "step": 7507 + }, + { + "epoch": 20.457765667574932, + "grad_norm": 8.80207633972168, + "learning_rate": 1.844366698161588e-05, + "loss": 0.6603, + "step": 7508 + }, + { + "epoch": 20.460490463215258, + "grad_norm": 8.420857429504395, + "learning_rate": 1.844319413838591e-05, + "loss": 0.8613, + "step": 7509 + }, + { + "epoch": 20.463215258855588, + "grad_norm": 9.497468948364258, + "learning_rate": 1.8442721229400615e-05, + "loss": 0.7391, + "step": 7510 + }, + { + "epoch": 20.465940054495913, + "grad_norm": 16.942873001098633, + "learning_rate": 1.844224825466368e-05, + "loss": 0.8069, + "step": 7511 + }, + { + "epoch": 20.46866485013624, + "grad_norm": 9.093857765197754, + "learning_rate": 1.8441775214178784e-05, + "loss": 0.7908, + "step": 7512 + }, + { + "epoch": 20.47138964577657, + "grad_norm": 8.484370231628418, + "learning_rate": 1.844130210794962e-05, + "loss": 0.8571, + "step": 7513 + }, + { + "epoch": 20.474114441416894, + "grad_norm": 7.775330066680908, + "learning_rate": 1.8440828935979865e-05, + "loss": 0.795, + "step": 7514 + }, + { + "epoch": 20.47683923705722, + "grad_norm": 10.508936882019043, + "learning_rate": 1.8440355698273203e-05, + "loss": 0.8212, + "step": 7515 + }, + { + "epoch": 20.479564032697546, + "grad_norm": 9.015315055847168, + "learning_rate": 1.843988239483333e-05, + "loss": 0.6935, + "step": 7516 + }, + { + "epoch": 20.482288828337875, + "grad_norm": 9.50527286529541, + "learning_rate": 1.8439409025663915e-05, + "loss": 0.8352, + "step": 7517 + }, + { + "epoch": 20.4850136239782, + "grad_norm": 10.273641586303711, + "learning_rate": 1.8438935590768658e-05, + "loss": 0.8578, + "step": 7518 + }, + { + "epoch": 20.48773841961853, + "grad_norm": 7.911138534545898, + "learning_rate": 1.8438462090151247e-05, + "loss": 0.8323, + "step": 7519 + }, + { + "epoch": 20.490463215258856, + "grad_norm": 8.356745719909668, + "learning_rate": 1.843798852381536e-05, + "loss": 0.7462, + "step": 7520 + }, + { + "epoch": 20.493188010899182, + "grad_norm": 9.9681978225708, + "learning_rate": 1.843751489176469e-05, + "loss": 0.7948, + "step": 7521 + }, + { + "epoch": 20.495912806539508, + "grad_norm": 8.1953763961792, + "learning_rate": 1.8437041194002924e-05, + "loss": 0.6564, + "step": 7522 + }, + { + "epoch": 20.498637602179837, + "grad_norm": 10.268936157226562, + "learning_rate": 1.8436567430533757e-05, + "loss": 0.8291, + "step": 7523 + }, + { + "epoch": 20.501362397820163, + "grad_norm": 11.004013061523438, + "learning_rate": 1.8436093601360872e-05, + "loss": 0.9343, + "step": 7524 + }, + { + "epoch": 20.504087193460492, + "grad_norm": 10.917760848999023, + "learning_rate": 1.843561970648796e-05, + "loss": 0.7391, + "step": 7525 + }, + { + "epoch": 20.506811989100818, + "grad_norm": 11.350653648376465, + "learning_rate": 1.8435145745918713e-05, + "loss": 0.6913, + "step": 7526 + }, + { + "epoch": 20.509536784741144, + "grad_norm": 10.579289436340332, + "learning_rate": 1.8434671719656826e-05, + "loss": 0.7494, + "step": 7527 + }, + { + "epoch": 20.51226158038147, + "grad_norm": 11.816920280456543, + "learning_rate": 1.843419762770599e-05, + "loss": 1.0459, + "step": 7528 + }, + { + "epoch": 20.5149863760218, + "grad_norm": 11.840269088745117, + "learning_rate": 1.8433723470069888e-05, + "loss": 0.8867, + "step": 7529 + }, + { + "epoch": 20.517711171662125, + "grad_norm": 8.952495574951172, + "learning_rate": 1.843324924675222e-05, + "loss": 0.7943, + "step": 7530 + }, + { + "epoch": 20.520435967302454, + "grad_norm": 9.813703536987305, + "learning_rate": 1.8432774957756677e-05, + "loss": 0.797, + "step": 7531 + }, + { + "epoch": 20.52316076294278, + "grad_norm": 16.976900100708008, + "learning_rate": 1.8432300603086957e-05, + "loss": 0.9147, + "step": 7532 + }, + { + "epoch": 20.525885558583106, + "grad_norm": 9.287324905395508, + "learning_rate": 1.843182618274675e-05, + "loss": 0.8871, + "step": 7533 + }, + { + "epoch": 20.52861035422343, + "grad_norm": 13.709163665771484, + "learning_rate": 1.8431351696739755e-05, + "loss": 0.7975, + "step": 7534 + }, + { + "epoch": 20.53133514986376, + "grad_norm": 9.606921195983887, + "learning_rate": 1.843087714506966e-05, + "loss": 0.8434, + "step": 7535 + }, + { + "epoch": 20.534059945504087, + "grad_norm": 12.49398422241211, + "learning_rate": 1.843040252774017e-05, + "loss": 0.7167, + "step": 7536 + }, + { + "epoch": 20.536784741144416, + "grad_norm": 7.58212423324585, + "learning_rate": 1.8429927844754972e-05, + "loss": 0.8987, + "step": 7537 + }, + { + "epoch": 20.539509536784742, + "grad_norm": 12.724702835083008, + "learning_rate": 1.842945309611777e-05, + "loss": 0.8319, + "step": 7538 + }, + { + "epoch": 20.542234332425068, + "grad_norm": 8.409048080444336, + "learning_rate": 1.8428978281832255e-05, + "loss": 0.7396, + "step": 7539 + }, + { + "epoch": 20.544959128065393, + "grad_norm": 9.053321838378906, + "learning_rate": 1.842850340190213e-05, + "loss": 0.8324, + "step": 7540 + }, + { + "epoch": 20.547683923705723, + "grad_norm": 7.629400730133057, + "learning_rate": 1.8428028456331093e-05, + "loss": 0.6138, + "step": 7541 + }, + { + "epoch": 20.55040871934605, + "grad_norm": 12.569177627563477, + "learning_rate": 1.8427553445122842e-05, + "loss": 0.7177, + "step": 7542 + }, + { + "epoch": 20.553133514986374, + "grad_norm": 7.9694132804870605, + "learning_rate": 1.8427078368281077e-05, + "loss": 0.8976, + "step": 7543 + }, + { + "epoch": 20.555858310626704, + "grad_norm": 8.255053520202637, + "learning_rate": 1.8426603225809493e-05, + "loss": 0.8405, + "step": 7544 + }, + { + "epoch": 20.55858310626703, + "grad_norm": 8.747611999511719, + "learning_rate": 1.8426128017711797e-05, + "loss": 0.9238, + "step": 7545 + }, + { + "epoch": 20.561307901907355, + "grad_norm": 10.35474681854248, + "learning_rate": 1.8425652743991688e-05, + "loss": 0.7651, + "step": 7546 + }, + { + "epoch": 20.564032697547685, + "grad_norm": 8.243481636047363, + "learning_rate": 1.8425177404652865e-05, + "loss": 0.7662, + "step": 7547 + }, + { + "epoch": 20.56675749318801, + "grad_norm": 10.073675155639648, + "learning_rate": 1.842470199969903e-05, + "loss": 0.6719, + "step": 7548 + }, + { + "epoch": 20.569482288828336, + "grad_norm": 7.270785808563232, + "learning_rate": 1.842422652913389e-05, + "loss": 0.6927, + "step": 7549 + }, + { + "epoch": 20.572207084468666, + "grad_norm": 11.287145614624023, + "learning_rate": 1.8423750992961143e-05, + "loss": 0.8513, + "step": 7550 + }, + { + "epoch": 20.57493188010899, + "grad_norm": 8.997488021850586, + "learning_rate": 1.8423275391184496e-05, + "loss": 0.795, + "step": 7551 + }, + { + "epoch": 20.577656675749317, + "grad_norm": 11.46519660949707, + "learning_rate": 1.842279972380765e-05, + "loss": 0.7411, + "step": 7552 + }, + { + "epoch": 20.580381471389646, + "grad_norm": 9.471609115600586, + "learning_rate": 1.842232399083431e-05, + "loss": 0.812, + "step": 7553 + }, + { + "epoch": 20.583106267029972, + "grad_norm": 9.562443733215332, + "learning_rate": 1.8421848192268187e-05, + "loss": 0.743, + "step": 7554 + }, + { + "epoch": 20.585831062670298, + "grad_norm": 8.251599311828613, + "learning_rate": 1.8421372328112974e-05, + "loss": 0.7606, + "step": 7555 + }, + { + "epoch": 20.588555858310627, + "grad_norm": 8.16517162322998, + "learning_rate": 1.842089639837239e-05, + "loss": 0.8248, + "step": 7556 + }, + { + "epoch": 20.591280653950953, + "grad_norm": 8.494513511657715, + "learning_rate": 1.8420420403050134e-05, + "loss": 0.7952, + "step": 7557 + }, + { + "epoch": 20.59400544959128, + "grad_norm": 9.98038387298584, + "learning_rate": 1.8419944342149913e-05, + "loss": 0.8759, + "step": 7558 + }, + { + "epoch": 20.59673024523161, + "grad_norm": 10.59455680847168, + "learning_rate": 1.8419468215675437e-05, + "loss": 0.962, + "step": 7559 + }, + { + "epoch": 20.599455040871934, + "grad_norm": 10.139543533325195, + "learning_rate": 1.8418992023630416e-05, + "loss": 0.778, + "step": 7560 + }, + { + "epoch": 20.60217983651226, + "grad_norm": 8.193345069885254, + "learning_rate": 1.8418515766018553e-05, + "loss": 0.6841, + "step": 7561 + }, + { + "epoch": 20.60490463215259, + "grad_norm": 8.825242042541504, + "learning_rate": 1.8418039442843562e-05, + "loss": 0.8464, + "step": 7562 + }, + { + "epoch": 20.607629427792915, + "grad_norm": 9.617834091186523, + "learning_rate": 1.8417563054109153e-05, + "loss": 0.7627, + "step": 7563 + }, + { + "epoch": 20.61035422343324, + "grad_norm": 12.968689918518066, + "learning_rate": 1.8417086599819028e-05, + "loss": 0.847, + "step": 7564 + }, + { + "epoch": 20.61307901907357, + "grad_norm": 7.965363025665283, + "learning_rate": 1.841661007997691e-05, + "loss": 0.7997, + "step": 7565 + }, + { + "epoch": 20.615803814713896, + "grad_norm": 8.659131050109863, + "learning_rate": 1.84161334945865e-05, + "loss": 0.745, + "step": 7566 + }, + { + "epoch": 20.618528610354222, + "grad_norm": 11.7770357131958, + "learning_rate": 1.8415656843651514e-05, + "loss": 0.6655, + "step": 7567 + }, + { + "epoch": 20.62125340599455, + "grad_norm": 8.190646171569824, + "learning_rate": 1.841518012717566e-05, + "loss": 0.8326, + "step": 7568 + }, + { + "epoch": 20.623978201634877, + "grad_norm": 6.952454090118408, + "learning_rate": 1.8414703345162656e-05, + "loss": 0.765, + "step": 7569 + }, + { + "epoch": 20.626702997275203, + "grad_norm": 8.603614807128906, + "learning_rate": 1.8414226497616215e-05, + "loss": 0.7329, + "step": 7570 + }, + { + "epoch": 20.629427792915532, + "grad_norm": 11.186273574829102, + "learning_rate": 1.841374958454005e-05, + "loss": 0.9298, + "step": 7571 + }, + { + "epoch": 20.632152588555858, + "grad_norm": 15.902365684509277, + "learning_rate": 1.8413272605937872e-05, + "loss": 0.9056, + "step": 7572 + }, + { + "epoch": 20.634877384196184, + "grad_norm": 9.482760429382324, + "learning_rate": 1.8412795561813397e-05, + "loss": 0.7537, + "step": 7573 + }, + { + "epoch": 20.637602179836513, + "grad_norm": 7.537638187408447, + "learning_rate": 1.8412318452170344e-05, + "loss": 0.7407, + "step": 7574 + }, + { + "epoch": 20.64032697547684, + "grad_norm": 8.906112670898438, + "learning_rate": 1.8411841277012423e-05, + "loss": 0.8531, + "step": 7575 + }, + { + "epoch": 20.643051771117165, + "grad_norm": 9.597343444824219, + "learning_rate": 1.841136403634335e-05, + "loss": 0.7976, + "step": 7576 + }, + { + "epoch": 20.645776566757494, + "grad_norm": 8.042146682739258, + "learning_rate": 1.8410886730166848e-05, + "loss": 0.7957, + "step": 7577 + }, + { + "epoch": 20.64850136239782, + "grad_norm": 10.171354293823242, + "learning_rate": 1.841040935848663e-05, + "loss": 0.7577, + "step": 7578 + }, + { + "epoch": 20.651226158038146, + "grad_norm": 9.854966163635254, + "learning_rate": 1.840993192130642e-05, + "loss": 0.6897, + "step": 7579 + }, + { + "epoch": 20.653950953678475, + "grad_norm": 9.036667823791504, + "learning_rate": 1.8409454418629925e-05, + "loss": 0.6295, + "step": 7580 + }, + { + "epoch": 20.6566757493188, + "grad_norm": 13.81934642791748, + "learning_rate": 1.840897685046087e-05, + "loss": 0.8835, + "step": 7581 + }, + { + "epoch": 20.659400544959126, + "grad_norm": 12.976028442382812, + "learning_rate": 1.8408499216802974e-05, + "loss": 0.8418, + "step": 7582 + }, + { + "epoch": 20.662125340599456, + "grad_norm": 9.331933975219727, + "learning_rate": 1.840802151765996e-05, + "loss": 0.6176, + "step": 7583 + }, + { + "epoch": 20.66485013623978, + "grad_norm": 10.498309135437012, + "learning_rate": 1.840754375303554e-05, + "loss": 0.8578, + "step": 7584 + }, + { + "epoch": 20.667574931880107, + "grad_norm": 9.227131843566895, + "learning_rate": 1.840706592293344e-05, + "loss": 0.848, + "step": 7585 + }, + { + "epoch": 20.670299727520437, + "grad_norm": 9.691853523254395, + "learning_rate": 1.8406588027357383e-05, + "loss": 0.9496, + "step": 7586 + }, + { + "epoch": 20.673024523160763, + "grad_norm": 8.21297550201416, + "learning_rate": 1.8406110066311093e-05, + "loss": 0.835, + "step": 7587 + }, + { + "epoch": 20.67574931880109, + "grad_norm": 8.179823875427246, + "learning_rate": 1.8405632039798283e-05, + "loss": 0.892, + "step": 7588 + }, + { + "epoch": 20.678474114441418, + "grad_norm": 12.935137748718262, + "learning_rate": 1.840515394782268e-05, + "loss": 0.8531, + "step": 7589 + }, + { + "epoch": 20.681198910081743, + "grad_norm": 11.246734619140625, + "learning_rate": 1.8404675790388017e-05, + "loss": 1.0269, + "step": 7590 + }, + { + "epoch": 20.68392370572207, + "grad_norm": 9.77748966217041, + "learning_rate": 1.8404197567498e-05, + "loss": 0.9647, + "step": 7591 + }, + { + "epoch": 20.6866485013624, + "grad_norm": 9.248991966247559, + "learning_rate": 1.840371927915637e-05, + "loss": 0.7554, + "step": 7592 + }, + { + "epoch": 20.689373297002724, + "grad_norm": 10.35046100616455, + "learning_rate": 1.8403240925366842e-05, + "loss": 0.7442, + "step": 7593 + }, + { + "epoch": 20.69209809264305, + "grad_norm": 8.65871524810791, + "learning_rate": 1.8402762506133145e-05, + "loss": 0.7538, + "step": 7594 + }, + { + "epoch": 20.69482288828338, + "grad_norm": 13.182056427001953, + "learning_rate": 1.8402284021459e-05, + "loss": 0.7523, + "step": 7595 + }, + { + "epoch": 20.697547683923705, + "grad_norm": 9.477316856384277, + "learning_rate": 1.840180547134814e-05, + "loss": 0.864, + "step": 7596 + }, + { + "epoch": 20.70027247956403, + "grad_norm": 9.479179382324219, + "learning_rate": 1.8401326855804293e-05, + "loss": 0.7625, + "step": 7597 + }, + { + "epoch": 20.70299727520436, + "grad_norm": 10.778131484985352, + "learning_rate": 1.8400848174831178e-05, + "loss": 0.7231, + "step": 7598 + }, + { + "epoch": 20.705722070844686, + "grad_norm": 9.457087516784668, + "learning_rate": 1.840036942843253e-05, + "loss": 0.9269, + "step": 7599 + }, + { + "epoch": 20.708446866485012, + "grad_norm": 8.120590209960938, + "learning_rate": 1.8399890616612073e-05, + "loss": 0.8187, + "step": 7600 + }, + { + "epoch": 20.71117166212534, + "grad_norm": 9.013141632080078, + "learning_rate": 1.839941173937354e-05, + "loss": 0.7363, + "step": 7601 + }, + { + "epoch": 20.713896457765667, + "grad_norm": 11.750839233398438, + "learning_rate": 1.839893279672066e-05, + "loss": 0.8936, + "step": 7602 + }, + { + "epoch": 20.716621253405993, + "grad_norm": 8.871647834777832, + "learning_rate": 1.839845378865716e-05, + "loss": 0.9536, + "step": 7603 + }, + { + "epoch": 20.719346049046322, + "grad_norm": 8.749375343322754, + "learning_rate": 1.839797471518677e-05, + "loss": 0.9968, + "step": 7604 + }, + { + "epoch": 20.722070844686648, + "grad_norm": 10.805994987487793, + "learning_rate": 1.8397495576313226e-05, + "loss": 0.8442, + "step": 7605 + }, + { + "epoch": 20.724795640326974, + "grad_norm": 11.166732788085938, + "learning_rate": 1.8397016372040256e-05, + "loss": 0.7979, + "step": 7606 + }, + { + "epoch": 20.727520435967303, + "grad_norm": 7.917816638946533, + "learning_rate": 1.8396537102371593e-05, + "loss": 0.6642, + "step": 7607 + }, + { + "epoch": 20.73024523160763, + "grad_norm": 8.999839782714844, + "learning_rate": 1.839605776731097e-05, + "loss": 0.8108, + "step": 7608 + }, + { + "epoch": 20.732970027247955, + "grad_norm": 11.270936965942383, + "learning_rate": 1.839557836686212e-05, + "loss": 0.8053, + "step": 7609 + }, + { + "epoch": 20.735694822888284, + "grad_norm": 8.101061820983887, + "learning_rate": 1.8395098901028774e-05, + "loss": 0.7604, + "step": 7610 + }, + { + "epoch": 20.73841961852861, + "grad_norm": 9.721184730529785, + "learning_rate": 1.8394619369814666e-05, + "loss": 0.9728, + "step": 7611 + }, + { + "epoch": 20.741144414168936, + "grad_norm": 8.81428337097168, + "learning_rate": 1.8394139773223537e-05, + "loss": 0.8023, + "step": 7612 + }, + { + "epoch": 20.743869209809265, + "grad_norm": 9.245955467224121, + "learning_rate": 1.8393660111259116e-05, + "loss": 0.8396, + "step": 7613 + }, + { + "epoch": 20.74659400544959, + "grad_norm": 15.609857559204102, + "learning_rate": 1.839318038392514e-05, + "loss": 0.9071, + "step": 7614 + }, + { + "epoch": 20.749318801089917, + "grad_norm": 7.997469902038574, + "learning_rate": 1.8392700591225346e-05, + "loss": 0.8051, + "step": 7615 + }, + { + "epoch": 20.752043596730246, + "grad_norm": 7.729000091552734, + "learning_rate": 1.8392220733163467e-05, + "loss": 0.7467, + "step": 7616 + }, + { + "epoch": 20.754768392370572, + "grad_norm": 7.590522766113281, + "learning_rate": 1.8391740809743245e-05, + "loss": 0.8373, + "step": 7617 + }, + { + "epoch": 20.757493188010898, + "grad_norm": 8.049286842346191, + "learning_rate": 1.8391260820968417e-05, + "loss": 0.7924, + "step": 7618 + }, + { + "epoch": 20.760217983651227, + "grad_norm": 8.123289108276367, + "learning_rate": 1.8390780766842717e-05, + "loss": 0.8227, + "step": 7619 + }, + { + "epoch": 20.762942779291553, + "grad_norm": 8.064492225646973, + "learning_rate": 1.839030064736989e-05, + "loss": 0.7632, + "step": 7620 + }, + { + "epoch": 20.76566757493188, + "grad_norm": 11.855932235717773, + "learning_rate": 1.838982046255367e-05, + "loss": 0.6485, + "step": 7621 + }, + { + "epoch": 20.768392370572208, + "grad_norm": 8.009469032287598, + "learning_rate": 1.8389340212397797e-05, + "loss": 0.6338, + "step": 7622 + }, + { + "epoch": 20.771117166212534, + "grad_norm": 8.831151008605957, + "learning_rate": 1.8388859896906014e-05, + "loss": 0.6919, + "step": 7623 + }, + { + "epoch": 20.77384196185286, + "grad_norm": 7.897984504699707, + "learning_rate": 1.838837951608206e-05, + "loss": 0.8043, + "step": 7624 + }, + { + "epoch": 20.77656675749319, + "grad_norm": 7.134253025054932, + "learning_rate": 1.8387899069929673e-05, + "loss": 0.8281, + "step": 7625 + }, + { + "epoch": 20.779291553133515, + "grad_norm": 8.043962478637695, + "learning_rate": 1.8387418558452602e-05, + "loss": 1.0161, + "step": 7626 + }, + { + "epoch": 20.78201634877384, + "grad_norm": 9.967580795288086, + "learning_rate": 1.8386937981654583e-05, + "loss": 0.7574, + "step": 7627 + }, + { + "epoch": 20.78474114441417, + "grad_norm": 9.644227981567383, + "learning_rate": 1.8386457339539364e-05, + "loss": 0.6687, + "step": 7628 + }, + { + "epoch": 20.787465940054496, + "grad_norm": 8.344680786132812, + "learning_rate": 1.8385976632110684e-05, + "loss": 0.7148, + "step": 7629 + }, + { + "epoch": 20.79019073569482, + "grad_norm": 9.260910034179688, + "learning_rate": 1.8385495859372288e-05, + "loss": 0.9921, + "step": 7630 + }, + { + "epoch": 20.79291553133515, + "grad_norm": 6.6078314781188965, + "learning_rate": 1.8385015021327916e-05, + "loss": 0.9178, + "step": 7631 + }, + { + "epoch": 20.795640326975477, + "grad_norm": 10.556445121765137, + "learning_rate": 1.838453411798132e-05, + "loss": 0.8213, + "step": 7632 + }, + { + "epoch": 20.798365122615802, + "grad_norm": 8.5899019241333, + "learning_rate": 1.8384053149336243e-05, + "loss": 0.6635, + "step": 7633 + }, + { + "epoch": 20.80108991825613, + "grad_norm": 7.8474650382995605, + "learning_rate": 1.838357211539643e-05, + "loss": 0.7745, + "step": 7634 + }, + { + "epoch": 20.803814713896458, + "grad_norm": 7.122204303741455, + "learning_rate": 1.8383091016165626e-05, + "loss": 0.7743, + "step": 7635 + }, + { + "epoch": 20.806539509536783, + "grad_norm": 9.272528648376465, + "learning_rate": 1.838260985164758e-05, + "loss": 0.8671, + "step": 7636 + }, + { + "epoch": 20.809264305177113, + "grad_norm": 7.35139274597168, + "learning_rate": 1.8382128621846034e-05, + "loss": 0.9444, + "step": 7637 + }, + { + "epoch": 20.81198910081744, + "grad_norm": 9.256814956665039, + "learning_rate": 1.8381647326764744e-05, + "loss": 0.651, + "step": 7638 + }, + { + "epoch": 20.814713896457764, + "grad_norm": 8.758612632751465, + "learning_rate": 1.8381165966407456e-05, + "loss": 0.7474, + "step": 7639 + }, + { + "epoch": 20.817438692098094, + "grad_norm": 8.256421089172363, + "learning_rate": 1.8380684540777914e-05, + "loss": 0.6742, + "step": 7640 + }, + { + "epoch": 20.82016348773842, + "grad_norm": 7.075945854187012, + "learning_rate": 1.8380203049879872e-05, + "loss": 0.8121, + "step": 7641 + }, + { + "epoch": 20.822888283378745, + "grad_norm": 7.424861431121826, + "learning_rate": 1.8379721493717077e-05, + "loss": 0.7523, + "step": 7642 + }, + { + "epoch": 20.825613079019075, + "grad_norm": 8.83095932006836, + "learning_rate": 1.837923987229328e-05, + "loss": 0.8737, + "step": 7643 + }, + { + "epoch": 20.8283378746594, + "grad_norm": 9.214203834533691, + "learning_rate": 1.8378758185612237e-05, + "loss": 0.8524, + "step": 7644 + }, + { + "epoch": 20.831062670299726, + "grad_norm": 8.21826457977295, + "learning_rate": 1.8378276433677692e-05, + "loss": 0.7117, + "step": 7645 + }, + { + "epoch": 20.833787465940055, + "grad_norm": 8.080403327941895, + "learning_rate": 1.83777946164934e-05, + "loss": 0.7695, + "step": 7646 + }, + { + "epoch": 20.83651226158038, + "grad_norm": 7.988407611846924, + "learning_rate": 1.8377312734063113e-05, + "loss": 0.7418, + "step": 7647 + }, + { + "epoch": 20.839237057220707, + "grad_norm": 9.077837944030762, + "learning_rate": 1.8376830786390584e-05, + "loss": 0.6626, + "step": 7648 + }, + { + "epoch": 20.841961852861036, + "grad_norm": 8.081254959106445, + "learning_rate": 1.8376348773479568e-05, + "loss": 0.8218, + "step": 7649 + }, + { + "epoch": 20.844686648501362, + "grad_norm": 7.435146331787109, + "learning_rate": 1.8375866695333814e-05, + "loss": 0.9399, + "step": 7650 + }, + { + "epoch": 20.847411444141688, + "grad_norm": 7.113531112670898, + "learning_rate": 1.8375384551957084e-05, + "loss": 0.8247, + "step": 7651 + }, + { + "epoch": 20.850136239782017, + "grad_norm": 7.996152400970459, + "learning_rate": 1.8374902343353124e-05, + "loss": 0.5957, + "step": 7652 + }, + { + "epoch": 20.852861035422343, + "grad_norm": 8.345686912536621, + "learning_rate": 1.8374420069525697e-05, + "loss": 0.7369, + "step": 7653 + }, + { + "epoch": 20.85558583106267, + "grad_norm": 9.157774925231934, + "learning_rate": 1.8373937730478556e-05, + "loss": 0.8046, + "step": 7654 + }, + { + "epoch": 20.858310626703, + "grad_norm": 8.734550476074219, + "learning_rate": 1.8373455326215458e-05, + "loss": 0.8349, + "step": 7655 + }, + { + "epoch": 20.861035422343324, + "grad_norm": 9.237524032592773, + "learning_rate": 1.8372972856740157e-05, + "loss": 0.7737, + "step": 7656 + }, + { + "epoch": 20.86376021798365, + "grad_norm": 7.846309661865234, + "learning_rate": 1.8372490322056414e-05, + "loss": 0.7671, + "step": 7657 + }, + { + "epoch": 20.86648501362398, + "grad_norm": 7.726889610290527, + "learning_rate": 1.8372007722167987e-05, + "loss": 0.8007, + "step": 7658 + }, + { + "epoch": 20.869209809264305, + "grad_norm": 7.21893310546875, + "learning_rate": 1.8371525057078633e-05, + "loss": 0.7676, + "step": 7659 + }, + { + "epoch": 20.87193460490463, + "grad_norm": 7.970730304718018, + "learning_rate": 1.837104232679211e-05, + "loss": 0.8494, + "step": 7660 + }, + { + "epoch": 20.87465940054496, + "grad_norm": 6.842720031738281, + "learning_rate": 1.837055953131218e-05, + "loss": 0.9396, + "step": 7661 + }, + { + "epoch": 20.877384196185286, + "grad_norm": 8.219659805297852, + "learning_rate": 1.83700766706426e-05, + "loss": 0.9392, + "step": 7662 + }, + { + "epoch": 20.88010899182561, + "grad_norm": 7.09730863571167, + "learning_rate": 1.8369593744787135e-05, + "loss": 0.7419, + "step": 7663 + }, + { + "epoch": 20.88283378746594, + "grad_norm": 7.974386215209961, + "learning_rate": 1.836911075374954e-05, + "loss": 0.7454, + "step": 7664 + }, + { + "epoch": 20.885558583106267, + "grad_norm": 7.594198226928711, + "learning_rate": 1.8368627697533583e-05, + "loss": 0.7988, + "step": 7665 + }, + { + "epoch": 20.888283378746593, + "grad_norm": 8.172731399536133, + "learning_rate": 1.836814457614302e-05, + "loss": 0.9724, + "step": 7666 + }, + { + "epoch": 20.891008174386922, + "grad_norm": 9.023299217224121, + "learning_rate": 1.836766138958162e-05, + "loss": 0.7821, + "step": 7667 + }, + { + "epoch": 20.893732970027248, + "grad_norm": 9.135993957519531, + "learning_rate": 1.836717813785314e-05, + "loss": 0.7178, + "step": 7668 + }, + { + "epoch": 20.896457765667574, + "grad_norm": 8.075799942016602, + "learning_rate": 1.8366694820961346e-05, + "loss": 0.9333, + "step": 7669 + }, + { + "epoch": 20.899182561307903, + "grad_norm": 8.042290687561035, + "learning_rate": 1.8366211438910004e-05, + "loss": 0.9171, + "step": 7670 + }, + { + "epoch": 20.90190735694823, + "grad_norm": 8.95767593383789, + "learning_rate": 1.8365727991702874e-05, + "loss": 0.7039, + "step": 7671 + }, + { + "epoch": 20.904632152588555, + "grad_norm": 10.070302963256836, + "learning_rate": 1.8365244479343723e-05, + "loss": 0.8101, + "step": 7672 + }, + { + "epoch": 20.907356948228884, + "grad_norm": 7.303725719451904, + "learning_rate": 1.836476090183632e-05, + "loss": 0.8423, + "step": 7673 + }, + { + "epoch": 20.91008174386921, + "grad_norm": 8.69246768951416, + "learning_rate": 1.8364277259184428e-05, + "loss": 0.7401, + "step": 7674 + }, + { + "epoch": 20.912806539509535, + "grad_norm": 9.71865463256836, + "learning_rate": 1.8363793551391814e-05, + "loss": 0.881, + "step": 7675 + }, + { + "epoch": 20.915531335149865, + "grad_norm": 8.502640724182129, + "learning_rate": 1.836330977846224e-05, + "loss": 0.5955, + "step": 7676 + }, + { + "epoch": 20.91825613079019, + "grad_norm": 9.499765396118164, + "learning_rate": 1.8362825940399483e-05, + "loss": 0.7382, + "step": 7677 + }, + { + "epoch": 20.920980926430516, + "grad_norm": 8.114084243774414, + "learning_rate": 1.8362342037207308e-05, + "loss": 0.9603, + "step": 7678 + }, + { + "epoch": 20.923705722070846, + "grad_norm": 10.1805419921875, + "learning_rate": 1.836185806888948e-05, + "loss": 0.8999, + "step": 7679 + }, + { + "epoch": 20.92643051771117, + "grad_norm": 7.986012935638428, + "learning_rate": 1.836137403544977e-05, + "loss": 0.8367, + "step": 7680 + }, + { + "epoch": 20.929155313351497, + "grad_norm": 9.502193450927734, + "learning_rate": 1.836088993689195e-05, + "loss": 0.6833, + "step": 7681 + }, + { + "epoch": 20.931880108991827, + "grad_norm": 8.042461395263672, + "learning_rate": 1.836040577321979e-05, + "loss": 0.7908, + "step": 7682 + }, + { + "epoch": 20.934604904632153, + "grad_norm": 8.619714736938477, + "learning_rate": 1.8359921544437055e-05, + "loss": 0.7698, + "step": 7683 + }, + { + "epoch": 20.93732970027248, + "grad_norm": 7.86964750289917, + "learning_rate": 1.835943725054752e-05, + "loss": 0.8191, + "step": 7684 + }, + { + "epoch": 20.940054495912808, + "grad_norm": 8.827571868896484, + "learning_rate": 1.835895289155496e-05, + "loss": 0.8391, + "step": 7685 + }, + { + "epoch": 20.942779291553133, + "grad_norm": 8.40529727935791, + "learning_rate": 1.835846846746314e-05, + "loss": 0.7603, + "step": 7686 + }, + { + "epoch": 20.94550408719346, + "grad_norm": 8.676128387451172, + "learning_rate": 1.835798397827584e-05, + "loss": 0.7245, + "step": 7687 + }, + { + "epoch": 20.94822888283379, + "grad_norm": 9.562548637390137, + "learning_rate": 1.835749942399683e-05, + "loss": 0.7974, + "step": 7688 + }, + { + "epoch": 20.950953678474114, + "grad_norm": 8.225702285766602, + "learning_rate": 1.835701480462988e-05, + "loss": 0.7402, + "step": 7689 + }, + { + "epoch": 20.95367847411444, + "grad_norm": 6.749309062957764, + "learning_rate": 1.8356530120178767e-05, + "loss": 0.7914, + "step": 7690 + }, + { + "epoch": 20.95640326975477, + "grad_norm": 8.198533058166504, + "learning_rate": 1.835604537064727e-05, + "loss": 0.8502, + "step": 7691 + }, + { + "epoch": 20.959128065395095, + "grad_norm": 6.520903587341309, + "learning_rate": 1.8355560556039164e-05, + "loss": 0.6687, + "step": 7692 + }, + { + "epoch": 20.96185286103542, + "grad_norm": 8.739531517028809, + "learning_rate": 1.8355075676358215e-05, + "loss": 0.9065, + "step": 7693 + }, + { + "epoch": 20.96457765667575, + "grad_norm": 7.634159564971924, + "learning_rate": 1.835459073160821e-05, + "loss": 0.6198, + "step": 7694 + }, + { + "epoch": 20.967302452316076, + "grad_norm": 9.236230850219727, + "learning_rate": 1.8354105721792917e-05, + "loss": 0.8596, + "step": 7695 + }, + { + "epoch": 20.970027247956402, + "grad_norm": 7.2085113525390625, + "learning_rate": 1.8353620646916116e-05, + "loss": 0.8096, + "step": 7696 + }, + { + "epoch": 20.97275204359673, + "grad_norm": 7.414519786834717, + "learning_rate": 1.835313550698159e-05, + "loss": 0.8225, + "step": 7697 + }, + { + "epoch": 20.975476839237057, + "grad_norm": 8.842377662658691, + "learning_rate": 1.8352650301993112e-05, + "loss": 0.6714, + "step": 7698 + }, + { + "epoch": 20.978201634877383, + "grad_norm": 8.369305610656738, + "learning_rate": 1.8352165031954468e-05, + "loss": 0.7489, + "step": 7699 + }, + { + "epoch": 20.980926430517712, + "grad_norm": 11.194235801696777, + "learning_rate": 1.8351679696869427e-05, + "loss": 0.8214, + "step": 7700 + }, + { + "epoch": 20.983651226158038, + "grad_norm": 7.6760663986206055, + "learning_rate": 1.835119429674177e-05, + "loss": 0.734, + "step": 7701 + }, + { + "epoch": 20.986376021798364, + "grad_norm": 8.03299331665039, + "learning_rate": 1.8350708831575286e-05, + "loss": 0.8882, + "step": 7702 + }, + { + "epoch": 20.989100817438693, + "grad_norm": 8.684178352355957, + "learning_rate": 1.835022330137375e-05, + "loss": 0.7222, + "step": 7703 + }, + { + "epoch": 20.99182561307902, + "grad_norm": 11.191232681274414, + "learning_rate": 1.834973770614094e-05, + "loss": 0.9777, + "step": 7704 + }, + { + "epoch": 20.994550408719345, + "grad_norm": 7.9103007316589355, + "learning_rate": 1.834925204588064e-05, + "loss": 0.649, + "step": 7705 + }, + { + "epoch": 20.997275204359674, + "grad_norm": 8.560781478881836, + "learning_rate": 1.8348766320596638e-05, + "loss": 0.8652, + "step": 7706 + }, + { + "epoch": 21.0, + "grad_norm": 7.691993236541748, + "learning_rate": 1.8348280530292712e-05, + "loss": 0.7366, + "step": 7707 + }, + { + "epoch": 21.002724795640326, + "grad_norm": 7.323371410369873, + "learning_rate": 1.834779467497265e-05, + "loss": 0.6414, + "step": 7708 + }, + { + "epoch": 21.005449591280655, + "grad_norm": 8.487759590148926, + "learning_rate": 1.834730875464022e-05, + "loss": 0.7064, + "step": 7709 + }, + { + "epoch": 21.00817438692098, + "grad_norm": 7.555262088775635, + "learning_rate": 1.834682276929923e-05, + "loss": 0.9084, + "step": 7710 + }, + { + "epoch": 21.010899182561307, + "grad_norm": 7.268922805786133, + "learning_rate": 1.8346336718953447e-05, + "loss": 0.6943, + "step": 7711 + }, + { + "epoch": 21.013623978201636, + "grad_norm": 6.138815402984619, + "learning_rate": 1.8345850603606666e-05, + "loss": 0.7697, + "step": 7712 + }, + { + "epoch": 21.016348773841962, + "grad_norm": 7.12817907333374, + "learning_rate": 1.8345364423262666e-05, + "loss": 0.6686, + "step": 7713 + }, + { + "epoch": 21.019073569482288, + "grad_norm": 6.738901615142822, + "learning_rate": 1.8344878177925238e-05, + "loss": 0.6882, + "step": 7714 + }, + { + "epoch": 21.021798365122617, + "grad_norm": 7.405285358428955, + "learning_rate": 1.8344391867598164e-05, + "loss": 0.6643, + "step": 7715 + }, + { + "epoch": 21.024523160762943, + "grad_norm": 8.851975440979004, + "learning_rate": 1.8343905492285238e-05, + "loss": 0.7656, + "step": 7716 + }, + { + "epoch": 21.02724795640327, + "grad_norm": 8.151577949523926, + "learning_rate": 1.8343419051990245e-05, + "loss": 0.7937, + "step": 7717 + }, + { + "epoch": 21.029972752043598, + "grad_norm": 7.610278606414795, + "learning_rate": 1.8342932546716973e-05, + "loss": 0.6821, + "step": 7718 + }, + { + "epoch": 21.032697547683924, + "grad_norm": 49.263816833496094, + "learning_rate": 1.8342445976469206e-05, + "loss": 0.7039, + "step": 7719 + }, + { + "epoch": 21.03542234332425, + "grad_norm": 6.417880058288574, + "learning_rate": 1.8341959341250743e-05, + "loss": 0.6281, + "step": 7720 + }, + { + "epoch": 21.03814713896458, + "grad_norm": 7.054736614227295, + "learning_rate": 1.834147264106537e-05, + "loss": 0.6315, + "step": 7721 + }, + { + "epoch": 21.040871934604905, + "grad_norm": 7.179330825805664, + "learning_rate": 1.8340985875916874e-05, + "loss": 0.6987, + "step": 7722 + }, + { + "epoch": 21.04359673024523, + "grad_norm": 8.369280815124512, + "learning_rate": 1.834049904580905e-05, + "loss": 0.8383, + "step": 7723 + }, + { + "epoch": 21.04632152588556, + "grad_norm": 8.203306198120117, + "learning_rate": 1.8340012150745685e-05, + "loss": 0.6147, + "step": 7724 + }, + { + "epoch": 21.049046321525886, + "grad_norm": 8.10911750793457, + "learning_rate": 1.8339525190730577e-05, + "loss": 0.8666, + "step": 7725 + }, + { + "epoch": 21.05177111716621, + "grad_norm": 8.598569869995117, + "learning_rate": 1.833903816576751e-05, + "loss": 0.6295, + "step": 7726 + }, + { + "epoch": 21.05449591280654, + "grad_norm": 8.309627532958984, + "learning_rate": 1.8338551075860288e-05, + "loss": 0.6552, + "step": 7727 + }, + { + "epoch": 21.057220708446867, + "grad_norm": 7.313740253448486, + "learning_rate": 1.83380639210127e-05, + "loss": 0.7542, + "step": 7728 + }, + { + "epoch": 21.059945504087192, + "grad_norm": 7.313722133636475, + "learning_rate": 1.833757670122853e-05, + "loss": 0.647, + "step": 7729 + }, + { + "epoch": 21.06267029972752, + "grad_norm": 7.183590412139893, + "learning_rate": 1.833708941651159e-05, + "loss": 0.7993, + "step": 7730 + }, + { + "epoch": 21.065395095367847, + "grad_norm": 20.81493377685547, + "learning_rate": 1.833660206686566e-05, + "loss": 0.8202, + "step": 7731 + }, + { + "epoch": 21.068119891008173, + "grad_norm": 8.982355117797852, + "learning_rate": 1.8336114652294547e-05, + "loss": 0.7061, + "step": 7732 + }, + { + "epoch": 21.070844686648503, + "grad_norm": 8.355277061462402, + "learning_rate": 1.8335627172802034e-05, + "loss": 0.7621, + "step": 7733 + }, + { + "epoch": 21.07356948228883, + "grad_norm": 11.035460472106934, + "learning_rate": 1.833513962839193e-05, + "loss": 0.6851, + "step": 7734 + }, + { + "epoch": 21.076294277929154, + "grad_norm": 10.80052375793457, + "learning_rate": 1.8334652019068024e-05, + "loss": 0.7092, + "step": 7735 + }, + { + "epoch": 21.079019073569484, + "grad_norm": 8.625014305114746, + "learning_rate": 1.833416434483412e-05, + "loss": 0.707, + "step": 7736 + }, + { + "epoch": 21.08174386920981, + "grad_norm": 9.866307258605957, + "learning_rate": 1.833367660569401e-05, + "loss": 0.8092, + "step": 7737 + }, + { + "epoch": 21.084468664850135, + "grad_norm": 7.818713188171387, + "learning_rate": 1.8333188801651497e-05, + "loss": 0.8223, + "step": 7738 + }, + { + "epoch": 21.087193460490465, + "grad_norm": 6.951756954193115, + "learning_rate": 1.8332700932710375e-05, + "loss": 0.6738, + "step": 7739 + }, + { + "epoch": 21.08991825613079, + "grad_norm": 8.046797752380371, + "learning_rate": 1.8332212998874445e-05, + "loss": 0.7175, + "step": 7740 + }, + { + "epoch": 21.092643051771116, + "grad_norm": 7.292179107666016, + "learning_rate": 1.833172500014751e-05, + "loss": 0.6885, + "step": 7741 + }, + { + "epoch": 21.095367847411445, + "grad_norm": 7.999224662780762, + "learning_rate": 1.8331236936533372e-05, + "loss": 0.6877, + "step": 7742 + }, + { + "epoch": 21.09809264305177, + "grad_norm": 7.979372501373291, + "learning_rate": 1.8330748808035827e-05, + "loss": 0.6896, + "step": 7743 + }, + { + "epoch": 21.100817438692097, + "grad_norm": 8.748741149902344, + "learning_rate": 1.8330260614658674e-05, + "loss": 0.7583, + "step": 7744 + }, + { + "epoch": 21.103542234332426, + "grad_norm": 6.686682224273682, + "learning_rate": 1.8329772356405723e-05, + "loss": 0.906, + "step": 7745 + }, + { + "epoch": 21.106267029972752, + "grad_norm": 6.980701923370361, + "learning_rate": 1.8329284033280775e-05, + "loss": 0.523, + "step": 7746 + }, + { + "epoch": 21.108991825613078, + "grad_norm": 11.001998901367188, + "learning_rate": 1.832879564528763e-05, + "loss": 0.8516, + "step": 7747 + }, + { + "epoch": 21.111716621253407, + "grad_norm": 8.298548698425293, + "learning_rate": 1.832830719243009e-05, + "loss": 0.6667, + "step": 7748 + }, + { + "epoch": 21.114441416893733, + "grad_norm": 11.617433547973633, + "learning_rate": 1.8327818674711965e-05, + "loss": 0.7035, + "step": 7749 + }, + { + "epoch": 21.11716621253406, + "grad_norm": 6.781091213226318, + "learning_rate": 1.832733009213705e-05, + "loss": 0.7485, + "step": 7750 + }, + { + "epoch": 21.11989100817439, + "grad_norm": 8.314715385437012, + "learning_rate": 1.832684144470916e-05, + "loss": 0.8, + "step": 7751 + }, + { + "epoch": 21.122615803814714, + "grad_norm": 7.875467300415039, + "learning_rate": 1.8326352732432103e-05, + "loss": 0.6787, + "step": 7752 + }, + { + "epoch": 21.12534059945504, + "grad_norm": 12.015420913696289, + "learning_rate": 1.8325863955309673e-05, + "loss": 0.7911, + "step": 7753 + }, + { + "epoch": 21.12806539509537, + "grad_norm": 8.246016502380371, + "learning_rate": 1.8325375113345684e-05, + "loss": 0.7249, + "step": 7754 + }, + { + "epoch": 21.130790190735695, + "grad_norm": 7.11991024017334, + "learning_rate": 1.832488620654394e-05, + "loss": 0.7421, + "step": 7755 + }, + { + "epoch": 21.13351498637602, + "grad_norm": 9.072060585021973, + "learning_rate": 1.8324397234908252e-05, + "loss": 0.8292, + "step": 7756 + }, + { + "epoch": 21.13623978201635, + "grad_norm": 10.79595947265625, + "learning_rate": 1.8323908198442423e-05, + "loss": 0.7333, + "step": 7757 + }, + { + "epoch": 21.138964577656676, + "grad_norm": 9.850205421447754, + "learning_rate": 1.8323419097150264e-05, + "loss": 0.786, + "step": 7758 + }, + { + "epoch": 21.141689373297, + "grad_norm": 8.980114936828613, + "learning_rate": 1.832292993103559e-05, + "loss": 0.675, + "step": 7759 + }, + { + "epoch": 21.14441416893733, + "grad_norm": 6.9589009284973145, + "learning_rate": 1.8322440700102203e-05, + "loss": 0.7552, + "step": 7760 + }, + { + "epoch": 21.147138964577657, + "grad_norm": 9.685104370117188, + "learning_rate": 1.8321951404353916e-05, + "loss": 0.7158, + "step": 7761 + }, + { + "epoch": 21.149863760217983, + "grad_norm": 7.686063289642334, + "learning_rate": 1.8321462043794538e-05, + "loss": 0.9153, + "step": 7762 + }, + { + "epoch": 21.152588555858312, + "grad_norm": 7.35426664352417, + "learning_rate": 1.8320972618427885e-05, + "loss": 0.7068, + "step": 7763 + }, + { + "epoch": 21.155313351498638, + "grad_norm": 8.867984771728516, + "learning_rate": 1.832048312825776e-05, + "loss": 0.8534, + "step": 7764 + }, + { + "epoch": 21.158038147138964, + "grad_norm": 7.1844096183776855, + "learning_rate": 1.8319993573287984e-05, + "loss": 0.9589, + "step": 7765 + }, + { + "epoch": 21.160762942779293, + "grad_norm": 8.416938781738281, + "learning_rate": 1.8319503953522368e-05, + "loss": 0.6345, + "step": 7766 + }, + { + "epoch": 21.16348773841962, + "grad_norm": 7.446508407592773, + "learning_rate": 1.8319014268964718e-05, + "loss": 0.667, + "step": 7767 + }, + { + "epoch": 21.166212534059945, + "grad_norm": 8.560457229614258, + "learning_rate": 1.8318524519618853e-05, + "loss": 0.6437, + "step": 7768 + }, + { + "epoch": 21.168937329700274, + "grad_norm": 7.70897102355957, + "learning_rate": 1.831803470548859e-05, + "loss": 0.5842, + "step": 7769 + }, + { + "epoch": 21.1716621253406, + "grad_norm": 7.899026393890381, + "learning_rate": 1.8317544826577738e-05, + "loss": 0.7852, + "step": 7770 + }, + { + "epoch": 21.174386920980925, + "grad_norm": 7.9237823486328125, + "learning_rate": 1.8317054882890114e-05, + "loss": 0.7289, + "step": 7771 + }, + { + "epoch": 21.177111716621255, + "grad_norm": 8.078022956848145, + "learning_rate": 1.8316564874429535e-05, + "loss": 0.7711, + "step": 7772 + }, + { + "epoch": 21.17983651226158, + "grad_norm": 6.839797019958496, + "learning_rate": 1.831607480119982e-05, + "loss": 0.5835, + "step": 7773 + }, + { + "epoch": 21.182561307901906, + "grad_norm": 8.098297119140625, + "learning_rate": 1.8315584663204776e-05, + "loss": 0.7346, + "step": 7774 + }, + { + "epoch": 21.185286103542236, + "grad_norm": 7.693576812744141, + "learning_rate": 1.8315094460448232e-05, + "loss": 0.6617, + "step": 7775 + }, + { + "epoch": 21.18801089918256, + "grad_norm": 8.116175651550293, + "learning_rate": 1.8314604192933997e-05, + "loss": 0.7086, + "step": 7776 + }, + { + "epoch": 21.190735694822887, + "grad_norm": 8.301321983337402, + "learning_rate": 1.8314113860665892e-05, + "loss": 0.8246, + "step": 7777 + }, + { + "epoch": 21.193460490463217, + "grad_norm": 12.183932304382324, + "learning_rate": 1.8313623463647736e-05, + "loss": 0.77, + "step": 7778 + }, + { + "epoch": 21.196185286103542, + "grad_norm": 7.684350490570068, + "learning_rate": 1.831313300188335e-05, + "loss": 0.7761, + "step": 7779 + }, + { + "epoch": 21.19891008174387, + "grad_norm": 8.239131927490234, + "learning_rate": 1.8312642475376547e-05, + "loss": 0.7188, + "step": 7780 + }, + { + "epoch": 21.201634877384198, + "grad_norm": 9.018391609191895, + "learning_rate": 1.8312151884131157e-05, + "loss": 0.7761, + "step": 7781 + }, + { + "epoch": 21.204359673024523, + "grad_norm": 8.890396118164062, + "learning_rate": 1.8311661228150994e-05, + "loss": 0.6096, + "step": 7782 + }, + { + "epoch": 21.20708446866485, + "grad_norm": 7.6317548751831055, + "learning_rate": 1.8311170507439878e-05, + "loss": 0.8057, + "step": 7783 + }, + { + "epoch": 21.20980926430518, + "grad_norm": 7.228536128997803, + "learning_rate": 1.8310679722001638e-05, + "loss": 0.6051, + "step": 7784 + }, + { + "epoch": 21.212534059945504, + "grad_norm": 9.289490699768066, + "learning_rate": 1.831018887184009e-05, + "loss": 0.8712, + "step": 7785 + }, + { + "epoch": 21.21525885558583, + "grad_norm": 8.295319557189941, + "learning_rate": 1.8309697956959057e-05, + "loss": 0.6566, + "step": 7786 + }, + { + "epoch": 21.21798365122616, + "grad_norm": 9.994537353515625, + "learning_rate": 1.8309206977362367e-05, + "loss": 1.0121, + "step": 7787 + }, + { + "epoch": 21.220708446866485, + "grad_norm": 9.828986167907715, + "learning_rate": 1.8308715933053836e-05, + "loss": 0.6002, + "step": 7788 + }, + { + "epoch": 21.22343324250681, + "grad_norm": 8.134908676147461, + "learning_rate": 1.8308224824037295e-05, + "loss": 0.8085, + "step": 7789 + }, + { + "epoch": 21.22615803814714, + "grad_norm": 8.998791694641113, + "learning_rate": 1.8307733650316567e-05, + "loss": 0.6447, + "step": 7790 + }, + { + "epoch": 21.228882833787466, + "grad_norm": 6.333938121795654, + "learning_rate": 1.8307242411895478e-05, + "loss": 0.8348, + "step": 7791 + }, + { + "epoch": 21.231607629427792, + "grad_norm": 6.362037658691406, + "learning_rate": 1.8306751108777853e-05, + "loss": 0.6097, + "step": 7792 + }, + { + "epoch": 21.23433242506812, + "grad_norm": 6.66240930557251, + "learning_rate": 1.8306259740967515e-05, + "loss": 0.6624, + "step": 7793 + }, + { + "epoch": 21.237057220708447, + "grad_norm": 9.169851303100586, + "learning_rate": 1.8305768308468294e-05, + "loss": 0.7953, + "step": 7794 + }, + { + "epoch": 21.239782016348773, + "grad_norm": 8.247089385986328, + "learning_rate": 1.8305276811284013e-05, + "loss": 0.6312, + "step": 7795 + }, + { + "epoch": 21.242506811989102, + "grad_norm": 7.682947158813477, + "learning_rate": 1.8304785249418508e-05, + "loss": 0.7508, + "step": 7796 + }, + { + "epoch": 21.245231607629428, + "grad_norm": 7.679996013641357, + "learning_rate": 1.8304293622875603e-05, + "loss": 0.6304, + "step": 7797 + }, + { + "epoch": 21.247956403269754, + "grad_norm": 7.897690773010254, + "learning_rate": 1.8303801931659127e-05, + "loss": 0.9888, + "step": 7798 + }, + { + "epoch": 21.250681198910083, + "grad_norm": 7.268885612487793, + "learning_rate": 1.8303310175772905e-05, + "loss": 0.7899, + "step": 7799 + }, + { + "epoch": 21.25340599455041, + "grad_norm": 7.545280456542969, + "learning_rate": 1.8302818355220776e-05, + "loss": 0.6075, + "step": 7800 + }, + { + "epoch": 21.256130790190735, + "grad_norm": 7.544144630432129, + "learning_rate": 1.8302326470006562e-05, + "loss": 0.8575, + "step": 7801 + }, + { + "epoch": 21.258855585831064, + "grad_norm": 6.4075164794921875, + "learning_rate": 1.8301834520134098e-05, + "loss": 0.7751, + "step": 7802 + }, + { + "epoch": 21.26158038147139, + "grad_norm": 7.582212448120117, + "learning_rate": 1.830134250560721e-05, + "loss": 0.6442, + "step": 7803 + }, + { + "epoch": 21.264305177111716, + "grad_norm": 9.166476249694824, + "learning_rate": 1.8300850426429738e-05, + "loss": 0.7045, + "step": 7804 + }, + { + "epoch": 21.267029972752045, + "grad_norm": 8.270711898803711, + "learning_rate": 1.830035828260551e-05, + "loss": 0.5986, + "step": 7805 + }, + { + "epoch": 21.26975476839237, + "grad_norm": 8.354194641113281, + "learning_rate": 1.8299866074138356e-05, + "loss": 0.672, + "step": 7806 + }, + { + "epoch": 21.272479564032697, + "grad_norm": 7.5973896980285645, + "learning_rate": 1.829937380103211e-05, + "loss": 0.6956, + "step": 7807 + }, + { + "epoch": 21.275204359673026, + "grad_norm": 9.056324005126953, + "learning_rate": 1.8298881463290613e-05, + "loss": 0.8167, + "step": 7808 + }, + { + "epoch": 21.277929155313352, + "grad_norm": 8.447535514831543, + "learning_rate": 1.8298389060917696e-05, + "loss": 0.6823, + "step": 7809 + }, + { + "epoch": 21.280653950953678, + "grad_norm": 6.850573539733887, + "learning_rate": 1.8297896593917187e-05, + "loss": 0.6815, + "step": 7810 + }, + { + "epoch": 21.283378746594007, + "grad_norm": 9.523035049438477, + "learning_rate": 1.8297404062292927e-05, + "loss": 0.6124, + "step": 7811 + }, + { + "epoch": 21.286103542234333, + "grad_norm": 8.456561088562012, + "learning_rate": 1.8296911466048754e-05, + "loss": 0.7413, + "step": 7812 + }, + { + "epoch": 21.28882833787466, + "grad_norm": 6.094063758850098, + "learning_rate": 1.82964188051885e-05, + "loss": 0.6749, + "step": 7813 + }, + { + "epoch": 21.291553133514988, + "grad_norm": 7.415526866912842, + "learning_rate": 1.8295926079716002e-05, + "loss": 0.7262, + "step": 7814 + }, + { + "epoch": 21.294277929155314, + "grad_norm": 6.7150654792785645, + "learning_rate": 1.82954332896351e-05, + "loss": 0.6599, + "step": 7815 + }, + { + "epoch": 21.29700272479564, + "grad_norm": 8.221084594726562, + "learning_rate": 1.829494043494963e-05, + "loss": 0.7855, + "step": 7816 + }, + { + "epoch": 21.29972752043597, + "grad_norm": 7.059593200683594, + "learning_rate": 1.829444751566343e-05, + "loss": 0.7522, + "step": 7817 + }, + { + "epoch": 21.302452316076295, + "grad_norm": 8.087608337402344, + "learning_rate": 1.829395453178034e-05, + "loss": 0.6614, + "step": 7818 + }, + { + "epoch": 21.30517711171662, + "grad_norm": 7.509298801422119, + "learning_rate": 1.8293461483304203e-05, + "loss": 0.8376, + "step": 7819 + }, + { + "epoch": 21.30790190735695, + "grad_norm": 8.698942184448242, + "learning_rate": 1.8292968370238852e-05, + "loss": 0.6471, + "step": 7820 + }, + { + "epoch": 21.310626702997276, + "grad_norm": 7.400518417358398, + "learning_rate": 1.829247519258813e-05, + "loss": 0.7327, + "step": 7821 + }, + { + "epoch": 21.3133514986376, + "grad_norm": 7.770204067230225, + "learning_rate": 1.8291981950355878e-05, + "loss": 0.7166, + "step": 7822 + }, + { + "epoch": 21.31607629427793, + "grad_norm": 9.752872467041016, + "learning_rate": 1.829148864354594e-05, + "loss": 0.6592, + "step": 7823 + }, + { + "epoch": 21.318801089918257, + "grad_norm": 8.794660568237305, + "learning_rate": 1.829099527216215e-05, + "loss": 0.6592, + "step": 7824 + }, + { + "epoch": 21.321525885558582, + "grad_norm": 8.04993724822998, + "learning_rate": 1.8290501836208357e-05, + "loss": 0.7495, + "step": 7825 + }, + { + "epoch": 21.32425068119891, + "grad_norm": 9.428915023803711, + "learning_rate": 1.8290008335688404e-05, + "loss": 0.7839, + "step": 7826 + }, + { + "epoch": 21.326975476839237, + "grad_norm": 8.758989334106445, + "learning_rate": 1.8289514770606133e-05, + "loss": 0.7225, + "step": 7827 + }, + { + "epoch": 21.329700272479563, + "grad_norm": 7.357696056365967, + "learning_rate": 1.828902114096539e-05, + "loss": 0.7797, + "step": 7828 + }, + { + "epoch": 21.332425068119893, + "grad_norm": 7.127198696136475, + "learning_rate": 1.8288527446770015e-05, + "loss": 0.6018, + "step": 7829 + }, + { + "epoch": 21.33514986376022, + "grad_norm": 8.083072662353516, + "learning_rate": 1.8288033688023855e-05, + "loss": 0.7021, + "step": 7830 + }, + { + "epoch": 21.337874659400544, + "grad_norm": 39.04533767700195, + "learning_rate": 1.8287539864730756e-05, + "loss": 0.6806, + "step": 7831 + }, + { + "epoch": 21.340599455040874, + "grad_norm": 7.802813529968262, + "learning_rate": 1.8287045976894563e-05, + "loss": 0.7299, + "step": 7832 + }, + { + "epoch": 21.3433242506812, + "grad_norm": 7.451691627502441, + "learning_rate": 1.828655202451912e-05, + "loss": 0.7479, + "step": 7833 + }, + { + "epoch": 21.346049046321525, + "grad_norm": 8.16508960723877, + "learning_rate": 1.828605800760828e-05, + "loss": 0.6664, + "step": 7834 + }, + { + "epoch": 21.348773841961854, + "grad_norm": 8.571643829345703, + "learning_rate": 1.8285563926165884e-05, + "loss": 0.7836, + "step": 7835 + }, + { + "epoch": 21.35149863760218, + "grad_norm": 8.905378341674805, + "learning_rate": 1.8285069780195787e-05, + "loss": 0.7247, + "step": 7836 + }, + { + "epoch": 21.354223433242506, + "grad_norm": 8.476143836975098, + "learning_rate": 1.828457556970183e-05, + "loss": 0.9014, + "step": 7837 + }, + { + "epoch": 21.356948228882835, + "grad_norm": 9.995495796203613, + "learning_rate": 1.8284081294687866e-05, + "loss": 0.7649, + "step": 7838 + }, + { + "epoch": 21.35967302452316, + "grad_norm": 7.34924840927124, + "learning_rate": 1.8283586955157744e-05, + "loss": 0.6138, + "step": 7839 + }, + { + "epoch": 21.362397820163487, + "grad_norm": 8.554211616516113, + "learning_rate": 1.8283092551115312e-05, + "loss": 0.6246, + "step": 7840 + }, + { + "epoch": 21.365122615803816, + "grad_norm": 9.853658676147461, + "learning_rate": 1.8282598082564423e-05, + "loss": 0.6639, + "step": 7841 + }, + { + "epoch": 21.367847411444142, + "grad_norm": 9.210776329040527, + "learning_rate": 1.828210354950893e-05, + "loss": 0.7076, + "step": 7842 + }, + { + "epoch": 21.370572207084468, + "grad_norm": 10.371861457824707, + "learning_rate": 1.8281608951952675e-05, + "loss": 0.7557, + "step": 7843 + }, + { + "epoch": 21.373297002724797, + "grad_norm": 9.623146057128906, + "learning_rate": 1.8281114289899515e-05, + "loss": 0.8533, + "step": 7844 + }, + { + "epoch": 21.376021798365123, + "grad_norm": 14.123766899108887, + "learning_rate": 1.8280619563353307e-05, + "loss": 0.7615, + "step": 7845 + }, + { + "epoch": 21.37874659400545, + "grad_norm": 8.241548538208008, + "learning_rate": 1.8280124772317903e-05, + "loss": 0.7469, + "step": 7846 + }, + { + "epoch": 21.381471389645778, + "grad_norm": 9.194026947021484, + "learning_rate": 1.827962991679715e-05, + "loss": 0.8611, + "step": 7847 + }, + { + "epoch": 21.384196185286104, + "grad_norm": 9.951804161071777, + "learning_rate": 1.8279134996794904e-05, + "loss": 0.7452, + "step": 7848 + }, + { + "epoch": 21.38692098092643, + "grad_norm": 9.589630126953125, + "learning_rate": 1.8278640012315026e-05, + "loss": 0.8759, + "step": 7849 + }, + { + "epoch": 21.38964577656676, + "grad_norm": 8.136022567749023, + "learning_rate": 1.8278144963361363e-05, + "loss": 0.8513, + "step": 7850 + }, + { + "epoch": 21.392370572207085, + "grad_norm": 7.128570079803467, + "learning_rate": 1.8277649849937776e-05, + "loss": 0.601, + "step": 7851 + }, + { + "epoch": 21.39509536784741, + "grad_norm": 8.721702575683594, + "learning_rate": 1.8277154672048117e-05, + "loss": 0.8491, + "step": 7852 + }, + { + "epoch": 21.39782016348774, + "grad_norm": 10.861640930175781, + "learning_rate": 1.827665942969624e-05, + "loss": 0.8474, + "step": 7853 + }, + { + "epoch": 21.400544959128066, + "grad_norm": 9.07026195526123, + "learning_rate": 1.827616412288601e-05, + "loss": 0.7765, + "step": 7854 + }, + { + "epoch": 21.40326975476839, + "grad_norm": 10.966297149658203, + "learning_rate": 1.827566875162128e-05, + "loss": 0.7677, + "step": 7855 + }, + { + "epoch": 21.40599455040872, + "grad_norm": 7.402095317840576, + "learning_rate": 1.827517331590591e-05, + "loss": 0.6769, + "step": 7856 + }, + { + "epoch": 21.408719346049047, + "grad_norm": 9.250561714172363, + "learning_rate": 1.827467781574375e-05, + "loss": 0.7842, + "step": 7857 + }, + { + "epoch": 21.411444141689373, + "grad_norm": 8.343886375427246, + "learning_rate": 1.827418225113867e-05, + "loss": 0.7271, + "step": 7858 + }, + { + "epoch": 21.414168937329702, + "grad_norm": 9.130738258361816, + "learning_rate": 1.8273686622094528e-05, + "loss": 0.9478, + "step": 7859 + }, + { + "epoch": 21.416893732970028, + "grad_norm": 8.603825569152832, + "learning_rate": 1.8273190928615175e-05, + "loss": 0.723, + "step": 7860 + }, + { + "epoch": 21.419618528610354, + "grad_norm": 8.468642234802246, + "learning_rate": 1.827269517070448e-05, + "loss": 0.8052, + "step": 7861 + }, + { + "epoch": 21.422343324250683, + "grad_norm": 9.678513526916504, + "learning_rate": 1.82721993483663e-05, + "loss": 0.7749, + "step": 7862 + }, + { + "epoch": 21.42506811989101, + "grad_norm": 8.318564414978027, + "learning_rate": 1.82717034616045e-05, + "loss": 0.8833, + "step": 7863 + }, + { + "epoch": 21.427792915531334, + "grad_norm": 9.165751457214355, + "learning_rate": 1.8271207510422936e-05, + "loss": 0.6578, + "step": 7864 + }, + { + "epoch": 21.430517711171664, + "grad_norm": 9.25309944152832, + "learning_rate": 1.827071149482548e-05, + "loss": 0.8782, + "step": 7865 + }, + { + "epoch": 21.43324250681199, + "grad_norm": 7.358325481414795, + "learning_rate": 1.8270215414815983e-05, + "loss": 0.7503, + "step": 7866 + }, + { + "epoch": 21.435967302452315, + "grad_norm": 10.131277084350586, + "learning_rate": 1.826971927039832e-05, + "loss": 0.8035, + "step": 7867 + }, + { + "epoch": 21.438692098092645, + "grad_norm": 6.802368640899658, + "learning_rate": 1.8269223061576345e-05, + "loss": 0.5909, + "step": 7868 + }, + { + "epoch": 21.44141689373297, + "grad_norm": 7.230935573577881, + "learning_rate": 1.8268726788353928e-05, + "loss": 0.6816, + "step": 7869 + }, + { + "epoch": 21.444141689373296, + "grad_norm": 8.83212947845459, + "learning_rate": 1.8268230450734933e-05, + "loss": 0.7934, + "step": 7870 + }, + { + "epoch": 21.446866485013626, + "grad_norm": 10.197222709655762, + "learning_rate": 1.8267734048723227e-05, + "loss": 0.7797, + "step": 7871 + }, + { + "epoch": 21.44959128065395, + "grad_norm": 7.890384197235107, + "learning_rate": 1.826723758232267e-05, + "loss": 0.7396, + "step": 7872 + }, + { + "epoch": 21.452316076294277, + "grad_norm": 22.438573837280273, + "learning_rate": 1.8266741051537138e-05, + "loss": 0.7768, + "step": 7873 + }, + { + "epoch": 21.455040871934607, + "grad_norm": 8.331838607788086, + "learning_rate": 1.826624445637049e-05, + "loss": 0.7235, + "step": 7874 + }, + { + "epoch": 21.457765667574932, + "grad_norm": 8.330008506774902, + "learning_rate": 1.82657477968266e-05, + "loss": 0.794, + "step": 7875 + }, + { + "epoch": 21.460490463215258, + "grad_norm": 8.820117950439453, + "learning_rate": 1.8265251072909325e-05, + "loss": 0.726, + "step": 7876 + }, + { + "epoch": 21.463215258855588, + "grad_norm": 8.135759353637695, + "learning_rate": 1.8264754284622544e-05, + "loss": 0.7684, + "step": 7877 + }, + { + "epoch": 21.465940054495913, + "grad_norm": 8.72147274017334, + "learning_rate": 1.8264257431970126e-05, + "loss": 0.6674, + "step": 7878 + }, + { + "epoch": 21.46866485013624, + "grad_norm": 9.059609413146973, + "learning_rate": 1.8263760514955934e-05, + "loss": 0.6546, + "step": 7879 + }, + { + "epoch": 21.47138964577657, + "grad_norm": 8.65694522857666, + "learning_rate": 1.826326353358384e-05, + "loss": 0.6604, + "step": 7880 + }, + { + "epoch": 21.474114441416894, + "grad_norm": 16.3781795501709, + "learning_rate": 1.826276648785772e-05, + "loss": 0.79, + "step": 7881 + }, + { + "epoch": 21.47683923705722, + "grad_norm": 8.262587547302246, + "learning_rate": 1.8262269377781433e-05, + "loss": 0.8599, + "step": 7882 + }, + { + "epoch": 21.479564032697546, + "grad_norm": 10.127559661865234, + "learning_rate": 1.8261772203358864e-05, + "loss": 0.806, + "step": 7883 + }, + { + "epoch": 21.482288828337875, + "grad_norm": 8.68094253540039, + "learning_rate": 1.826127496459388e-05, + "loss": 0.8834, + "step": 7884 + }, + { + "epoch": 21.4850136239782, + "grad_norm": 10.492690086364746, + "learning_rate": 1.8260777661490346e-05, + "loss": 0.8959, + "step": 7885 + }, + { + "epoch": 21.48773841961853, + "grad_norm": 9.7289457321167, + "learning_rate": 1.8260280294052147e-05, + "loss": 0.6808, + "step": 7886 + }, + { + "epoch": 21.490463215258856, + "grad_norm": 8.183979988098145, + "learning_rate": 1.825978286228315e-05, + "loss": 0.6351, + "step": 7887 + }, + { + "epoch": 21.493188010899182, + "grad_norm": 7.9571452140808105, + "learning_rate": 1.825928536618723e-05, + "loss": 0.884, + "step": 7888 + }, + { + "epoch": 21.495912806539508, + "grad_norm": 7.1114678382873535, + "learning_rate": 1.825878780576826e-05, + "loss": 0.7722, + "step": 7889 + }, + { + "epoch": 21.498637602179837, + "grad_norm": 9.125557899475098, + "learning_rate": 1.8258290181030118e-05, + "loss": 0.7119, + "step": 7890 + }, + { + "epoch": 21.501362397820163, + "grad_norm": 8.275768280029297, + "learning_rate": 1.8257792491976676e-05, + "loss": 0.7316, + "step": 7891 + }, + { + "epoch": 21.504087193460492, + "grad_norm": 6.560149669647217, + "learning_rate": 1.8257294738611814e-05, + "loss": 0.6208, + "step": 7892 + }, + { + "epoch": 21.506811989100818, + "grad_norm": 11.462034225463867, + "learning_rate": 1.8256796920939405e-05, + "loss": 0.6605, + "step": 7893 + }, + { + "epoch": 21.509536784741144, + "grad_norm": 9.567168235778809, + "learning_rate": 1.8256299038963326e-05, + "loss": 0.7499, + "step": 7894 + }, + { + "epoch": 21.51226158038147, + "grad_norm": 8.80770492553711, + "learning_rate": 1.8255801092687456e-05, + "loss": 0.6636, + "step": 7895 + }, + { + "epoch": 21.5149863760218, + "grad_norm": 7.371953010559082, + "learning_rate": 1.8255303082115676e-05, + "loss": 0.666, + "step": 7896 + }, + { + "epoch": 21.517711171662125, + "grad_norm": 9.620489120483398, + "learning_rate": 1.825480500725186e-05, + "loss": 0.9453, + "step": 7897 + }, + { + "epoch": 21.520435967302454, + "grad_norm": 10.59334945678711, + "learning_rate": 1.8254306868099885e-05, + "loss": 0.9546, + "step": 7898 + }, + { + "epoch": 21.52316076294278, + "grad_norm": 8.24769115447998, + "learning_rate": 1.8253808664663636e-05, + "loss": 0.582, + "step": 7899 + }, + { + "epoch": 21.525885558583106, + "grad_norm": 8.952377319335938, + "learning_rate": 1.8253310396946992e-05, + "loss": 0.7687, + "step": 7900 + }, + { + "epoch": 21.52861035422343, + "grad_norm": 8.575875282287598, + "learning_rate": 1.8252812064953832e-05, + "loss": 0.7123, + "step": 7901 + }, + { + "epoch": 21.53133514986376, + "grad_norm": 8.191732406616211, + "learning_rate": 1.8252313668688036e-05, + "loss": 0.7455, + "step": 7902 + }, + { + "epoch": 21.534059945504087, + "grad_norm": 8.31759262084961, + "learning_rate": 1.825181520815349e-05, + "loss": 0.7352, + "step": 7903 + }, + { + "epoch": 21.536784741144416, + "grad_norm": 7.698764324188232, + "learning_rate": 1.825131668335407e-05, + "loss": 0.6262, + "step": 7904 + }, + { + "epoch": 21.539509536784742, + "grad_norm": 8.273205757141113, + "learning_rate": 1.825081809429366e-05, + "loss": 0.6234, + "step": 7905 + }, + { + "epoch": 21.542234332425068, + "grad_norm": 8.954992294311523, + "learning_rate": 1.8250319440976146e-05, + "loss": 0.6729, + "step": 7906 + }, + { + "epoch": 21.544959128065393, + "grad_norm": 6.745213985443115, + "learning_rate": 1.824982072340541e-05, + "loss": 0.6978, + "step": 7907 + }, + { + "epoch": 21.547683923705723, + "grad_norm": 10.402472496032715, + "learning_rate": 1.8249321941585333e-05, + "loss": 0.6672, + "step": 7908 + }, + { + "epoch": 21.55040871934605, + "grad_norm": 11.216215133666992, + "learning_rate": 1.8248823095519804e-05, + "loss": 0.9177, + "step": 7909 + }, + { + "epoch": 21.553133514986374, + "grad_norm": 8.769536018371582, + "learning_rate": 1.824832418521271e-05, + "loss": 0.812, + "step": 7910 + }, + { + "epoch": 21.555858310626704, + "grad_norm": 8.631336212158203, + "learning_rate": 1.8247825210667926e-05, + "loss": 0.772, + "step": 7911 + }, + { + "epoch": 21.55858310626703, + "grad_norm": 10.451501846313477, + "learning_rate": 1.8247326171889346e-05, + "loss": 0.7401, + "step": 7912 + }, + { + "epoch": 21.561307901907355, + "grad_norm": 7.815615653991699, + "learning_rate": 1.824682706888086e-05, + "loss": 0.7202, + "step": 7913 + }, + { + "epoch": 21.564032697547685, + "grad_norm": 7.0563740730285645, + "learning_rate": 1.8246327901646344e-05, + "loss": 0.8525, + "step": 7914 + }, + { + "epoch": 21.56675749318801, + "grad_norm": 8.432811737060547, + "learning_rate": 1.8245828670189697e-05, + "loss": 0.6382, + "step": 7915 + }, + { + "epoch": 21.569482288828336, + "grad_norm": 10.904496192932129, + "learning_rate": 1.8245329374514803e-05, + "loss": 0.6903, + "step": 7916 + }, + { + "epoch": 21.572207084468666, + "grad_norm": 7.396626949310303, + "learning_rate": 1.8244830014625546e-05, + "loss": 0.6741, + "step": 7917 + }, + { + "epoch": 21.57493188010899, + "grad_norm": 7.294145584106445, + "learning_rate": 1.8244330590525817e-05, + "loss": 0.6677, + "step": 7918 + }, + { + "epoch": 21.577656675749317, + "grad_norm": 8.535848617553711, + "learning_rate": 1.8243831102219507e-05, + "loss": 0.871, + "step": 7919 + }, + { + "epoch": 21.580381471389646, + "grad_norm": 8.005303382873535, + "learning_rate": 1.8243331549710505e-05, + "loss": 0.5657, + "step": 7920 + }, + { + "epoch": 21.583106267029972, + "grad_norm": 10.448698997497559, + "learning_rate": 1.8242831933002704e-05, + "loss": 0.5724, + "step": 7921 + }, + { + "epoch": 21.585831062670298, + "grad_norm": 8.847328186035156, + "learning_rate": 1.8242332252099994e-05, + "loss": 0.8586, + "step": 7922 + }, + { + "epoch": 21.588555858310627, + "grad_norm": 8.258277893066406, + "learning_rate": 1.8241832507006265e-05, + "loss": 0.718, + "step": 7923 + }, + { + "epoch": 21.591280653950953, + "grad_norm": 9.496620178222656, + "learning_rate": 1.824133269772541e-05, + "loss": 0.8494, + "step": 7924 + }, + { + "epoch": 21.59400544959128, + "grad_norm": 14.107674598693848, + "learning_rate": 1.824083282426132e-05, + "loss": 0.6569, + "step": 7925 + }, + { + "epoch": 21.59673024523161, + "grad_norm": 9.128961563110352, + "learning_rate": 1.824033288661789e-05, + "loss": 0.7015, + "step": 7926 + }, + { + "epoch": 21.599455040871934, + "grad_norm": 10.131857872009277, + "learning_rate": 1.823983288479901e-05, + "loss": 0.6528, + "step": 7927 + }, + { + "epoch": 21.60217983651226, + "grad_norm": 9.59658145904541, + "learning_rate": 1.823933281880858e-05, + "loss": 0.8142, + "step": 7928 + }, + { + "epoch": 21.60490463215259, + "grad_norm": 8.79918098449707, + "learning_rate": 1.823883268865049e-05, + "loss": 0.7122, + "step": 7929 + }, + { + "epoch": 21.607629427792915, + "grad_norm": 7.878252029418945, + "learning_rate": 1.823833249432864e-05, + "loss": 0.7546, + "step": 7930 + }, + { + "epoch": 21.61035422343324, + "grad_norm": 9.626506805419922, + "learning_rate": 1.8237832235846916e-05, + "loss": 0.7728, + "step": 7931 + }, + { + "epoch": 21.61307901907357, + "grad_norm": 9.732280731201172, + "learning_rate": 1.8237331913209223e-05, + "loss": 0.7407, + "step": 7932 + }, + { + "epoch": 21.615803814713896, + "grad_norm": 7.609302997589111, + "learning_rate": 1.8236831526419453e-05, + "loss": 0.5814, + "step": 7933 + }, + { + "epoch": 21.618528610354222, + "grad_norm": 9.080131530761719, + "learning_rate": 1.8236331075481503e-05, + "loss": 0.6292, + "step": 7934 + }, + { + "epoch": 21.62125340599455, + "grad_norm": 9.119004249572754, + "learning_rate": 1.8235830560399273e-05, + "loss": 0.6587, + "step": 7935 + }, + { + "epoch": 21.623978201634877, + "grad_norm": 9.003334999084473, + "learning_rate": 1.823532998117666e-05, + "loss": 0.7407, + "step": 7936 + }, + { + "epoch": 21.626702997275203, + "grad_norm": 11.348891258239746, + "learning_rate": 1.8234829337817562e-05, + "loss": 0.739, + "step": 7937 + }, + { + "epoch": 21.629427792915532, + "grad_norm": 7.240442752838135, + "learning_rate": 1.8234328630325876e-05, + "loss": 0.8259, + "step": 7938 + }, + { + "epoch": 21.632152588555858, + "grad_norm": 12.556734085083008, + "learning_rate": 1.8233827858705507e-05, + "loss": 0.8721, + "step": 7939 + }, + { + "epoch": 21.634877384196184, + "grad_norm": 8.399681091308594, + "learning_rate": 1.823332702296035e-05, + "loss": 0.7849, + "step": 7940 + }, + { + "epoch": 21.637602179836513, + "grad_norm": 9.10388469696045, + "learning_rate": 1.8232826123094308e-05, + "loss": 0.6383, + "step": 7941 + }, + { + "epoch": 21.64032697547684, + "grad_norm": 7.981561183929443, + "learning_rate": 1.823232515911128e-05, + "loss": 0.8083, + "step": 7942 + }, + { + "epoch": 21.643051771117165, + "grad_norm": 7.688388347625732, + "learning_rate": 1.8231824131015166e-05, + "loss": 0.5851, + "step": 7943 + }, + { + "epoch": 21.645776566757494, + "grad_norm": 7.962990760803223, + "learning_rate": 1.823132303880988e-05, + "loss": 0.6984, + "step": 7944 + }, + { + "epoch": 21.64850136239782, + "grad_norm": 8.506324768066406, + "learning_rate": 1.8230821882499307e-05, + "loss": 0.8352, + "step": 7945 + }, + { + "epoch": 21.651226158038146, + "grad_norm": 9.10961627960205, + "learning_rate": 1.823032066208736e-05, + "loss": 0.8057, + "step": 7946 + }, + { + "epoch": 21.653950953678475, + "grad_norm": 8.348368644714355, + "learning_rate": 1.8229819377577938e-05, + "loss": 0.6708, + "step": 7947 + }, + { + "epoch": 21.6566757493188, + "grad_norm": 7.474180698394775, + "learning_rate": 1.822931802897495e-05, + "loss": 0.6534, + "step": 7948 + }, + { + "epoch": 21.659400544959126, + "grad_norm": 11.66097640991211, + "learning_rate": 1.8228816616282298e-05, + "loss": 0.7632, + "step": 7949 + }, + { + "epoch": 21.662125340599456, + "grad_norm": 14.725122451782227, + "learning_rate": 1.822831513950389e-05, + "loss": 0.8108, + "step": 7950 + }, + { + "epoch": 21.66485013623978, + "grad_norm": 7.565695285797119, + "learning_rate": 1.8227813598643623e-05, + "loss": 0.6025, + "step": 7951 + }, + { + "epoch": 21.667574931880107, + "grad_norm": 11.076896667480469, + "learning_rate": 1.822731199370541e-05, + "loss": 0.7438, + "step": 7952 + }, + { + "epoch": 21.670299727520437, + "grad_norm": 10.393583297729492, + "learning_rate": 1.822681032469316e-05, + "loss": 0.7128, + "step": 7953 + }, + { + "epoch": 21.673024523160763, + "grad_norm": 7.5954694747924805, + "learning_rate": 1.8226308591610772e-05, + "loss": 0.6598, + "step": 7954 + }, + { + "epoch": 21.67574931880109, + "grad_norm": 7.7545623779296875, + "learning_rate": 1.8225806794462156e-05, + "loss": 0.8911, + "step": 7955 + }, + { + "epoch": 21.678474114441418, + "grad_norm": 15.038293838500977, + "learning_rate": 1.8225304933251226e-05, + "loss": 0.743, + "step": 7956 + }, + { + "epoch": 21.681198910081743, + "grad_norm": 8.431268692016602, + "learning_rate": 1.8224803007981883e-05, + "loss": 0.6809, + "step": 7957 + }, + { + "epoch": 21.68392370572207, + "grad_norm": 8.869983673095703, + "learning_rate": 1.8224301018658042e-05, + "loss": 0.5802, + "step": 7958 + }, + { + "epoch": 21.6866485013624, + "grad_norm": 7.820289611816406, + "learning_rate": 1.8223798965283606e-05, + "loss": 0.8416, + "step": 7959 + }, + { + "epoch": 21.689373297002724, + "grad_norm": 9.78795051574707, + "learning_rate": 1.8223296847862492e-05, + "loss": 0.8647, + "step": 7960 + }, + { + "epoch": 21.69209809264305, + "grad_norm": 9.411185264587402, + "learning_rate": 1.8222794666398602e-05, + "loss": 0.7452, + "step": 7961 + }, + { + "epoch": 21.69482288828338, + "grad_norm": 8.101469039916992, + "learning_rate": 1.8222292420895857e-05, + "loss": 0.7953, + "step": 7962 + }, + { + "epoch": 21.697547683923705, + "grad_norm": 8.729936599731445, + "learning_rate": 1.8221790111358156e-05, + "loss": 0.7415, + "step": 7963 + }, + { + "epoch": 21.70027247956403, + "grad_norm": 6.6953511238098145, + "learning_rate": 1.8221287737789423e-05, + "loss": 0.7032, + "step": 7964 + }, + { + "epoch": 21.70299727520436, + "grad_norm": 6.772510051727295, + "learning_rate": 1.8220785300193565e-05, + "loss": 0.7838, + "step": 7965 + }, + { + "epoch": 21.705722070844686, + "grad_norm": 8.998079299926758, + "learning_rate": 1.8220282798574497e-05, + "loss": 0.8809, + "step": 7966 + }, + { + "epoch": 21.708446866485012, + "grad_norm": 10.296906471252441, + "learning_rate": 1.821978023293613e-05, + "loss": 0.6854, + "step": 7967 + }, + { + "epoch": 21.71117166212534, + "grad_norm": 7.554832458496094, + "learning_rate": 1.8219277603282378e-05, + "loss": 0.9015, + "step": 7968 + }, + { + "epoch": 21.713896457765667, + "grad_norm": 8.607104301452637, + "learning_rate": 1.8218774909617157e-05, + "loss": 0.947, + "step": 7969 + }, + { + "epoch": 21.716621253405993, + "grad_norm": 8.692824363708496, + "learning_rate": 1.8218272151944383e-05, + "loss": 0.8123, + "step": 7970 + }, + { + "epoch": 21.719346049046322, + "grad_norm": 5.778202056884766, + "learning_rate": 1.821776933026797e-05, + "loss": 0.7533, + "step": 7971 + }, + { + "epoch": 21.722070844686648, + "grad_norm": 40.46097183227539, + "learning_rate": 1.8217266444591835e-05, + "loss": 0.6561, + "step": 7972 + }, + { + "epoch": 21.724795640326974, + "grad_norm": 9.413145065307617, + "learning_rate": 1.8216763494919888e-05, + "loss": 0.8752, + "step": 7973 + }, + { + "epoch": 21.727520435967303, + "grad_norm": 9.560535430908203, + "learning_rate": 1.8216260481256058e-05, + "loss": 0.7362, + "step": 7974 + }, + { + "epoch": 21.73024523160763, + "grad_norm": 8.597753524780273, + "learning_rate": 1.8215757403604252e-05, + "loss": 0.7456, + "step": 7975 + }, + { + "epoch": 21.732970027247955, + "grad_norm": 8.375833511352539, + "learning_rate": 1.821525426196839e-05, + "loss": 0.8604, + "step": 7976 + }, + { + "epoch": 21.735694822888284, + "grad_norm": 8.554570198059082, + "learning_rate": 1.8214751056352397e-05, + "loss": 0.652, + "step": 7977 + }, + { + "epoch": 21.73841961852861, + "grad_norm": 9.537891387939453, + "learning_rate": 1.8214247786760184e-05, + "loss": 0.7294, + "step": 7978 + }, + { + "epoch": 21.741144414168936, + "grad_norm": 14.614935874938965, + "learning_rate": 1.8213744453195676e-05, + "loss": 0.9902, + "step": 7979 + }, + { + "epoch": 21.743869209809265, + "grad_norm": 9.442888259887695, + "learning_rate": 1.8213241055662786e-05, + "loss": 0.7906, + "step": 7980 + }, + { + "epoch": 21.74659400544959, + "grad_norm": 8.972207069396973, + "learning_rate": 1.8212737594165444e-05, + "loss": 0.7928, + "step": 7981 + }, + { + "epoch": 21.749318801089917, + "grad_norm": 11.947616577148438, + "learning_rate": 1.8212234068707563e-05, + "loss": 0.8579, + "step": 7982 + }, + { + "epoch": 21.752043596730246, + "grad_norm": 8.358003616333008, + "learning_rate": 1.8211730479293067e-05, + "loss": 0.712, + "step": 7983 + }, + { + "epoch": 21.754768392370572, + "grad_norm": 7.6386613845825195, + "learning_rate": 1.8211226825925883e-05, + "loss": 0.6794, + "step": 7984 + }, + { + "epoch": 21.757493188010898, + "grad_norm": 12.572188377380371, + "learning_rate": 1.8210723108609923e-05, + "loss": 0.7697, + "step": 7985 + }, + { + "epoch": 21.760217983651227, + "grad_norm": 10.8894624710083, + "learning_rate": 1.8210219327349122e-05, + "loss": 0.787, + "step": 7986 + }, + { + "epoch": 21.762942779291553, + "grad_norm": 8.683341026306152, + "learning_rate": 1.8209715482147393e-05, + "loss": 0.619, + "step": 7987 + }, + { + "epoch": 21.76566757493188, + "grad_norm": 9.78201961517334, + "learning_rate": 1.8209211573008663e-05, + "loss": 0.9135, + "step": 7988 + }, + { + "epoch": 21.768392370572208, + "grad_norm": 8.886528968811035, + "learning_rate": 1.8208707599936858e-05, + "loss": 0.8416, + "step": 7989 + }, + { + "epoch": 21.771117166212534, + "grad_norm": 8.137007713317871, + "learning_rate": 1.8208203562935902e-05, + "loss": 0.7484, + "step": 7990 + }, + { + "epoch": 21.77384196185286, + "grad_norm": 8.364813804626465, + "learning_rate": 1.8207699462009722e-05, + "loss": 0.6542, + "step": 7991 + }, + { + "epoch": 21.77656675749319, + "grad_norm": 8.100030899047852, + "learning_rate": 1.8207195297162245e-05, + "loss": 0.6743, + "step": 7992 + }, + { + "epoch": 21.779291553133515, + "grad_norm": 7.499617576599121, + "learning_rate": 1.820669106839739e-05, + "loss": 0.7401, + "step": 7993 + }, + { + "epoch": 21.78201634877384, + "grad_norm": 9.239191055297852, + "learning_rate": 1.8206186775719096e-05, + "loss": 0.7218, + "step": 7994 + }, + { + "epoch": 21.78474114441417, + "grad_norm": 8.191755294799805, + "learning_rate": 1.8205682419131277e-05, + "loss": 0.7122, + "step": 7995 + }, + { + "epoch": 21.787465940054496, + "grad_norm": 17.269739151000977, + "learning_rate": 1.8205177998637872e-05, + "loss": 0.8901, + "step": 7996 + }, + { + "epoch": 21.79019073569482, + "grad_norm": 10.68104076385498, + "learning_rate": 1.8204673514242804e-05, + "loss": 0.8568, + "step": 7997 + }, + { + "epoch": 21.79291553133515, + "grad_norm": 10.695720672607422, + "learning_rate": 1.820416896595e-05, + "loss": 0.8121, + "step": 7998 + }, + { + "epoch": 21.795640326975477, + "grad_norm": 9.297723770141602, + "learning_rate": 1.8203664353763393e-05, + "loss": 0.6395, + "step": 7999 + }, + { + "epoch": 21.798365122615802, + "grad_norm": 8.26783561706543, + "learning_rate": 1.8203159677686914e-05, + "loss": 0.6795, + "step": 8000 + }, + { + "epoch": 21.80108991825613, + "grad_norm": 8.635510444641113, + "learning_rate": 1.820265493772449e-05, + "loss": 0.5949, + "step": 8001 + }, + { + "epoch": 21.803814713896458, + "grad_norm": 9.092911720275879, + "learning_rate": 1.8202150133880052e-05, + "loss": 0.7261, + "step": 8002 + }, + { + "epoch": 21.806539509536783, + "grad_norm": 8.284882545471191, + "learning_rate": 1.8201645266157534e-05, + "loss": 0.7927, + "step": 8003 + }, + { + "epoch": 21.809264305177113, + "grad_norm": 7.807535171508789, + "learning_rate": 1.8201140334560867e-05, + "loss": 0.7951, + "step": 8004 + }, + { + "epoch": 21.81198910081744, + "grad_norm": 12.532002449035645, + "learning_rate": 1.8200635339093983e-05, + "loss": 0.7982, + "step": 8005 + }, + { + "epoch": 21.814713896457764, + "grad_norm": 8.454265594482422, + "learning_rate": 1.8200130279760814e-05, + "loss": 0.7979, + "step": 8006 + }, + { + "epoch": 21.817438692098094, + "grad_norm": 9.2294340133667, + "learning_rate": 1.8199625156565295e-05, + "loss": 0.8566, + "step": 8007 + }, + { + "epoch": 21.82016348773842, + "grad_norm": 9.567198753356934, + "learning_rate": 1.8199119969511362e-05, + "loss": 0.6354, + "step": 8008 + }, + { + "epoch": 21.822888283378745, + "grad_norm": 9.14952564239502, + "learning_rate": 1.8198614718602943e-05, + "loss": 0.7948, + "step": 8009 + }, + { + "epoch": 21.825613079019075, + "grad_norm": 17.607019424438477, + "learning_rate": 1.8198109403843977e-05, + "loss": 0.7565, + "step": 8010 + }, + { + "epoch": 21.8283378746594, + "grad_norm": 14.952523231506348, + "learning_rate": 1.8197604025238398e-05, + "loss": 0.8657, + "step": 8011 + }, + { + "epoch": 21.831062670299726, + "grad_norm": 13.148463249206543, + "learning_rate": 1.8197098582790144e-05, + "loss": 0.7017, + "step": 8012 + }, + { + "epoch": 21.833787465940055, + "grad_norm": 8.732821464538574, + "learning_rate": 1.819659307650315e-05, + "loss": 0.8524, + "step": 8013 + }, + { + "epoch": 21.83651226158038, + "grad_norm": 14.557068824768066, + "learning_rate": 1.8196087506381356e-05, + "loss": 0.8275, + "step": 8014 + }, + { + "epoch": 21.839237057220707, + "grad_norm": 10.754493713378906, + "learning_rate": 1.8195581872428693e-05, + "loss": 0.7708, + "step": 8015 + }, + { + "epoch": 21.841961852861036, + "grad_norm": 9.273686408996582, + "learning_rate": 1.81950761746491e-05, + "loss": 0.7947, + "step": 8016 + }, + { + "epoch": 21.844686648501362, + "grad_norm": 10.021817207336426, + "learning_rate": 1.819457041304652e-05, + "loss": 0.7877, + "step": 8017 + }, + { + "epoch": 21.847411444141688, + "grad_norm": 7.916262149810791, + "learning_rate": 1.819406458762489e-05, + "loss": 0.7999, + "step": 8018 + }, + { + "epoch": 21.850136239782017, + "grad_norm": 10.504857063293457, + "learning_rate": 1.8193558698388148e-05, + "loss": 0.7526, + "step": 8019 + }, + { + "epoch": 21.852861035422343, + "grad_norm": 7.127544403076172, + "learning_rate": 1.819305274534023e-05, + "loss": 0.7443, + "step": 8020 + }, + { + "epoch": 21.85558583106267, + "grad_norm": 9.729533195495605, + "learning_rate": 1.8192546728485087e-05, + "loss": 0.7009, + "step": 8021 + }, + { + "epoch": 21.858310626703, + "grad_norm": 11.557148933410645, + "learning_rate": 1.8192040647826652e-05, + "loss": 0.9875, + "step": 8022 + }, + { + "epoch": 21.861035422343324, + "grad_norm": 9.22014331817627, + "learning_rate": 1.819153450336887e-05, + "loss": 0.6754, + "step": 8023 + }, + { + "epoch": 21.86376021798365, + "grad_norm": 9.431036949157715, + "learning_rate": 1.819102829511568e-05, + "loss": 0.6737, + "step": 8024 + }, + { + "epoch": 21.86648501362398, + "grad_norm": 8.149208068847656, + "learning_rate": 1.819052202307102e-05, + "loss": 0.7744, + "step": 8025 + }, + { + "epoch": 21.869209809264305, + "grad_norm": 7.808688163757324, + "learning_rate": 1.8190015687238848e-05, + "loss": 0.8295, + "step": 8026 + }, + { + "epoch": 21.87193460490463, + "grad_norm": 8.341070175170898, + "learning_rate": 1.818950928762309e-05, + "loss": 0.7428, + "step": 8027 + }, + { + "epoch": 21.87465940054496, + "grad_norm": 10.882519721984863, + "learning_rate": 1.81890028242277e-05, + "loss": 0.7593, + "step": 8028 + }, + { + "epoch": 21.877384196185286, + "grad_norm": 11.259774208068848, + "learning_rate": 1.8188496297056616e-05, + "loss": 0.7113, + "step": 8029 + }, + { + "epoch": 21.88010899182561, + "grad_norm": 10.727615356445312, + "learning_rate": 1.818798970611379e-05, + "loss": 0.9111, + "step": 8030 + }, + { + "epoch": 21.88283378746594, + "grad_norm": 16.16585350036621, + "learning_rate": 1.8187483051403162e-05, + "loss": 0.9004, + "step": 8031 + }, + { + "epoch": 21.885558583106267, + "grad_norm": 9.897339820861816, + "learning_rate": 1.818697633292868e-05, + "loss": 0.7002, + "step": 8032 + }, + { + "epoch": 21.888283378746593, + "grad_norm": 7.668357849121094, + "learning_rate": 1.818646955069429e-05, + "loss": 0.8422, + "step": 8033 + }, + { + "epoch": 21.891008174386922, + "grad_norm": 9.614480018615723, + "learning_rate": 1.8185962704703942e-05, + "loss": 0.6727, + "step": 8034 + }, + { + "epoch": 21.893732970027248, + "grad_norm": 7.975518226623535, + "learning_rate": 1.8185455794961574e-05, + "loss": 0.8705, + "step": 8035 + }, + { + "epoch": 21.896457765667574, + "grad_norm": 8.036733627319336, + "learning_rate": 1.8184948821471144e-05, + "loss": 0.7402, + "step": 8036 + }, + { + "epoch": 21.899182561307903, + "grad_norm": 10.84546947479248, + "learning_rate": 1.8184441784236595e-05, + "loss": 0.8982, + "step": 8037 + }, + { + "epoch": 21.90190735694823, + "grad_norm": 10.531929016113281, + "learning_rate": 1.8183934683261875e-05, + "loss": 0.8087, + "step": 8038 + }, + { + "epoch": 21.904632152588555, + "grad_norm": 7.393584728240967, + "learning_rate": 1.8183427518550934e-05, + "loss": 0.7101, + "step": 8039 + }, + { + "epoch": 21.907356948228884, + "grad_norm": 7.93975305557251, + "learning_rate": 1.8182920290107727e-05, + "loss": 0.8103, + "step": 8040 + }, + { + "epoch": 21.91008174386921, + "grad_norm": 7.738041400909424, + "learning_rate": 1.8182412997936197e-05, + "loss": 0.9581, + "step": 8041 + }, + { + "epoch": 21.912806539509535, + "grad_norm": 10.444761276245117, + "learning_rate": 1.8181905642040298e-05, + "loss": 0.7683, + "step": 8042 + }, + { + "epoch": 21.915531335149865, + "grad_norm": 9.234233856201172, + "learning_rate": 1.8181398222423984e-05, + "loss": 0.7468, + "step": 8043 + }, + { + "epoch": 21.91825613079019, + "grad_norm": 9.53412914276123, + "learning_rate": 1.8180890739091205e-05, + "loss": 0.6504, + "step": 8044 + }, + { + "epoch": 21.920980926430516, + "grad_norm": 9.891529083251953, + "learning_rate": 1.8180383192045906e-05, + "loss": 0.7048, + "step": 8045 + }, + { + "epoch": 21.923705722070846, + "grad_norm": 10.515586853027344, + "learning_rate": 1.817987558129205e-05, + "loss": 0.8552, + "step": 8046 + }, + { + "epoch": 21.92643051771117, + "grad_norm": 11.16555404663086, + "learning_rate": 1.8179367906833586e-05, + "loss": 0.7252, + "step": 8047 + }, + { + "epoch": 21.929155313351497, + "grad_norm": 9.70915412902832, + "learning_rate": 1.817886016867447e-05, + "loss": 0.6676, + "step": 8048 + }, + { + "epoch": 21.931880108991827, + "grad_norm": 27.498109817504883, + "learning_rate": 1.817835236681865e-05, + "loss": 0.7378, + "step": 8049 + }, + { + "epoch": 21.934604904632153, + "grad_norm": 14.925739288330078, + "learning_rate": 1.8177844501270088e-05, + "loss": 0.8044, + "step": 8050 + }, + { + "epoch": 21.93732970027248, + "grad_norm": 8.186935424804688, + "learning_rate": 1.817733657203273e-05, + "loss": 0.8361, + "step": 8051 + }, + { + "epoch": 21.940054495912808, + "grad_norm": 7.971308708190918, + "learning_rate": 1.817682857911055e-05, + "loss": 0.7766, + "step": 8052 + }, + { + "epoch": 21.942779291553133, + "grad_norm": 8.413043975830078, + "learning_rate": 1.8176320522507485e-05, + "loss": 0.7009, + "step": 8053 + }, + { + "epoch": 21.94550408719346, + "grad_norm": 7.476767063140869, + "learning_rate": 1.81758124022275e-05, + "loss": 0.6925, + "step": 8054 + }, + { + "epoch": 21.94822888283379, + "grad_norm": 8.602943420410156, + "learning_rate": 1.817530421827455e-05, + "loss": 0.8936, + "step": 8055 + }, + { + "epoch": 21.950953678474114, + "grad_norm": 12.193194389343262, + "learning_rate": 1.8174795970652592e-05, + "loss": 0.8, + "step": 8056 + }, + { + "epoch": 21.95367847411444, + "grad_norm": 9.034198760986328, + "learning_rate": 1.817428765936559e-05, + "loss": 0.8422, + "step": 8057 + }, + { + "epoch": 21.95640326975477, + "grad_norm": 34.969703674316406, + "learning_rate": 1.8173779284417497e-05, + "loss": 0.9277, + "step": 8058 + }, + { + "epoch": 21.959128065395095, + "grad_norm": 10.297454833984375, + "learning_rate": 1.8173270845812273e-05, + "loss": 0.746, + "step": 8059 + }, + { + "epoch": 21.96185286103542, + "grad_norm": 9.3963041305542, + "learning_rate": 1.8172762343553883e-05, + "loss": 0.8197, + "step": 8060 + }, + { + "epoch": 21.96457765667575, + "grad_norm": 8.728163719177246, + "learning_rate": 1.817225377764628e-05, + "loss": 0.7479, + "step": 8061 + }, + { + "epoch": 21.967302452316076, + "grad_norm": 9.23142147064209, + "learning_rate": 1.8171745148093425e-05, + "loss": 0.703, + "step": 8062 + }, + { + "epoch": 21.970027247956402, + "grad_norm": 24.890634536743164, + "learning_rate": 1.8171236454899283e-05, + "loss": 0.8262, + "step": 8063 + }, + { + "epoch": 21.97275204359673, + "grad_norm": 8.38480281829834, + "learning_rate": 1.8170727698067817e-05, + "loss": 0.8821, + "step": 8064 + }, + { + "epoch": 21.975476839237057, + "grad_norm": 10.035608291625977, + "learning_rate": 1.8170218877602987e-05, + "loss": 0.8413, + "step": 8065 + }, + { + "epoch": 21.978201634877383, + "grad_norm": 9.714282989501953, + "learning_rate": 1.816970999350875e-05, + "loss": 0.7596, + "step": 8066 + }, + { + "epoch": 21.980926430517712, + "grad_norm": 8.85979175567627, + "learning_rate": 1.816920104578908e-05, + "loss": 0.7859, + "step": 8067 + }, + { + "epoch": 21.983651226158038, + "grad_norm": 8.130599975585938, + "learning_rate": 1.816869203444793e-05, + "loss": 0.8478, + "step": 8068 + }, + { + "epoch": 21.986376021798364, + "grad_norm": 9.997649192810059, + "learning_rate": 1.8168182959489277e-05, + "loss": 0.7366, + "step": 8069 + }, + { + "epoch": 21.989100817438693, + "grad_norm": 7.8750505447387695, + "learning_rate": 1.8167673820917073e-05, + "loss": 0.7366, + "step": 8070 + }, + { + "epoch": 21.99182561307902, + "grad_norm": 8.245959281921387, + "learning_rate": 1.816716461873529e-05, + "loss": 0.8219, + "step": 8071 + }, + { + "epoch": 21.994550408719345, + "grad_norm": 9.712108612060547, + "learning_rate": 1.816665535294789e-05, + "loss": 0.7715, + "step": 8072 + }, + { + "epoch": 21.997275204359674, + "grad_norm": 11.4086332321167, + "learning_rate": 1.816614602355884e-05, + "loss": 0.8273, + "step": 8073 + }, + { + "epoch": 22.0, + "grad_norm": 8.965995788574219, + "learning_rate": 1.816563663057211e-05, + "loss": 0.6558, + "step": 8074 + }, + { + "epoch": 22.002724795640326, + "grad_norm": 10.172837257385254, + "learning_rate": 1.8165127173991667e-05, + "loss": 0.6926, + "step": 8075 + }, + { + "epoch": 22.005449591280655, + "grad_norm": 8.559929847717285, + "learning_rate": 1.816461765382147e-05, + "loss": 0.7812, + "step": 8076 + }, + { + "epoch": 22.00817438692098, + "grad_norm": 7.295583724975586, + "learning_rate": 1.8164108070065498e-05, + "loss": 0.494, + "step": 8077 + }, + { + "epoch": 22.010899182561307, + "grad_norm": 8.792229652404785, + "learning_rate": 1.8163598422727714e-05, + "loss": 0.7005, + "step": 8078 + }, + { + "epoch": 22.013623978201636, + "grad_norm": 7.681225776672363, + "learning_rate": 1.816308871181209e-05, + "loss": 0.5142, + "step": 8079 + }, + { + "epoch": 22.016348773841962, + "grad_norm": 7.9823198318481445, + "learning_rate": 1.816257893732259e-05, + "loss": 0.7559, + "step": 8080 + }, + { + "epoch": 22.019073569482288, + "grad_norm": 8.489956855773926, + "learning_rate": 1.816206909926319e-05, + "loss": 0.5811, + "step": 8081 + }, + { + "epoch": 22.021798365122617, + "grad_norm": 8.067201614379883, + "learning_rate": 1.816155919763786e-05, + "loss": 0.8422, + "step": 8082 + }, + { + "epoch": 22.024523160762943, + "grad_norm": 15.2614107131958, + "learning_rate": 1.8161049232450566e-05, + "loss": 0.7727, + "step": 8083 + }, + { + "epoch": 22.02724795640327, + "grad_norm": 9.465600967407227, + "learning_rate": 1.8160539203705285e-05, + "loss": 0.6544, + "step": 8084 + }, + { + "epoch": 22.029972752043598, + "grad_norm": 24.28710174560547, + "learning_rate": 1.8160029111405986e-05, + "loss": 0.78, + "step": 8085 + }, + { + "epoch": 22.032697547683924, + "grad_norm": 9.697113990783691, + "learning_rate": 1.815951895555665e-05, + "loss": 0.6359, + "step": 8086 + }, + { + "epoch": 22.03542234332425, + "grad_norm": 8.137419700622559, + "learning_rate": 1.8159008736161236e-05, + "loss": 0.6996, + "step": 8087 + }, + { + "epoch": 22.03814713896458, + "grad_norm": 8.577265739440918, + "learning_rate": 1.815849845322373e-05, + "loss": 0.6985, + "step": 8088 + }, + { + "epoch": 22.040871934604905, + "grad_norm": 10.814737319946289, + "learning_rate": 1.815798810674809e-05, + "loss": 0.5823, + "step": 8089 + }, + { + "epoch": 22.04359673024523, + "grad_norm": 9.610568046569824, + "learning_rate": 1.8157477696738312e-05, + "loss": 0.8083, + "step": 8090 + }, + { + "epoch": 22.04632152588556, + "grad_norm": 10.783349990844727, + "learning_rate": 1.8156967223198358e-05, + "loss": 0.7408, + "step": 8091 + }, + { + "epoch": 22.049046321525886, + "grad_norm": 8.860383987426758, + "learning_rate": 1.81564566861322e-05, + "loss": 0.6569, + "step": 8092 + }, + { + "epoch": 22.05177111716621, + "grad_norm": 10.234100341796875, + "learning_rate": 1.8155946085543825e-05, + "loss": 0.6267, + "step": 8093 + }, + { + "epoch": 22.05449591280654, + "grad_norm": 9.198258399963379, + "learning_rate": 1.8155435421437202e-05, + "loss": 0.7501, + "step": 8094 + }, + { + "epoch": 22.057220708446867, + "grad_norm": 8.372624397277832, + "learning_rate": 1.8154924693816312e-05, + "loss": 0.783, + "step": 8095 + }, + { + "epoch": 22.059945504087192, + "grad_norm": 10.100859642028809, + "learning_rate": 1.8154413902685132e-05, + "loss": 0.6799, + "step": 8096 + }, + { + "epoch": 22.06267029972752, + "grad_norm": 8.656736373901367, + "learning_rate": 1.8153903048047636e-05, + "loss": 0.5563, + "step": 8097 + }, + { + "epoch": 22.065395095367847, + "grad_norm": 7.222809314727783, + "learning_rate": 1.815339212990781e-05, + "loss": 0.6029, + "step": 8098 + }, + { + "epoch": 22.068119891008173, + "grad_norm": 8.096519470214844, + "learning_rate": 1.8152881148269626e-05, + "loss": 0.7532, + "step": 8099 + }, + { + "epoch": 22.070844686648503, + "grad_norm": 8.562289237976074, + "learning_rate": 1.8152370103137063e-05, + "loss": 0.6422, + "step": 8100 + }, + { + "epoch": 22.07356948228883, + "grad_norm": 7.9341654777526855, + "learning_rate": 1.815185899451411e-05, + "loss": 0.876, + "step": 8101 + }, + { + "epoch": 22.076294277929154, + "grad_norm": 7.58868408203125, + "learning_rate": 1.8151347822404735e-05, + "loss": 0.6191, + "step": 8102 + }, + { + "epoch": 22.079019073569484, + "grad_norm": 10.293460845947266, + "learning_rate": 1.8150836586812927e-05, + "loss": 0.6768, + "step": 8103 + }, + { + "epoch": 22.08174386920981, + "grad_norm": 7.736724376678467, + "learning_rate": 1.815032528774267e-05, + "loss": 0.9154, + "step": 8104 + }, + { + "epoch": 22.084468664850135, + "grad_norm": 8.748819351196289, + "learning_rate": 1.814981392519794e-05, + "loss": 0.6484, + "step": 8105 + }, + { + "epoch": 22.087193460490465, + "grad_norm": 8.212860107421875, + "learning_rate": 1.814930249918272e-05, + "loss": 0.6599, + "step": 8106 + }, + { + "epoch": 22.08991825613079, + "grad_norm": 8.72126579284668, + "learning_rate": 1.8148791009700994e-05, + "loss": 0.6707, + "step": 8107 + }, + { + "epoch": 22.092643051771116, + "grad_norm": 8.394826889038086, + "learning_rate": 1.814827945675675e-05, + "loss": 0.6061, + "step": 8108 + }, + { + "epoch": 22.095367847411445, + "grad_norm": 7.980009078979492, + "learning_rate": 1.8147767840353966e-05, + "loss": 0.7402, + "step": 8109 + }, + { + "epoch": 22.09809264305177, + "grad_norm": 9.812178611755371, + "learning_rate": 1.8147256160496627e-05, + "loss": 0.7423, + "step": 8110 + }, + { + "epoch": 22.100817438692097, + "grad_norm": 8.119328498840332, + "learning_rate": 1.814674441718872e-05, + "loss": 0.5847, + "step": 8111 + }, + { + "epoch": 22.103542234332426, + "grad_norm": 9.668068885803223, + "learning_rate": 1.814623261043423e-05, + "loss": 0.717, + "step": 8112 + }, + { + "epoch": 22.106267029972752, + "grad_norm": 9.752023696899414, + "learning_rate": 1.8145720740237142e-05, + "loss": 0.6893, + "step": 8113 + }, + { + "epoch": 22.108991825613078, + "grad_norm": 9.450759887695312, + "learning_rate": 1.814520880660144e-05, + "loss": 0.7324, + "step": 8114 + }, + { + "epoch": 22.111716621253407, + "grad_norm": 10.053879737854004, + "learning_rate": 1.8144696809531117e-05, + "loss": 0.6709, + "step": 8115 + }, + { + "epoch": 22.114441416893733, + "grad_norm": 11.055795669555664, + "learning_rate": 1.814418474903016e-05, + "loss": 0.6781, + "step": 8116 + }, + { + "epoch": 22.11716621253406, + "grad_norm": 9.688031196594238, + "learning_rate": 1.814367262510255e-05, + "loss": 0.7238, + "step": 8117 + }, + { + "epoch": 22.11989100817439, + "grad_norm": 9.846515655517578, + "learning_rate": 1.8143160437752282e-05, + "loss": 0.661, + "step": 8118 + }, + { + "epoch": 22.122615803814714, + "grad_norm": 8.671991348266602, + "learning_rate": 1.8142648186983342e-05, + "loss": 0.6635, + "step": 8119 + }, + { + "epoch": 22.12534059945504, + "grad_norm": 7.699706554412842, + "learning_rate": 1.814213587279972e-05, + "loss": 0.4941, + "step": 8120 + }, + { + "epoch": 22.12806539509537, + "grad_norm": 10.536995887756348, + "learning_rate": 1.8141623495205407e-05, + "loss": 0.6252, + "step": 8121 + }, + { + "epoch": 22.130790190735695, + "grad_norm": 9.968353271484375, + "learning_rate": 1.814111105420439e-05, + "loss": 0.7587, + "step": 8122 + }, + { + "epoch": 22.13351498637602, + "grad_norm": 15.113749504089355, + "learning_rate": 1.8140598549800665e-05, + "loss": 0.7292, + "step": 8123 + }, + { + "epoch": 22.13623978201635, + "grad_norm": 10.22586727142334, + "learning_rate": 1.8140085981998217e-05, + "loss": 0.9756, + "step": 8124 + }, + { + "epoch": 22.138964577656676, + "grad_norm": 13.87658405303955, + "learning_rate": 1.8139573350801044e-05, + "loss": 0.6628, + "step": 8125 + }, + { + "epoch": 22.141689373297, + "grad_norm": 18.155254364013672, + "learning_rate": 1.8139060656213136e-05, + "loss": 0.7733, + "step": 8126 + }, + { + "epoch": 22.14441416893733, + "grad_norm": 7.1122636795043945, + "learning_rate": 1.8138547898238482e-05, + "loss": 0.7997, + "step": 8127 + }, + { + "epoch": 22.147138964577657, + "grad_norm": 7.740839004516602, + "learning_rate": 1.813803507688108e-05, + "loss": 0.688, + "step": 8128 + }, + { + "epoch": 22.149863760217983, + "grad_norm": 7.7154974937438965, + "learning_rate": 1.813752219214493e-05, + "loss": 0.5564, + "step": 8129 + }, + { + "epoch": 22.152588555858312, + "grad_norm": 15.014013290405273, + "learning_rate": 1.813700924403401e-05, + "loss": 0.8921, + "step": 8130 + }, + { + "epoch": 22.155313351498638, + "grad_norm": 6.617035388946533, + "learning_rate": 1.8136496232552327e-05, + "loss": 0.4835, + "step": 8131 + }, + { + "epoch": 22.158038147138964, + "grad_norm": 9.0719633102417, + "learning_rate": 1.8135983157703875e-05, + "loss": 0.5991, + "step": 8132 + }, + { + "epoch": 22.160762942779293, + "grad_norm": 8.152012825012207, + "learning_rate": 1.8135470019492645e-05, + "loss": 0.5002, + "step": 8133 + }, + { + "epoch": 22.16348773841962, + "grad_norm": 8.208850860595703, + "learning_rate": 1.813495681792264e-05, + "loss": 0.5294, + "step": 8134 + }, + { + "epoch": 22.166212534059945, + "grad_norm": 10.276405334472656, + "learning_rate": 1.8134443552997848e-05, + "loss": 0.5847, + "step": 8135 + }, + { + "epoch": 22.168937329700274, + "grad_norm": 9.390474319458008, + "learning_rate": 1.8133930224722274e-05, + "loss": 0.7382, + "step": 8136 + }, + { + "epoch": 22.1716621253406, + "grad_norm": 10.195333480834961, + "learning_rate": 1.813341683309991e-05, + "loss": 0.6446, + "step": 8137 + }, + { + "epoch": 22.174386920980925, + "grad_norm": 10.102724075317383, + "learning_rate": 1.8132903378134764e-05, + "loss": 0.693, + "step": 8138 + }, + { + "epoch": 22.177111716621255, + "grad_norm": 11.12580394744873, + "learning_rate": 1.8132389859830825e-05, + "loss": 0.7888, + "step": 8139 + }, + { + "epoch": 22.17983651226158, + "grad_norm": 8.86587142944336, + "learning_rate": 1.8131876278192097e-05, + "loss": 0.6686, + "step": 8140 + }, + { + "epoch": 22.182561307901906, + "grad_norm": 9.61230754852295, + "learning_rate": 1.8131362633222577e-05, + "loss": 0.7871, + "step": 8141 + }, + { + "epoch": 22.185286103542236, + "grad_norm": 8.075401306152344, + "learning_rate": 1.8130848924926264e-05, + "loss": 0.7047, + "step": 8142 + }, + { + "epoch": 22.18801089918256, + "grad_norm": 13.674467086791992, + "learning_rate": 1.8130335153307167e-05, + "loss": 0.6346, + "step": 8143 + }, + { + "epoch": 22.190735694822887, + "grad_norm": 7.627383708953857, + "learning_rate": 1.8129821318369278e-05, + "loss": 0.5735, + "step": 8144 + }, + { + "epoch": 22.193460490463217, + "grad_norm": 9.116448402404785, + "learning_rate": 1.81293074201166e-05, + "loss": 0.6015, + "step": 8145 + }, + { + "epoch": 22.196185286103542, + "grad_norm": 10.330015182495117, + "learning_rate": 1.812879345855314e-05, + "loss": 0.6343, + "step": 8146 + }, + { + "epoch": 22.19891008174387, + "grad_norm": 12.202704429626465, + "learning_rate": 1.8128279433682898e-05, + "loss": 0.6803, + "step": 8147 + }, + { + "epoch": 22.201634877384198, + "grad_norm": 9.495345115661621, + "learning_rate": 1.812776534550988e-05, + "loss": 0.7317, + "step": 8148 + }, + { + "epoch": 22.204359673024523, + "grad_norm": 10.337039947509766, + "learning_rate": 1.812725119403808e-05, + "loss": 0.7294, + "step": 8149 + }, + { + "epoch": 22.20708446866485, + "grad_norm": 9.894977569580078, + "learning_rate": 1.8126736979271516e-05, + "loss": 0.7222, + "step": 8150 + }, + { + "epoch": 22.20980926430518, + "grad_norm": 8.29999828338623, + "learning_rate": 1.8126222701214185e-05, + "loss": 0.7822, + "step": 8151 + }, + { + "epoch": 22.212534059945504, + "grad_norm": 8.871851921081543, + "learning_rate": 1.812570835987009e-05, + "loss": 0.7723, + "step": 8152 + }, + { + "epoch": 22.21525885558583, + "grad_norm": 10.580748558044434, + "learning_rate": 1.8125193955243244e-05, + "loss": 0.8129, + "step": 8153 + }, + { + "epoch": 22.21798365122616, + "grad_norm": 11.675036430358887, + "learning_rate": 1.8124679487337647e-05, + "loss": 0.782, + "step": 8154 + }, + { + "epoch": 22.220708446866485, + "grad_norm": 8.933625221252441, + "learning_rate": 1.8124164956157306e-05, + "loss": 0.5898, + "step": 8155 + }, + { + "epoch": 22.22343324250681, + "grad_norm": 7.400137901306152, + "learning_rate": 1.8123650361706234e-05, + "loss": 0.5396, + "step": 8156 + }, + { + "epoch": 22.22615803814714, + "grad_norm": 9.74735164642334, + "learning_rate": 1.812313570398843e-05, + "loss": 0.8325, + "step": 8157 + }, + { + "epoch": 22.228882833787466, + "grad_norm": 7.880486011505127, + "learning_rate": 1.8122620983007908e-05, + "loss": 0.6642, + "step": 8158 + }, + { + "epoch": 22.231607629427792, + "grad_norm": 12.720961570739746, + "learning_rate": 1.8122106198768675e-05, + "loss": 0.6642, + "step": 8159 + }, + { + "epoch": 22.23433242506812, + "grad_norm": 16.37128448486328, + "learning_rate": 1.8121591351274743e-05, + "loss": 0.6898, + "step": 8160 + }, + { + "epoch": 22.237057220708447, + "grad_norm": 7.74159574508667, + "learning_rate": 1.8121076440530116e-05, + "loss": 0.7014, + "step": 8161 + }, + { + "epoch": 22.239782016348773, + "grad_norm": 10.525813102722168, + "learning_rate": 1.8120561466538806e-05, + "loss": 0.6607, + "step": 8162 + }, + { + "epoch": 22.242506811989102, + "grad_norm": 8.556599617004395, + "learning_rate": 1.8120046429304828e-05, + "loss": 0.6026, + "step": 8163 + }, + { + "epoch": 22.245231607629428, + "grad_norm": 10.699475288391113, + "learning_rate": 1.8119531328832186e-05, + "loss": 0.7379, + "step": 8164 + }, + { + "epoch": 22.247956403269754, + "grad_norm": 10.441765785217285, + "learning_rate": 1.81190161651249e-05, + "loss": 0.6156, + "step": 8165 + }, + { + "epoch": 22.250681198910083, + "grad_norm": 7.536591529846191, + "learning_rate": 1.811850093818697e-05, + "loss": 0.5994, + "step": 8166 + }, + { + "epoch": 22.25340599455041, + "grad_norm": 7.260444164276123, + "learning_rate": 1.811798564802242e-05, + "loss": 0.7764, + "step": 8167 + }, + { + "epoch": 22.256130790190735, + "grad_norm": 8.492497444152832, + "learning_rate": 1.8117470294635263e-05, + "loss": 0.6183, + "step": 8168 + }, + { + "epoch": 22.258855585831064, + "grad_norm": 8.711894035339355, + "learning_rate": 1.8116954878029505e-05, + "loss": 0.748, + "step": 8169 + }, + { + "epoch": 22.26158038147139, + "grad_norm": 12.734328269958496, + "learning_rate": 1.8116439398209164e-05, + "loss": 0.6395, + "step": 8170 + }, + { + "epoch": 22.264305177111716, + "grad_norm": 8.598809242248535, + "learning_rate": 1.8115923855178253e-05, + "loss": 0.5896, + "step": 8171 + }, + { + "epoch": 22.267029972752045, + "grad_norm": 7.421351432800293, + "learning_rate": 1.8115408248940792e-05, + "loss": 0.5556, + "step": 8172 + }, + { + "epoch": 22.26975476839237, + "grad_norm": 14.382796287536621, + "learning_rate": 1.8114892579500792e-05, + "loss": 0.7145, + "step": 8173 + }, + { + "epoch": 22.272479564032697, + "grad_norm": 7.493317127227783, + "learning_rate": 1.811437684686227e-05, + "loss": 0.6122, + "step": 8174 + }, + { + "epoch": 22.275204359673026, + "grad_norm": 10.393016815185547, + "learning_rate": 1.8113861051029235e-05, + "loss": 0.7552, + "step": 8175 + }, + { + "epoch": 22.277929155313352, + "grad_norm": 8.7063570022583, + "learning_rate": 1.8113345192005718e-05, + "loss": 0.6884, + "step": 8176 + }, + { + "epoch": 22.280653950953678, + "grad_norm": 8.036070823669434, + "learning_rate": 1.8112829269795728e-05, + "loss": 0.6925, + "step": 8177 + }, + { + "epoch": 22.283378746594007, + "grad_norm": 8.267637252807617, + "learning_rate": 1.8112313284403287e-05, + "loss": 0.6825, + "step": 8178 + }, + { + "epoch": 22.286103542234333, + "grad_norm": 8.847068786621094, + "learning_rate": 1.8111797235832407e-05, + "loss": 0.584, + "step": 8179 + }, + { + "epoch": 22.28882833787466, + "grad_norm": 8.622603416442871, + "learning_rate": 1.8111281124087113e-05, + "loss": 0.9071, + "step": 8180 + }, + { + "epoch": 22.291553133514988, + "grad_norm": 9.915871620178223, + "learning_rate": 1.8110764949171423e-05, + "loss": 0.7716, + "step": 8181 + }, + { + "epoch": 22.294277929155314, + "grad_norm": 10.577964782714844, + "learning_rate": 1.811024871108936e-05, + "loss": 0.6343, + "step": 8182 + }, + { + "epoch": 22.29700272479564, + "grad_norm": 7.768617153167725, + "learning_rate": 1.8109732409844936e-05, + "loss": 0.787, + "step": 8183 + }, + { + "epoch": 22.29972752043597, + "grad_norm": 7.035017967224121, + "learning_rate": 1.810921604544218e-05, + "loss": 0.6422, + "step": 8184 + }, + { + "epoch": 22.302452316076295, + "grad_norm": 8.015909194946289, + "learning_rate": 1.810869961788511e-05, + "loss": 0.6508, + "step": 8185 + }, + { + "epoch": 22.30517711171662, + "grad_norm": 8.814335823059082, + "learning_rate": 1.810818312717775e-05, + "loss": 0.637, + "step": 8186 + }, + { + "epoch": 22.30790190735695, + "grad_norm": 14.538896560668945, + "learning_rate": 1.8107666573324113e-05, + "loss": 0.9564, + "step": 8187 + }, + { + "epoch": 22.310626702997276, + "grad_norm": 7.954617023468018, + "learning_rate": 1.810714995632824e-05, + "loss": 0.7405, + "step": 8188 + }, + { + "epoch": 22.3133514986376, + "grad_norm": 6.726071834564209, + "learning_rate": 1.8106633276194138e-05, + "loss": 0.5693, + "step": 8189 + }, + { + "epoch": 22.31607629427793, + "grad_norm": 7.355459690093994, + "learning_rate": 1.8106116532925835e-05, + "loss": 0.7271, + "step": 8190 + }, + { + "epoch": 22.318801089918257, + "grad_norm": 6.360330581665039, + "learning_rate": 1.8105599726527364e-05, + "loss": 0.7659, + "step": 8191 + }, + { + "epoch": 22.321525885558582, + "grad_norm": 10.908573150634766, + "learning_rate": 1.810508285700274e-05, + "loss": 0.6515, + "step": 8192 + }, + { + "epoch": 22.32425068119891, + "grad_norm": 9.36457347869873, + "learning_rate": 1.8104565924355987e-05, + "loss": 0.6348, + "step": 8193 + }, + { + "epoch": 22.326975476839237, + "grad_norm": 8.57176685333252, + "learning_rate": 1.810404892859114e-05, + "loss": 0.7372, + "step": 8194 + }, + { + "epoch": 22.329700272479563, + "grad_norm": 8.153583526611328, + "learning_rate": 1.8103531869712222e-05, + "loss": 0.6459, + "step": 8195 + }, + { + "epoch": 22.332425068119893, + "grad_norm": 8.096521377563477, + "learning_rate": 1.8103014747723258e-05, + "loss": 0.7163, + "step": 8196 + }, + { + "epoch": 22.33514986376022, + "grad_norm": 8.034278869628906, + "learning_rate": 1.8102497562628272e-05, + "loss": 0.7621, + "step": 8197 + }, + { + "epoch": 22.337874659400544, + "grad_norm": 10.737513542175293, + "learning_rate": 1.81019803144313e-05, + "loss": 0.7793, + "step": 8198 + }, + { + "epoch": 22.340599455040874, + "grad_norm": 9.598867416381836, + "learning_rate": 1.8101463003136365e-05, + "loss": 0.6896, + "step": 8199 + }, + { + "epoch": 22.3433242506812, + "grad_norm": 8.55178451538086, + "learning_rate": 1.81009456287475e-05, + "loss": 0.6556, + "step": 8200 + }, + { + "epoch": 22.346049046321525, + "grad_norm": 9.146363258361816, + "learning_rate": 1.8100428191268724e-05, + "loss": 0.6005, + "step": 8201 + }, + { + "epoch": 22.348773841961854, + "grad_norm": 7.098503112792969, + "learning_rate": 1.809991069070408e-05, + "loss": 0.8154, + "step": 8202 + }, + { + "epoch": 22.35149863760218, + "grad_norm": 14.414313316345215, + "learning_rate": 1.809939312705759e-05, + "loss": 0.6385, + "step": 8203 + }, + { + "epoch": 22.354223433242506, + "grad_norm": 8.21053409576416, + "learning_rate": 1.8098875500333287e-05, + "loss": 0.8989, + "step": 8204 + }, + { + "epoch": 22.356948228882835, + "grad_norm": 7.663893222808838, + "learning_rate": 1.8098357810535204e-05, + "loss": 0.6729, + "step": 8205 + }, + { + "epoch": 22.35967302452316, + "grad_norm": 7.619863033294678, + "learning_rate": 1.8097840057667366e-05, + "loss": 0.6927, + "step": 8206 + }, + { + "epoch": 22.362397820163487, + "grad_norm": 9.250384330749512, + "learning_rate": 1.8097322241733815e-05, + "loss": 0.5206, + "step": 8207 + }, + { + "epoch": 22.365122615803816, + "grad_norm": 7.354512691497803, + "learning_rate": 1.8096804362738577e-05, + "loss": 0.8595, + "step": 8208 + }, + { + "epoch": 22.367847411444142, + "grad_norm": 7.876550674438477, + "learning_rate": 1.809628642068569e-05, + "loss": 0.7395, + "step": 8209 + }, + { + "epoch": 22.370572207084468, + "grad_norm": 9.378175735473633, + "learning_rate": 1.809576841557918e-05, + "loss": 0.6779, + "step": 8210 + }, + { + "epoch": 22.373297002724797, + "grad_norm": 8.54090404510498, + "learning_rate": 1.809525034742309e-05, + "loss": 0.8472, + "step": 8211 + }, + { + "epoch": 22.376021798365123, + "grad_norm": 9.159504890441895, + "learning_rate": 1.809473221622145e-05, + "loss": 0.7279, + "step": 8212 + }, + { + "epoch": 22.37874659400545, + "grad_norm": 7.7075300216674805, + "learning_rate": 1.8094214021978295e-05, + "loss": 0.598, + "step": 8213 + }, + { + "epoch": 22.381471389645778, + "grad_norm": 12.308601379394531, + "learning_rate": 1.8093695764697664e-05, + "loss": 0.6523, + "step": 8214 + }, + { + "epoch": 22.384196185286104, + "grad_norm": 7.844625949859619, + "learning_rate": 1.8093177444383586e-05, + "loss": 0.9073, + "step": 8215 + }, + { + "epoch": 22.38692098092643, + "grad_norm": 7.515353679656982, + "learning_rate": 1.809265906104011e-05, + "loss": 0.8254, + "step": 8216 + }, + { + "epoch": 22.38964577656676, + "grad_norm": 8.23155403137207, + "learning_rate": 1.809214061467126e-05, + "loss": 0.5969, + "step": 8217 + }, + { + "epoch": 22.392370572207085, + "grad_norm": 8.199894905090332, + "learning_rate": 1.809162210528108e-05, + "loss": 0.7928, + "step": 8218 + }, + { + "epoch": 22.39509536784741, + "grad_norm": 7.663973808288574, + "learning_rate": 1.809110353287361e-05, + "loss": 0.7141, + "step": 8219 + }, + { + "epoch": 22.39782016348774, + "grad_norm": 10.365224838256836, + "learning_rate": 1.8090584897452884e-05, + "loss": 0.6886, + "step": 8220 + }, + { + "epoch": 22.400544959128066, + "grad_norm": 12.609064102172852, + "learning_rate": 1.8090066199022946e-05, + "loss": 0.7184, + "step": 8221 + }, + { + "epoch": 22.40326975476839, + "grad_norm": 7.5562615394592285, + "learning_rate": 1.8089547437587828e-05, + "loss": 0.6334, + "step": 8222 + }, + { + "epoch": 22.40599455040872, + "grad_norm": 7.856863021850586, + "learning_rate": 1.8089028613151578e-05, + "loss": 0.5431, + "step": 8223 + }, + { + "epoch": 22.408719346049047, + "grad_norm": 9.362018585205078, + "learning_rate": 1.808850972571823e-05, + "loss": 0.6707, + "step": 8224 + }, + { + "epoch": 22.411444141689373, + "grad_norm": 7.5704731941223145, + "learning_rate": 1.8087990775291835e-05, + "loss": 0.8016, + "step": 8225 + }, + { + "epoch": 22.414168937329702, + "grad_norm": 14.33726978302002, + "learning_rate": 1.8087471761876425e-05, + "loss": 0.9342, + "step": 8226 + }, + { + "epoch": 22.416893732970028, + "grad_norm": 9.47899341583252, + "learning_rate": 1.8086952685476046e-05, + "loss": 0.6818, + "step": 8227 + }, + { + "epoch": 22.419618528610354, + "grad_norm": 8.469098091125488, + "learning_rate": 1.808643354609474e-05, + "loss": 0.5687, + "step": 8228 + }, + { + "epoch": 22.422343324250683, + "grad_norm": 7.910406589508057, + "learning_rate": 1.8085914343736545e-05, + "loss": 0.696, + "step": 8229 + }, + { + "epoch": 22.42506811989101, + "grad_norm": 8.005192756652832, + "learning_rate": 1.8085395078405514e-05, + "loss": 0.6208, + "step": 8230 + }, + { + "epoch": 22.427792915531334, + "grad_norm": 13.900349617004395, + "learning_rate": 1.8084875750105685e-05, + "loss": 0.6278, + "step": 8231 + }, + { + "epoch": 22.430517711171664, + "grad_norm": 8.031730651855469, + "learning_rate": 1.8084356358841106e-05, + "loss": 0.6943, + "step": 8232 + }, + { + "epoch": 22.43324250681199, + "grad_norm": 8.470152854919434, + "learning_rate": 1.8083836904615815e-05, + "loss": 0.5541, + "step": 8233 + }, + { + "epoch": 22.435967302452315, + "grad_norm": 9.42927074432373, + "learning_rate": 1.8083317387433866e-05, + "loss": 0.5667, + "step": 8234 + }, + { + "epoch": 22.438692098092645, + "grad_norm": 10.382102966308594, + "learning_rate": 1.80827978072993e-05, + "loss": 0.7693, + "step": 8235 + }, + { + "epoch": 22.44141689373297, + "grad_norm": 9.156529426574707, + "learning_rate": 1.8082278164216166e-05, + "loss": 0.875, + "step": 8236 + }, + { + "epoch": 22.444141689373296, + "grad_norm": 9.471755027770996, + "learning_rate": 1.808175845818851e-05, + "loss": 0.8351, + "step": 8237 + }, + { + "epoch": 22.446866485013626, + "grad_norm": 10.10020637512207, + "learning_rate": 1.808123868922038e-05, + "loss": 0.6541, + "step": 8238 + }, + { + "epoch": 22.44959128065395, + "grad_norm": 8.335165977478027, + "learning_rate": 1.808071885731582e-05, + "loss": 0.7588, + "step": 8239 + }, + { + "epoch": 22.452316076294277, + "grad_norm": 7.9259161949157715, + "learning_rate": 1.8080198962478884e-05, + "loss": 0.6415, + "step": 8240 + }, + { + "epoch": 22.455040871934607, + "grad_norm": 20.179035186767578, + "learning_rate": 1.8079679004713618e-05, + "loss": 0.6896, + "step": 8241 + }, + { + "epoch": 22.457765667574932, + "grad_norm": 10.354724884033203, + "learning_rate": 1.8079158984024073e-05, + "loss": 0.7043, + "step": 8242 + }, + { + "epoch": 22.460490463215258, + "grad_norm": 8.078150749206543, + "learning_rate": 1.8078638900414292e-05, + "loss": 0.8281, + "step": 8243 + }, + { + "epoch": 22.463215258855588, + "grad_norm": 10.773573875427246, + "learning_rate": 1.8078118753888337e-05, + "loss": 0.679, + "step": 8244 + }, + { + "epoch": 22.465940054495913, + "grad_norm": 6.376916885375977, + "learning_rate": 1.8077598544450253e-05, + "loss": 0.5781, + "step": 8245 + }, + { + "epoch": 22.46866485013624, + "grad_norm": 7.432671546936035, + "learning_rate": 1.8077078272104093e-05, + "loss": 0.7159, + "step": 8246 + }, + { + "epoch": 22.47138964577657, + "grad_norm": 8.190813064575195, + "learning_rate": 1.8076557936853905e-05, + "loss": 0.6945, + "step": 8247 + }, + { + "epoch": 22.474114441416894, + "grad_norm": 7.159677982330322, + "learning_rate": 1.807603753870374e-05, + "loss": 0.5876, + "step": 8248 + }, + { + "epoch": 22.47683923705722, + "grad_norm": 22.71761131286621, + "learning_rate": 1.807551707765766e-05, + "loss": 0.7416, + "step": 8249 + }, + { + "epoch": 22.479564032697546, + "grad_norm": 9.451669692993164, + "learning_rate": 1.807499655371971e-05, + "loss": 0.6469, + "step": 8250 + }, + { + "epoch": 22.482288828337875, + "grad_norm": 8.264025688171387, + "learning_rate": 1.807447596689395e-05, + "loss": 0.587, + "step": 8251 + }, + { + "epoch": 22.4850136239782, + "grad_norm": 8.693696022033691, + "learning_rate": 1.807395531718443e-05, + "loss": 0.5808, + "step": 8252 + }, + { + "epoch": 22.48773841961853, + "grad_norm": 8.700834274291992, + "learning_rate": 1.8073434604595203e-05, + "loss": 0.7067, + "step": 8253 + }, + { + "epoch": 22.490463215258856, + "grad_norm": 7.785550117492676, + "learning_rate": 1.8072913829130326e-05, + "loss": 0.7192, + "step": 8254 + }, + { + "epoch": 22.493188010899182, + "grad_norm": 8.362305641174316, + "learning_rate": 1.8072392990793864e-05, + "loss": 0.589, + "step": 8255 + }, + { + "epoch": 22.495912806539508, + "grad_norm": 8.484654426574707, + "learning_rate": 1.8071872089589857e-05, + "loss": 0.5781, + "step": 8256 + }, + { + "epoch": 22.498637602179837, + "grad_norm": 10.331132888793945, + "learning_rate": 1.8071351125522372e-05, + "loss": 0.6402, + "step": 8257 + }, + { + "epoch": 22.501362397820163, + "grad_norm": 8.756699562072754, + "learning_rate": 1.8070830098595467e-05, + "loss": 0.5598, + "step": 8258 + }, + { + "epoch": 22.504087193460492, + "grad_norm": 34.18621826171875, + "learning_rate": 1.8070309008813195e-05, + "loss": 0.8003, + "step": 8259 + }, + { + "epoch": 22.506811989100818, + "grad_norm": 8.338065147399902, + "learning_rate": 1.8069787856179618e-05, + "loss": 0.7378, + "step": 8260 + }, + { + "epoch": 22.509536784741144, + "grad_norm": 8.108210563659668, + "learning_rate": 1.806926664069879e-05, + "loss": 0.6598, + "step": 8261 + }, + { + "epoch": 22.51226158038147, + "grad_norm": 8.238025665283203, + "learning_rate": 1.8068745362374774e-05, + "loss": 0.6777, + "step": 8262 + }, + { + "epoch": 22.5149863760218, + "grad_norm": 9.277074813842773, + "learning_rate": 1.806822402121163e-05, + "loss": 0.7857, + "step": 8263 + }, + { + "epoch": 22.517711171662125, + "grad_norm": 8.868127822875977, + "learning_rate": 1.8067702617213415e-05, + "loss": 0.6467, + "step": 8264 + }, + { + "epoch": 22.520435967302454, + "grad_norm": 8.341856956481934, + "learning_rate": 1.8067181150384195e-05, + "loss": 0.7299, + "step": 8265 + }, + { + "epoch": 22.52316076294278, + "grad_norm": 9.665529251098633, + "learning_rate": 1.8066659620728023e-05, + "loss": 0.7332, + "step": 8266 + }, + { + "epoch": 22.525885558583106, + "grad_norm": 9.782292366027832, + "learning_rate": 1.806613802824897e-05, + "loss": 0.6966, + "step": 8267 + }, + { + "epoch": 22.52861035422343, + "grad_norm": 8.606857299804688, + "learning_rate": 1.8065616372951093e-05, + "loss": 0.722, + "step": 8268 + }, + { + "epoch": 22.53133514986376, + "grad_norm": 11.900496482849121, + "learning_rate": 1.8065094654838452e-05, + "loss": 0.8167, + "step": 8269 + }, + { + "epoch": 22.534059945504087, + "grad_norm": 8.272493362426758, + "learning_rate": 1.8064572873915117e-05, + "loss": 0.5896, + "step": 8270 + }, + { + "epoch": 22.536784741144416, + "grad_norm": 8.059184074401855, + "learning_rate": 1.8064051030185145e-05, + "loss": 1.0009, + "step": 8271 + }, + { + "epoch": 22.539509536784742, + "grad_norm": 8.604249000549316, + "learning_rate": 1.8063529123652604e-05, + "loss": 0.662, + "step": 8272 + }, + { + "epoch": 22.542234332425068, + "grad_norm": 7.399803638458252, + "learning_rate": 1.8063007154321558e-05, + "loss": 0.6537, + "step": 8273 + }, + { + "epoch": 22.544959128065393, + "grad_norm": 8.598675727844238, + "learning_rate": 1.8062485122196074e-05, + "loss": 0.7892, + "step": 8274 + }, + { + "epoch": 22.547683923705723, + "grad_norm": 7.8193583488464355, + "learning_rate": 1.806196302728021e-05, + "loss": 0.8136, + "step": 8275 + }, + { + "epoch": 22.55040871934605, + "grad_norm": 9.113085746765137, + "learning_rate": 1.8061440869578043e-05, + "loss": 0.699, + "step": 8276 + }, + { + "epoch": 22.553133514986374, + "grad_norm": 8.494874954223633, + "learning_rate": 1.8060918649093634e-05, + "loss": 0.6088, + "step": 8277 + }, + { + "epoch": 22.555858310626704, + "grad_norm": 8.600625038146973, + "learning_rate": 1.8060396365831046e-05, + "loss": 0.6802, + "step": 8278 + }, + { + "epoch": 22.55858310626703, + "grad_norm": 8.80474853515625, + "learning_rate": 1.8059874019794352e-05, + "loss": 0.6677, + "step": 8279 + }, + { + "epoch": 22.561307901907355, + "grad_norm": 8.594862937927246, + "learning_rate": 1.8059351610987617e-05, + "loss": 0.8966, + "step": 8280 + }, + { + "epoch": 22.564032697547685, + "grad_norm": 9.526464462280273, + "learning_rate": 1.8058829139414915e-05, + "loss": 0.6548, + "step": 8281 + }, + { + "epoch": 22.56675749318801, + "grad_norm": 8.03078842163086, + "learning_rate": 1.805830660508031e-05, + "loss": 0.7498, + "step": 8282 + }, + { + "epoch": 22.569482288828336, + "grad_norm": 9.00503921508789, + "learning_rate": 1.805778400798787e-05, + "loss": 0.7373, + "step": 8283 + }, + { + "epoch": 22.572207084468666, + "grad_norm": 11.846492767333984, + "learning_rate": 1.805726134814167e-05, + "loss": 0.8224, + "step": 8284 + }, + { + "epoch": 22.57493188010899, + "grad_norm": 8.72476577758789, + "learning_rate": 1.8056738625545778e-05, + "loss": 0.6932, + "step": 8285 + }, + { + "epoch": 22.577656675749317, + "grad_norm": 6.827003479003906, + "learning_rate": 1.8056215840204262e-05, + "loss": 0.6933, + "step": 8286 + }, + { + "epoch": 22.580381471389646, + "grad_norm": 7.064388275146484, + "learning_rate": 1.80556929921212e-05, + "loss": 0.6964, + "step": 8287 + }, + { + "epoch": 22.583106267029972, + "grad_norm": 7.903183460235596, + "learning_rate": 1.8055170081300656e-05, + "loss": 0.5508, + "step": 8288 + }, + { + "epoch": 22.585831062670298, + "grad_norm": 9.286689758300781, + "learning_rate": 1.805464710774671e-05, + "loss": 0.8115, + "step": 8289 + }, + { + "epoch": 22.588555858310627, + "grad_norm": 12.02190113067627, + "learning_rate": 1.805412407146343e-05, + "loss": 0.7172, + "step": 8290 + }, + { + "epoch": 22.591280653950953, + "grad_norm": 6.979458332061768, + "learning_rate": 1.805360097245489e-05, + "loss": 0.6827, + "step": 8291 + }, + { + "epoch": 22.59400544959128, + "grad_norm": 8.05056381225586, + "learning_rate": 1.8053077810725167e-05, + "loss": 0.7211, + "step": 8292 + }, + { + "epoch": 22.59673024523161, + "grad_norm": 42.04249954223633, + "learning_rate": 1.8052554586278335e-05, + "loss": 0.6968, + "step": 8293 + }, + { + "epoch": 22.599455040871934, + "grad_norm": 9.809717178344727, + "learning_rate": 1.8052031299118465e-05, + "loss": 0.6751, + "step": 8294 + }, + { + "epoch": 22.60217983651226, + "grad_norm": 10.563461303710938, + "learning_rate": 1.805150794924963e-05, + "loss": 0.8352, + "step": 8295 + }, + { + "epoch": 22.60490463215259, + "grad_norm": 10.033594131469727, + "learning_rate": 1.8050984536675918e-05, + "loss": 0.7987, + "step": 8296 + }, + { + "epoch": 22.607629427792915, + "grad_norm": 8.315168380737305, + "learning_rate": 1.8050461061401394e-05, + "loss": 0.7013, + "step": 8297 + }, + { + "epoch": 22.61035422343324, + "grad_norm": 12.972036361694336, + "learning_rate": 1.8049937523430138e-05, + "loss": 0.7091, + "step": 8298 + }, + { + "epoch": 22.61307901907357, + "grad_norm": 9.643797874450684, + "learning_rate": 1.8049413922766227e-05, + "loss": 0.7911, + "step": 8299 + }, + { + "epoch": 22.615803814713896, + "grad_norm": 9.095795631408691, + "learning_rate": 1.804889025941374e-05, + "loss": 0.6661, + "step": 8300 + }, + { + "epoch": 22.618528610354222, + "grad_norm": 9.258108139038086, + "learning_rate": 1.8048366533376754e-05, + "loss": 0.6235, + "step": 8301 + }, + { + "epoch": 22.62125340599455, + "grad_norm": 9.524581909179688, + "learning_rate": 1.804784274465935e-05, + "loss": 0.8983, + "step": 8302 + }, + { + "epoch": 22.623978201634877, + "grad_norm": 10.910232543945312, + "learning_rate": 1.8047318893265606e-05, + "loss": 0.6393, + "step": 8303 + }, + { + "epoch": 22.626702997275203, + "grad_norm": 11.33791732788086, + "learning_rate": 1.80467949791996e-05, + "loss": 0.7798, + "step": 8304 + }, + { + "epoch": 22.629427792915532, + "grad_norm": 8.183943748474121, + "learning_rate": 1.8046271002465416e-05, + "loss": 0.7988, + "step": 8305 + }, + { + "epoch": 22.632152588555858, + "grad_norm": 9.401528358459473, + "learning_rate": 1.804574696306713e-05, + "loss": 0.7225, + "step": 8306 + }, + { + "epoch": 22.634877384196184, + "grad_norm": 9.101771354675293, + "learning_rate": 1.8045222861008826e-05, + "loss": 0.584, + "step": 8307 + }, + { + "epoch": 22.637602179836513, + "grad_norm": 8.446800231933594, + "learning_rate": 1.8044698696294586e-05, + "loss": 0.6541, + "step": 8308 + }, + { + "epoch": 22.64032697547684, + "grad_norm": 10.920446395874023, + "learning_rate": 1.804417446892849e-05, + "loss": 0.6578, + "step": 8309 + }, + { + "epoch": 22.643051771117165, + "grad_norm": 9.614753723144531, + "learning_rate": 1.8043650178914624e-05, + "loss": 0.7683, + "step": 8310 + }, + { + "epoch": 22.645776566757494, + "grad_norm": 9.82983684539795, + "learning_rate": 1.8043125826257067e-05, + "loss": 0.7668, + "step": 8311 + }, + { + "epoch": 22.64850136239782, + "grad_norm": 8.423670768737793, + "learning_rate": 1.8042601410959907e-05, + "loss": 0.8746, + "step": 8312 + }, + { + "epoch": 22.651226158038146, + "grad_norm": 8.503253936767578, + "learning_rate": 1.8042076933027228e-05, + "loss": 0.6849, + "step": 8313 + }, + { + "epoch": 22.653950953678475, + "grad_norm": 9.42237377166748, + "learning_rate": 1.804155239246311e-05, + "loss": 0.701, + "step": 8314 + }, + { + "epoch": 22.6566757493188, + "grad_norm": 10.920177459716797, + "learning_rate": 1.8041027789271642e-05, + "loss": 0.6328, + "step": 8315 + }, + { + "epoch": 22.659400544959126, + "grad_norm": 7.157051086425781, + "learning_rate": 1.8040503123456905e-05, + "loss": 0.88, + "step": 8316 + }, + { + "epoch": 22.662125340599456, + "grad_norm": 7.44293737411499, + "learning_rate": 1.8039978395022993e-05, + "loss": 0.7865, + "step": 8317 + }, + { + "epoch": 22.66485013623978, + "grad_norm": 10.239413261413574, + "learning_rate": 1.8039453603973984e-05, + "loss": 0.7601, + "step": 8318 + }, + { + "epoch": 22.667574931880107, + "grad_norm": 9.254770278930664, + "learning_rate": 1.803892875031397e-05, + "loss": 0.7531, + "step": 8319 + }, + { + "epoch": 22.670299727520437, + "grad_norm": 8.593079566955566, + "learning_rate": 1.803840383404704e-05, + "loss": 0.7659, + "step": 8320 + }, + { + "epoch": 22.673024523160763, + "grad_norm": 8.502016067504883, + "learning_rate": 1.8037878855177276e-05, + "loss": 0.9703, + "step": 8321 + }, + { + "epoch": 22.67574931880109, + "grad_norm": 9.36688232421875, + "learning_rate": 1.8037353813708773e-05, + "loss": 0.8094, + "step": 8322 + }, + { + "epoch": 22.678474114441418, + "grad_norm": 9.845867156982422, + "learning_rate": 1.8036828709645616e-05, + "loss": 0.6603, + "step": 8323 + }, + { + "epoch": 22.681198910081743, + "grad_norm": 7.752012252807617, + "learning_rate": 1.8036303542991898e-05, + "loss": 0.689, + "step": 8324 + }, + { + "epoch": 22.68392370572207, + "grad_norm": 8.684884071350098, + "learning_rate": 1.8035778313751704e-05, + "loss": 0.7348, + "step": 8325 + }, + { + "epoch": 22.6866485013624, + "grad_norm": 14.845547676086426, + "learning_rate": 1.803525302192913e-05, + "loss": 0.7791, + "step": 8326 + }, + { + "epoch": 22.689373297002724, + "grad_norm": 10.740171432495117, + "learning_rate": 1.803472766752826e-05, + "loss": 0.7183, + "step": 8327 + }, + { + "epoch": 22.69209809264305, + "grad_norm": 9.001082420349121, + "learning_rate": 1.8034202250553193e-05, + "loss": 0.7847, + "step": 8328 + }, + { + "epoch": 22.69482288828338, + "grad_norm": 8.427489280700684, + "learning_rate": 1.8033676771008014e-05, + "loss": 0.7919, + "step": 8329 + }, + { + "epoch": 22.697547683923705, + "grad_norm": 9.384603500366211, + "learning_rate": 1.803315122889682e-05, + "loss": 0.5674, + "step": 8330 + }, + { + "epoch": 22.70027247956403, + "grad_norm": 7.615623950958252, + "learning_rate": 1.8032625624223708e-05, + "loss": 0.7269, + "step": 8331 + }, + { + "epoch": 22.70299727520436, + "grad_norm": 7.652527809143066, + "learning_rate": 1.803209995699276e-05, + "loss": 0.5839, + "step": 8332 + }, + { + "epoch": 22.705722070844686, + "grad_norm": 8.273387908935547, + "learning_rate": 1.8031574227208078e-05, + "loss": 0.611, + "step": 8333 + }, + { + "epoch": 22.708446866485012, + "grad_norm": 9.620495796203613, + "learning_rate": 1.8031048434873754e-05, + "loss": 0.8767, + "step": 8334 + }, + { + "epoch": 22.71117166212534, + "grad_norm": 10.494977951049805, + "learning_rate": 1.8030522579993884e-05, + "loss": 0.6519, + "step": 8335 + }, + { + "epoch": 22.713896457765667, + "grad_norm": 9.045083999633789, + "learning_rate": 1.802999666257256e-05, + "loss": 0.6703, + "step": 8336 + }, + { + "epoch": 22.716621253405993, + "grad_norm": 7.966055393218994, + "learning_rate": 1.8029470682613886e-05, + "loss": 0.8085, + "step": 8337 + }, + { + "epoch": 22.719346049046322, + "grad_norm": 9.901015281677246, + "learning_rate": 1.8028944640121948e-05, + "loss": 0.7672, + "step": 8338 + }, + { + "epoch": 22.722070844686648, + "grad_norm": 11.238534927368164, + "learning_rate": 1.8028418535100848e-05, + "loss": 0.6296, + "step": 8339 + }, + { + "epoch": 22.724795640326974, + "grad_norm": 9.268028259277344, + "learning_rate": 1.8027892367554686e-05, + "loss": 0.6449, + "step": 8340 + }, + { + "epoch": 22.727520435967303, + "grad_norm": 10.056122779846191, + "learning_rate": 1.8027366137487555e-05, + "loss": 0.7068, + "step": 8341 + }, + { + "epoch": 22.73024523160763, + "grad_norm": 8.317461967468262, + "learning_rate": 1.8026839844903552e-05, + "loss": 0.6533, + "step": 8342 + }, + { + "epoch": 22.732970027247955, + "grad_norm": 18.117374420166016, + "learning_rate": 1.8026313489806783e-05, + "loss": 0.6644, + "step": 8343 + }, + { + "epoch": 22.735694822888284, + "grad_norm": 11.009692192077637, + "learning_rate": 1.802578707220134e-05, + "loss": 0.6713, + "step": 8344 + }, + { + "epoch": 22.73841961852861, + "grad_norm": 7.9983367919921875, + "learning_rate": 1.8025260592091326e-05, + "loss": 0.8015, + "step": 8345 + }, + { + "epoch": 22.741144414168936, + "grad_norm": 8.074543952941895, + "learning_rate": 1.8024734049480843e-05, + "loss": 0.7056, + "step": 8346 + }, + { + "epoch": 22.743869209809265, + "grad_norm": 12.755304336547852, + "learning_rate": 1.8024207444373988e-05, + "loss": 0.7308, + "step": 8347 + }, + { + "epoch": 22.74659400544959, + "grad_norm": 8.259418487548828, + "learning_rate": 1.802368077677486e-05, + "loss": 0.6225, + "step": 8348 + }, + { + "epoch": 22.749318801089917, + "grad_norm": 10.191117286682129, + "learning_rate": 1.802315404668757e-05, + "loss": 0.7797, + "step": 8349 + }, + { + "epoch": 22.752043596730246, + "grad_norm": 7.531361103057861, + "learning_rate": 1.802262725411621e-05, + "loss": 0.7404, + "step": 8350 + }, + { + "epoch": 22.754768392370572, + "grad_norm": 8.780338287353516, + "learning_rate": 1.802210039906489e-05, + "loss": 0.7735, + "step": 8351 + }, + { + "epoch": 22.757493188010898, + "grad_norm": 10.208608627319336, + "learning_rate": 1.8021573481537712e-05, + "loss": 0.8137, + "step": 8352 + }, + { + "epoch": 22.760217983651227, + "grad_norm": 11.209440231323242, + "learning_rate": 1.8021046501538774e-05, + "loss": 0.6912, + "step": 8353 + }, + { + "epoch": 22.762942779291553, + "grad_norm": 10.841713905334473, + "learning_rate": 1.8020519459072186e-05, + "loss": 0.7172, + "step": 8354 + }, + { + "epoch": 22.76566757493188, + "grad_norm": 7.741214752197266, + "learning_rate": 1.801999235414205e-05, + "loss": 0.8362, + "step": 8355 + }, + { + "epoch": 22.768392370572208, + "grad_norm": 8.230745315551758, + "learning_rate": 1.801946518675247e-05, + "loss": 0.7798, + "step": 8356 + }, + { + "epoch": 22.771117166212534, + "grad_norm": 9.219021797180176, + "learning_rate": 1.8018937956907556e-05, + "loss": 0.7969, + "step": 8357 + }, + { + "epoch": 22.77384196185286, + "grad_norm": 7.021849632263184, + "learning_rate": 1.8018410664611413e-05, + "loss": 0.8274, + "step": 8358 + }, + { + "epoch": 22.77656675749319, + "grad_norm": 8.705036163330078, + "learning_rate": 1.801788330986814e-05, + "loss": 0.7939, + "step": 8359 + }, + { + "epoch": 22.779291553133515, + "grad_norm": 8.407700538635254, + "learning_rate": 1.8017355892681855e-05, + "loss": 0.6484, + "step": 8360 + }, + { + "epoch": 22.78201634877384, + "grad_norm": 10.441157341003418, + "learning_rate": 1.8016828413056657e-05, + "loss": 0.6018, + "step": 8361 + }, + { + "epoch": 22.78474114441417, + "grad_norm": 15.836782455444336, + "learning_rate": 1.8016300870996657e-05, + "loss": 0.7433, + "step": 8362 + }, + { + "epoch": 22.787465940054496, + "grad_norm": 7.165671348571777, + "learning_rate": 1.8015773266505968e-05, + "loss": 0.6499, + "step": 8363 + }, + { + "epoch": 22.79019073569482, + "grad_norm": 7.884844779968262, + "learning_rate": 1.801524559958869e-05, + "loss": 0.7734, + "step": 8364 + }, + { + "epoch": 22.79291553133515, + "grad_norm": 8.301671028137207, + "learning_rate": 1.801471787024894e-05, + "loss": 0.7458, + "step": 8365 + }, + { + "epoch": 22.795640326975477, + "grad_norm": 8.874147415161133, + "learning_rate": 1.8014190078490827e-05, + "loss": 0.818, + "step": 8366 + }, + { + "epoch": 22.798365122615802, + "grad_norm": 8.567561149597168, + "learning_rate": 1.8013662224318454e-05, + "loss": 0.6621, + "step": 8367 + }, + { + "epoch": 22.80108991825613, + "grad_norm": 8.372900009155273, + "learning_rate": 1.801313430773594e-05, + "loss": 0.7499, + "step": 8368 + }, + { + "epoch": 22.803814713896458, + "grad_norm": 10.487556457519531, + "learning_rate": 1.8012606328747396e-05, + "loss": 0.7626, + "step": 8369 + }, + { + "epoch": 22.806539509536783, + "grad_norm": 8.268380165100098, + "learning_rate": 1.801207828735693e-05, + "loss": 0.6166, + "step": 8370 + }, + { + "epoch": 22.809264305177113, + "grad_norm": 9.076476097106934, + "learning_rate": 1.801155018356866e-05, + "loss": 0.9066, + "step": 8371 + }, + { + "epoch": 22.81198910081744, + "grad_norm": 7.709597110748291, + "learning_rate": 1.801102201738669e-05, + "loss": 0.7554, + "step": 8372 + }, + { + "epoch": 22.814713896457764, + "grad_norm": 7.452513694763184, + "learning_rate": 1.801049378881514e-05, + "loss": 0.8503, + "step": 8373 + }, + { + "epoch": 22.817438692098094, + "grad_norm": 12.326823234558105, + "learning_rate": 1.8009965497858122e-05, + "loss": 0.8734, + "step": 8374 + }, + { + "epoch": 22.82016348773842, + "grad_norm": 8.573702812194824, + "learning_rate": 1.8009437144519754e-05, + "loss": 0.7109, + "step": 8375 + }, + { + "epoch": 22.822888283378745, + "grad_norm": 9.0914306640625, + "learning_rate": 1.800890872880414e-05, + "loss": 0.7036, + "step": 8376 + }, + { + "epoch": 22.825613079019075, + "grad_norm": 7.493348121643066, + "learning_rate": 1.8008380250715407e-05, + "loss": 0.7402, + "step": 8377 + }, + { + "epoch": 22.8283378746594, + "grad_norm": 7.073947906494141, + "learning_rate": 1.8007851710257665e-05, + "loss": 0.7428, + "step": 8378 + }, + { + "epoch": 22.831062670299726, + "grad_norm": 7.560627460479736, + "learning_rate": 1.8007323107435036e-05, + "loss": 0.7723, + "step": 8379 + }, + { + "epoch": 22.833787465940055, + "grad_norm": 11.093255043029785, + "learning_rate": 1.8006794442251628e-05, + "loss": 0.6369, + "step": 8380 + }, + { + "epoch": 22.83651226158038, + "grad_norm": 10.050905227661133, + "learning_rate": 1.8006265714711563e-05, + "loss": 0.7341, + "step": 8381 + }, + { + "epoch": 22.839237057220707, + "grad_norm": 6.6332011222839355, + "learning_rate": 1.800573692481896e-05, + "loss": 0.6653, + "step": 8382 + }, + { + "epoch": 22.841961852861036, + "grad_norm": 10.797080993652344, + "learning_rate": 1.8005208072577934e-05, + "loss": 0.7542, + "step": 8383 + }, + { + "epoch": 22.844686648501362, + "grad_norm": 7.66061544418335, + "learning_rate": 1.8004679157992603e-05, + "loss": 0.6463, + "step": 8384 + }, + { + "epoch": 22.847411444141688, + "grad_norm": 9.29662036895752, + "learning_rate": 1.8004150181067092e-05, + "loss": 0.6167, + "step": 8385 + }, + { + "epoch": 22.850136239782017, + "grad_norm": 8.294990539550781, + "learning_rate": 1.8003621141805515e-05, + "loss": 0.8214, + "step": 8386 + }, + { + "epoch": 22.852861035422343, + "grad_norm": 9.719687461853027, + "learning_rate": 1.8003092040211997e-05, + "loss": 0.7599, + "step": 8387 + }, + { + "epoch": 22.85558583106267, + "grad_norm": 6.939882755279541, + "learning_rate": 1.8002562876290653e-05, + "loss": 0.6698, + "step": 8388 + }, + { + "epoch": 22.858310626703, + "grad_norm": 7.773337364196777, + "learning_rate": 1.8002033650045608e-05, + "loss": 0.7798, + "step": 8389 + }, + { + "epoch": 22.861035422343324, + "grad_norm": 5.989284992218018, + "learning_rate": 1.800150436148098e-05, + "loss": 0.8341, + "step": 8390 + }, + { + "epoch": 22.86376021798365, + "grad_norm": 8.706110000610352, + "learning_rate": 1.8000975010600896e-05, + "loss": 0.6805, + "step": 8391 + }, + { + "epoch": 22.86648501362398, + "grad_norm": 8.234627723693848, + "learning_rate": 1.8000445597409476e-05, + "loss": 0.7802, + "step": 8392 + }, + { + "epoch": 22.869209809264305, + "grad_norm": 8.230191230773926, + "learning_rate": 1.7999916121910844e-05, + "loss": 0.9098, + "step": 8393 + }, + { + "epoch": 22.87193460490463, + "grad_norm": 9.947519302368164, + "learning_rate": 1.799938658410912e-05, + "loss": 0.6981, + "step": 8394 + }, + { + "epoch": 22.87465940054496, + "grad_norm": 8.276824951171875, + "learning_rate": 1.7998856984008435e-05, + "loss": 0.625, + "step": 8395 + }, + { + "epoch": 22.877384196185286, + "grad_norm": 9.143417358398438, + "learning_rate": 1.799832732161291e-05, + "loss": 0.7893, + "step": 8396 + }, + { + "epoch": 22.88010899182561, + "grad_norm": 8.269719123840332, + "learning_rate": 1.7997797596926663e-05, + "loss": 0.6224, + "step": 8397 + }, + { + "epoch": 22.88283378746594, + "grad_norm": 12.5256929397583, + "learning_rate": 1.799726780995383e-05, + "loss": 0.705, + "step": 8398 + }, + { + "epoch": 22.885558583106267, + "grad_norm": 7.561325550079346, + "learning_rate": 1.799673796069853e-05, + "loss": 0.6573, + "step": 8399 + }, + { + "epoch": 22.888283378746593, + "grad_norm": 8.696834564208984, + "learning_rate": 1.7996208049164893e-05, + "loss": 0.8337, + "step": 8400 + }, + { + "epoch": 22.891008174386922, + "grad_norm": 12.15063190460205, + "learning_rate": 1.7995678075357046e-05, + "loss": 0.9536, + "step": 8401 + }, + { + "epoch": 22.893732970027248, + "grad_norm": 11.010416030883789, + "learning_rate": 1.7995148039279114e-05, + "loss": 0.6628, + "step": 8402 + }, + { + "epoch": 22.896457765667574, + "grad_norm": 27.363561630249023, + "learning_rate": 1.799461794093523e-05, + "loss": 0.7762, + "step": 8403 + }, + { + "epoch": 22.899182561307903, + "grad_norm": 9.95945930480957, + "learning_rate": 1.7994087780329515e-05, + "loss": 0.7667, + "step": 8404 + }, + { + "epoch": 22.90190735694823, + "grad_norm": 9.571027755737305, + "learning_rate": 1.79935575574661e-05, + "loss": 0.6774, + "step": 8405 + }, + { + "epoch": 22.904632152588555, + "grad_norm": 6.8465681076049805, + "learning_rate": 1.7993027272349122e-05, + "loss": 0.7532, + "step": 8406 + }, + { + "epoch": 22.907356948228884, + "grad_norm": 7.76675271987915, + "learning_rate": 1.79924969249827e-05, + "loss": 0.6217, + "step": 8407 + }, + { + "epoch": 22.91008174386921, + "grad_norm": 7.14346170425415, + "learning_rate": 1.799196651537097e-05, + "loss": 0.8032, + "step": 8408 + }, + { + "epoch": 22.912806539509535, + "grad_norm": 8.59581470489502, + "learning_rate": 1.7991436043518063e-05, + "loss": 0.7368, + "step": 8409 + }, + { + "epoch": 22.915531335149865, + "grad_norm": 9.888229370117188, + "learning_rate": 1.7990905509428113e-05, + "loss": 0.8506, + "step": 8410 + }, + { + "epoch": 22.91825613079019, + "grad_norm": 8.427626609802246, + "learning_rate": 1.7990374913105243e-05, + "loss": 0.7975, + "step": 8411 + }, + { + "epoch": 22.920980926430516, + "grad_norm": 7.949625015258789, + "learning_rate": 1.798984425455359e-05, + "loss": 0.7159, + "step": 8412 + }, + { + "epoch": 22.923705722070846, + "grad_norm": 12.150747299194336, + "learning_rate": 1.798931353377729e-05, + "loss": 0.6206, + "step": 8413 + }, + { + "epoch": 22.92643051771117, + "grad_norm": 11.340509414672852, + "learning_rate": 1.7988782750780474e-05, + "loss": 0.8069, + "step": 8414 + }, + { + "epoch": 22.929155313351497, + "grad_norm": 8.656377792358398, + "learning_rate": 1.7988251905567272e-05, + "loss": 0.6528, + "step": 8415 + }, + { + "epoch": 22.931880108991827, + "grad_norm": 8.10794448852539, + "learning_rate": 1.798772099814182e-05, + "loss": 0.5533, + "step": 8416 + }, + { + "epoch": 22.934604904632153, + "grad_norm": 6.618900299072266, + "learning_rate": 1.7987190028508258e-05, + "loss": 0.7542, + "step": 8417 + }, + { + "epoch": 22.93732970027248, + "grad_norm": 10.989508628845215, + "learning_rate": 1.7986658996670716e-05, + "loss": 0.6791, + "step": 8418 + }, + { + "epoch": 22.940054495912808, + "grad_norm": 7.508787155151367, + "learning_rate": 1.798612790263333e-05, + "loss": 0.7457, + "step": 8419 + }, + { + "epoch": 22.942779291553133, + "grad_norm": 11.940625190734863, + "learning_rate": 1.7985596746400234e-05, + "loss": 0.7559, + "step": 8420 + }, + { + "epoch": 22.94550408719346, + "grad_norm": 9.415892601013184, + "learning_rate": 1.7985065527975574e-05, + "loss": 0.86, + "step": 8421 + }, + { + "epoch": 22.94822888283379, + "grad_norm": 9.412283897399902, + "learning_rate": 1.798453424736348e-05, + "loss": 0.707, + "step": 8422 + }, + { + "epoch": 22.950953678474114, + "grad_norm": 7.368431568145752, + "learning_rate": 1.7984002904568085e-05, + "loss": 0.5997, + "step": 8423 + }, + { + "epoch": 22.95367847411444, + "grad_norm": 8.547812461853027, + "learning_rate": 1.7983471499593536e-05, + "loss": 0.758, + "step": 8424 + }, + { + "epoch": 22.95640326975477, + "grad_norm": 8.5846586227417, + "learning_rate": 1.7982940032443967e-05, + "loss": 0.7478, + "step": 8425 + }, + { + "epoch": 22.959128065395095, + "grad_norm": 15.388944625854492, + "learning_rate": 1.7982408503123518e-05, + "loss": 0.7078, + "step": 8426 + }, + { + "epoch": 22.96185286103542, + "grad_norm": 7.916131496429443, + "learning_rate": 1.7981876911636325e-05, + "loss": 0.6588, + "step": 8427 + }, + { + "epoch": 22.96457765667575, + "grad_norm": 8.411246299743652, + "learning_rate": 1.7981345257986537e-05, + "loss": 0.7148, + "step": 8428 + }, + { + "epoch": 22.967302452316076, + "grad_norm": 8.674823760986328, + "learning_rate": 1.798081354217829e-05, + "loss": 0.7478, + "step": 8429 + }, + { + "epoch": 22.970027247956402, + "grad_norm": 8.647583961486816, + "learning_rate": 1.7980281764215716e-05, + "loss": 0.7847, + "step": 8430 + }, + { + "epoch": 22.97275204359673, + "grad_norm": 12.102951049804688, + "learning_rate": 1.797974992410297e-05, + "loss": 0.9033, + "step": 8431 + }, + { + "epoch": 22.975476839237057, + "grad_norm": 8.523092269897461, + "learning_rate": 1.797921802184419e-05, + "loss": 0.6737, + "step": 8432 + }, + { + "epoch": 22.978201634877383, + "grad_norm": 9.005290031433105, + "learning_rate": 1.7978686057443514e-05, + "loss": 0.7683, + "step": 8433 + }, + { + "epoch": 22.980926430517712, + "grad_norm": 14.410584449768066, + "learning_rate": 1.797815403090509e-05, + "loss": 0.6978, + "step": 8434 + }, + { + "epoch": 22.983651226158038, + "grad_norm": 8.908540725708008, + "learning_rate": 1.7977621942233057e-05, + "loss": 0.8822, + "step": 8435 + }, + { + "epoch": 22.986376021798364, + "grad_norm": 9.658884048461914, + "learning_rate": 1.797708979143156e-05, + "loss": 0.9028, + "step": 8436 + }, + { + "epoch": 22.989100817438693, + "grad_norm": 9.560940742492676, + "learning_rate": 1.797655757850475e-05, + "loss": 0.733, + "step": 8437 + }, + { + "epoch": 22.99182561307902, + "grad_norm": 8.36474609375, + "learning_rate": 1.797602530345676e-05, + "loss": 0.6675, + "step": 8438 + }, + { + "epoch": 22.994550408719345, + "grad_norm": 7.720761299133301, + "learning_rate": 1.7975492966291743e-05, + "loss": 0.7605, + "step": 8439 + }, + { + "epoch": 22.997275204359674, + "grad_norm": 10.557333946228027, + "learning_rate": 1.7974960567013844e-05, + "loss": 0.8137, + "step": 8440 + }, + { + "epoch": 23.0, + "grad_norm": 7.309525966644287, + "learning_rate": 1.797442810562721e-05, + "loss": 0.5304, + "step": 8441 + }, + { + "epoch": 23.002724795640326, + "grad_norm": 7.120656967163086, + "learning_rate": 1.7973895582135984e-05, + "loss": 0.6416, + "step": 8442 + }, + { + "epoch": 23.005449591280655, + "grad_norm": 7.714159965515137, + "learning_rate": 1.7973362996544318e-05, + "loss": 0.5383, + "step": 8443 + }, + { + "epoch": 23.00817438692098, + "grad_norm": 7.924902439117432, + "learning_rate": 1.7972830348856358e-05, + "loss": 0.6489, + "step": 8444 + }, + { + "epoch": 23.010899182561307, + "grad_norm": 8.31507682800293, + "learning_rate": 1.797229763907625e-05, + "loss": 0.6921, + "step": 8445 + }, + { + "epoch": 23.013623978201636, + "grad_norm": 6.668956756591797, + "learning_rate": 1.797176486720815e-05, + "loss": 0.6844, + "step": 8446 + }, + { + "epoch": 23.016348773841962, + "grad_norm": 7.660555362701416, + "learning_rate": 1.7971232033256197e-05, + "loss": 0.4926, + "step": 8447 + }, + { + "epoch": 23.019073569482288, + "grad_norm": 6.523613929748535, + "learning_rate": 1.7970699137224543e-05, + "loss": 0.6993, + "step": 8448 + }, + { + "epoch": 23.021798365122617, + "grad_norm": 9.737499237060547, + "learning_rate": 1.7970166179117344e-05, + "loss": 0.7983, + "step": 8449 + }, + { + "epoch": 23.024523160762943, + "grad_norm": 7.278012275695801, + "learning_rate": 1.7969633158938745e-05, + "loss": 0.6957, + "step": 8450 + }, + { + "epoch": 23.02724795640327, + "grad_norm": 10.634453773498535, + "learning_rate": 1.79691000766929e-05, + "loss": 0.6973, + "step": 8451 + }, + { + "epoch": 23.029972752043598, + "grad_norm": 8.478558540344238, + "learning_rate": 1.7968566932383968e-05, + "loss": 0.671, + "step": 8452 + }, + { + "epoch": 23.032697547683924, + "grad_norm": 10.252836227416992, + "learning_rate": 1.7968033726016085e-05, + "loss": 0.619, + "step": 8453 + }, + { + "epoch": 23.03542234332425, + "grad_norm": 7.047082424163818, + "learning_rate": 1.7967500457593412e-05, + "loss": 0.6472, + "step": 8454 + }, + { + "epoch": 23.03814713896458, + "grad_norm": 8.522323608398438, + "learning_rate": 1.79669671271201e-05, + "loss": 0.6464, + "step": 8455 + }, + { + "epoch": 23.040871934604905, + "grad_norm": 7.537111759185791, + "learning_rate": 1.796643373460031e-05, + "loss": 0.6147, + "step": 8456 + }, + { + "epoch": 23.04359673024523, + "grad_norm": 7.55095911026001, + "learning_rate": 1.796590028003819e-05, + "loss": 0.6521, + "step": 8457 + }, + { + "epoch": 23.04632152588556, + "grad_norm": 7.395035743713379, + "learning_rate": 1.7965366763437893e-05, + "loss": 0.6871, + "step": 8458 + }, + { + "epoch": 23.049046321525886, + "grad_norm": 8.479537010192871, + "learning_rate": 1.7964833184803576e-05, + "loss": 0.6937, + "step": 8459 + }, + { + "epoch": 23.05177111716621, + "grad_norm": 6.660445690155029, + "learning_rate": 1.7964299544139394e-05, + "loss": 0.5733, + "step": 8460 + }, + { + "epoch": 23.05449591280654, + "grad_norm": 8.537720680236816, + "learning_rate": 1.7963765841449506e-05, + "loss": 0.6393, + "step": 8461 + }, + { + "epoch": 23.057220708446867, + "grad_norm": 9.241690635681152, + "learning_rate": 1.7963232076738063e-05, + "loss": 0.6331, + "step": 8462 + }, + { + "epoch": 23.059945504087192, + "grad_norm": 35.25710678100586, + "learning_rate": 1.7962698250009226e-05, + "loss": 0.646, + "step": 8463 + }, + { + "epoch": 23.06267029972752, + "grad_norm": 7.614792823791504, + "learning_rate": 1.7962164361267152e-05, + "loss": 0.5204, + "step": 8464 + }, + { + "epoch": 23.065395095367847, + "grad_norm": 7.552260398864746, + "learning_rate": 1.7961630410515998e-05, + "loss": 0.5472, + "step": 8465 + }, + { + "epoch": 23.068119891008173, + "grad_norm": 10.231441497802734, + "learning_rate": 1.7961096397759922e-05, + "loss": 0.592, + "step": 8466 + }, + { + "epoch": 23.070844686648503, + "grad_norm": 7.6383843421936035, + "learning_rate": 1.7960562323003087e-05, + "loss": 0.5792, + "step": 8467 + }, + { + "epoch": 23.07356948228883, + "grad_norm": 9.595244407653809, + "learning_rate": 1.7960028186249644e-05, + "loss": 0.693, + "step": 8468 + }, + { + "epoch": 23.076294277929154, + "grad_norm": 9.348398208618164, + "learning_rate": 1.7959493987503757e-05, + "loss": 0.6698, + "step": 8469 + }, + { + "epoch": 23.079019073569484, + "grad_norm": 8.854413032531738, + "learning_rate": 1.795895972676959e-05, + "loss": 0.6348, + "step": 8470 + }, + { + "epoch": 23.08174386920981, + "grad_norm": 8.519789695739746, + "learning_rate": 1.79584254040513e-05, + "loss": 0.5905, + "step": 8471 + }, + { + "epoch": 23.084468664850135, + "grad_norm": 8.251155853271484, + "learning_rate": 1.7957891019353048e-05, + "loss": 0.6971, + "step": 8472 + }, + { + "epoch": 23.087193460490465, + "grad_norm": 9.817055702209473, + "learning_rate": 1.7957356572678998e-05, + "loss": 0.5431, + "step": 8473 + }, + { + "epoch": 23.08991825613079, + "grad_norm": 9.670547485351562, + "learning_rate": 1.7956822064033313e-05, + "loss": 0.6669, + "step": 8474 + }, + { + "epoch": 23.092643051771116, + "grad_norm": 9.475438117980957, + "learning_rate": 1.7956287493420152e-05, + "loss": 0.7317, + "step": 8475 + }, + { + "epoch": 23.095367847411445, + "grad_norm": 8.039822578430176, + "learning_rate": 1.7955752860843678e-05, + "loss": 0.6687, + "step": 8476 + }, + { + "epoch": 23.09809264305177, + "grad_norm": 7.249072074890137, + "learning_rate": 1.795521816630806e-05, + "loss": 0.646, + "step": 8477 + }, + { + "epoch": 23.100817438692097, + "grad_norm": 7.711321830749512, + "learning_rate": 1.7954683409817457e-05, + "loss": 0.5933, + "step": 8478 + }, + { + "epoch": 23.103542234332426, + "grad_norm": 7.8946380615234375, + "learning_rate": 1.7954148591376038e-05, + "loss": 0.6982, + "step": 8479 + }, + { + "epoch": 23.106267029972752, + "grad_norm": 7.7069597244262695, + "learning_rate": 1.7953613710987966e-05, + "loss": 0.5725, + "step": 8480 + }, + { + "epoch": 23.108991825613078, + "grad_norm": 8.600133895874023, + "learning_rate": 1.7953078768657404e-05, + "loss": 0.6288, + "step": 8481 + }, + { + "epoch": 23.111716621253407, + "grad_norm": 7.790313720703125, + "learning_rate": 1.795254376438852e-05, + "loss": 0.6152, + "step": 8482 + }, + { + "epoch": 23.114441416893733, + "grad_norm": 9.687016487121582, + "learning_rate": 1.7952008698185483e-05, + "loss": 0.6984, + "step": 8483 + }, + { + "epoch": 23.11716621253406, + "grad_norm": 8.021065711975098, + "learning_rate": 1.7951473570052457e-05, + "loss": 0.6957, + "step": 8484 + }, + { + "epoch": 23.11989100817439, + "grad_norm": 47.138607025146484, + "learning_rate": 1.795093837999361e-05, + "loss": 0.5585, + "step": 8485 + }, + { + "epoch": 23.122615803814714, + "grad_norm": 8.166311264038086, + "learning_rate": 1.795040312801311e-05, + "loss": 0.5601, + "step": 8486 + }, + { + "epoch": 23.12534059945504, + "grad_norm": 8.451225280761719, + "learning_rate": 1.794986781411513e-05, + "loss": 0.677, + "step": 8487 + }, + { + "epoch": 23.12806539509537, + "grad_norm": 9.893058776855469, + "learning_rate": 1.7949332438303834e-05, + "loss": 0.6196, + "step": 8488 + }, + { + "epoch": 23.130790190735695, + "grad_norm": 7.625050067901611, + "learning_rate": 1.7948797000583394e-05, + "loss": 0.6169, + "step": 8489 + }, + { + "epoch": 23.13351498637602, + "grad_norm": 9.372100830078125, + "learning_rate": 1.7948261500957974e-05, + "loss": 0.6243, + "step": 8490 + }, + { + "epoch": 23.13623978201635, + "grad_norm": 10.169224739074707, + "learning_rate": 1.7947725939431756e-05, + "loss": 0.7031, + "step": 8491 + }, + { + "epoch": 23.138964577656676, + "grad_norm": 8.801020622253418, + "learning_rate": 1.7947190316008896e-05, + "loss": 0.6228, + "step": 8492 + }, + { + "epoch": 23.141689373297, + "grad_norm": 12.136094093322754, + "learning_rate": 1.7946654630693583e-05, + "loss": 0.7136, + "step": 8493 + }, + { + "epoch": 23.14441416893733, + "grad_norm": 7.939266204833984, + "learning_rate": 1.7946118883489974e-05, + "loss": 0.7758, + "step": 8494 + }, + { + "epoch": 23.147138964577657, + "grad_norm": 7.835748195648193, + "learning_rate": 1.7945583074402246e-05, + "loss": 0.6205, + "step": 8495 + }, + { + "epoch": 23.149863760217983, + "grad_norm": 10.074135780334473, + "learning_rate": 1.7945047203434573e-05, + "loss": 0.6698, + "step": 8496 + }, + { + "epoch": 23.152588555858312, + "grad_norm": 9.422436714172363, + "learning_rate": 1.794451127059113e-05, + "loss": 0.79, + "step": 8497 + }, + { + "epoch": 23.155313351498638, + "grad_norm": 8.241384506225586, + "learning_rate": 1.7943975275876088e-05, + "loss": 0.636, + "step": 8498 + }, + { + "epoch": 23.158038147138964, + "grad_norm": 8.339426040649414, + "learning_rate": 1.7943439219293623e-05, + "loss": 0.692, + "step": 8499 + }, + { + "epoch": 23.160762942779293, + "grad_norm": 8.311019897460938, + "learning_rate": 1.794290310084791e-05, + "loss": 0.5696, + "step": 8500 + }, + { + "epoch": 23.16348773841962, + "grad_norm": 8.582189559936523, + "learning_rate": 1.794236692054312e-05, + "loss": 0.5953, + "step": 8501 + }, + { + "epoch": 23.166212534059945, + "grad_norm": 7.771618366241455, + "learning_rate": 1.7941830678383433e-05, + "loss": 0.8604, + "step": 8502 + }, + { + "epoch": 23.168937329700274, + "grad_norm": 10.156007766723633, + "learning_rate": 1.794129437437303e-05, + "loss": 0.6352, + "step": 8503 + }, + { + "epoch": 23.1716621253406, + "grad_norm": 10.292689323425293, + "learning_rate": 1.7940758008516074e-05, + "loss": 0.721, + "step": 8504 + }, + { + "epoch": 23.174386920980925, + "grad_norm": 8.468525886535645, + "learning_rate": 1.7940221580816755e-05, + "loss": 0.5929, + "step": 8505 + }, + { + "epoch": 23.177111716621255, + "grad_norm": 8.367538452148438, + "learning_rate": 1.7939685091279244e-05, + "loss": 0.6339, + "step": 8506 + }, + { + "epoch": 23.17983651226158, + "grad_norm": 9.837169647216797, + "learning_rate": 1.7939148539907722e-05, + "loss": 0.6194, + "step": 8507 + }, + { + "epoch": 23.182561307901906, + "grad_norm": 7.640585422515869, + "learning_rate": 1.7938611926706365e-05, + "loss": 0.5526, + "step": 8508 + }, + { + "epoch": 23.185286103542236, + "grad_norm": 7.256917476654053, + "learning_rate": 1.7938075251679356e-05, + "loss": 0.6492, + "step": 8509 + }, + { + "epoch": 23.18801089918256, + "grad_norm": 6.757735252380371, + "learning_rate": 1.793753851483087e-05, + "loss": 0.5229, + "step": 8510 + }, + { + "epoch": 23.190735694822887, + "grad_norm": 10.572715759277344, + "learning_rate": 1.793700171616509e-05, + "loss": 0.7336, + "step": 8511 + }, + { + "epoch": 23.193460490463217, + "grad_norm": 8.248072624206543, + "learning_rate": 1.7936464855686197e-05, + "loss": 0.6858, + "step": 8512 + }, + { + "epoch": 23.196185286103542, + "grad_norm": 8.662367820739746, + "learning_rate": 1.7935927933398374e-05, + "loss": 0.6094, + "step": 8513 + }, + { + "epoch": 23.19891008174387, + "grad_norm": 6.991458415985107, + "learning_rate": 1.7935390949305796e-05, + "loss": 0.789, + "step": 8514 + }, + { + "epoch": 23.201634877384198, + "grad_norm": 8.048157691955566, + "learning_rate": 1.7934853903412648e-05, + "loss": 0.66, + "step": 8515 + }, + { + "epoch": 23.204359673024523, + "grad_norm": 11.361948013305664, + "learning_rate": 1.7934316795723116e-05, + "loss": 0.675, + "step": 8516 + }, + { + "epoch": 23.20708446866485, + "grad_norm": 19.493915557861328, + "learning_rate": 1.793377962624138e-05, + "loss": 0.6782, + "step": 8517 + }, + { + "epoch": 23.20980926430518, + "grad_norm": 7.957698822021484, + "learning_rate": 1.793324239497162e-05, + "loss": 0.5366, + "step": 8518 + }, + { + "epoch": 23.212534059945504, + "grad_norm": 7.149418354034424, + "learning_rate": 1.7932705101918025e-05, + "loss": 0.7745, + "step": 8519 + }, + { + "epoch": 23.21525885558583, + "grad_norm": 9.753764152526855, + "learning_rate": 1.793216774708478e-05, + "loss": 0.5413, + "step": 8520 + }, + { + "epoch": 23.21798365122616, + "grad_norm": 8.978517532348633, + "learning_rate": 1.7931630330476066e-05, + "loss": 0.7794, + "step": 8521 + }, + { + "epoch": 23.220708446866485, + "grad_norm": 10.788363456726074, + "learning_rate": 1.793109285209607e-05, + "loss": 0.6026, + "step": 8522 + }, + { + "epoch": 23.22343324250681, + "grad_norm": 8.073689460754395, + "learning_rate": 1.793055531194898e-05, + "loss": 0.6669, + "step": 8523 + }, + { + "epoch": 23.22615803814714, + "grad_norm": 7.393884181976318, + "learning_rate": 1.793001771003898e-05, + "loss": 0.6308, + "step": 8524 + }, + { + "epoch": 23.228882833787466, + "grad_norm": 9.178787231445312, + "learning_rate": 1.7929480046370257e-05, + "loss": 0.7239, + "step": 8525 + }, + { + "epoch": 23.231607629427792, + "grad_norm": 8.557303428649902, + "learning_rate": 1.7928942320947e-05, + "loss": 0.8069, + "step": 8526 + }, + { + "epoch": 23.23433242506812, + "grad_norm": 7.862518310546875, + "learning_rate": 1.7928404533773394e-05, + "loss": 0.6935, + "step": 8527 + }, + { + "epoch": 23.237057220708447, + "grad_norm": 7.550032138824463, + "learning_rate": 1.7927866684853628e-05, + "loss": 0.5632, + "step": 8528 + }, + { + "epoch": 23.239782016348773, + "grad_norm": 10.641572952270508, + "learning_rate": 1.792732877419189e-05, + "loss": 0.6713, + "step": 8529 + }, + { + "epoch": 23.242506811989102, + "grad_norm": 11.035921096801758, + "learning_rate": 1.7926790801792374e-05, + "loss": 0.7606, + "step": 8530 + }, + { + "epoch": 23.245231607629428, + "grad_norm": 10.768778800964355, + "learning_rate": 1.7926252767659265e-05, + "loss": 0.6884, + "step": 8531 + }, + { + "epoch": 23.247956403269754, + "grad_norm": 8.348357200622559, + "learning_rate": 1.7925714671796754e-05, + "loss": 0.5798, + "step": 8532 + }, + { + "epoch": 23.250681198910083, + "grad_norm": 8.501439094543457, + "learning_rate": 1.7925176514209033e-05, + "loss": 0.721, + "step": 8533 + }, + { + "epoch": 23.25340599455041, + "grad_norm": 8.829363822937012, + "learning_rate": 1.7924638294900292e-05, + "loss": 0.7488, + "step": 8534 + }, + { + "epoch": 23.256130790190735, + "grad_norm": 7.027775287628174, + "learning_rate": 1.7924100013874725e-05, + "loss": 0.7323, + "step": 8535 + }, + { + "epoch": 23.258855585831064, + "grad_norm": 7.892490863800049, + "learning_rate": 1.792356167113652e-05, + "loss": 0.5483, + "step": 8536 + }, + { + "epoch": 23.26158038147139, + "grad_norm": 7.996335983276367, + "learning_rate": 1.792302326668987e-05, + "loss": 0.5439, + "step": 8537 + }, + { + "epoch": 23.264305177111716, + "grad_norm": 11.164660453796387, + "learning_rate": 1.7922484800538973e-05, + "loss": 0.5655, + "step": 8538 + }, + { + "epoch": 23.267029972752045, + "grad_norm": 7.229864120483398, + "learning_rate": 1.7921946272688018e-05, + "loss": 0.6787, + "step": 8539 + }, + { + "epoch": 23.26975476839237, + "grad_norm": 9.329996109008789, + "learning_rate": 1.79214076831412e-05, + "loss": 0.6082, + "step": 8540 + }, + { + "epoch": 23.272479564032697, + "grad_norm": 7.63694429397583, + "learning_rate": 1.7920869031902715e-05, + "loss": 0.6626, + "step": 8541 + }, + { + "epoch": 23.275204359673026, + "grad_norm": 8.810453414916992, + "learning_rate": 1.792033031897676e-05, + "loss": 0.5375, + "step": 8542 + }, + { + "epoch": 23.277929155313352, + "grad_norm": 8.408686637878418, + "learning_rate": 1.791979154436752e-05, + "loss": 0.74, + "step": 8543 + }, + { + "epoch": 23.280653950953678, + "grad_norm": 8.32150650024414, + "learning_rate": 1.7919252708079203e-05, + "loss": 0.6957, + "step": 8544 + }, + { + "epoch": 23.283378746594007, + "grad_norm": 7.6873040199279785, + "learning_rate": 1.7918713810116e-05, + "loss": 0.6849, + "step": 8545 + }, + { + "epoch": 23.286103542234333, + "grad_norm": 15.796939849853516, + "learning_rate": 1.791817485048211e-05, + "loss": 0.6536, + "step": 8546 + }, + { + "epoch": 23.28882833787466, + "grad_norm": 10.190418243408203, + "learning_rate": 1.7917635829181726e-05, + "loss": 0.6182, + "step": 8547 + }, + { + "epoch": 23.291553133514988, + "grad_norm": 9.241643905639648, + "learning_rate": 1.7917096746219053e-05, + "loss": 0.607, + "step": 8548 + }, + { + "epoch": 23.294277929155314, + "grad_norm": 7.768148422241211, + "learning_rate": 1.7916557601598283e-05, + "loss": 0.679, + "step": 8549 + }, + { + "epoch": 23.29700272479564, + "grad_norm": 9.539830207824707, + "learning_rate": 1.7916018395323614e-05, + "loss": 0.5195, + "step": 8550 + }, + { + "epoch": 23.29972752043597, + "grad_norm": 7.210759162902832, + "learning_rate": 1.7915479127399255e-05, + "loss": 0.6689, + "step": 8551 + }, + { + "epoch": 23.302452316076295, + "grad_norm": 10.108943939208984, + "learning_rate": 1.7914939797829393e-05, + "loss": 0.8805, + "step": 8552 + }, + { + "epoch": 23.30517711171662, + "grad_norm": 8.475149154663086, + "learning_rate": 1.791440040661824e-05, + "loss": 0.6523, + "step": 8553 + }, + { + "epoch": 23.30790190735695, + "grad_norm": 7.329076766967773, + "learning_rate": 1.7913860953769987e-05, + "loss": 0.5496, + "step": 8554 + }, + { + "epoch": 23.310626702997276, + "grad_norm": 7.7415876388549805, + "learning_rate": 1.791332143928884e-05, + "loss": 0.6384, + "step": 8555 + }, + { + "epoch": 23.3133514986376, + "grad_norm": 9.320038795471191, + "learning_rate": 1.7912781863179005e-05, + "loss": 0.6972, + "step": 8556 + }, + { + "epoch": 23.31607629427793, + "grad_norm": 9.999711990356445, + "learning_rate": 1.7912242225444676e-05, + "loss": 0.7368, + "step": 8557 + }, + { + "epoch": 23.318801089918257, + "grad_norm": 10.375534057617188, + "learning_rate": 1.791170252609006e-05, + "loss": 0.681, + "step": 8558 + }, + { + "epoch": 23.321525885558582, + "grad_norm": 9.925941467285156, + "learning_rate": 1.7911162765119357e-05, + "loss": 0.6501, + "step": 8559 + }, + { + "epoch": 23.32425068119891, + "grad_norm": 9.065058708190918, + "learning_rate": 1.7910622942536777e-05, + "loss": 0.7489, + "step": 8560 + }, + { + "epoch": 23.326975476839237, + "grad_norm": 8.21484088897705, + "learning_rate": 1.7910083058346516e-05, + "loss": 0.8214, + "step": 8561 + }, + { + "epoch": 23.329700272479563, + "grad_norm": 7.954100608825684, + "learning_rate": 1.790954311255279e-05, + "loss": 0.5521, + "step": 8562 + }, + { + "epoch": 23.332425068119893, + "grad_norm": 8.682811737060547, + "learning_rate": 1.790900310515979e-05, + "loss": 0.691, + "step": 8563 + }, + { + "epoch": 23.33514986376022, + "grad_norm": 8.368846893310547, + "learning_rate": 1.790846303617173e-05, + "loss": 0.7624, + "step": 8564 + }, + { + "epoch": 23.337874659400544, + "grad_norm": 7.999691963195801, + "learning_rate": 1.7907922905592813e-05, + "loss": 0.6859, + "step": 8565 + }, + { + "epoch": 23.340599455040874, + "grad_norm": 7.746175289154053, + "learning_rate": 1.790738271342725e-05, + "loss": 0.6075, + "step": 8566 + }, + { + "epoch": 23.3433242506812, + "grad_norm": 7.714305400848389, + "learning_rate": 1.7906842459679242e-05, + "loss": 0.7225, + "step": 8567 + }, + { + "epoch": 23.346049046321525, + "grad_norm": 7.813354969024658, + "learning_rate": 1.7906302144353002e-05, + "loss": 0.6647, + "step": 8568 + }, + { + "epoch": 23.348773841961854, + "grad_norm": 23.70584487915039, + "learning_rate": 1.7905761767452735e-05, + "loss": 0.6464, + "step": 8569 + }, + { + "epoch": 23.35149863760218, + "grad_norm": 11.611759185791016, + "learning_rate": 1.7905221328982647e-05, + "loss": 0.7893, + "step": 8570 + }, + { + "epoch": 23.354223433242506, + "grad_norm": 7.760707378387451, + "learning_rate": 1.790468082894695e-05, + "loss": 0.7317, + "step": 8571 + }, + { + "epoch": 23.356948228882835, + "grad_norm": 8.688565254211426, + "learning_rate": 1.7904140267349856e-05, + "loss": 0.5536, + "step": 8572 + }, + { + "epoch": 23.35967302452316, + "grad_norm": 6.916512489318848, + "learning_rate": 1.7903599644195573e-05, + "loss": 0.6938, + "step": 8573 + }, + { + "epoch": 23.362397820163487, + "grad_norm": 9.440940856933594, + "learning_rate": 1.7903058959488307e-05, + "loss": 0.6481, + "step": 8574 + }, + { + "epoch": 23.365122615803816, + "grad_norm": 9.571310997009277, + "learning_rate": 1.7902518213232273e-05, + "loss": 0.718, + "step": 8575 + }, + { + "epoch": 23.367847411444142, + "grad_norm": 8.1104736328125, + "learning_rate": 1.7901977405431683e-05, + "loss": 0.7656, + "step": 8576 + }, + { + "epoch": 23.370572207084468, + "grad_norm": 8.448812484741211, + "learning_rate": 1.7901436536090747e-05, + "loss": 0.7043, + "step": 8577 + }, + { + "epoch": 23.373297002724797, + "grad_norm": 8.477097511291504, + "learning_rate": 1.7900895605213673e-05, + "loss": 0.6609, + "step": 8578 + }, + { + "epoch": 23.376021798365123, + "grad_norm": 8.596450805664062, + "learning_rate": 1.7900354612804685e-05, + "loss": 0.7032, + "step": 8579 + }, + { + "epoch": 23.37874659400545, + "grad_norm": 8.790950775146484, + "learning_rate": 1.7899813558867985e-05, + "loss": 0.7711, + "step": 8580 + }, + { + "epoch": 23.381471389645778, + "grad_norm": 8.57071590423584, + "learning_rate": 1.7899272443407792e-05, + "loss": 0.6788, + "step": 8581 + }, + { + "epoch": 23.384196185286104, + "grad_norm": 8.83356761932373, + "learning_rate": 1.789873126642832e-05, + "loss": 0.8002, + "step": 8582 + }, + { + "epoch": 23.38692098092643, + "grad_norm": 7.473575115203857, + "learning_rate": 1.7898190027933785e-05, + "loss": 0.5423, + "step": 8583 + }, + { + "epoch": 23.38964577656676, + "grad_norm": 9.0474853515625, + "learning_rate": 1.78976487279284e-05, + "loss": 0.62, + "step": 8584 + }, + { + "epoch": 23.392370572207085, + "grad_norm": 7.830740928649902, + "learning_rate": 1.7897107366416378e-05, + "loss": 0.7531, + "step": 8585 + }, + { + "epoch": 23.39509536784741, + "grad_norm": 7.8416290283203125, + "learning_rate": 1.789656594340194e-05, + "loss": 0.6802, + "step": 8586 + }, + { + "epoch": 23.39782016348774, + "grad_norm": 8.996277809143066, + "learning_rate": 1.78960244588893e-05, + "loss": 0.5889, + "step": 8587 + }, + { + "epoch": 23.400544959128066, + "grad_norm": 8.558965682983398, + "learning_rate": 1.7895482912882673e-05, + "loss": 0.6445, + "step": 8588 + }, + { + "epoch": 23.40326975476839, + "grad_norm": 7.307924747467041, + "learning_rate": 1.7894941305386283e-05, + "loss": 0.7791, + "step": 8589 + }, + { + "epoch": 23.40599455040872, + "grad_norm": 10.23050594329834, + "learning_rate": 1.7894399636404344e-05, + "loss": 0.6134, + "step": 8590 + }, + { + "epoch": 23.408719346049047, + "grad_norm": 8.079825401306152, + "learning_rate": 1.7893857905941074e-05, + "loss": 0.7001, + "step": 8591 + }, + { + "epoch": 23.411444141689373, + "grad_norm": 9.503316879272461, + "learning_rate": 1.789331611400069e-05, + "loss": 0.7207, + "step": 8592 + }, + { + "epoch": 23.414168937329702, + "grad_norm": 7.8776021003723145, + "learning_rate": 1.789277426058742e-05, + "loss": 0.5166, + "step": 8593 + }, + { + "epoch": 23.416893732970028, + "grad_norm": 40.536216735839844, + "learning_rate": 1.7892232345705475e-05, + "loss": 0.7108, + "step": 8594 + }, + { + "epoch": 23.419618528610354, + "grad_norm": 7.9806718826293945, + "learning_rate": 1.7891690369359077e-05, + "loss": 0.6958, + "step": 8595 + }, + { + "epoch": 23.422343324250683, + "grad_norm": 8.904545783996582, + "learning_rate": 1.789114833155245e-05, + "loss": 0.8054, + "step": 8596 + }, + { + "epoch": 23.42506811989101, + "grad_norm": 9.127898216247559, + "learning_rate": 1.7890606232289815e-05, + "loss": 0.7883, + "step": 8597 + }, + { + "epoch": 23.427792915531334, + "grad_norm": 9.511321067810059, + "learning_rate": 1.789006407157539e-05, + "loss": 0.7177, + "step": 8598 + }, + { + "epoch": 23.430517711171664, + "grad_norm": 8.270140647888184, + "learning_rate": 1.78895218494134e-05, + "loss": 0.5883, + "step": 8599 + }, + { + "epoch": 23.43324250681199, + "grad_norm": 7.842483043670654, + "learning_rate": 1.788897956580807e-05, + "loss": 0.6144, + "step": 8600 + }, + { + "epoch": 23.435967302452315, + "grad_norm": 9.526908874511719, + "learning_rate": 1.7888437220763618e-05, + "loss": 0.7385, + "step": 8601 + }, + { + "epoch": 23.438692098092645, + "grad_norm": 8.789389610290527, + "learning_rate": 1.7887894814284274e-05, + "loss": 0.5989, + "step": 8602 + }, + { + "epoch": 23.44141689373297, + "grad_norm": 9.479100227355957, + "learning_rate": 1.7887352346374255e-05, + "loss": 0.6363, + "step": 8603 + }, + { + "epoch": 23.444141689373296, + "grad_norm": 8.337409019470215, + "learning_rate": 1.7886809817037797e-05, + "loss": 0.7091, + "step": 8604 + }, + { + "epoch": 23.446866485013626, + "grad_norm": 7.94667911529541, + "learning_rate": 1.7886267226279114e-05, + "loss": 0.714, + "step": 8605 + }, + { + "epoch": 23.44959128065395, + "grad_norm": 9.154091835021973, + "learning_rate": 1.788572457410243e-05, + "loss": 0.6265, + "step": 8606 + }, + { + "epoch": 23.452316076294277, + "grad_norm": 9.223176956176758, + "learning_rate": 1.7885181860511983e-05, + "loss": 0.702, + "step": 8607 + }, + { + "epoch": 23.455040871934607, + "grad_norm": 7.356810092926025, + "learning_rate": 1.7884639085511996e-05, + "loss": 0.6519, + "step": 8608 + }, + { + "epoch": 23.457765667574932, + "grad_norm": 8.943059921264648, + "learning_rate": 1.7884096249106687e-05, + "loss": 0.667, + "step": 8609 + }, + { + "epoch": 23.460490463215258, + "grad_norm": 9.221323013305664, + "learning_rate": 1.7883553351300292e-05, + "loss": 0.7407, + "step": 8610 + }, + { + "epoch": 23.463215258855588, + "grad_norm": 7.710006237030029, + "learning_rate": 1.788301039209704e-05, + "loss": 0.6475, + "step": 8611 + }, + { + "epoch": 23.465940054495913, + "grad_norm": 8.61248779296875, + "learning_rate": 1.7882467371501156e-05, + "loss": 0.6575, + "step": 8612 + }, + { + "epoch": 23.46866485013624, + "grad_norm": 7.137813568115234, + "learning_rate": 1.788192428951687e-05, + "loss": 0.6826, + "step": 8613 + }, + { + "epoch": 23.47138964577657, + "grad_norm": 7.6610212326049805, + "learning_rate": 1.788138114614841e-05, + "loss": 0.7191, + "step": 8614 + }, + { + "epoch": 23.474114441416894, + "grad_norm": 9.8787841796875, + "learning_rate": 1.7880837941400005e-05, + "loss": 0.7482, + "step": 8615 + }, + { + "epoch": 23.47683923705722, + "grad_norm": 6.708698749542236, + "learning_rate": 1.788029467527589e-05, + "loss": 0.7267, + "step": 8616 + }, + { + "epoch": 23.479564032697546, + "grad_norm": 6.205842971801758, + "learning_rate": 1.7879751347780297e-05, + "loss": 0.5804, + "step": 8617 + }, + { + "epoch": 23.482288828337875, + "grad_norm": 7.933350563049316, + "learning_rate": 1.7879207958917447e-05, + "loss": 0.5801, + "step": 8618 + }, + { + "epoch": 23.4850136239782, + "grad_norm": 9.49789047241211, + "learning_rate": 1.7878664508691586e-05, + "loss": 0.5733, + "step": 8619 + }, + { + "epoch": 23.48773841961853, + "grad_norm": 7.27047061920166, + "learning_rate": 1.7878120997106937e-05, + "loss": 0.546, + "step": 8620 + }, + { + "epoch": 23.490463215258856, + "grad_norm": 9.08828067779541, + "learning_rate": 1.7877577424167734e-05, + "loss": 0.5861, + "step": 8621 + }, + { + "epoch": 23.493188010899182, + "grad_norm": 7.885524272918701, + "learning_rate": 1.7877033789878212e-05, + "loss": 0.8145, + "step": 8622 + }, + { + "epoch": 23.495912806539508, + "grad_norm": 7.435037136077881, + "learning_rate": 1.7876490094242604e-05, + "loss": 0.7148, + "step": 8623 + }, + { + "epoch": 23.498637602179837, + "grad_norm": 7.90762996673584, + "learning_rate": 1.7875946337265143e-05, + "loss": 0.6532, + "step": 8624 + }, + { + "epoch": 23.501362397820163, + "grad_norm": 7.87869930267334, + "learning_rate": 1.787540251895007e-05, + "loss": 0.7826, + "step": 8625 + }, + { + "epoch": 23.504087193460492, + "grad_norm": 6.55080509185791, + "learning_rate": 1.7874858639301616e-05, + "loss": 0.6455, + "step": 8626 + }, + { + "epoch": 23.506811989100818, + "grad_norm": 8.975728034973145, + "learning_rate": 1.7874314698324012e-05, + "loss": 0.72, + "step": 8627 + }, + { + "epoch": 23.509536784741144, + "grad_norm": 10.967278480529785, + "learning_rate": 1.78737706960215e-05, + "loss": 0.7908, + "step": 8628 + }, + { + "epoch": 23.51226158038147, + "grad_norm": 8.755050659179688, + "learning_rate": 1.7873226632398317e-05, + "loss": 0.814, + "step": 8629 + }, + { + "epoch": 23.5149863760218, + "grad_norm": 8.059727668762207, + "learning_rate": 1.7872682507458696e-05, + "loss": 0.7316, + "step": 8630 + }, + { + "epoch": 23.517711171662125, + "grad_norm": 12.241052627563477, + "learning_rate": 1.7872138321206876e-05, + "loss": 0.6984, + "step": 8631 + }, + { + "epoch": 23.520435967302454, + "grad_norm": 9.974397659301758, + "learning_rate": 1.78715940736471e-05, + "loss": 0.6152, + "step": 8632 + }, + { + "epoch": 23.52316076294278, + "grad_norm": 8.978565216064453, + "learning_rate": 1.7871049764783598e-05, + "loss": 0.6549, + "step": 8633 + }, + { + "epoch": 23.525885558583106, + "grad_norm": 10.687780380249023, + "learning_rate": 1.7870505394620617e-05, + "loss": 0.6996, + "step": 8634 + }, + { + "epoch": 23.52861035422343, + "grad_norm": 7.585939884185791, + "learning_rate": 1.7869960963162395e-05, + "loss": 0.5245, + "step": 8635 + }, + { + "epoch": 23.53133514986376, + "grad_norm": 8.184713363647461, + "learning_rate": 1.7869416470413167e-05, + "loss": 0.6719, + "step": 8636 + }, + { + "epoch": 23.534059945504087, + "grad_norm": 9.080817222595215, + "learning_rate": 1.7868871916377178e-05, + "loss": 0.7789, + "step": 8637 + }, + { + "epoch": 23.536784741144416, + "grad_norm": 6.877401351928711, + "learning_rate": 1.7868327301058668e-05, + "loss": 0.5884, + "step": 8638 + }, + { + "epoch": 23.539509536784742, + "grad_norm": 7.515068531036377, + "learning_rate": 1.7867782624461877e-05, + "loss": 0.5229, + "step": 8639 + }, + { + "epoch": 23.542234332425068, + "grad_norm": 7.122920513153076, + "learning_rate": 1.786723788659105e-05, + "loss": 0.7167, + "step": 8640 + }, + { + "epoch": 23.544959128065393, + "grad_norm": 8.047174453735352, + "learning_rate": 1.7866693087450426e-05, + "loss": 0.6377, + "step": 8641 + }, + { + "epoch": 23.547683923705723, + "grad_norm": 7.259688377380371, + "learning_rate": 1.786614822704425e-05, + "loss": 0.6741, + "step": 8642 + }, + { + "epoch": 23.55040871934605, + "grad_norm": 7.659267425537109, + "learning_rate": 1.7865603305376765e-05, + "loss": 0.7208, + "step": 8643 + }, + { + "epoch": 23.553133514986374, + "grad_norm": 6.8070173263549805, + "learning_rate": 1.7865058322452214e-05, + "loss": 0.6266, + "step": 8644 + }, + { + "epoch": 23.555858310626704, + "grad_norm": 7.469305515289307, + "learning_rate": 1.7864513278274843e-05, + "loss": 0.7759, + "step": 8645 + }, + { + "epoch": 23.55858310626703, + "grad_norm": 8.908949851989746, + "learning_rate": 1.7863968172848897e-05, + "loss": 0.5837, + "step": 8646 + }, + { + "epoch": 23.561307901907355, + "grad_norm": 7.560341835021973, + "learning_rate": 1.7863423006178616e-05, + "loss": 0.6711, + "step": 8647 + }, + { + "epoch": 23.564032697547685, + "grad_norm": 7.590961933135986, + "learning_rate": 1.786287777826825e-05, + "loss": 0.6345, + "step": 8648 + }, + { + "epoch": 23.56675749318801, + "grad_norm": 8.51723861694336, + "learning_rate": 1.786233248912205e-05, + "loss": 0.5675, + "step": 8649 + }, + { + "epoch": 23.569482288828336, + "grad_norm": 8.561624526977539, + "learning_rate": 1.7861787138744254e-05, + "loss": 0.7284, + "step": 8650 + }, + { + "epoch": 23.572207084468666, + "grad_norm": 8.869158744812012, + "learning_rate": 1.7861241727139113e-05, + "loss": 0.812, + "step": 8651 + }, + { + "epoch": 23.57493188010899, + "grad_norm": 10.612920761108398, + "learning_rate": 1.7860696254310874e-05, + "loss": 0.6151, + "step": 8652 + }, + { + "epoch": 23.577656675749317, + "grad_norm": 8.31689453125, + "learning_rate": 1.7860150720263786e-05, + "loss": 0.601, + "step": 8653 + }, + { + "epoch": 23.580381471389646, + "grad_norm": 8.467896461486816, + "learning_rate": 1.7859605125002098e-05, + "loss": 0.5558, + "step": 8654 + }, + { + "epoch": 23.583106267029972, + "grad_norm": 7.422057628631592, + "learning_rate": 1.7859059468530055e-05, + "loss": 0.5573, + "step": 8655 + }, + { + "epoch": 23.585831062670298, + "grad_norm": 13.866622924804688, + "learning_rate": 1.7858513750851913e-05, + "loss": 0.8096, + "step": 8656 + }, + { + "epoch": 23.588555858310627, + "grad_norm": 8.810937881469727, + "learning_rate": 1.785796797197192e-05, + "loss": 0.6388, + "step": 8657 + }, + { + "epoch": 23.591280653950953, + "grad_norm": 6.7735090255737305, + "learning_rate": 1.7857422131894322e-05, + "loss": 0.7238, + "step": 8658 + }, + { + "epoch": 23.59400544959128, + "grad_norm": 8.533026695251465, + "learning_rate": 1.7856876230623374e-05, + "loss": 0.6313, + "step": 8659 + }, + { + "epoch": 23.59673024523161, + "grad_norm": 7.0363922119140625, + "learning_rate": 1.785633026816333e-05, + "loss": 0.5979, + "step": 8660 + }, + { + "epoch": 23.599455040871934, + "grad_norm": 8.589900970458984, + "learning_rate": 1.7855784244518434e-05, + "loss": 0.5581, + "step": 8661 + }, + { + "epoch": 23.60217983651226, + "grad_norm": 7.23314905166626, + "learning_rate": 1.7855238159692943e-05, + "loss": 0.5594, + "step": 8662 + }, + { + "epoch": 23.60490463215259, + "grad_norm": 6.846451282501221, + "learning_rate": 1.7854692013691114e-05, + "loss": 0.6437, + "step": 8663 + }, + { + "epoch": 23.607629427792915, + "grad_norm": 15.448397636413574, + "learning_rate": 1.7854145806517195e-05, + "loss": 0.6333, + "step": 8664 + }, + { + "epoch": 23.61035422343324, + "grad_norm": 9.071206092834473, + "learning_rate": 1.7853599538175443e-05, + "loss": 0.6938, + "step": 8665 + }, + { + "epoch": 23.61307901907357, + "grad_norm": 9.376893997192383, + "learning_rate": 1.785305320867011e-05, + "loss": 0.6271, + "step": 8666 + }, + { + "epoch": 23.615803814713896, + "grad_norm": 7.037196159362793, + "learning_rate": 1.785250681800545e-05, + "loss": 0.5181, + "step": 8667 + }, + { + "epoch": 23.618528610354222, + "grad_norm": 7.3704376220703125, + "learning_rate": 1.7851960366185718e-05, + "loss": 0.6652, + "step": 8668 + }, + { + "epoch": 23.62125340599455, + "grad_norm": 8.9699125289917, + "learning_rate": 1.7851413853215175e-05, + "loss": 0.7029, + "step": 8669 + }, + { + "epoch": 23.623978201634877, + "grad_norm": 9.074806213378906, + "learning_rate": 1.785086727909807e-05, + "loss": 0.733, + "step": 8670 + }, + { + "epoch": 23.626702997275203, + "grad_norm": 7.657893657684326, + "learning_rate": 1.7850320643838666e-05, + "loss": 0.597, + "step": 8671 + }, + { + "epoch": 23.629427792915532, + "grad_norm": 7.139098167419434, + "learning_rate": 1.7849773947441215e-05, + "loss": 0.6231, + "step": 8672 + }, + { + "epoch": 23.632152588555858, + "grad_norm": 8.690154075622559, + "learning_rate": 1.784922718990998e-05, + "loss": 0.6373, + "step": 8673 + }, + { + "epoch": 23.634877384196184, + "grad_norm": 7.496939182281494, + "learning_rate": 1.7848680371249214e-05, + "loss": 0.6178, + "step": 8674 + }, + { + "epoch": 23.637602179836513, + "grad_norm": 10.386566162109375, + "learning_rate": 1.7848133491463176e-05, + "loss": 0.7594, + "step": 8675 + }, + { + "epoch": 23.64032697547684, + "grad_norm": 7.76467752456665, + "learning_rate": 1.7847586550556132e-05, + "loss": 0.6033, + "step": 8676 + }, + { + "epoch": 23.643051771117165, + "grad_norm": 7.715465068817139, + "learning_rate": 1.7847039548532333e-05, + "loss": 0.7561, + "step": 8677 + }, + { + "epoch": 23.645776566757494, + "grad_norm": 8.637248039245605, + "learning_rate": 1.7846492485396046e-05, + "loss": 0.6965, + "step": 8678 + }, + { + "epoch": 23.64850136239782, + "grad_norm": 8.032029151916504, + "learning_rate": 1.7845945361151526e-05, + "loss": 0.7462, + "step": 8679 + }, + { + "epoch": 23.651226158038146, + "grad_norm": 8.577354431152344, + "learning_rate": 1.7845398175803035e-05, + "loss": 0.792, + "step": 8680 + }, + { + "epoch": 23.653950953678475, + "grad_norm": 8.476625442504883, + "learning_rate": 1.7844850929354835e-05, + "loss": 0.7145, + "step": 8681 + }, + { + "epoch": 23.6566757493188, + "grad_norm": 9.123308181762695, + "learning_rate": 1.784430362181119e-05, + "loss": 0.7391, + "step": 8682 + }, + { + "epoch": 23.659400544959126, + "grad_norm": 8.435811996459961, + "learning_rate": 1.7843756253176362e-05, + "loss": 0.6026, + "step": 8683 + }, + { + "epoch": 23.662125340599456, + "grad_norm": 9.569748878479004, + "learning_rate": 1.784320882345461e-05, + "loss": 0.7577, + "step": 8684 + }, + { + "epoch": 23.66485013623978, + "grad_norm": 7.912408828735352, + "learning_rate": 1.7842661332650202e-05, + "loss": 0.8336, + "step": 8685 + }, + { + "epoch": 23.667574931880107, + "grad_norm": 8.150311470031738, + "learning_rate": 1.78421137807674e-05, + "loss": 0.5372, + "step": 8686 + }, + { + "epoch": 23.670299727520437, + "grad_norm": 6.968649864196777, + "learning_rate": 1.7841566167810467e-05, + "loss": 0.521, + "step": 8687 + }, + { + "epoch": 23.673024523160763, + "grad_norm": 6.817625045776367, + "learning_rate": 1.784101849378367e-05, + "loss": 0.6313, + "step": 8688 + }, + { + "epoch": 23.67574931880109, + "grad_norm": 7.390740871429443, + "learning_rate": 1.7840470758691274e-05, + "loss": 0.6503, + "step": 8689 + }, + { + "epoch": 23.678474114441418, + "grad_norm": 8.48143482208252, + "learning_rate": 1.7839922962537543e-05, + "loss": 0.6953, + "step": 8690 + }, + { + "epoch": 23.681198910081743, + "grad_norm": 9.579242706298828, + "learning_rate": 1.7839375105326743e-05, + "loss": 0.8687, + "step": 8691 + }, + { + "epoch": 23.68392370572207, + "grad_norm": 7.510007381439209, + "learning_rate": 1.7838827187063144e-05, + "loss": 0.6313, + "step": 8692 + }, + { + "epoch": 23.6866485013624, + "grad_norm": 8.059843063354492, + "learning_rate": 1.7838279207751013e-05, + "loss": 0.5894, + "step": 8693 + }, + { + "epoch": 23.689373297002724, + "grad_norm": 7.011054992675781, + "learning_rate": 1.7837731167394614e-05, + "loss": 0.7607, + "step": 8694 + }, + { + "epoch": 23.69209809264305, + "grad_norm": 9.017129898071289, + "learning_rate": 1.7837183065998215e-05, + "loss": 0.6663, + "step": 8695 + }, + { + "epoch": 23.69482288828338, + "grad_norm": 8.130972862243652, + "learning_rate": 1.783663490356609e-05, + "loss": 1.0414, + "step": 8696 + }, + { + "epoch": 23.697547683923705, + "grad_norm": 10.18790340423584, + "learning_rate": 1.78360866801025e-05, + "loss": 0.787, + "step": 8697 + }, + { + "epoch": 23.70027247956403, + "grad_norm": 8.673542976379395, + "learning_rate": 1.783553839561172e-05, + "loss": 0.5428, + "step": 8698 + }, + { + "epoch": 23.70299727520436, + "grad_norm": 8.38430118560791, + "learning_rate": 1.7834990050098025e-05, + "loss": 0.8124, + "step": 8699 + }, + { + "epoch": 23.705722070844686, + "grad_norm": 8.579794883728027, + "learning_rate": 1.7834441643565674e-05, + "loss": 0.5999, + "step": 8700 + }, + { + "epoch": 23.708446866485012, + "grad_norm": 8.432461738586426, + "learning_rate": 1.7833893176018945e-05, + "loss": 0.7352, + "step": 8701 + }, + { + "epoch": 23.71117166212534, + "grad_norm": 10.682052612304688, + "learning_rate": 1.7833344647462106e-05, + "loss": 0.6133, + "step": 8702 + }, + { + "epoch": 23.713896457765667, + "grad_norm": 8.271554946899414, + "learning_rate": 1.7832796057899434e-05, + "loss": 0.6321, + "step": 8703 + }, + { + "epoch": 23.716621253405993, + "grad_norm": 7.847799301147461, + "learning_rate": 1.7832247407335197e-05, + "loss": 0.6888, + "step": 8704 + }, + { + "epoch": 23.719346049046322, + "grad_norm": 7.223616600036621, + "learning_rate": 1.783169869577367e-05, + "loss": 0.6458, + "step": 8705 + }, + { + "epoch": 23.722070844686648, + "grad_norm": 7.0132904052734375, + "learning_rate": 1.7831149923219126e-05, + "loss": 0.7334, + "step": 8706 + }, + { + "epoch": 23.724795640326974, + "grad_norm": 8.604496002197266, + "learning_rate": 1.783060108967584e-05, + "loss": 0.6483, + "step": 8707 + }, + { + "epoch": 23.727520435967303, + "grad_norm": 6.9799652099609375, + "learning_rate": 1.7830052195148083e-05, + "loss": 0.7627, + "step": 8708 + }, + { + "epoch": 23.73024523160763, + "grad_norm": 6.896748065948486, + "learning_rate": 1.782950323964013e-05, + "loss": 0.5499, + "step": 8709 + }, + { + "epoch": 23.732970027247955, + "grad_norm": 9.566889762878418, + "learning_rate": 1.7828954223156257e-05, + "loss": 0.6467, + "step": 8710 + }, + { + "epoch": 23.735694822888284, + "grad_norm": 7.210999965667725, + "learning_rate": 1.7828405145700743e-05, + "loss": 0.6013, + "step": 8711 + }, + { + "epoch": 23.73841961852861, + "grad_norm": 10.314238548278809, + "learning_rate": 1.7827856007277865e-05, + "loss": 0.6503, + "step": 8712 + }, + { + "epoch": 23.741144414168936, + "grad_norm": 9.22961711883545, + "learning_rate": 1.782730680789189e-05, + "loss": 0.7363, + "step": 8713 + }, + { + "epoch": 23.743869209809265, + "grad_norm": 9.406926155090332, + "learning_rate": 1.78267575475471e-05, + "loss": 0.6622, + "step": 8714 + }, + { + "epoch": 23.74659400544959, + "grad_norm": 8.926714897155762, + "learning_rate": 1.7826208226247783e-05, + "loss": 0.6537, + "step": 8715 + }, + { + "epoch": 23.749318801089917, + "grad_norm": 9.726031303405762, + "learning_rate": 1.78256588439982e-05, + "loss": 0.567, + "step": 8716 + }, + { + "epoch": 23.752043596730246, + "grad_norm": 8.517714500427246, + "learning_rate": 1.7825109400802643e-05, + "loss": 0.77, + "step": 8717 + }, + { + "epoch": 23.754768392370572, + "grad_norm": 7.61201286315918, + "learning_rate": 1.7824559896665385e-05, + "loss": 0.6111, + "step": 8718 + }, + { + "epoch": 23.757493188010898, + "grad_norm": 8.55817985534668, + "learning_rate": 1.7824010331590703e-05, + "loss": 0.5581, + "step": 8719 + }, + { + "epoch": 23.760217983651227, + "grad_norm": 8.823881149291992, + "learning_rate": 1.7823460705582884e-05, + "loss": 0.6625, + "step": 8720 + }, + { + "epoch": 23.762942779291553, + "grad_norm": 7.473922252655029, + "learning_rate": 1.7822911018646202e-05, + "loss": 0.5093, + "step": 8721 + }, + { + "epoch": 23.76566757493188, + "grad_norm": 7.682458877563477, + "learning_rate": 1.782236127078494e-05, + "loss": 0.6854, + "step": 8722 + }, + { + "epoch": 23.768392370572208, + "grad_norm": 8.417536735534668, + "learning_rate": 1.7821811462003387e-05, + "loss": 0.6559, + "step": 8723 + }, + { + "epoch": 23.771117166212534, + "grad_norm": 8.51427173614502, + "learning_rate": 1.782126159230581e-05, + "loss": 0.6233, + "step": 8724 + }, + { + "epoch": 23.77384196185286, + "grad_norm": 8.760787963867188, + "learning_rate": 1.7820711661696504e-05, + "loss": 0.7046, + "step": 8725 + }, + { + "epoch": 23.77656675749319, + "grad_norm": 8.030685424804688, + "learning_rate": 1.7820161670179748e-05, + "loss": 0.6956, + "step": 8726 + }, + { + "epoch": 23.779291553133515, + "grad_norm": 8.65029239654541, + "learning_rate": 1.7819611617759826e-05, + "loss": 0.631, + "step": 8727 + }, + { + "epoch": 23.78201634877384, + "grad_norm": 7.661012649536133, + "learning_rate": 1.7819061504441016e-05, + "loss": 0.6351, + "step": 8728 + }, + { + "epoch": 23.78474114441417, + "grad_norm": 7.802098751068115, + "learning_rate": 1.7818511330227604e-05, + "loss": 0.7091, + "step": 8729 + }, + { + "epoch": 23.787465940054496, + "grad_norm": 8.589938163757324, + "learning_rate": 1.7817961095123885e-05, + "loss": 0.7041, + "step": 8730 + }, + { + "epoch": 23.79019073569482, + "grad_norm": 8.099030494689941, + "learning_rate": 1.7817410799134133e-05, + "loss": 0.8079, + "step": 8731 + }, + { + "epoch": 23.79291553133515, + "grad_norm": 10.787029266357422, + "learning_rate": 1.7816860442262637e-05, + "loss": 0.6957, + "step": 8732 + }, + { + "epoch": 23.795640326975477, + "grad_norm": 9.628156661987305, + "learning_rate": 1.781631002451368e-05, + "loss": 0.6896, + "step": 8733 + }, + { + "epoch": 23.798365122615802, + "grad_norm": 8.368080139160156, + "learning_rate": 1.7815759545891556e-05, + "loss": 0.6821, + "step": 8734 + }, + { + "epoch": 23.80108991825613, + "grad_norm": 7.77903938293457, + "learning_rate": 1.781520900640055e-05, + "loss": 0.5994, + "step": 8735 + }, + { + "epoch": 23.803814713896458, + "grad_norm": 8.866826057434082, + "learning_rate": 1.7814658406044948e-05, + "loss": 0.7404, + "step": 8736 + }, + { + "epoch": 23.806539509536783, + "grad_norm": 9.506380081176758, + "learning_rate": 1.7814107744829036e-05, + "loss": 0.7247, + "step": 8737 + }, + { + "epoch": 23.809264305177113, + "grad_norm": 13.592761993408203, + "learning_rate": 1.7813557022757103e-05, + "loss": 0.7326, + "step": 8738 + }, + { + "epoch": 23.81198910081744, + "grad_norm": 9.544055938720703, + "learning_rate": 1.781300623983344e-05, + "loss": 0.5842, + "step": 8739 + }, + { + "epoch": 23.814713896457764, + "grad_norm": 7.893803596496582, + "learning_rate": 1.7812455396062336e-05, + "loss": 0.6718, + "step": 8740 + }, + { + "epoch": 23.817438692098094, + "grad_norm": 8.230522155761719, + "learning_rate": 1.781190449144808e-05, + "loss": 0.6367, + "step": 8741 + }, + { + "epoch": 23.82016348773842, + "grad_norm": 8.57618522644043, + "learning_rate": 1.7811353525994967e-05, + "loss": 0.6167, + "step": 8742 + }, + { + "epoch": 23.822888283378745, + "grad_norm": 9.646374702453613, + "learning_rate": 1.781080249970728e-05, + "loss": 0.7092, + "step": 8743 + }, + { + "epoch": 23.825613079019075, + "grad_norm": 8.21642017364502, + "learning_rate": 1.7810251412589315e-05, + "loss": 0.6303, + "step": 8744 + }, + { + "epoch": 23.8283378746594, + "grad_norm": 8.2904052734375, + "learning_rate": 1.7809700264645365e-05, + "loss": 0.7354, + "step": 8745 + }, + { + "epoch": 23.831062670299726, + "grad_norm": 8.364733695983887, + "learning_rate": 1.780914905587972e-05, + "loss": 0.7319, + "step": 8746 + }, + { + "epoch": 23.833787465940055, + "grad_norm": 8.430075645446777, + "learning_rate": 1.7808597786296673e-05, + "loss": 0.596, + "step": 8747 + }, + { + "epoch": 23.83651226158038, + "grad_norm": 8.242403030395508, + "learning_rate": 1.7808046455900517e-05, + "loss": 0.696, + "step": 8748 + }, + { + "epoch": 23.839237057220707, + "grad_norm": 8.332865715026855, + "learning_rate": 1.780749506469555e-05, + "loss": 0.7371, + "step": 8749 + }, + { + "epoch": 23.841961852861036, + "grad_norm": 7.8866400718688965, + "learning_rate": 1.7806943612686058e-05, + "loss": 0.6669, + "step": 8750 + }, + { + "epoch": 23.844686648501362, + "grad_norm": 6.825740337371826, + "learning_rate": 1.7806392099876343e-05, + "loss": 0.6196, + "step": 8751 + }, + { + "epoch": 23.847411444141688, + "grad_norm": 13.025237083435059, + "learning_rate": 1.78058405262707e-05, + "loss": 0.7921, + "step": 8752 + }, + { + "epoch": 23.850136239782017, + "grad_norm": 6.44904088973999, + "learning_rate": 1.780528889187342e-05, + "loss": 0.7094, + "step": 8753 + }, + { + "epoch": 23.852861035422343, + "grad_norm": 8.157832145690918, + "learning_rate": 1.78047371966888e-05, + "loss": 0.6033, + "step": 8754 + }, + { + "epoch": 23.85558583106267, + "grad_norm": 9.57671070098877, + "learning_rate": 1.7804185440721136e-05, + "loss": 0.5122, + "step": 8755 + }, + { + "epoch": 23.858310626703, + "grad_norm": 9.046643257141113, + "learning_rate": 1.7803633623974732e-05, + "loss": 0.6341, + "step": 8756 + }, + { + "epoch": 23.861035422343324, + "grad_norm": 8.198485374450684, + "learning_rate": 1.7803081746453877e-05, + "loss": 0.5378, + "step": 8757 + }, + { + "epoch": 23.86376021798365, + "grad_norm": 7.1689043045043945, + "learning_rate": 1.7802529808162877e-05, + "loss": 0.6439, + "step": 8758 + }, + { + "epoch": 23.86648501362398, + "grad_norm": 7.593871116638184, + "learning_rate": 1.7801977809106024e-05, + "loss": 0.787, + "step": 8759 + }, + { + "epoch": 23.869209809264305, + "grad_norm": 8.279637336730957, + "learning_rate": 1.7801425749287616e-05, + "loss": 0.7444, + "step": 8760 + }, + { + "epoch": 23.87193460490463, + "grad_norm": 10.108986854553223, + "learning_rate": 1.7800873628711957e-05, + "loss": 0.7656, + "step": 8761 + }, + { + "epoch": 23.87465940054496, + "grad_norm": 14.299032211303711, + "learning_rate": 1.7800321447383345e-05, + "loss": 0.9197, + "step": 8762 + }, + { + "epoch": 23.877384196185286, + "grad_norm": 6.564296722412109, + "learning_rate": 1.7799769205306082e-05, + "loss": 0.7238, + "step": 8763 + }, + { + "epoch": 23.88010899182561, + "grad_norm": 8.50287914276123, + "learning_rate": 1.7799216902484465e-05, + "loss": 0.5895, + "step": 8764 + }, + { + "epoch": 23.88283378746594, + "grad_norm": 7.999722480773926, + "learning_rate": 1.77986645389228e-05, + "loss": 0.5835, + "step": 8765 + }, + { + "epoch": 23.885558583106267, + "grad_norm": 7.00806188583374, + "learning_rate": 1.7798112114625385e-05, + "loss": 0.8248, + "step": 8766 + }, + { + "epoch": 23.888283378746593, + "grad_norm": 8.394281387329102, + "learning_rate": 1.7797559629596525e-05, + "loss": 0.6644, + "step": 8767 + }, + { + "epoch": 23.891008174386922, + "grad_norm": 7.199811935424805, + "learning_rate": 1.7797007083840522e-05, + "loss": 0.7495, + "step": 8768 + }, + { + "epoch": 23.893732970027248, + "grad_norm": 8.760477066040039, + "learning_rate": 1.7796454477361676e-05, + "loss": 0.7896, + "step": 8769 + }, + { + "epoch": 23.896457765667574, + "grad_norm": 7.498642444610596, + "learning_rate": 1.7795901810164296e-05, + "loss": 0.6012, + "step": 8770 + }, + { + "epoch": 23.899182561307903, + "grad_norm": 7.29533052444458, + "learning_rate": 1.7795349082252686e-05, + "loss": 0.6757, + "step": 8771 + }, + { + "epoch": 23.90190735694823, + "grad_norm": 11.376025199890137, + "learning_rate": 1.7794796293631144e-05, + "loss": 0.7375, + "step": 8772 + }, + { + "epoch": 23.904632152588555, + "grad_norm": 9.86885929107666, + "learning_rate": 1.779424344430398e-05, + "loss": 0.653, + "step": 8773 + }, + { + "epoch": 23.907356948228884, + "grad_norm": 7.98117733001709, + "learning_rate": 1.77936905342755e-05, + "loss": 0.6324, + "step": 8774 + }, + { + "epoch": 23.91008174386921, + "grad_norm": 9.175762176513672, + "learning_rate": 1.7793137563550006e-05, + "loss": 0.6484, + "step": 8775 + }, + { + "epoch": 23.912806539509535, + "grad_norm": 9.684450149536133, + "learning_rate": 1.7792584532131813e-05, + "loss": 0.6616, + "step": 8776 + }, + { + "epoch": 23.915531335149865, + "grad_norm": 9.040603637695312, + "learning_rate": 1.779203144002522e-05, + "loss": 0.7095, + "step": 8777 + }, + { + "epoch": 23.91825613079019, + "grad_norm": 8.966569900512695, + "learning_rate": 1.7791478287234534e-05, + "loss": 0.6418, + "step": 8778 + }, + { + "epoch": 23.920980926430516, + "grad_norm": 9.191880226135254, + "learning_rate": 1.779092507376407e-05, + "loss": 0.7317, + "step": 8779 + }, + { + "epoch": 23.923705722070846, + "grad_norm": 6.665855407714844, + "learning_rate": 1.779037179961813e-05, + "loss": 0.678, + "step": 8780 + }, + { + "epoch": 23.92643051771117, + "grad_norm": 10.758771896362305, + "learning_rate": 1.7789818464801025e-05, + "loss": 0.7538, + "step": 8781 + }, + { + "epoch": 23.929155313351497, + "grad_norm": 8.288837432861328, + "learning_rate": 1.7789265069317067e-05, + "loss": 0.649, + "step": 8782 + }, + { + "epoch": 23.931880108991827, + "grad_norm": 8.446208000183105, + "learning_rate": 1.778871161317056e-05, + "loss": 0.6255, + "step": 8783 + }, + { + "epoch": 23.934604904632153, + "grad_norm": 10.18574047088623, + "learning_rate": 1.778815809636582e-05, + "loss": 0.6509, + "step": 8784 + }, + { + "epoch": 23.93732970027248, + "grad_norm": 7.808631420135498, + "learning_rate": 1.7787604518907152e-05, + "loss": 0.8768, + "step": 8785 + }, + { + "epoch": 23.940054495912808, + "grad_norm": 8.451011657714844, + "learning_rate": 1.7787050880798877e-05, + "loss": 0.6985, + "step": 8786 + }, + { + "epoch": 23.942779291553133, + "grad_norm": 10.8347749710083, + "learning_rate": 1.7786497182045295e-05, + "loss": 0.7277, + "step": 8787 + }, + { + "epoch": 23.94550408719346, + "grad_norm": 8.061737060546875, + "learning_rate": 1.7785943422650724e-05, + "loss": 0.5524, + "step": 8788 + }, + { + "epoch": 23.94822888283379, + "grad_norm": 10.186460494995117, + "learning_rate": 1.7785389602619477e-05, + "loss": 0.6448, + "step": 8789 + }, + { + "epoch": 23.950953678474114, + "grad_norm": 9.940427780151367, + "learning_rate": 1.7784835721955866e-05, + "loss": 0.6981, + "step": 8790 + }, + { + "epoch": 23.95367847411444, + "grad_norm": 8.110967636108398, + "learning_rate": 1.778428178066421e-05, + "loss": 0.7357, + "step": 8791 + }, + { + "epoch": 23.95640326975477, + "grad_norm": 8.784134864807129, + "learning_rate": 1.778372777874881e-05, + "loss": 0.6589, + "step": 8792 + }, + { + "epoch": 23.959128065395095, + "grad_norm": 8.895995140075684, + "learning_rate": 1.7783173716213996e-05, + "loss": 0.6352, + "step": 8793 + }, + { + "epoch": 23.96185286103542, + "grad_norm": 8.353736877441406, + "learning_rate": 1.778261959306407e-05, + "loss": 0.7448, + "step": 8794 + }, + { + "epoch": 23.96457765667575, + "grad_norm": 7.859174728393555, + "learning_rate": 1.7782065409303354e-05, + "loss": 0.6858, + "step": 8795 + }, + { + "epoch": 23.967302452316076, + "grad_norm": 6.824813365936279, + "learning_rate": 1.7781511164936166e-05, + "loss": 0.5969, + "step": 8796 + }, + { + "epoch": 23.970027247956402, + "grad_norm": 7.503294467926025, + "learning_rate": 1.7780956859966816e-05, + "loss": 0.5964, + "step": 8797 + }, + { + "epoch": 23.97275204359673, + "grad_norm": 16.265262603759766, + "learning_rate": 1.7780402494399625e-05, + "loss": 0.6479, + "step": 8798 + }, + { + "epoch": 23.975476839237057, + "grad_norm": 10.838225364685059, + "learning_rate": 1.777984806823891e-05, + "loss": 0.9917, + "step": 8799 + }, + { + "epoch": 23.978201634877383, + "grad_norm": 8.561009407043457, + "learning_rate": 1.777929358148899e-05, + "loss": 0.5197, + "step": 8800 + }, + { + "epoch": 23.980926430517712, + "grad_norm": 7.6468000411987305, + "learning_rate": 1.777873903415418e-05, + "loss": 0.6396, + "step": 8801 + }, + { + "epoch": 23.983651226158038, + "grad_norm": 8.598393440246582, + "learning_rate": 1.7778184426238805e-05, + "loss": 0.7515, + "step": 8802 + }, + { + "epoch": 23.986376021798364, + "grad_norm": 8.6475248336792, + "learning_rate": 1.7777629757747177e-05, + "loss": 0.7531, + "step": 8803 + }, + { + "epoch": 23.989100817438693, + "grad_norm": 9.719010353088379, + "learning_rate": 1.7777075028683617e-05, + "loss": 0.5279, + "step": 8804 + }, + { + "epoch": 23.99182561307902, + "grad_norm": 6.662492275238037, + "learning_rate": 1.7776520239052447e-05, + "loss": 0.6635, + "step": 8805 + }, + { + "epoch": 23.994550408719345, + "grad_norm": 9.058082580566406, + "learning_rate": 1.777596538885799e-05, + "loss": 0.7446, + "step": 8806 + }, + { + "epoch": 23.997275204359674, + "grad_norm": 11.454946517944336, + "learning_rate": 1.7775410478104566e-05, + "loss": 0.7344, + "step": 8807 + }, + { + "epoch": 24.0, + "grad_norm": 7.274345397949219, + "learning_rate": 1.7774855506796497e-05, + "loss": 0.6438, + "step": 8808 + }, + { + "epoch": 24.002724795640326, + "grad_norm": 9.180956840515137, + "learning_rate": 1.77743004749381e-05, + "loss": 0.7663, + "step": 8809 + }, + { + "epoch": 24.005449591280655, + "grad_norm": 9.361931800842285, + "learning_rate": 1.77737453825337e-05, + "loss": 0.5725, + "step": 8810 + }, + { + "epoch": 24.00817438692098, + "grad_norm": 13.765742301940918, + "learning_rate": 1.7773190229587624e-05, + "loss": 0.6661, + "step": 8811 + }, + { + "epoch": 24.010899182561307, + "grad_norm": 7.7954325675964355, + "learning_rate": 1.777263501610419e-05, + "loss": 0.5587, + "step": 8812 + }, + { + "epoch": 24.013623978201636, + "grad_norm": 9.439408302307129, + "learning_rate": 1.7772079742087728e-05, + "loss": 0.5846, + "step": 8813 + }, + { + "epoch": 24.016348773841962, + "grad_norm": 8.322379112243652, + "learning_rate": 1.7771524407542557e-05, + "loss": 0.4714, + "step": 8814 + }, + { + "epoch": 24.019073569482288, + "grad_norm": 9.102412223815918, + "learning_rate": 1.7770969012473002e-05, + "loss": 0.5491, + "step": 8815 + }, + { + "epoch": 24.021798365122617, + "grad_norm": 7.189291954040527, + "learning_rate": 1.777041355688339e-05, + "loss": 0.5874, + "step": 8816 + }, + { + "epoch": 24.024523160762943, + "grad_norm": 8.017959594726562, + "learning_rate": 1.7769858040778052e-05, + "loss": 0.5565, + "step": 8817 + }, + { + "epoch": 24.02724795640327, + "grad_norm": 7.578139305114746, + "learning_rate": 1.7769302464161307e-05, + "loss": 0.606, + "step": 8818 + }, + { + "epoch": 24.029972752043598, + "grad_norm": 8.187880516052246, + "learning_rate": 1.7768746827037485e-05, + "loss": 0.8091, + "step": 8819 + }, + { + "epoch": 24.032697547683924, + "grad_norm": 11.661108016967773, + "learning_rate": 1.7768191129410913e-05, + "loss": 0.5452, + "step": 8820 + }, + { + "epoch": 24.03542234332425, + "grad_norm": 7.239599227905273, + "learning_rate": 1.776763537128592e-05, + "loss": 0.7075, + "step": 8821 + }, + { + "epoch": 24.03814713896458, + "grad_norm": 6.680261135101318, + "learning_rate": 1.7767079552666827e-05, + "loss": 0.641, + "step": 8822 + }, + { + "epoch": 24.040871934604905, + "grad_norm": 6.787194728851318, + "learning_rate": 1.7766523673557973e-05, + "loss": 0.5983, + "step": 8823 + }, + { + "epoch": 24.04359673024523, + "grad_norm": 7.517077445983887, + "learning_rate": 1.7765967733963683e-05, + "loss": 0.7063, + "step": 8824 + }, + { + "epoch": 24.04632152588556, + "grad_norm": 7.721282482147217, + "learning_rate": 1.7765411733888286e-05, + "loss": 0.5142, + "step": 8825 + }, + { + "epoch": 24.049046321525886, + "grad_norm": 7.770618438720703, + "learning_rate": 1.776485567333611e-05, + "loss": 0.7643, + "step": 8826 + }, + { + "epoch": 24.05177111716621, + "grad_norm": 10.189929008483887, + "learning_rate": 1.776429955231149e-05, + "loss": 0.5923, + "step": 8827 + }, + { + "epoch": 24.05449591280654, + "grad_norm": 9.526094436645508, + "learning_rate": 1.7763743370818754e-05, + "loss": 0.5329, + "step": 8828 + }, + { + "epoch": 24.057220708446867, + "grad_norm": 7.70242166519165, + "learning_rate": 1.7763187128862237e-05, + "loss": 0.5778, + "step": 8829 + }, + { + "epoch": 24.059945504087192, + "grad_norm": 6.777331829071045, + "learning_rate": 1.7762630826446266e-05, + "loss": 0.5876, + "step": 8830 + }, + { + "epoch": 24.06267029972752, + "grad_norm": 6.557994842529297, + "learning_rate": 1.7762074463575175e-05, + "loss": 0.5725, + "step": 8831 + }, + { + "epoch": 24.065395095367847, + "grad_norm": 8.306127548217773, + "learning_rate": 1.77615180402533e-05, + "loss": 0.5729, + "step": 8832 + }, + { + "epoch": 24.068119891008173, + "grad_norm": 11.447331428527832, + "learning_rate": 1.776096155648497e-05, + "loss": 0.5963, + "step": 8833 + }, + { + "epoch": 24.070844686648503, + "grad_norm": 9.204768180847168, + "learning_rate": 1.7760405012274524e-05, + "loss": 0.7494, + "step": 8834 + }, + { + "epoch": 24.07356948228883, + "grad_norm": 7.9457197189331055, + "learning_rate": 1.775984840762629e-05, + "loss": 0.6118, + "step": 8835 + }, + { + "epoch": 24.076294277929154, + "grad_norm": 8.53819465637207, + "learning_rate": 1.775929174254461e-05, + "loss": 0.5968, + "step": 8836 + }, + { + "epoch": 24.079019073569484, + "grad_norm": 9.084603309631348, + "learning_rate": 1.7758735017033815e-05, + "loss": 0.5464, + "step": 8837 + }, + { + "epoch": 24.08174386920981, + "grad_norm": 8.14167594909668, + "learning_rate": 1.775817823109824e-05, + "loss": 0.5959, + "step": 8838 + }, + { + "epoch": 24.084468664850135, + "grad_norm": 8.741009712219238, + "learning_rate": 1.7757621384742224e-05, + "loss": 0.6049, + "step": 8839 + }, + { + "epoch": 24.087193460490465, + "grad_norm": 8.19509220123291, + "learning_rate": 1.7757064477970102e-05, + "loss": 0.6028, + "step": 8840 + }, + { + "epoch": 24.08991825613079, + "grad_norm": 7.75546932220459, + "learning_rate": 1.775650751078621e-05, + "loss": 0.6354, + "step": 8841 + }, + { + "epoch": 24.092643051771116, + "grad_norm": 6.951767444610596, + "learning_rate": 1.775595048319489e-05, + "loss": 0.4155, + "step": 8842 + }, + { + "epoch": 24.095367847411445, + "grad_norm": 7.5613837242126465, + "learning_rate": 1.7755393395200474e-05, + "loss": 0.5192, + "step": 8843 + }, + { + "epoch": 24.09809264305177, + "grad_norm": 7.482040882110596, + "learning_rate": 1.7754836246807308e-05, + "loss": 0.5631, + "step": 8844 + }, + { + "epoch": 24.100817438692097, + "grad_norm": 6.91545295715332, + "learning_rate": 1.775427903801972e-05, + "loss": 0.774, + "step": 8845 + }, + { + "epoch": 24.103542234332426, + "grad_norm": 6.406805515289307, + "learning_rate": 1.7753721768842062e-05, + "loss": 0.6931, + "step": 8846 + }, + { + "epoch": 24.106267029972752, + "grad_norm": 7.519858360290527, + "learning_rate": 1.775316443927867e-05, + "loss": 0.6432, + "step": 8847 + }, + { + "epoch": 24.108991825613078, + "grad_norm": 7.980284690856934, + "learning_rate": 1.7752607049333878e-05, + "loss": 0.6577, + "step": 8848 + }, + { + "epoch": 24.111716621253407, + "grad_norm": 6.317418575286865, + "learning_rate": 1.7752049599012037e-05, + "loss": 0.6211, + "step": 8849 + }, + { + "epoch": 24.114441416893733, + "grad_norm": 7.740270614624023, + "learning_rate": 1.775149208831748e-05, + "loss": 0.6008, + "step": 8850 + }, + { + "epoch": 24.11716621253406, + "grad_norm": 9.802743911743164, + "learning_rate": 1.775093451725455e-05, + "loss": 0.4851, + "step": 8851 + }, + { + "epoch": 24.11989100817439, + "grad_norm": 9.85669231414795, + "learning_rate": 1.775037688582759e-05, + "loss": 0.5617, + "step": 8852 + }, + { + "epoch": 24.122615803814714, + "grad_norm": 13.62320613861084, + "learning_rate": 1.7749819194040953e-05, + "loss": 0.6625, + "step": 8853 + }, + { + "epoch": 24.12534059945504, + "grad_norm": 8.604169845581055, + "learning_rate": 1.774926144189897e-05, + "loss": 0.5516, + "step": 8854 + }, + { + "epoch": 24.12806539509537, + "grad_norm": 7.5963945388793945, + "learning_rate": 1.7748703629405985e-05, + "loss": 0.6075, + "step": 8855 + }, + { + "epoch": 24.130790190735695, + "grad_norm": 10.069814682006836, + "learning_rate": 1.7748145756566346e-05, + "loss": 0.6424, + "step": 8856 + }, + { + "epoch": 24.13351498637602, + "grad_norm": 9.934816360473633, + "learning_rate": 1.7747587823384398e-05, + "loss": 0.6561, + "step": 8857 + }, + { + "epoch": 24.13623978201635, + "grad_norm": 7.163966178894043, + "learning_rate": 1.7747029829864485e-05, + "loss": 0.5048, + "step": 8858 + }, + { + "epoch": 24.138964577656676, + "grad_norm": 6.831045627593994, + "learning_rate": 1.7746471776010953e-05, + "loss": 0.5886, + "step": 8859 + }, + { + "epoch": 24.141689373297, + "grad_norm": 8.305370330810547, + "learning_rate": 1.7745913661828148e-05, + "loss": 0.6605, + "step": 8860 + }, + { + "epoch": 24.14441416893733, + "grad_norm": 7.8919677734375, + "learning_rate": 1.7745355487320418e-05, + "loss": 0.5443, + "step": 8861 + }, + { + "epoch": 24.147138964577657, + "grad_norm": 8.134822845458984, + "learning_rate": 1.774479725249211e-05, + "loss": 0.4431, + "step": 8862 + }, + { + "epoch": 24.149863760217983, + "grad_norm": 6.560815334320068, + "learning_rate": 1.774423895734757e-05, + "loss": 0.465, + "step": 8863 + }, + { + "epoch": 24.152588555858312, + "grad_norm": 6.805933475494385, + "learning_rate": 1.7743680601891146e-05, + "loss": 0.5242, + "step": 8864 + }, + { + "epoch": 24.155313351498638, + "grad_norm": 12.554423332214355, + "learning_rate": 1.7743122186127186e-05, + "loss": 0.5912, + "step": 8865 + }, + { + "epoch": 24.158038147138964, + "grad_norm": 9.693236351013184, + "learning_rate": 1.7742563710060036e-05, + "loss": 0.7233, + "step": 8866 + }, + { + "epoch": 24.160762942779293, + "grad_norm": 7.917965888977051, + "learning_rate": 1.774200517369405e-05, + "loss": 0.5757, + "step": 8867 + }, + { + "epoch": 24.16348773841962, + "grad_norm": 7.072247505187988, + "learning_rate": 1.7741446577033584e-05, + "loss": 0.6943, + "step": 8868 + }, + { + "epoch": 24.166212534059945, + "grad_norm": 7.145406723022461, + "learning_rate": 1.7740887920082975e-05, + "loss": 0.5609, + "step": 8869 + }, + { + "epoch": 24.168937329700274, + "grad_norm": 7.124011993408203, + "learning_rate": 1.774032920284658e-05, + "loss": 0.5221, + "step": 8870 + }, + { + "epoch": 24.1716621253406, + "grad_norm": 13.629548072814941, + "learning_rate": 1.7739770425328755e-05, + "loss": 0.5374, + "step": 8871 + }, + { + "epoch": 24.174386920980925, + "grad_norm": 8.548341751098633, + "learning_rate": 1.773921158753384e-05, + "loss": 0.5474, + "step": 8872 + }, + { + "epoch": 24.177111716621255, + "grad_norm": 7.261266708374023, + "learning_rate": 1.77386526894662e-05, + "loss": 0.4607, + "step": 8873 + }, + { + "epoch": 24.17983651226158, + "grad_norm": 8.976286888122559, + "learning_rate": 1.773809373113018e-05, + "loss": 0.6172, + "step": 8874 + }, + { + "epoch": 24.182561307901906, + "grad_norm": 8.677587509155273, + "learning_rate": 1.7737534712530133e-05, + "loss": 0.5142, + "step": 8875 + }, + { + "epoch": 24.185286103542236, + "grad_norm": 6.425335884094238, + "learning_rate": 1.7736975633670418e-05, + "loss": 0.6136, + "step": 8876 + }, + { + "epoch": 24.18801089918256, + "grad_norm": 14.822269439697266, + "learning_rate": 1.7736416494555384e-05, + "loss": 0.6446, + "step": 8877 + }, + { + "epoch": 24.190735694822887, + "grad_norm": 7.213735580444336, + "learning_rate": 1.773585729518939e-05, + "loss": 0.5947, + "step": 8878 + }, + { + "epoch": 24.193460490463217, + "grad_norm": 21.222930908203125, + "learning_rate": 1.7735298035576784e-05, + "loss": 0.5765, + "step": 8879 + }, + { + "epoch": 24.196185286103542, + "grad_norm": 9.02164077758789, + "learning_rate": 1.7734738715721928e-05, + "loss": 0.5336, + "step": 8880 + }, + { + "epoch": 24.19891008174387, + "grad_norm": 8.176846504211426, + "learning_rate": 1.7734179335629175e-05, + "loss": 0.7168, + "step": 8881 + }, + { + "epoch": 24.201634877384198, + "grad_norm": 7.966734409332275, + "learning_rate": 1.7733619895302886e-05, + "loss": 0.5344, + "step": 8882 + }, + { + "epoch": 24.204359673024523, + "grad_norm": 7.438953876495361, + "learning_rate": 1.773306039474741e-05, + "loss": 0.5792, + "step": 8883 + }, + { + "epoch": 24.20708446866485, + "grad_norm": 8.2271146774292, + "learning_rate": 1.7732500833967112e-05, + "loss": 0.5456, + "step": 8884 + }, + { + "epoch": 24.20980926430518, + "grad_norm": 9.87670612335205, + "learning_rate": 1.773194121296634e-05, + "loss": 0.5912, + "step": 8885 + }, + { + "epoch": 24.212534059945504, + "grad_norm": 6.806392192840576, + "learning_rate": 1.7731381531749465e-05, + "loss": 0.5977, + "step": 8886 + }, + { + "epoch": 24.21525885558583, + "grad_norm": 9.069767951965332, + "learning_rate": 1.7730821790320836e-05, + "loss": 0.7052, + "step": 8887 + }, + { + "epoch": 24.21798365122616, + "grad_norm": 7.941775798797607, + "learning_rate": 1.7730261988684817e-05, + "loss": 0.4982, + "step": 8888 + }, + { + "epoch": 24.220708446866485, + "grad_norm": 8.840487480163574, + "learning_rate": 1.772970212684577e-05, + "loss": 0.5079, + "step": 8889 + }, + { + "epoch": 24.22343324250681, + "grad_norm": 6.968510627746582, + "learning_rate": 1.7729142204808044e-05, + "loss": 0.8477, + "step": 8890 + }, + { + "epoch": 24.22615803814714, + "grad_norm": 8.35019588470459, + "learning_rate": 1.7728582222576012e-05, + "loss": 0.733, + "step": 8891 + }, + { + "epoch": 24.228882833787466, + "grad_norm": 20.245084762573242, + "learning_rate": 1.7728022180154032e-05, + "loss": 0.648, + "step": 8892 + }, + { + "epoch": 24.231607629427792, + "grad_norm": 6.931366443634033, + "learning_rate": 1.772746207754646e-05, + "loss": 0.5787, + "step": 8893 + }, + { + "epoch": 24.23433242506812, + "grad_norm": 8.669196128845215, + "learning_rate": 1.7726901914757664e-05, + "loss": 0.6771, + "step": 8894 + }, + { + "epoch": 24.237057220708447, + "grad_norm": 8.523401260375977, + "learning_rate": 1.7726341691792007e-05, + "loss": 0.6283, + "step": 8895 + }, + { + "epoch": 24.239782016348773, + "grad_norm": 8.485087394714355, + "learning_rate": 1.7725781408653844e-05, + "loss": 0.4896, + "step": 8896 + }, + { + "epoch": 24.242506811989102, + "grad_norm": 9.202347755432129, + "learning_rate": 1.772522106534755e-05, + "loss": 0.6118, + "step": 8897 + }, + { + "epoch": 24.245231607629428, + "grad_norm": 8.783988952636719, + "learning_rate": 1.7724660661877478e-05, + "loss": 0.5195, + "step": 8898 + }, + { + "epoch": 24.247956403269754, + "grad_norm": 8.67990493774414, + "learning_rate": 1.7724100198248e-05, + "loss": 0.6837, + "step": 8899 + }, + { + "epoch": 24.250681198910083, + "grad_norm": 6.818397521972656, + "learning_rate": 1.7723539674463473e-05, + "loss": 0.7156, + "step": 8900 + }, + { + "epoch": 24.25340599455041, + "grad_norm": 11.372779846191406, + "learning_rate": 1.7722979090528275e-05, + "loss": 0.8043, + "step": 8901 + }, + { + "epoch": 24.256130790190735, + "grad_norm": 7.923463821411133, + "learning_rate": 1.7722418446446764e-05, + "loss": 0.7062, + "step": 8902 + }, + { + "epoch": 24.258855585831064, + "grad_norm": 9.79150104522705, + "learning_rate": 1.7721857742223302e-05, + "loss": 0.5948, + "step": 8903 + }, + { + "epoch": 24.26158038147139, + "grad_norm": 8.668356895446777, + "learning_rate": 1.7721296977862263e-05, + "loss": 0.7242, + "step": 8904 + }, + { + "epoch": 24.264305177111716, + "grad_norm": 7.8720574378967285, + "learning_rate": 1.772073615336801e-05, + "loss": 0.6948, + "step": 8905 + }, + { + "epoch": 24.267029972752045, + "grad_norm": 13.879902839660645, + "learning_rate": 1.7720175268744914e-05, + "loss": 0.6692, + "step": 8906 + }, + { + "epoch": 24.26975476839237, + "grad_norm": 8.270305633544922, + "learning_rate": 1.771961432399734e-05, + "loss": 0.5986, + "step": 8907 + }, + { + "epoch": 24.272479564032697, + "grad_norm": 7.922856330871582, + "learning_rate": 1.771905331912966e-05, + "loss": 0.5305, + "step": 8908 + }, + { + "epoch": 24.275204359673026, + "grad_norm": 8.344463348388672, + "learning_rate": 1.771849225414624e-05, + "loss": 0.6023, + "step": 8909 + }, + { + "epoch": 24.277929155313352, + "grad_norm": 12.2206392288208, + "learning_rate": 1.7717931129051453e-05, + "loss": 0.6153, + "step": 8910 + }, + { + "epoch": 24.280653950953678, + "grad_norm": 8.765689849853516, + "learning_rate": 1.7717369943849666e-05, + "loss": 0.6091, + "step": 8911 + }, + { + "epoch": 24.283378746594007, + "grad_norm": 8.562520027160645, + "learning_rate": 1.771680869854525e-05, + "loss": 0.7114, + "step": 8912 + }, + { + "epoch": 24.286103542234333, + "grad_norm": 7.536573886871338, + "learning_rate": 1.7716247393142574e-05, + "loss": 0.8361, + "step": 8913 + }, + { + "epoch": 24.28882833787466, + "grad_norm": 9.855628967285156, + "learning_rate": 1.7715686027646012e-05, + "loss": 0.7352, + "step": 8914 + }, + { + "epoch": 24.291553133514988, + "grad_norm": 8.171891212463379, + "learning_rate": 1.7715124602059938e-05, + "loss": 0.5229, + "step": 8915 + }, + { + "epoch": 24.294277929155314, + "grad_norm": 8.117642402648926, + "learning_rate": 1.7714563116388717e-05, + "loss": 0.5455, + "step": 8916 + }, + { + "epoch": 24.29700272479564, + "grad_norm": 8.047110557556152, + "learning_rate": 1.771400157063673e-05, + "loss": 0.6682, + "step": 8917 + }, + { + "epoch": 24.29972752043597, + "grad_norm": 6.081267356872559, + "learning_rate": 1.771343996480835e-05, + "loss": 0.4733, + "step": 8918 + }, + { + "epoch": 24.302452316076295, + "grad_norm": 7.226494312286377, + "learning_rate": 1.7712878298907947e-05, + "loss": 0.6339, + "step": 8919 + }, + { + "epoch": 24.30517711171662, + "grad_norm": 7.701619625091553, + "learning_rate": 1.7712316572939893e-05, + "loss": 0.682, + "step": 8920 + }, + { + "epoch": 24.30790190735695, + "grad_norm": 12.228361129760742, + "learning_rate": 1.7711754786908566e-05, + "loss": 0.7488, + "step": 8921 + }, + { + "epoch": 24.310626702997276, + "grad_norm": 7.400647163391113, + "learning_rate": 1.771119294081834e-05, + "loss": 0.5571, + "step": 8922 + }, + { + "epoch": 24.3133514986376, + "grad_norm": 8.388209342956543, + "learning_rate": 1.7710631034673596e-05, + "loss": 0.6585, + "step": 8923 + }, + { + "epoch": 24.31607629427793, + "grad_norm": 11.702413558959961, + "learning_rate": 1.77100690684787e-05, + "loss": 0.6978, + "step": 8924 + }, + { + "epoch": 24.318801089918257, + "grad_norm": 8.448484420776367, + "learning_rate": 1.770950704223804e-05, + "loss": 0.6179, + "step": 8925 + }, + { + "epoch": 24.321525885558582, + "grad_norm": 13.490495681762695, + "learning_rate": 1.7708944955955983e-05, + "loss": 0.5149, + "step": 8926 + }, + { + "epoch": 24.32425068119891, + "grad_norm": 7.025055885314941, + "learning_rate": 1.7708382809636916e-05, + "loss": 0.6355, + "step": 8927 + }, + { + "epoch": 24.326975476839237, + "grad_norm": 9.349492073059082, + "learning_rate": 1.7707820603285205e-05, + "loss": 0.6227, + "step": 8928 + }, + { + "epoch": 24.329700272479563, + "grad_norm": 7.702953338623047, + "learning_rate": 1.770725833690524e-05, + "loss": 0.587, + "step": 8929 + }, + { + "epoch": 24.332425068119893, + "grad_norm": 8.693236351013184, + "learning_rate": 1.7706696010501393e-05, + "loss": 0.6459, + "step": 8930 + }, + { + "epoch": 24.33514986376022, + "grad_norm": 7.2914042472839355, + "learning_rate": 1.7706133624078046e-05, + "loss": 0.6217, + "step": 8931 + }, + { + "epoch": 24.337874659400544, + "grad_norm": 8.049612045288086, + "learning_rate": 1.7705571177639576e-05, + "loss": 0.5838, + "step": 8932 + }, + { + "epoch": 24.340599455040874, + "grad_norm": 6.403984069824219, + "learning_rate": 1.770500867119037e-05, + "loss": 0.636, + "step": 8933 + }, + { + "epoch": 24.3433242506812, + "grad_norm": 8.680638313293457, + "learning_rate": 1.7704446104734803e-05, + "loss": 0.6687, + "step": 8934 + }, + { + "epoch": 24.346049046321525, + "grad_norm": 10.090593338012695, + "learning_rate": 1.7703883478277254e-05, + "loss": 0.5801, + "step": 8935 + }, + { + "epoch": 24.348773841961854, + "grad_norm": 7.0510573387146, + "learning_rate": 1.7703320791822115e-05, + "loss": 0.5844, + "step": 8936 + }, + { + "epoch": 24.35149863760218, + "grad_norm": 7.9243292808532715, + "learning_rate": 1.7702758045373757e-05, + "loss": 0.56, + "step": 8937 + }, + { + "epoch": 24.354223433242506, + "grad_norm": 8.23276138305664, + "learning_rate": 1.7702195238936567e-05, + "loss": 0.5253, + "step": 8938 + }, + { + "epoch": 24.356948228882835, + "grad_norm": 7.644566059112549, + "learning_rate": 1.7701632372514934e-05, + "loss": 0.5872, + "step": 8939 + }, + { + "epoch": 24.35967302452316, + "grad_norm": 7.820858001708984, + "learning_rate": 1.770106944611323e-05, + "loss": 0.5786, + "step": 8940 + }, + { + "epoch": 24.362397820163487, + "grad_norm": 8.273859977722168, + "learning_rate": 1.7700506459735844e-05, + "loss": 0.6094, + "step": 8941 + }, + { + "epoch": 24.365122615803816, + "grad_norm": 8.284680366516113, + "learning_rate": 1.7699943413387166e-05, + "loss": 0.6714, + "step": 8942 + }, + { + "epoch": 24.367847411444142, + "grad_norm": 7.8198981285095215, + "learning_rate": 1.7699380307071575e-05, + "loss": 0.6301, + "step": 8943 + }, + { + "epoch": 24.370572207084468, + "grad_norm": 10.067788124084473, + "learning_rate": 1.7698817140793458e-05, + "loss": 0.5275, + "step": 8944 + }, + { + "epoch": 24.373297002724797, + "grad_norm": 6.036175727844238, + "learning_rate": 1.76982539145572e-05, + "loss": 0.774, + "step": 8945 + }, + { + "epoch": 24.376021798365123, + "grad_norm": 8.07691478729248, + "learning_rate": 1.7697690628367188e-05, + "loss": 0.6495, + "step": 8946 + }, + { + "epoch": 24.37874659400545, + "grad_norm": 7.238626480102539, + "learning_rate": 1.769712728222781e-05, + "loss": 0.6085, + "step": 8947 + }, + { + "epoch": 24.381471389645778, + "grad_norm": 7.894228935241699, + "learning_rate": 1.7696563876143455e-05, + "loss": 0.7269, + "step": 8948 + }, + { + "epoch": 24.384196185286104, + "grad_norm": 8.925589561462402, + "learning_rate": 1.7696000410118504e-05, + "loss": 0.5912, + "step": 8949 + }, + { + "epoch": 24.38692098092643, + "grad_norm": 8.214383125305176, + "learning_rate": 1.7695436884157353e-05, + "loss": 0.6021, + "step": 8950 + }, + { + "epoch": 24.38964577656676, + "grad_norm": 7.753206253051758, + "learning_rate": 1.7694873298264385e-05, + "loss": 0.6138, + "step": 8951 + }, + { + "epoch": 24.392370572207085, + "grad_norm": 7.649204254150391, + "learning_rate": 1.769430965244399e-05, + "loss": 0.6303, + "step": 8952 + }, + { + "epoch": 24.39509536784741, + "grad_norm": 7.90365743637085, + "learning_rate": 1.7693745946700566e-05, + "loss": 0.632, + "step": 8953 + }, + { + "epoch": 24.39782016348774, + "grad_norm": 8.675521850585938, + "learning_rate": 1.769318218103849e-05, + "loss": 0.6139, + "step": 8954 + }, + { + "epoch": 24.400544959128066, + "grad_norm": 9.54442310333252, + "learning_rate": 1.7692618355462157e-05, + "loss": 0.5366, + "step": 8955 + }, + { + "epoch": 24.40326975476839, + "grad_norm": 7.759203910827637, + "learning_rate": 1.7692054469975964e-05, + "loss": 0.4946, + "step": 8956 + }, + { + "epoch": 24.40599455040872, + "grad_norm": 26.981840133666992, + "learning_rate": 1.7691490524584297e-05, + "loss": 0.7293, + "step": 8957 + }, + { + "epoch": 24.408719346049047, + "grad_norm": 9.283357620239258, + "learning_rate": 1.7690926519291548e-05, + "loss": 0.7754, + "step": 8958 + }, + { + "epoch": 24.411444141689373, + "grad_norm": 7.14051628112793, + "learning_rate": 1.7690362454102114e-05, + "loss": 0.5724, + "step": 8959 + }, + { + "epoch": 24.414168937329702, + "grad_norm": 8.556551933288574, + "learning_rate": 1.7689798329020386e-05, + "loss": 0.5964, + "step": 8960 + }, + { + "epoch": 24.416893732970028, + "grad_norm": 7.010879993438721, + "learning_rate": 1.768923414405075e-05, + "loss": 0.54, + "step": 8961 + }, + { + "epoch": 24.419618528610354, + "grad_norm": 7.770777225494385, + "learning_rate": 1.768866989919761e-05, + "loss": 0.5397, + "step": 8962 + }, + { + "epoch": 24.422343324250683, + "grad_norm": 8.03707504272461, + "learning_rate": 1.7688105594465356e-05, + "loss": 0.6537, + "step": 8963 + }, + { + "epoch": 24.42506811989101, + "grad_norm": 8.599611282348633, + "learning_rate": 1.768754122985838e-05, + "loss": 0.6307, + "step": 8964 + }, + { + "epoch": 24.427792915531334, + "grad_norm": 8.289087295532227, + "learning_rate": 1.7686976805381084e-05, + "loss": 0.6356, + "step": 8965 + }, + { + "epoch": 24.430517711171664, + "grad_norm": 7.699691295623779, + "learning_rate": 1.7686412321037857e-05, + "loss": 0.5087, + "step": 8966 + }, + { + "epoch": 24.43324250681199, + "grad_norm": 6.849878311157227, + "learning_rate": 1.76858477768331e-05, + "loss": 0.5422, + "step": 8967 + }, + { + "epoch": 24.435967302452315, + "grad_norm": 7.258474826812744, + "learning_rate": 1.768528317277121e-05, + "loss": 0.4946, + "step": 8968 + }, + { + "epoch": 24.438692098092645, + "grad_norm": 13.755452156066895, + "learning_rate": 1.768471850885658e-05, + "loss": 0.538, + "step": 8969 + }, + { + "epoch": 24.44141689373297, + "grad_norm": 6.409572124481201, + "learning_rate": 1.768415378509361e-05, + "loss": 0.6858, + "step": 8970 + }, + { + "epoch": 24.444141689373296, + "grad_norm": 7.1457014083862305, + "learning_rate": 1.7683589001486696e-05, + "loss": 0.7271, + "step": 8971 + }, + { + "epoch": 24.446866485013626, + "grad_norm": 7.805093765258789, + "learning_rate": 1.768302415804024e-05, + "loss": 0.6566, + "step": 8972 + }, + { + "epoch": 24.44959128065395, + "grad_norm": 9.943085670471191, + "learning_rate": 1.768245925475864e-05, + "loss": 0.6541, + "step": 8973 + }, + { + "epoch": 24.452316076294277, + "grad_norm": 9.868901252746582, + "learning_rate": 1.7681894291646293e-05, + "loss": 0.4976, + "step": 8974 + }, + { + "epoch": 24.455040871934607, + "grad_norm": 9.336941719055176, + "learning_rate": 1.7681329268707598e-05, + "loss": 0.5962, + "step": 8975 + }, + { + "epoch": 24.457765667574932, + "grad_norm": 9.290519714355469, + "learning_rate": 1.768076418594696e-05, + "loss": 0.6821, + "step": 8976 + }, + { + "epoch": 24.460490463215258, + "grad_norm": 8.6582612991333, + "learning_rate": 1.768019904336878e-05, + "loss": 0.6085, + "step": 8977 + }, + { + "epoch": 24.463215258855588, + "grad_norm": 7.847634315490723, + "learning_rate": 1.7679633840977454e-05, + "loss": 0.5726, + "step": 8978 + }, + { + "epoch": 24.465940054495913, + "grad_norm": 8.564176559448242, + "learning_rate": 1.7679068578777387e-05, + "loss": 0.6907, + "step": 8979 + }, + { + "epoch": 24.46866485013624, + "grad_norm": 8.275485038757324, + "learning_rate": 1.7678503256772985e-05, + "loss": 0.6737, + "step": 8980 + }, + { + "epoch": 24.47138964577657, + "grad_norm": 9.92436408996582, + "learning_rate": 1.7677937874968646e-05, + "loss": 0.5356, + "step": 8981 + }, + { + "epoch": 24.474114441416894, + "grad_norm": 7.590448379516602, + "learning_rate": 1.767737243336877e-05, + "loss": 0.6865, + "step": 8982 + }, + { + "epoch": 24.47683923705722, + "grad_norm": 8.421040534973145, + "learning_rate": 1.7676806931977765e-05, + "loss": 0.5803, + "step": 8983 + }, + { + "epoch": 24.479564032697546, + "grad_norm": 9.572787284851074, + "learning_rate": 1.7676241370800037e-05, + "loss": 0.6669, + "step": 8984 + }, + { + "epoch": 24.482288828337875, + "grad_norm": 7.989253520965576, + "learning_rate": 1.7675675749839988e-05, + "loss": 0.5555, + "step": 8985 + }, + { + "epoch": 24.4850136239782, + "grad_norm": 7.294342517852783, + "learning_rate": 1.7675110069102022e-05, + "loss": 0.601, + "step": 8986 + }, + { + "epoch": 24.48773841961853, + "grad_norm": 8.045269012451172, + "learning_rate": 1.7674544328590547e-05, + "loss": 0.5715, + "step": 8987 + }, + { + "epoch": 24.490463215258856, + "grad_norm": 7.78092622756958, + "learning_rate": 1.7673978528309964e-05, + "loss": 0.6519, + "step": 8988 + }, + { + "epoch": 24.493188010899182, + "grad_norm": 8.891827583312988, + "learning_rate": 1.7673412668264687e-05, + "loss": 0.7516, + "step": 8989 + }, + { + "epoch": 24.495912806539508, + "grad_norm": 7.932019233703613, + "learning_rate": 1.767284674845912e-05, + "loss": 0.6261, + "step": 8990 + }, + { + "epoch": 24.498637602179837, + "grad_norm": 8.965381622314453, + "learning_rate": 1.767228076889767e-05, + "loss": 0.6057, + "step": 8991 + }, + { + "epoch": 24.501362397820163, + "grad_norm": 7.663259983062744, + "learning_rate": 1.767171472958474e-05, + "loss": 0.6209, + "step": 8992 + }, + { + "epoch": 24.504087193460492, + "grad_norm": 10.831971168518066, + "learning_rate": 1.7671148630524745e-05, + "loss": 0.5768, + "step": 8993 + }, + { + "epoch": 24.506811989100818, + "grad_norm": 7.278465747833252, + "learning_rate": 1.767058247172209e-05, + "loss": 0.6361, + "step": 8994 + }, + { + "epoch": 24.509536784741144, + "grad_norm": 10.330945014953613, + "learning_rate": 1.767001625318119e-05, + "loss": 0.655, + "step": 8995 + }, + { + "epoch": 24.51226158038147, + "grad_norm": 8.391157150268555, + "learning_rate": 1.7669449974906446e-05, + "loss": 0.6749, + "step": 8996 + }, + { + "epoch": 24.5149863760218, + "grad_norm": 6.680755615234375, + "learning_rate": 1.766888363690227e-05, + "loss": 0.6873, + "step": 8997 + }, + { + "epoch": 24.517711171662125, + "grad_norm": 9.297725677490234, + "learning_rate": 1.766831723917308e-05, + "loss": 0.6774, + "step": 8998 + }, + { + "epoch": 24.520435967302454, + "grad_norm": 7.953189849853516, + "learning_rate": 1.7667750781723282e-05, + "loss": 0.6069, + "step": 8999 + }, + { + "epoch": 24.52316076294278, + "grad_norm": 7.478446006774902, + "learning_rate": 1.7667184264557286e-05, + "loss": 0.6924, + "step": 9000 + }, + { + "epoch": 24.525885558583106, + "grad_norm": 7.651972770690918, + "learning_rate": 1.7666617687679505e-05, + "loss": 0.5371, + "step": 9001 + }, + { + "epoch": 24.52861035422343, + "grad_norm": 7.096588611602783, + "learning_rate": 1.766605105109435e-05, + "loss": 0.6324, + "step": 9002 + }, + { + "epoch": 24.53133514986376, + "grad_norm": 9.0821533203125, + "learning_rate": 1.7665484354806244e-05, + "loss": 0.7375, + "step": 9003 + }, + { + "epoch": 24.534059945504087, + "grad_norm": 6.819845676422119, + "learning_rate": 1.766491759881959e-05, + "loss": 0.5464, + "step": 9004 + }, + { + "epoch": 24.536784741144416, + "grad_norm": 8.515116691589355, + "learning_rate": 1.76643507831388e-05, + "loss": 0.5974, + "step": 9005 + }, + { + "epoch": 24.539509536784742, + "grad_norm": 9.178707122802734, + "learning_rate": 1.7663783907768298e-05, + "loss": 0.775, + "step": 9006 + }, + { + "epoch": 24.542234332425068, + "grad_norm": 7.338752269744873, + "learning_rate": 1.766321697271249e-05, + "loss": 0.6062, + "step": 9007 + }, + { + "epoch": 24.544959128065393, + "grad_norm": 8.074347496032715, + "learning_rate": 1.7662649977975794e-05, + "loss": 0.5342, + "step": 9008 + }, + { + "epoch": 24.547683923705723, + "grad_norm": 9.013470649719238, + "learning_rate": 1.766208292356263e-05, + "loss": 0.5968, + "step": 9009 + }, + { + "epoch": 24.55040871934605, + "grad_norm": 8.02351188659668, + "learning_rate": 1.766151580947741e-05, + "loss": 0.6957, + "step": 9010 + }, + { + "epoch": 24.553133514986374, + "grad_norm": 7.712599277496338, + "learning_rate": 1.766094863572455e-05, + "loss": 0.6971, + "step": 9011 + }, + { + "epoch": 24.555858310626704, + "grad_norm": 9.144669532775879, + "learning_rate": 1.7660381402308465e-05, + "loss": 0.678, + "step": 9012 + }, + { + "epoch": 24.55858310626703, + "grad_norm": 9.957167625427246, + "learning_rate": 1.765981410923358e-05, + "loss": 0.6351, + "step": 9013 + }, + { + "epoch": 24.561307901907355, + "grad_norm": 8.49111270904541, + "learning_rate": 1.7659246756504313e-05, + "loss": 0.577, + "step": 9014 + }, + { + "epoch": 24.564032697547685, + "grad_norm": 8.66234302520752, + "learning_rate": 1.7658679344125075e-05, + "loss": 0.5004, + "step": 9015 + }, + { + "epoch": 24.56675749318801, + "grad_norm": 10.30588436126709, + "learning_rate": 1.7658111872100287e-05, + "loss": 0.4411, + "step": 9016 + }, + { + "epoch": 24.569482288828336, + "grad_norm": 8.420388221740723, + "learning_rate": 1.7657544340434375e-05, + "loss": 0.6025, + "step": 9017 + }, + { + "epoch": 24.572207084468666, + "grad_norm": 8.328437805175781, + "learning_rate": 1.7656976749131753e-05, + "loss": 0.5613, + "step": 9018 + }, + { + "epoch": 24.57493188010899, + "grad_norm": 7.625326633453369, + "learning_rate": 1.765640909819684e-05, + "loss": 0.55, + "step": 9019 + }, + { + "epoch": 24.577656675749317, + "grad_norm": 10.811392784118652, + "learning_rate": 1.7655841387634057e-05, + "loss": 0.9567, + "step": 9020 + }, + { + "epoch": 24.580381471389646, + "grad_norm": 22.325044631958008, + "learning_rate": 1.765527361744783e-05, + "loss": 0.8193, + "step": 9021 + }, + { + "epoch": 24.583106267029972, + "grad_norm": 9.547529220581055, + "learning_rate": 1.765470578764258e-05, + "loss": 0.6692, + "step": 9022 + }, + { + "epoch": 24.585831062670298, + "grad_norm": 9.6989107131958, + "learning_rate": 1.7654137898222728e-05, + "loss": 0.7803, + "step": 9023 + }, + { + "epoch": 24.588555858310627, + "grad_norm": 10.85034465789795, + "learning_rate": 1.7653569949192698e-05, + "loss": 0.4957, + "step": 9024 + }, + { + "epoch": 24.591280653950953, + "grad_norm": 10.391765594482422, + "learning_rate": 1.765300194055691e-05, + "loss": 0.6892, + "step": 9025 + }, + { + "epoch": 24.59400544959128, + "grad_norm": 7.947431564331055, + "learning_rate": 1.7652433872319785e-05, + "loss": 0.6081, + "step": 9026 + }, + { + "epoch": 24.59673024523161, + "grad_norm": 7.657660961151123, + "learning_rate": 1.7651865744485755e-05, + "loss": 0.608, + "step": 9027 + }, + { + "epoch": 24.599455040871934, + "grad_norm": 12.64451789855957, + "learning_rate": 1.765129755705924e-05, + "loss": 0.6497, + "step": 9028 + }, + { + "epoch": 24.60217983651226, + "grad_norm": 7.720130443572998, + "learning_rate": 1.7650729310044667e-05, + "loss": 0.6349, + "step": 9029 + }, + { + "epoch": 24.60490463215259, + "grad_norm": 6.875460147857666, + "learning_rate": 1.765016100344646e-05, + "loss": 0.6453, + "step": 9030 + }, + { + "epoch": 24.607629427792915, + "grad_norm": 9.920437812805176, + "learning_rate": 1.7649592637269045e-05, + "loss": 0.6627, + "step": 9031 + }, + { + "epoch": 24.61035422343324, + "grad_norm": 7.393453598022461, + "learning_rate": 1.7649024211516848e-05, + "loss": 0.534, + "step": 9032 + }, + { + "epoch": 24.61307901907357, + "grad_norm": 8.168704986572266, + "learning_rate": 1.76484557261943e-05, + "loss": 0.5313, + "step": 9033 + }, + { + "epoch": 24.615803814713896, + "grad_norm": 8.419522285461426, + "learning_rate": 1.7647887181305822e-05, + "loss": 0.7209, + "step": 9034 + }, + { + "epoch": 24.618528610354222, + "grad_norm": 8.104192733764648, + "learning_rate": 1.7647318576855843e-05, + "loss": 0.6615, + "step": 9035 + }, + { + "epoch": 24.62125340599455, + "grad_norm": 7.3158488273620605, + "learning_rate": 1.7646749912848795e-05, + "loss": 0.6165, + "step": 9036 + }, + { + "epoch": 24.623978201634877, + "grad_norm": 8.528558731079102, + "learning_rate": 1.7646181189289108e-05, + "loss": 0.6068, + "step": 9037 + }, + { + "epoch": 24.626702997275203, + "grad_norm": 11.592710494995117, + "learning_rate": 1.7645612406181204e-05, + "loss": 0.6259, + "step": 9038 + }, + { + "epoch": 24.629427792915532, + "grad_norm": 7.119830131530762, + "learning_rate": 1.7645043563529518e-05, + "loss": 0.5124, + "step": 9039 + }, + { + "epoch": 24.632152588555858, + "grad_norm": 9.007055282592773, + "learning_rate": 1.764447466133848e-05, + "loss": 0.7422, + "step": 9040 + }, + { + "epoch": 24.634877384196184, + "grad_norm": 7.347967624664307, + "learning_rate": 1.7643905699612513e-05, + "loss": 0.5612, + "step": 9041 + }, + { + "epoch": 24.637602179836513, + "grad_norm": 8.965445518493652, + "learning_rate": 1.7643336678356063e-05, + "loss": 0.7264, + "step": 9042 + }, + { + "epoch": 24.64032697547684, + "grad_norm": 10.226734161376953, + "learning_rate": 1.7642767597573548e-05, + "loss": 0.6119, + "step": 9043 + }, + { + "epoch": 24.643051771117165, + "grad_norm": 7.831031799316406, + "learning_rate": 1.7642198457269405e-05, + "loss": 0.5123, + "step": 9044 + }, + { + "epoch": 24.645776566757494, + "grad_norm": 7.503066062927246, + "learning_rate": 1.7641629257448068e-05, + "loss": 0.5405, + "step": 9045 + }, + { + "epoch": 24.64850136239782, + "grad_norm": 15.644835472106934, + "learning_rate": 1.7641059998113966e-05, + "loss": 0.6517, + "step": 9046 + }, + { + "epoch": 24.651226158038146, + "grad_norm": 8.321699142456055, + "learning_rate": 1.7640490679271537e-05, + "loss": 0.7328, + "step": 9047 + }, + { + "epoch": 24.653950953678475, + "grad_norm": 11.984652519226074, + "learning_rate": 1.7639921300925213e-05, + "loss": 0.6308, + "step": 9048 + }, + { + "epoch": 24.6566757493188, + "grad_norm": 7.8258748054504395, + "learning_rate": 1.7639351863079426e-05, + "loss": 0.6423, + "step": 9049 + }, + { + "epoch": 24.659400544959126, + "grad_norm": 6.94466495513916, + "learning_rate": 1.7638782365738613e-05, + "loss": 0.6277, + "step": 9050 + }, + { + "epoch": 24.662125340599456, + "grad_norm": 6.627162456512451, + "learning_rate": 1.763821280890721e-05, + "loss": 0.7846, + "step": 9051 + }, + { + "epoch": 24.66485013623978, + "grad_norm": 10.093145370483398, + "learning_rate": 1.763764319258965e-05, + "loss": 0.6024, + "step": 9052 + }, + { + "epoch": 24.667574931880107, + "grad_norm": 10.328065872192383, + "learning_rate": 1.7637073516790373e-05, + "loss": 0.6041, + "step": 9053 + }, + { + "epoch": 24.670299727520437, + "grad_norm": 8.410794258117676, + "learning_rate": 1.7636503781513808e-05, + "loss": 0.7278, + "step": 9054 + }, + { + "epoch": 24.673024523160763, + "grad_norm": 7.4909348487854, + "learning_rate": 1.7635933986764403e-05, + "loss": 0.575, + "step": 9055 + }, + { + "epoch": 24.67574931880109, + "grad_norm": 10.587180137634277, + "learning_rate": 1.7635364132546587e-05, + "loss": 0.4573, + "step": 9056 + }, + { + "epoch": 24.678474114441418, + "grad_norm": 10.027560234069824, + "learning_rate": 1.7634794218864802e-05, + "loss": 0.7155, + "step": 9057 + }, + { + "epoch": 24.681198910081743, + "grad_norm": 8.658035278320312, + "learning_rate": 1.7634224245723482e-05, + "loss": 0.6944, + "step": 9058 + }, + { + "epoch": 24.68392370572207, + "grad_norm": 7.574838161468506, + "learning_rate": 1.7633654213127074e-05, + "loss": 0.5848, + "step": 9059 + }, + { + "epoch": 24.6866485013624, + "grad_norm": 15.168315887451172, + "learning_rate": 1.763308412108001e-05, + "loss": 0.8035, + "step": 9060 + }, + { + "epoch": 24.689373297002724, + "grad_norm": 13.63664722442627, + "learning_rate": 1.7632513969586736e-05, + "loss": 0.5897, + "step": 9061 + }, + { + "epoch": 24.69209809264305, + "grad_norm": 8.766971588134766, + "learning_rate": 1.7631943758651687e-05, + "loss": 0.5793, + "step": 9062 + }, + { + "epoch": 24.69482288828338, + "grad_norm": 8.28712272644043, + "learning_rate": 1.7631373488279303e-05, + "loss": 0.749, + "step": 9063 + }, + { + "epoch": 24.697547683923705, + "grad_norm": 7.610118865966797, + "learning_rate": 1.763080315847403e-05, + "loss": 0.6459, + "step": 9064 + }, + { + "epoch": 24.70027247956403, + "grad_norm": 11.615033149719238, + "learning_rate": 1.7630232769240307e-05, + "loss": 0.5387, + "step": 9065 + }, + { + "epoch": 24.70299727520436, + "grad_norm": 8.760119438171387, + "learning_rate": 1.7629662320582578e-05, + "loss": 0.7877, + "step": 9066 + }, + { + "epoch": 24.705722070844686, + "grad_norm": 7.303828239440918, + "learning_rate": 1.7629091812505285e-05, + "loss": 0.7491, + "step": 9067 + }, + { + "epoch": 24.708446866485012, + "grad_norm": 9.286757469177246, + "learning_rate": 1.762852124501287e-05, + "loss": 0.7002, + "step": 9068 + }, + { + "epoch": 24.71117166212534, + "grad_norm": 7.101996898651123, + "learning_rate": 1.7627950618109775e-05, + "loss": 0.6022, + "step": 9069 + }, + { + "epoch": 24.713896457765667, + "grad_norm": 8.550169944763184, + "learning_rate": 1.7627379931800446e-05, + "loss": 0.6114, + "step": 9070 + }, + { + "epoch": 24.716621253405993, + "grad_norm": 9.084425926208496, + "learning_rate": 1.762680918608933e-05, + "loss": 0.6962, + "step": 9071 + }, + { + "epoch": 24.719346049046322, + "grad_norm": 8.570323944091797, + "learning_rate": 1.7626238380980866e-05, + "loss": 0.7131, + "step": 9072 + }, + { + "epoch": 24.722070844686648, + "grad_norm": 8.048595428466797, + "learning_rate": 1.7625667516479508e-05, + "loss": 0.7187, + "step": 9073 + }, + { + "epoch": 24.724795640326974, + "grad_norm": 8.957825660705566, + "learning_rate": 1.7625096592589692e-05, + "loss": 0.7624, + "step": 9074 + }, + { + "epoch": 24.727520435967303, + "grad_norm": 9.336494445800781, + "learning_rate": 1.7624525609315873e-05, + "loss": 0.6737, + "step": 9075 + }, + { + "epoch": 24.73024523160763, + "grad_norm": 14.707310676574707, + "learning_rate": 1.762395456666249e-05, + "loss": 0.6622, + "step": 9076 + }, + { + "epoch": 24.732970027247955, + "grad_norm": 8.099577903747559, + "learning_rate": 1.7623383464633996e-05, + "loss": 0.6689, + "step": 9077 + }, + { + "epoch": 24.735694822888284, + "grad_norm": 7.692896366119385, + "learning_rate": 1.7622812303234837e-05, + "loss": 0.7451, + "step": 9078 + }, + { + "epoch": 24.73841961852861, + "grad_norm": 7.110904216766357, + "learning_rate": 1.7622241082469463e-05, + "loss": 0.8058, + "step": 9079 + }, + { + "epoch": 24.741144414168936, + "grad_norm": 9.915729522705078, + "learning_rate": 1.762166980234232e-05, + "loss": 0.6854, + "step": 9080 + }, + { + "epoch": 24.743869209809265, + "grad_norm": 6.910274982452393, + "learning_rate": 1.762109846285786e-05, + "loss": 0.7994, + "step": 9081 + }, + { + "epoch": 24.74659400544959, + "grad_norm": 8.334527969360352, + "learning_rate": 1.7620527064020524e-05, + "loss": 0.6736, + "step": 9082 + }, + { + "epoch": 24.749318801089917, + "grad_norm": 7.239718437194824, + "learning_rate": 1.761995560583477e-05, + "loss": 0.6385, + "step": 9083 + }, + { + "epoch": 24.752043596730246, + "grad_norm": 9.957289695739746, + "learning_rate": 1.761938408830505e-05, + "loss": 0.6938, + "step": 9084 + }, + { + "epoch": 24.754768392370572, + "grad_norm": 8.416315078735352, + "learning_rate": 1.761881251143581e-05, + "loss": 0.7626, + "step": 9085 + }, + { + "epoch": 24.757493188010898, + "grad_norm": 7.973998069763184, + "learning_rate": 1.7618240875231504e-05, + "loss": 0.6124, + "step": 9086 + }, + { + "epoch": 24.760217983651227, + "grad_norm": 12.216193199157715, + "learning_rate": 1.7617669179696584e-05, + "loss": 0.6934, + "step": 9087 + }, + { + "epoch": 24.762942779291553, + "grad_norm": 8.15843391418457, + "learning_rate": 1.76170974248355e-05, + "loss": 0.5637, + "step": 9088 + }, + { + "epoch": 24.76566757493188, + "grad_norm": 9.592131614685059, + "learning_rate": 1.761652561065271e-05, + "loss": 0.5842, + "step": 9089 + }, + { + "epoch": 24.768392370572208, + "grad_norm": 8.345134735107422, + "learning_rate": 1.7615953737152662e-05, + "loss": 0.6991, + "step": 9090 + }, + { + "epoch": 24.771117166212534, + "grad_norm": 8.831202507019043, + "learning_rate": 1.7615381804339812e-05, + "loss": 0.5632, + "step": 9091 + }, + { + "epoch": 24.77384196185286, + "grad_norm": 6.586507320404053, + "learning_rate": 1.761480981221861e-05, + "loss": 0.712, + "step": 9092 + }, + { + "epoch": 24.77656675749319, + "grad_norm": 7.661722660064697, + "learning_rate": 1.7614237760793517e-05, + "loss": 0.6247, + "step": 9093 + }, + { + "epoch": 24.779291553133515, + "grad_norm": 11.912310600280762, + "learning_rate": 1.7613665650068986e-05, + "loss": 0.7829, + "step": 9094 + }, + { + "epoch": 24.78201634877384, + "grad_norm": 9.052411079406738, + "learning_rate": 1.7613093480049472e-05, + "loss": 0.6127, + "step": 9095 + }, + { + "epoch": 24.78474114441417, + "grad_norm": 8.426584243774414, + "learning_rate": 1.7612521250739427e-05, + "loss": 0.4929, + "step": 9096 + }, + { + "epoch": 24.787465940054496, + "grad_norm": 8.199124336242676, + "learning_rate": 1.7611948962143317e-05, + "loss": 0.6892, + "step": 9097 + }, + { + "epoch": 24.79019073569482, + "grad_norm": 9.086944580078125, + "learning_rate": 1.7611376614265586e-05, + "loss": 0.656, + "step": 9098 + }, + { + "epoch": 24.79291553133515, + "grad_norm": 11.262910842895508, + "learning_rate": 1.7610804207110708e-05, + "loss": 0.721, + "step": 9099 + }, + { + "epoch": 24.795640326975477, + "grad_norm": 7.025333404541016, + "learning_rate": 1.7610231740683127e-05, + "loss": 0.7167, + "step": 9100 + }, + { + "epoch": 24.798365122615802, + "grad_norm": 7.94744348526001, + "learning_rate": 1.7609659214987306e-05, + "loss": 0.6428, + "step": 9101 + }, + { + "epoch": 24.80108991825613, + "grad_norm": 7.263674736022949, + "learning_rate": 1.7609086630027703e-05, + "loss": 0.619, + "step": 9102 + }, + { + "epoch": 24.803814713896458, + "grad_norm": 6.2140793800354, + "learning_rate": 1.760851398580878e-05, + "loss": 0.6459, + "step": 9103 + }, + { + "epoch": 24.806539509536783, + "grad_norm": 8.475105285644531, + "learning_rate": 1.7607941282334994e-05, + "loss": 0.6431, + "step": 9104 + }, + { + "epoch": 24.809264305177113, + "grad_norm": 9.592691421508789, + "learning_rate": 1.760736851961081e-05, + "loss": 0.7227, + "step": 9105 + }, + { + "epoch": 24.81198910081744, + "grad_norm": 9.697248458862305, + "learning_rate": 1.760679569764068e-05, + "loss": 0.7128, + "step": 9106 + }, + { + "epoch": 24.814713896457764, + "grad_norm": 7.512829303741455, + "learning_rate": 1.7606222816429072e-05, + "loss": 0.5385, + "step": 9107 + }, + { + "epoch": 24.817438692098094, + "grad_norm": 7.659682273864746, + "learning_rate": 1.7605649875980444e-05, + "loss": 0.6131, + "step": 9108 + }, + { + "epoch": 24.82016348773842, + "grad_norm": 9.706716537475586, + "learning_rate": 1.760507687629926e-05, + "loss": 0.6518, + "step": 9109 + }, + { + "epoch": 24.822888283378745, + "grad_norm": 7.4076948165893555, + "learning_rate": 1.7604503817389984e-05, + "loss": 0.6416, + "step": 9110 + }, + { + "epoch": 24.825613079019075, + "grad_norm": 7.795478820800781, + "learning_rate": 1.7603930699257077e-05, + "loss": 0.6566, + "step": 9111 + }, + { + "epoch": 24.8283378746594, + "grad_norm": 8.182226181030273, + "learning_rate": 1.7603357521905002e-05, + "loss": 0.7444, + "step": 9112 + }, + { + "epoch": 24.831062670299726, + "grad_norm": 8.728377342224121, + "learning_rate": 1.760278428533822e-05, + "loss": 0.6691, + "step": 9113 + }, + { + "epoch": 24.833787465940055, + "grad_norm": 13.578832626342773, + "learning_rate": 1.7602210989561202e-05, + "loss": 0.6788, + "step": 9114 + }, + { + "epoch": 24.83651226158038, + "grad_norm": 9.919561386108398, + "learning_rate": 1.760163763457841e-05, + "loss": 0.6063, + "step": 9115 + }, + { + "epoch": 24.839237057220707, + "grad_norm": 7.077985763549805, + "learning_rate": 1.7601064220394305e-05, + "loss": 0.5043, + "step": 9116 + }, + { + "epoch": 24.841961852861036, + "grad_norm": 9.012791633605957, + "learning_rate": 1.760049074701336e-05, + "loss": 0.4412, + "step": 9117 + }, + { + "epoch": 24.844686648501362, + "grad_norm": 7.965156555175781, + "learning_rate": 1.7599917214440035e-05, + "loss": 0.6007, + "step": 9118 + }, + { + "epoch": 24.847411444141688, + "grad_norm": 8.324759483337402, + "learning_rate": 1.7599343622678802e-05, + "loss": 0.5599, + "step": 9119 + }, + { + "epoch": 24.850136239782017, + "grad_norm": 8.590094566345215, + "learning_rate": 1.7598769971734127e-05, + "loss": 0.7472, + "step": 9120 + }, + { + "epoch": 24.852861035422343, + "grad_norm": 8.1151762008667, + "learning_rate": 1.7598196261610476e-05, + "loss": 0.5726, + "step": 9121 + }, + { + "epoch": 24.85558583106267, + "grad_norm": 7.521329402923584, + "learning_rate": 1.7597622492312313e-05, + "loss": 0.5908, + "step": 9122 + }, + { + "epoch": 24.858310626703, + "grad_norm": 9.701559066772461, + "learning_rate": 1.759704866384411e-05, + "loss": 0.5087, + "step": 9123 + }, + { + "epoch": 24.861035422343324, + "grad_norm": 8.193989753723145, + "learning_rate": 1.759647477621034e-05, + "loss": 0.5861, + "step": 9124 + }, + { + "epoch": 24.86376021798365, + "grad_norm": 9.653748512268066, + "learning_rate": 1.759590082941547e-05, + "loss": 0.767, + "step": 9125 + }, + { + "epoch": 24.86648501362398, + "grad_norm": 7.191437244415283, + "learning_rate": 1.7595326823463963e-05, + "loss": 0.5499, + "step": 9126 + }, + { + "epoch": 24.869209809264305, + "grad_norm": 7.461208820343018, + "learning_rate": 1.75947527583603e-05, + "loss": 0.4998, + "step": 9127 + }, + { + "epoch": 24.87193460490463, + "grad_norm": 8.673975944519043, + "learning_rate": 1.7594178634108944e-05, + "loss": 0.6719, + "step": 9128 + }, + { + "epoch": 24.87465940054496, + "grad_norm": 8.278363227844238, + "learning_rate": 1.759360445071437e-05, + "loss": 0.6855, + "step": 9129 + }, + { + "epoch": 24.877384196185286, + "grad_norm": 7.993578910827637, + "learning_rate": 1.7593030208181052e-05, + "loss": 0.6843, + "step": 9130 + }, + { + "epoch": 24.88010899182561, + "grad_norm": 8.322216033935547, + "learning_rate": 1.7592455906513456e-05, + "loss": 0.7618, + "step": 9131 + }, + { + "epoch": 24.88283378746594, + "grad_norm": 10.070342063903809, + "learning_rate": 1.7591881545716058e-05, + "loss": 0.6232, + "step": 9132 + }, + { + "epoch": 24.885558583106267, + "grad_norm": 9.82460880279541, + "learning_rate": 1.7591307125793332e-05, + "loss": 0.587, + "step": 9133 + }, + { + "epoch": 24.888283378746593, + "grad_norm": 7.020534038543701, + "learning_rate": 1.759073264674975e-05, + "loss": 0.7737, + "step": 9134 + }, + { + "epoch": 24.891008174386922, + "grad_norm": 7.385281085968018, + "learning_rate": 1.7590158108589785e-05, + "loss": 0.6512, + "step": 9135 + }, + { + "epoch": 24.893732970027248, + "grad_norm": 7.650609493255615, + "learning_rate": 1.7589583511317915e-05, + "loss": 0.6586, + "step": 9136 + }, + { + "epoch": 24.896457765667574, + "grad_norm": 6.550846099853516, + "learning_rate": 1.7589008854938613e-05, + "loss": 0.5401, + "step": 9137 + }, + { + "epoch": 24.899182561307903, + "grad_norm": 7.285351753234863, + "learning_rate": 1.7588434139456354e-05, + "loss": 0.6038, + "step": 9138 + }, + { + "epoch": 24.90190735694823, + "grad_norm": 7.743149280548096, + "learning_rate": 1.7587859364875613e-05, + "loss": 0.7252, + "step": 9139 + }, + { + "epoch": 24.904632152588555, + "grad_norm": 7.218400478363037, + "learning_rate": 1.7587284531200866e-05, + "loss": 0.4827, + "step": 9140 + }, + { + "epoch": 24.907356948228884, + "grad_norm": 6.358419418334961, + "learning_rate": 1.7586709638436593e-05, + "loss": 0.6794, + "step": 9141 + }, + { + "epoch": 24.91008174386921, + "grad_norm": 7.754582405090332, + "learning_rate": 1.758613468658727e-05, + "loss": 0.5704, + "step": 9142 + }, + { + "epoch": 24.912806539509535, + "grad_norm": 8.69373893737793, + "learning_rate": 1.7585559675657377e-05, + "loss": 0.7025, + "step": 9143 + }, + { + "epoch": 24.915531335149865, + "grad_norm": 8.12856674194336, + "learning_rate": 1.7584984605651385e-05, + "loss": 0.5807, + "step": 9144 + }, + { + "epoch": 24.91825613079019, + "grad_norm": 6.606778621673584, + "learning_rate": 1.758440947657378e-05, + "loss": 0.6108, + "step": 9145 + }, + { + "epoch": 24.920980926430516, + "grad_norm": 8.338944435119629, + "learning_rate": 1.7583834288429032e-05, + "loss": 0.7186, + "step": 9146 + }, + { + "epoch": 24.923705722070846, + "grad_norm": 8.624048233032227, + "learning_rate": 1.7583259041221634e-05, + "loss": 0.5325, + "step": 9147 + }, + { + "epoch": 24.92643051771117, + "grad_norm": 8.943880081176758, + "learning_rate": 1.7582683734956055e-05, + "loss": 0.6185, + "step": 9148 + }, + { + "epoch": 24.929155313351497, + "grad_norm": 8.175042152404785, + "learning_rate": 1.758210836963678e-05, + "loss": 0.7002, + "step": 9149 + }, + { + "epoch": 24.931880108991827, + "grad_norm": 8.36201286315918, + "learning_rate": 1.758153294526829e-05, + "loss": 0.5826, + "step": 9150 + }, + { + "epoch": 24.934604904632153, + "grad_norm": 9.481425285339355, + "learning_rate": 1.7580957461855064e-05, + "loss": 0.7182, + "step": 9151 + }, + { + "epoch": 24.93732970027248, + "grad_norm": 8.212348937988281, + "learning_rate": 1.7580381919401586e-05, + "loss": 0.6982, + "step": 9152 + }, + { + "epoch": 24.940054495912808, + "grad_norm": 7.990788459777832, + "learning_rate": 1.7579806317912336e-05, + "loss": 0.5393, + "step": 9153 + }, + { + "epoch": 24.942779291553133, + "grad_norm": 9.8809175491333, + "learning_rate": 1.7579230657391803e-05, + "loss": 0.5881, + "step": 9154 + }, + { + "epoch": 24.94550408719346, + "grad_norm": 10.29200553894043, + "learning_rate": 1.757865493784446e-05, + "loss": 0.6382, + "step": 9155 + }, + { + "epoch": 24.94822888283379, + "grad_norm": 7.920681953430176, + "learning_rate": 1.7578079159274798e-05, + "loss": 0.7075, + "step": 9156 + }, + { + "epoch": 24.950953678474114, + "grad_norm": 9.220345497131348, + "learning_rate": 1.75775033216873e-05, + "loss": 0.6733, + "step": 9157 + }, + { + "epoch": 24.95367847411444, + "grad_norm": 7.205484867095947, + "learning_rate": 1.757692742508645e-05, + "loss": 0.5162, + "step": 9158 + }, + { + "epoch": 24.95640326975477, + "grad_norm": 7.997858047485352, + "learning_rate": 1.7576351469476735e-05, + "loss": 0.6132, + "step": 9159 + }, + { + "epoch": 24.959128065395095, + "grad_norm": 8.290677070617676, + "learning_rate": 1.7575775454862636e-05, + "loss": 0.6284, + "step": 9160 + }, + { + "epoch": 24.96185286103542, + "grad_norm": 8.271625518798828, + "learning_rate": 1.7575199381248643e-05, + "loss": 0.6142, + "step": 9161 + }, + { + "epoch": 24.96457765667575, + "grad_norm": 7.2044572830200195, + "learning_rate": 1.757462324863924e-05, + "loss": 0.5352, + "step": 9162 + }, + { + "epoch": 24.967302452316076, + "grad_norm": 7.704048156738281, + "learning_rate": 1.7574047057038914e-05, + "loss": 0.6229, + "step": 9163 + }, + { + "epoch": 24.970027247956402, + "grad_norm": 8.477546691894531, + "learning_rate": 1.7573470806452156e-05, + "loss": 0.6918, + "step": 9164 + }, + { + "epoch": 24.97275204359673, + "grad_norm": 9.030668258666992, + "learning_rate": 1.7572894496883448e-05, + "loss": 0.6869, + "step": 9165 + }, + { + "epoch": 24.975476839237057, + "grad_norm": 7.245536804199219, + "learning_rate": 1.7572318128337286e-05, + "loss": 0.5255, + "step": 9166 + }, + { + "epoch": 24.978201634877383, + "grad_norm": 8.229454040527344, + "learning_rate": 1.757174170081815e-05, + "loss": 0.6912, + "step": 9167 + }, + { + "epoch": 24.980926430517712, + "grad_norm": 10.456474304199219, + "learning_rate": 1.7571165214330533e-05, + "loss": 0.5757, + "step": 9168 + }, + { + "epoch": 24.983651226158038, + "grad_norm": 13.14166259765625, + "learning_rate": 1.7570588668878925e-05, + "loss": 0.8313, + "step": 9169 + }, + { + "epoch": 24.986376021798364, + "grad_norm": 9.433475494384766, + "learning_rate": 1.757001206446782e-05, + "loss": 0.6941, + "step": 9170 + }, + { + "epoch": 24.989100817438693, + "grad_norm": 8.512743949890137, + "learning_rate": 1.7569435401101702e-05, + "loss": 0.6174, + "step": 9171 + }, + { + "epoch": 24.99182561307902, + "grad_norm": 8.018141746520996, + "learning_rate": 1.7568858678785067e-05, + "loss": 0.6895, + "step": 9172 + }, + { + "epoch": 24.994550408719345, + "grad_norm": 7.822866439819336, + "learning_rate": 1.75682818975224e-05, + "loss": 0.7471, + "step": 9173 + }, + { + "epoch": 24.997275204359674, + "grad_norm": 8.118390083312988, + "learning_rate": 1.75677050573182e-05, + "loss": 0.5596, + "step": 9174 + }, + { + "epoch": 25.0, + "grad_norm": 7.722609043121338, + "learning_rate": 1.7567128158176955e-05, + "loss": 0.7333, + "step": 9175 + }, + { + "epoch": 25.002724795640326, + "grad_norm": 7.151113510131836, + "learning_rate": 1.756655120010316e-05, + "loss": 0.6569, + "step": 9176 + }, + { + "epoch": 25.005449591280655, + "grad_norm": 7.189694404602051, + "learning_rate": 1.756597418310131e-05, + "loss": 0.4894, + "step": 9177 + }, + { + "epoch": 25.00817438692098, + "grad_norm": 7.096490859985352, + "learning_rate": 1.7565397107175893e-05, + "loss": 0.6046, + "step": 9178 + }, + { + "epoch": 25.010899182561307, + "grad_norm": 8.53683853149414, + "learning_rate": 1.7564819972331408e-05, + "loss": 0.593, + "step": 9179 + }, + { + "epoch": 25.013623978201636, + "grad_norm": 7.668188571929932, + "learning_rate": 1.7564242778572348e-05, + "loss": 0.6535, + "step": 9180 + }, + { + "epoch": 25.016348773841962, + "grad_norm": 7.663745403289795, + "learning_rate": 1.756366552590321e-05, + "loss": 0.4633, + "step": 9181 + }, + { + "epoch": 25.019073569482288, + "grad_norm": 6.856311321258545, + "learning_rate": 1.756308821432849e-05, + "loss": 0.5386, + "step": 9182 + }, + { + "epoch": 25.021798365122617, + "grad_norm": 8.927593231201172, + "learning_rate": 1.7562510843852678e-05, + "loss": 0.5468, + "step": 9183 + }, + { + "epoch": 25.024523160762943, + "grad_norm": 7.710852146148682, + "learning_rate": 1.7561933414480278e-05, + "loss": 0.5551, + "step": 9184 + }, + { + "epoch": 25.02724795640327, + "grad_norm": 7.814901828765869, + "learning_rate": 1.7561355926215784e-05, + "loss": 0.5698, + "step": 9185 + }, + { + "epoch": 25.029972752043598, + "grad_norm": 7.54987907409668, + "learning_rate": 1.7560778379063693e-05, + "loss": 0.5743, + "step": 9186 + }, + { + "epoch": 25.032697547683924, + "grad_norm": 8.966099739074707, + "learning_rate": 1.75602007730285e-05, + "loss": 0.6206, + "step": 9187 + }, + { + "epoch": 25.03542234332425, + "grad_norm": 9.749812126159668, + "learning_rate": 1.7559623108114713e-05, + "loss": 0.5268, + "step": 9188 + }, + { + "epoch": 25.03814713896458, + "grad_norm": 7.751905918121338, + "learning_rate": 1.755904538432682e-05, + "loss": 0.7687, + "step": 9189 + }, + { + "epoch": 25.040871934604905, + "grad_norm": 6.137204170227051, + "learning_rate": 1.7558467601669326e-05, + "loss": 0.6042, + "step": 9190 + }, + { + "epoch": 25.04359673024523, + "grad_norm": 9.052706718444824, + "learning_rate": 1.755788976014673e-05, + "loss": 0.6306, + "step": 9191 + }, + { + "epoch": 25.04632152588556, + "grad_norm": 7.87229585647583, + "learning_rate": 1.755731185976353e-05, + "loss": 0.4666, + "step": 9192 + }, + { + "epoch": 25.049046321525886, + "grad_norm": 12.386114120483398, + "learning_rate": 1.755673390052423e-05, + "loss": 0.4894, + "step": 9193 + }, + { + "epoch": 25.05177111716621, + "grad_norm": 7.40094518661499, + "learning_rate": 1.755615588243333e-05, + "loss": 0.4758, + "step": 9194 + }, + { + "epoch": 25.05449591280654, + "grad_norm": 9.998497009277344, + "learning_rate": 1.755557780549533e-05, + "loss": 0.5323, + "step": 9195 + }, + { + "epoch": 25.057220708446867, + "grad_norm": 7.588438034057617, + "learning_rate": 1.7554999669714736e-05, + "loss": 0.6864, + "step": 9196 + }, + { + "epoch": 25.059945504087192, + "grad_norm": 7.710918426513672, + "learning_rate": 1.7554421475096047e-05, + "loss": 0.5907, + "step": 9197 + }, + { + "epoch": 25.06267029972752, + "grad_norm": 7.103505611419678, + "learning_rate": 1.7553843221643764e-05, + "loss": 0.5072, + "step": 9198 + }, + { + "epoch": 25.065395095367847, + "grad_norm": 7.364475727081299, + "learning_rate": 1.7553264909362397e-05, + "loss": 0.6147, + "step": 9199 + }, + { + "epoch": 25.068119891008173, + "grad_norm": 6.914089679718018, + "learning_rate": 1.755268653825644e-05, + "loss": 0.7128, + "step": 9200 + }, + { + "epoch": 25.070844686648503, + "grad_norm": 6.164554595947266, + "learning_rate": 1.7552108108330407e-05, + "loss": 0.5146, + "step": 9201 + }, + { + "epoch": 25.07356948228883, + "grad_norm": 7.43580961227417, + "learning_rate": 1.75515296195888e-05, + "loss": 0.4504, + "step": 9202 + }, + { + "epoch": 25.076294277929154, + "grad_norm": 6.554437637329102, + "learning_rate": 1.755095107203612e-05, + "loss": 0.6844, + "step": 9203 + }, + { + "epoch": 25.079019073569484, + "grad_norm": 8.390671730041504, + "learning_rate": 1.755037246567688e-05, + "loss": 0.6544, + "step": 9204 + }, + { + "epoch": 25.08174386920981, + "grad_norm": 9.178902626037598, + "learning_rate": 1.754979380051558e-05, + "loss": 0.5558, + "step": 9205 + }, + { + "epoch": 25.084468664850135, + "grad_norm": 6.180863380432129, + "learning_rate": 1.754921507655673e-05, + "loss": 0.6732, + "step": 9206 + }, + { + "epoch": 25.087193460490465, + "grad_norm": 6.8885674476623535, + "learning_rate": 1.7548636293804838e-05, + "loss": 0.7445, + "step": 9207 + }, + { + "epoch": 25.08991825613079, + "grad_norm": 9.175154685974121, + "learning_rate": 1.7548057452264404e-05, + "loss": 0.6847, + "step": 9208 + }, + { + "epoch": 25.092643051771116, + "grad_norm": 7.723278999328613, + "learning_rate": 1.7547478551939944e-05, + "loss": 0.5176, + "step": 9209 + }, + { + "epoch": 25.095367847411445, + "grad_norm": 9.161273956298828, + "learning_rate": 1.7546899592835968e-05, + "loss": 0.5295, + "step": 9210 + }, + { + "epoch": 25.09809264305177, + "grad_norm": 7.03291654586792, + "learning_rate": 1.7546320574956976e-05, + "loss": 0.5646, + "step": 9211 + }, + { + "epoch": 25.100817438692097, + "grad_norm": 7.496363162994385, + "learning_rate": 1.7545741498307483e-05, + "loss": 0.5092, + "step": 9212 + }, + { + "epoch": 25.103542234332426, + "grad_norm": 9.686806678771973, + "learning_rate": 1.7545162362891997e-05, + "loss": 0.4745, + "step": 9213 + }, + { + "epoch": 25.106267029972752, + "grad_norm": 8.231841087341309, + "learning_rate": 1.754458316871503e-05, + "loss": 0.5324, + "step": 9214 + }, + { + "epoch": 25.108991825613078, + "grad_norm": 8.02005386352539, + "learning_rate": 1.7544003915781097e-05, + "loss": 0.6253, + "step": 9215 + }, + { + "epoch": 25.111716621253407, + "grad_norm": 6.017721652984619, + "learning_rate": 1.7543424604094697e-05, + "loss": 0.5031, + "step": 9216 + }, + { + "epoch": 25.114441416893733, + "grad_norm": 8.045443534851074, + "learning_rate": 1.754284523366035e-05, + "loss": 0.6282, + "step": 9217 + }, + { + "epoch": 25.11716621253406, + "grad_norm": 6.175623893737793, + "learning_rate": 1.7542265804482573e-05, + "loss": 0.6051, + "step": 9218 + }, + { + "epoch": 25.11989100817439, + "grad_norm": 7.03268575668335, + "learning_rate": 1.754168631656587e-05, + "loss": 0.5444, + "step": 9219 + }, + { + "epoch": 25.122615803814714, + "grad_norm": 9.013124465942383, + "learning_rate": 1.754110676991475e-05, + "loss": 0.5907, + "step": 9220 + }, + { + "epoch": 25.12534059945504, + "grad_norm": 7.212218284606934, + "learning_rate": 1.7540527164533744e-05, + "loss": 0.6246, + "step": 9221 + }, + { + "epoch": 25.12806539509537, + "grad_norm": 7.503476142883301, + "learning_rate": 1.7539947500427346e-05, + "loss": 0.5248, + "step": 9222 + }, + { + "epoch": 25.130790190735695, + "grad_norm": 7.938776969909668, + "learning_rate": 1.7539367777600088e-05, + "loss": 0.5154, + "step": 9223 + }, + { + "epoch": 25.13351498637602, + "grad_norm": 7.27805757522583, + "learning_rate": 1.753878799605647e-05, + "loss": 0.6232, + "step": 9224 + }, + { + "epoch": 25.13623978201635, + "grad_norm": 7.290003776550293, + "learning_rate": 1.7538208155801014e-05, + "loss": 0.5217, + "step": 9225 + }, + { + "epoch": 25.138964577656676, + "grad_norm": 7.449812412261963, + "learning_rate": 1.7537628256838238e-05, + "loss": 0.5759, + "step": 9226 + }, + { + "epoch": 25.141689373297, + "grad_norm": 9.210305213928223, + "learning_rate": 1.7537048299172657e-05, + "loss": 0.541, + "step": 9227 + }, + { + "epoch": 25.14441416893733, + "grad_norm": 8.278675079345703, + "learning_rate": 1.7536468282808787e-05, + "loss": 0.5414, + "step": 9228 + }, + { + "epoch": 25.147138964577657, + "grad_norm": 8.17081356048584, + "learning_rate": 1.753588820775114e-05, + "loss": 0.6001, + "step": 9229 + }, + { + "epoch": 25.149863760217983, + "grad_norm": 7.017838478088379, + "learning_rate": 1.7535308074004242e-05, + "loss": 0.5342, + "step": 9230 + }, + { + "epoch": 25.152588555858312, + "grad_norm": 7.229761600494385, + "learning_rate": 1.7534727881572603e-05, + "loss": 0.5457, + "step": 9231 + }, + { + "epoch": 25.155313351498638, + "grad_norm": 7.093820095062256, + "learning_rate": 1.753414763046075e-05, + "loss": 0.5176, + "step": 9232 + }, + { + "epoch": 25.158038147138964, + "grad_norm": 7.416743755340576, + "learning_rate": 1.7533567320673197e-05, + "loss": 0.5902, + "step": 9233 + }, + { + "epoch": 25.160762942779293, + "grad_norm": 7.925085544586182, + "learning_rate": 1.7532986952214458e-05, + "loss": 0.5453, + "step": 9234 + }, + { + "epoch": 25.16348773841962, + "grad_norm": 7.787499904632568, + "learning_rate": 1.7532406525089065e-05, + "loss": 0.4775, + "step": 9235 + }, + { + "epoch": 25.166212534059945, + "grad_norm": 8.381814956665039, + "learning_rate": 1.7531826039301534e-05, + "loss": 0.6014, + "step": 9236 + }, + { + "epoch": 25.168937329700274, + "grad_norm": 10.34481430053711, + "learning_rate": 1.7531245494856383e-05, + "loss": 0.6141, + "step": 9237 + }, + { + "epoch": 25.1716621253406, + "grad_norm": 6.762233734130859, + "learning_rate": 1.753066489175813e-05, + "loss": 0.6984, + "step": 9238 + }, + { + "epoch": 25.174386920980925, + "grad_norm": 8.525280952453613, + "learning_rate": 1.7530084230011305e-05, + "loss": 0.5868, + "step": 9239 + }, + { + "epoch": 25.177111716621255, + "grad_norm": 8.026586532592773, + "learning_rate": 1.7529503509620426e-05, + "loss": 0.4789, + "step": 9240 + }, + { + "epoch": 25.17983651226158, + "grad_norm": 7.491539478302002, + "learning_rate": 1.7528922730590014e-05, + "loss": 0.5432, + "step": 9241 + }, + { + "epoch": 25.182561307901906, + "grad_norm": 7.025993824005127, + "learning_rate": 1.7528341892924598e-05, + "loss": 0.53, + "step": 9242 + }, + { + "epoch": 25.185286103542236, + "grad_norm": 8.817523956298828, + "learning_rate": 1.7527760996628695e-05, + "loss": 0.677, + "step": 9243 + }, + { + "epoch": 25.18801089918256, + "grad_norm": 7.676280975341797, + "learning_rate": 1.7527180041706834e-05, + "loss": 0.5723, + "step": 9244 + }, + { + "epoch": 25.190735694822887, + "grad_norm": 7.347946643829346, + "learning_rate": 1.7526599028163534e-05, + "loss": 0.6664, + "step": 9245 + }, + { + "epoch": 25.193460490463217, + "grad_norm": 8.0401029586792, + "learning_rate": 1.7526017956003324e-05, + "loss": 0.5846, + "step": 9246 + }, + { + "epoch": 25.196185286103542, + "grad_norm": 6.611307144165039, + "learning_rate": 1.7525436825230728e-05, + "loss": 0.3984, + "step": 9247 + }, + { + "epoch": 25.19891008174387, + "grad_norm": 8.031599998474121, + "learning_rate": 1.7524855635850272e-05, + "loss": 0.5362, + "step": 9248 + }, + { + "epoch": 25.201634877384198, + "grad_norm": 7.952152252197266, + "learning_rate": 1.7524274387866483e-05, + "loss": 0.625, + "step": 9249 + }, + { + "epoch": 25.204359673024523, + "grad_norm": 9.92528247833252, + "learning_rate": 1.752369308128389e-05, + "loss": 0.446, + "step": 9250 + }, + { + "epoch": 25.20708446866485, + "grad_norm": 8.438230514526367, + "learning_rate": 1.7523111716107016e-05, + "loss": 0.5319, + "step": 9251 + }, + { + "epoch": 25.20980926430518, + "grad_norm": 6.178292274475098, + "learning_rate": 1.7522530292340387e-05, + "loss": 0.5495, + "step": 9252 + }, + { + "epoch": 25.212534059945504, + "grad_norm": 7.064868450164795, + "learning_rate": 1.7521948809988538e-05, + "loss": 0.6548, + "step": 9253 + }, + { + "epoch": 25.21525885558583, + "grad_norm": 9.970439910888672, + "learning_rate": 1.752136726905599e-05, + "loss": 0.6219, + "step": 9254 + }, + { + "epoch": 25.21798365122616, + "grad_norm": 6.916043758392334, + "learning_rate": 1.752078566954728e-05, + "loss": 0.5088, + "step": 9255 + }, + { + "epoch": 25.220708446866485, + "grad_norm": 7.9270195960998535, + "learning_rate": 1.752020401146693e-05, + "loss": 0.6082, + "step": 9256 + }, + { + "epoch": 25.22343324250681, + "grad_norm": 7.422311305999756, + "learning_rate": 1.7519622294819474e-05, + "loss": 0.509, + "step": 9257 + }, + { + "epoch": 25.22615803814714, + "grad_norm": 8.811856269836426, + "learning_rate": 1.7519040519609443e-05, + "loss": 0.6207, + "step": 9258 + }, + { + "epoch": 25.228882833787466, + "grad_norm": 12.191774368286133, + "learning_rate": 1.751845868584136e-05, + "loss": 0.4642, + "step": 9259 + }, + { + "epoch": 25.231607629427792, + "grad_norm": 6.951323986053467, + "learning_rate": 1.7517876793519772e-05, + "loss": 0.7046, + "step": 9260 + }, + { + "epoch": 25.23433242506812, + "grad_norm": 9.310023307800293, + "learning_rate": 1.75172948426492e-05, + "loss": 0.531, + "step": 9261 + }, + { + "epoch": 25.237057220708447, + "grad_norm": 11.55679988861084, + "learning_rate": 1.751671283323417e-05, + "loss": 0.5942, + "step": 9262 + }, + { + "epoch": 25.239782016348773, + "grad_norm": 6.232604026794434, + "learning_rate": 1.751613076527923e-05, + "loss": 0.6099, + "step": 9263 + }, + { + "epoch": 25.242506811989102, + "grad_norm": 10.137306213378906, + "learning_rate": 1.7515548638788904e-05, + "loss": 0.6305, + "step": 9264 + }, + { + "epoch": 25.245231607629428, + "grad_norm": 7.340976238250732, + "learning_rate": 1.7514966453767725e-05, + "loss": 0.5643, + "step": 9265 + }, + { + "epoch": 25.247956403269754, + "grad_norm": 6.675346851348877, + "learning_rate": 1.751438421022023e-05, + "loss": 0.6963, + "step": 9266 + }, + { + "epoch": 25.250681198910083, + "grad_norm": 9.164529800415039, + "learning_rate": 1.7513801908150953e-05, + "loss": 0.634, + "step": 9267 + }, + { + "epoch": 25.25340599455041, + "grad_norm": 7.60259485244751, + "learning_rate": 1.7513219547564427e-05, + "loss": 0.4993, + "step": 9268 + }, + { + "epoch": 25.256130790190735, + "grad_norm": 7.457983016967773, + "learning_rate": 1.7512637128465195e-05, + "loss": 0.5522, + "step": 9269 + }, + { + "epoch": 25.258855585831064, + "grad_norm": 7.982919216156006, + "learning_rate": 1.751205465085778e-05, + "loss": 0.5412, + "step": 9270 + }, + { + "epoch": 25.26158038147139, + "grad_norm": 6.639307022094727, + "learning_rate": 1.7511472114746727e-05, + "loss": 0.6172, + "step": 9271 + }, + { + "epoch": 25.264305177111716, + "grad_norm": 9.026050567626953, + "learning_rate": 1.7510889520136572e-05, + "loss": 0.516, + "step": 9272 + }, + { + "epoch": 25.267029972752045, + "grad_norm": 11.0486478805542, + "learning_rate": 1.751030686703185e-05, + "loss": 0.5549, + "step": 9273 + }, + { + "epoch": 25.26975476839237, + "grad_norm": 6.79197359085083, + "learning_rate": 1.7509724155437104e-05, + "loss": 0.5136, + "step": 9274 + }, + { + "epoch": 25.272479564032697, + "grad_norm": 9.363343238830566, + "learning_rate": 1.750914138535686e-05, + "loss": 0.4385, + "step": 9275 + }, + { + "epoch": 25.275204359673026, + "grad_norm": 8.308867454528809, + "learning_rate": 1.750855855679567e-05, + "loss": 0.5222, + "step": 9276 + }, + { + "epoch": 25.277929155313352, + "grad_norm": 7.330071926116943, + "learning_rate": 1.750797566975807e-05, + "loss": 0.5204, + "step": 9277 + }, + { + "epoch": 25.280653950953678, + "grad_norm": 7.579598426818848, + "learning_rate": 1.7507392724248592e-05, + "loss": 0.5756, + "step": 9278 + }, + { + "epoch": 25.283378746594007, + "grad_norm": 7.826560020446777, + "learning_rate": 1.750680972027178e-05, + "loss": 0.5952, + "step": 9279 + }, + { + "epoch": 25.286103542234333, + "grad_norm": 7.135838031768799, + "learning_rate": 1.750622665783218e-05, + "loss": 0.6481, + "step": 9280 + }, + { + "epoch": 25.28882833787466, + "grad_norm": 14.81757640838623, + "learning_rate": 1.7505643536934326e-05, + "loss": 0.7836, + "step": 9281 + }, + { + "epoch": 25.291553133514988, + "grad_norm": 7.334166526794434, + "learning_rate": 1.750506035758276e-05, + "loss": 0.546, + "step": 9282 + }, + { + "epoch": 25.294277929155314, + "grad_norm": 7.982358455657959, + "learning_rate": 1.750447711978203e-05, + "loss": 0.5037, + "step": 9283 + }, + { + "epoch": 25.29700272479564, + "grad_norm": 9.636107444763184, + "learning_rate": 1.7503893823536675e-05, + "loss": 0.5786, + "step": 9284 + }, + { + "epoch": 25.29972752043597, + "grad_norm": 8.395858764648438, + "learning_rate": 1.7503310468851232e-05, + "loss": 0.5997, + "step": 9285 + }, + { + "epoch": 25.302452316076295, + "grad_norm": 9.377330780029297, + "learning_rate": 1.750272705573025e-05, + "loss": 0.4741, + "step": 9286 + }, + { + "epoch": 25.30517711171662, + "grad_norm": 7.8394951820373535, + "learning_rate": 1.750214358417827e-05, + "loss": 0.5222, + "step": 9287 + }, + { + "epoch": 25.30790190735695, + "grad_norm": 10.575955390930176, + "learning_rate": 1.750156005419984e-05, + "loss": 0.6584, + "step": 9288 + }, + { + "epoch": 25.310626702997276, + "grad_norm": 8.982266426086426, + "learning_rate": 1.7500976465799496e-05, + "loss": 0.8733, + "step": 9289 + }, + { + "epoch": 25.3133514986376, + "grad_norm": 10.613094329833984, + "learning_rate": 1.7500392818981792e-05, + "loss": 0.5869, + "step": 9290 + }, + { + "epoch": 25.31607629427793, + "grad_norm": 7.434613227844238, + "learning_rate": 1.749980911375127e-05, + "loss": 0.5545, + "step": 9291 + }, + { + "epoch": 25.318801089918257, + "grad_norm": 6.9735565185546875, + "learning_rate": 1.7499225350112475e-05, + "loss": 0.5378, + "step": 9292 + }, + { + "epoch": 25.321525885558582, + "grad_norm": 8.49386215209961, + "learning_rate": 1.7498641528069956e-05, + "loss": 0.5077, + "step": 9293 + }, + { + "epoch": 25.32425068119891, + "grad_norm": 9.577007293701172, + "learning_rate": 1.749805764762826e-05, + "loss": 0.6476, + "step": 9294 + }, + { + "epoch": 25.326975476839237, + "grad_norm": 7.3503265380859375, + "learning_rate": 1.749747370879193e-05, + "loss": 0.5378, + "step": 9295 + }, + { + "epoch": 25.329700272479563, + "grad_norm": 7.510955810546875, + "learning_rate": 1.7496889711565516e-05, + "loss": 0.6151, + "step": 9296 + }, + { + "epoch": 25.332425068119893, + "grad_norm": 8.559822082519531, + "learning_rate": 1.7496305655953567e-05, + "loss": 0.4661, + "step": 9297 + }, + { + "epoch": 25.33514986376022, + "grad_norm": 7.167689800262451, + "learning_rate": 1.749572154196063e-05, + "loss": 0.5245, + "step": 9298 + }, + { + "epoch": 25.337874659400544, + "grad_norm": 8.277609825134277, + "learning_rate": 1.749513736959126e-05, + "loss": 0.7338, + "step": 9299 + }, + { + "epoch": 25.340599455040874, + "grad_norm": 7.558475971221924, + "learning_rate": 1.7494553138849993e-05, + "loss": 0.5319, + "step": 9300 + }, + { + "epoch": 25.3433242506812, + "grad_norm": 12.541115760803223, + "learning_rate": 1.749396884974139e-05, + "loss": 0.6882, + "step": 9301 + }, + { + "epoch": 25.346049046321525, + "grad_norm": 9.739608764648438, + "learning_rate": 1.7493384502270003e-05, + "loss": 0.6673, + "step": 9302 + }, + { + "epoch": 25.348773841961854, + "grad_norm": 8.39655590057373, + "learning_rate": 1.7492800096440376e-05, + "loss": 0.482, + "step": 9303 + }, + { + "epoch": 25.35149863760218, + "grad_norm": 11.642461776733398, + "learning_rate": 1.749221563225706e-05, + "loss": 0.5998, + "step": 9304 + }, + { + "epoch": 25.354223433242506, + "grad_norm": 9.626822471618652, + "learning_rate": 1.7491631109724613e-05, + "loss": 0.7056, + "step": 9305 + }, + { + "epoch": 25.356948228882835, + "grad_norm": 7.723657131195068, + "learning_rate": 1.7491046528847584e-05, + "loss": 0.5672, + "step": 9306 + }, + { + "epoch": 25.35967302452316, + "grad_norm": 8.35869026184082, + "learning_rate": 1.7490461889630523e-05, + "loss": 0.5688, + "step": 9307 + }, + { + "epoch": 25.362397820163487, + "grad_norm": 7.555449485778809, + "learning_rate": 1.748987719207799e-05, + "loss": 0.5198, + "step": 9308 + }, + { + "epoch": 25.365122615803816, + "grad_norm": 8.054333686828613, + "learning_rate": 1.748929243619453e-05, + "loss": 0.6856, + "step": 9309 + }, + { + "epoch": 25.367847411444142, + "grad_norm": 9.204339027404785, + "learning_rate": 1.7488707621984702e-05, + "loss": 0.5024, + "step": 9310 + }, + { + "epoch": 25.370572207084468, + "grad_norm": 7.36260461807251, + "learning_rate": 1.7488122749453067e-05, + "loss": 0.6157, + "step": 9311 + }, + { + "epoch": 25.373297002724797, + "grad_norm": 7.929131031036377, + "learning_rate": 1.7487537818604166e-05, + "loss": 0.6201, + "step": 9312 + }, + { + "epoch": 25.376021798365123, + "grad_norm": 6.746554374694824, + "learning_rate": 1.7486952829442562e-05, + "loss": 0.5786, + "step": 9313 + }, + { + "epoch": 25.37874659400545, + "grad_norm": 8.873085021972656, + "learning_rate": 1.7486367781972813e-05, + "loss": 0.6929, + "step": 9314 + }, + { + "epoch": 25.381471389645778, + "grad_norm": 8.892407417297363, + "learning_rate": 1.7485782676199475e-05, + "loss": 0.5998, + "step": 9315 + }, + { + "epoch": 25.384196185286104, + "grad_norm": 11.712400436401367, + "learning_rate": 1.7485197512127096e-05, + "loss": 0.4626, + "step": 9316 + }, + { + "epoch": 25.38692098092643, + "grad_norm": 8.752985000610352, + "learning_rate": 1.7484612289760242e-05, + "loss": 0.5222, + "step": 9317 + }, + { + "epoch": 25.38964577656676, + "grad_norm": 7.0970377922058105, + "learning_rate": 1.748402700910347e-05, + "loss": 0.6296, + "step": 9318 + }, + { + "epoch": 25.392370572207085, + "grad_norm": 8.385693550109863, + "learning_rate": 1.7483441670161336e-05, + "loss": 0.538, + "step": 9319 + }, + { + "epoch": 25.39509536784741, + "grad_norm": 8.93567943572998, + "learning_rate": 1.7482856272938398e-05, + "loss": 0.5391, + "step": 9320 + }, + { + "epoch": 25.39782016348774, + "grad_norm": 7.765710830688477, + "learning_rate": 1.7482270817439217e-05, + "loss": 0.7386, + "step": 9321 + }, + { + "epoch": 25.400544959128066, + "grad_norm": 9.23783016204834, + "learning_rate": 1.7481685303668353e-05, + "loss": 0.5933, + "step": 9322 + }, + { + "epoch": 25.40326975476839, + "grad_norm": 8.068859100341797, + "learning_rate": 1.7481099731630365e-05, + "loss": 0.5716, + "step": 9323 + }, + { + "epoch": 25.40599455040872, + "grad_norm": 6.749257564544678, + "learning_rate": 1.7480514101329808e-05, + "loss": 0.5922, + "step": 9324 + }, + { + "epoch": 25.408719346049047, + "grad_norm": 17.23390007019043, + "learning_rate": 1.7479928412771253e-05, + "loss": 0.5787, + "step": 9325 + }, + { + "epoch": 25.411444141689373, + "grad_norm": 7.998206615447998, + "learning_rate": 1.7479342665959254e-05, + "loss": 0.5224, + "step": 9326 + }, + { + "epoch": 25.414168937329702, + "grad_norm": 8.28626823425293, + "learning_rate": 1.7478756860898378e-05, + "loss": 0.6528, + "step": 9327 + }, + { + "epoch": 25.416893732970028, + "grad_norm": 8.12370491027832, + "learning_rate": 1.747817099759318e-05, + "loss": 0.5311, + "step": 9328 + }, + { + "epoch": 25.419618528610354, + "grad_norm": 9.191961288452148, + "learning_rate": 1.747758507604823e-05, + "loss": 0.6464, + "step": 9329 + }, + { + "epoch": 25.422343324250683, + "grad_norm": 7.370696544647217, + "learning_rate": 1.7476999096268086e-05, + "loss": 0.3813, + "step": 9330 + }, + { + "epoch": 25.42506811989101, + "grad_norm": 7.346981048583984, + "learning_rate": 1.7476413058257313e-05, + "loss": 0.6216, + "step": 9331 + }, + { + "epoch": 25.427792915531334, + "grad_norm": 7.545352458953857, + "learning_rate": 1.7475826962020476e-05, + "loss": 0.642, + "step": 9332 + }, + { + "epoch": 25.430517711171664, + "grad_norm": 9.863822937011719, + "learning_rate": 1.747524080756214e-05, + "loss": 0.7235, + "step": 9333 + }, + { + "epoch": 25.43324250681199, + "grad_norm": 8.380276679992676, + "learning_rate": 1.7474654594886873e-05, + "loss": 0.4589, + "step": 9334 + }, + { + "epoch": 25.435967302452315, + "grad_norm": 8.475086212158203, + "learning_rate": 1.7474068323999232e-05, + "loss": 0.4783, + "step": 9335 + }, + { + "epoch": 25.438692098092645, + "grad_norm": 7.905653953552246, + "learning_rate": 1.7473481994903788e-05, + "loss": 0.52, + "step": 9336 + }, + { + "epoch": 25.44141689373297, + "grad_norm": 8.372299194335938, + "learning_rate": 1.747289560760511e-05, + "loss": 0.5763, + "step": 9337 + }, + { + "epoch": 25.444141689373296, + "grad_norm": 8.619787216186523, + "learning_rate": 1.7472309162107757e-05, + "loss": 0.5384, + "step": 9338 + }, + { + "epoch": 25.446866485013626, + "grad_norm": 9.927772521972656, + "learning_rate": 1.7471722658416302e-05, + "loss": 0.4372, + "step": 9339 + }, + { + "epoch": 25.44959128065395, + "grad_norm": 9.848402976989746, + "learning_rate": 1.7471136096535316e-05, + "loss": 0.7333, + "step": 9340 + }, + { + "epoch": 25.452316076294277, + "grad_norm": 9.86668872833252, + "learning_rate": 1.7470549476469357e-05, + "loss": 0.6058, + "step": 9341 + }, + { + "epoch": 25.455040871934607, + "grad_norm": 8.02867603302002, + "learning_rate": 1.7469962798223e-05, + "loss": 0.6613, + "step": 9342 + }, + { + "epoch": 25.457765667574932, + "grad_norm": 9.436712265014648, + "learning_rate": 1.7469376061800815e-05, + "loss": 0.5602, + "step": 9343 + }, + { + "epoch": 25.460490463215258, + "grad_norm": 8.04949951171875, + "learning_rate": 1.746878926720737e-05, + "loss": 0.6345, + "step": 9344 + }, + { + "epoch": 25.463215258855588, + "grad_norm": 7.776516437530518, + "learning_rate": 1.746820241444723e-05, + "loss": 0.566, + "step": 9345 + }, + { + "epoch": 25.465940054495913, + "grad_norm": 9.003487586975098, + "learning_rate": 1.7467615503524973e-05, + "loss": 0.6335, + "step": 9346 + }, + { + "epoch": 25.46866485013624, + "grad_norm": 7.916099548339844, + "learning_rate": 1.7467028534445166e-05, + "loss": 0.5493, + "step": 9347 + }, + { + "epoch": 25.47138964577657, + "grad_norm": 7.610687255859375, + "learning_rate": 1.7466441507212383e-05, + "loss": 0.4928, + "step": 9348 + }, + { + "epoch": 25.474114441416894, + "grad_norm": 7.990988731384277, + "learning_rate": 1.7465854421831192e-05, + "loss": 0.5379, + "step": 9349 + }, + { + "epoch": 25.47683923705722, + "grad_norm": 6.85425329208374, + "learning_rate": 1.746526727830617e-05, + "loss": 0.5766, + "step": 9350 + }, + { + "epoch": 25.479564032697546, + "grad_norm": 7.345608234405518, + "learning_rate": 1.7464680076641883e-05, + "loss": 0.6484, + "step": 9351 + }, + { + "epoch": 25.482288828337875, + "grad_norm": 6.640669345855713, + "learning_rate": 1.746409281684291e-05, + "loss": 0.5922, + "step": 9352 + }, + { + "epoch": 25.4850136239782, + "grad_norm": 7.6144633293151855, + "learning_rate": 1.746350549891382e-05, + "loss": 0.4883, + "step": 9353 + }, + { + "epoch": 25.48773841961853, + "grad_norm": 8.312814712524414, + "learning_rate": 1.7462918122859193e-05, + "loss": 0.5203, + "step": 9354 + }, + { + "epoch": 25.490463215258856, + "grad_norm": 8.035418510437012, + "learning_rate": 1.7462330688683596e-05, + "loss": 0.7047, + "step": 9355 + }, + { + "epoch": 25.493188010899182, + "grad_norm": 6.685522556304932, + "learning_rate": 1.7461743196391613e-05, + "loss": 0.8011, + "step": 9356 + }, + { + "epoch": 25.495912806539508, + "grad_norm": 7.33150577545166, + "learning_rate": 1.746115564598781e-05, + "loss": 0.5392, + "step": 9357 + }, + { + "epoch": 25.498637602179837, + "grad_norm": 7.050995349884033, + "learning_rate": 1.746056803747677e-05, + "loss": 0.5724, + "step": 9358 + }, + { + "epoch": 25.501362397820163, + "grad_norm": 7.876449108123779, + "learning_rate": 1.7459980370863063e-05, + "loss": 0.6718, + "step": 9359 + }, + { + "epoch": 25.504087193460492, + "grad_norm": 6.868752479553223, + "learning_rate": 1.7459392646151266e-05, + "loss": 0.5359, + "step": 9360 + }, + { + "epoch": 25.506811989100818, + "grad_norm": 7.423297882080078, + "learning_rate": 1.7458804863345966e-05, + "loss": 0.5386, + "step": 9361 + }, + { + "epoch": 25.509536784741144, + "grad_norm": 8.611160278320312, + "learning_rate": 1.745821702245173e-05, + "loss": 0.4833, + "step": 9362 + }, + { + "epoch": 25.51226158038147, + "grad_norm": 7.3242998123168945, + "learning_rate": 1.7457629123473144e-05, + "loss": 0.5158, + "step": 9363 + }, + { + "epoch": 25.5149863760218, + "grad_norm": 8.992837905883789, + "learning_rate": 1.745704116641478e-05, + "loss": 0.6549, + "step": 9364 + }, + { + "epoch": 25.517711171662125, + "grad_norm": 7.9097208976745605, + "learning_rate": 1.7456453151281215e-05, + "loss": 0.4332, + "step": 9365 + }, + { + "epoch": 25.520435967302454, + "grad_norm": 8.41103458404541, + "learning_rate": 1.7455865078077038e-05, + "loss": 0.6543, + "step": 9366 + }, + { + "epoch": 25.52316076294278, + "grad_norm": 7.673321723937988, + "learning_rate": 1.745527694680682e-05, + "loss": 0.6619, + "step": 9367 + }, + { + "epoch": 25.525885558583106, + "grad_norm": 6.998402118682861, + "learning_rate": 1.745468875747515e-05, + "loss": 0.5494, + "step": 9368 + }, + { + "epoch": 25.52861035422343, + "grad_norm": 6.4210686683654785, + "learning_rate": 1.74541005100866e-05, + "loss": 0.5988, + "step": 9369 + }, + { + "epoch": 25.53133514986376, + "grad_norm": 7.388408184051514, + "learning_rate": 1.7453512204645756e-05, + "loss": 0.6859, + "step": 9370 + }, + { + "epoch": 25.534059945504087, + "grad_norm": 7.578431606292725, + "learning_rate": 1.7452923841157198e-05, + "loss": 0.4578, + "step": 9371 + }, + { + "epoch": 25.536784741144416, + "grad_norm": 7.251674175262451, + "learning_rate": 1.7452335419625514e-05, + "loss": 0.631, + "step": 9372 + }, + { + "epoch": 25.539509536784742, + "grad_norm": 9.027373313903809, + "learning_rate": 1.7451746940055278e-05, + "loss": 0.5519, + "step": 9373 + }, + { + "epoch": 25.542234332425068, + "grad_norm": 8.505552291870117, + "learning_rate": 1.7451158402451078e-05, + "loss": 0.5848, + "step": 9374 + }, + { + "epoch": 25.544959128065393, + "grad_norm": 7.444201469421387, + "learning_rate": 1.7450569806817494e-05, + "loss": 0.5968, + "step": 9375 + }, + { + "epoch": 25.547683923705723, + "grad_norm": 7.371540546417236, + "learning_rate": 1.744998115315911e-05, + "loss": 0.658, + "step": 9376 + }, + { + "epoch": 25.55040871934605, + "grad_norm": 8.483649253845215, + "learning_rate": 1.744939244148052e-05, + "loss": 0.5031, + "step": 9377 + }, + { + "epoch": 25.553133514986374, + "grad_norm": 25.00672149658203, + "learning_rate": 1.7448803671786292e-05, + "loss": 0.6876, + "step": 9378 + }, + { + "epoch": 25.555858310626704, + "grad_norm": 7.475778102874756, + "learning_rate": 1.7448214844081026e-05, + "loss": 0.6038, + "step": 9379 + }, + { + "epoch": 25.55858310626703, + "grad_norm": 8.381858825683594, + "learning_rate": 1.7447625958369303e-05, + "loss": 0.6476, + "step": 9380 + }, + { + "epoch": 25.561307901907355, + "grad_norm": 8.840806007385254, + "learning_rate": 1.744703701465571e-05, + "loss": 0.5338, + "step": 9381 + }, + { + "epoch": 25.564032697547685, + "grad_norm": 7.5802764892578125, + "learning_rate": 1.744644801294483e-05, + "loss": 0.6526, + "step": 9382 + }, + { + "epoch": 25.56675749318801, + "grad_norm": 8.006721496582031, + "learning_rate": 1.744585895324125e-05, + "loss": 0.4777, + "step": 9383 + }, + { + "epoch": 25.569482288828336, + "grad_norm": 8.405454635620117, + "learning_rate": 1.7445269835549565e-05, + "loss": 0.7128, + "step": 9384 + }, + { + "epoch": 25.572207084468666, + "grad_norm": 12.386618614196777, + "learning_rate": 1.7444680659874354e-05, + "loss": 0.5532, + "step": 9385 + }, + { + "epoch": 25.57493188010899, + "grad_norm": 8.866639137268066, + "learning_rate": 1.744409142622021e-05, + "loss": 0.5941, + "step": 9386 + }, + { + "epoch": 25.577656675749317, + "grad_norm": 10.208216667175293, + "learning_rate": 1.7443502134591725e-05, + "loss": 0.4695, + "step": 9387 + }, + { + "epoch": 25.580381471389646, + "grad_norm": 8.157602310180664, + "learning_rate": 1.744291278499348e-05, + "loss": 0.5888, + "step": 9388 + }, + { + "epoch": 25.583106267029972, + "grad_norm": 15.60487174987793, + "learning_rate": 1.744232337743008e-05, + "loss": 0.6458, + "step": 9389 + }, + { + "epoch": 25.585831062670298, + "grad_norm": 9.842437744140625, + "learning_rate": 1.7441733911906092e-05, + "loss": 0.5865, + "step": 9390 + }, + { + "epoch": 25.588555858310627, + "grad_norm": 11.806042671203613, + "learning_rate": 1.7441144388426126e-05, + "loss": 0.5978, + "step": 9391 + }, + { + "epoch": 25.591280653950953, + "grad_norm": 7.766541004180908, + "learning_rate": 1.7440554806994768e-05, + "loss": 0.5707, + "step": 9392 + }, + { + "epoch": 25.59400544959128, + "grad_norm": 9.12265682220459, + "learning_rate": 1.743996516761661e-05, + "loss": 0.5485, + "step": 9393 + }, + { + "epoch": 25.59673024523161, + "grad_norm": 8.803854942321777, + "learning_rate": 1.743937547029624e-05, + "loss": 0.7141, + "step": 9394 + }, + { + "epoch": 25.599455040871934, + "grad_norm": 9.123351097106934, + "learning_rate": 1.7438785715038253e-05, + "loss": 0.5258, + "step": 9395 + }, + { + "epoch": 25.60217983651226, + "grad_norm": 10.303979873657227, + "learning_rate": 1.7438195901847243e-05, + "loss": 0.6413, + "step": 9396 + }, + { + "epoch": 25.60490463215259, + "grad_norm": 8.321008682250977, + "learning_rate": 1.7437606030727804e-05, + "loss": 0.6555, + "step": 9397 + }, + { + "epoch": 25.607629427792915, + "grad_norm": 7.6452789306640625, + "learning_rate": 1.7437016101684526e-05, + "loss": 0.5445, + "step": 9398 + }, + { + "epoch": 25.61035422343324, + "grad_norm": 8.129426002502441, + "learning_rate": 1.7436426114722006e-05, + "loss": 0.5661, + "step": 9399 + }, + { + "epoch": 25.61307901907357, + "grad_norm": 8.526227951049805, + "learning_rate": 1.7435836069844838e-05, + "loss": 0.5932, + "step": 9400 + }, + { + "epoch": 25.615803814713896, + "grad_norm": 8.07772159576416, + "learning_rate": 1.7435245967057623e-05, + "loss": 0.7504, + "step": 9401 + }, + { + "epoch": 25.618528610354222, + "grad_norm": 8.812663078308105, + "learning_rate": 1.7434655806364945e-05, + "loss": 0.5126, + "step": 9402 + }, + { + "epoch": 25.62125340599455, + "grad_norm": 8.795720100402832, + "learning_rate": 1.7434065587771413e-05, + "loss": 0.7559, + "step": 9403 + }, + { + "epoch": 25.623978201634877, + "grad_norm": 8.46756362915039, + "learning_rate": 1.7433475311281616e-05, + "loss": 0.6748, + "step": 9404 + }, + { + "epoch": 25.626702997275203, + "grad_norm": 8.732349395751953, + "learning_rate": 1.7432884976900147e-05, + "loss": 0.5325, + "step": 9405 + }, + { + "epoch": 25.629427792915532, + "grad_norm": 9.263157844543457, + "learning_rate": 1.7432294584631616e-05, + "loss": 0.6005, + "step": 9406 + }, + { + "epoch": 25.632152588555858, + "grad_norm": 10.506868362426758, + "learning_rate": 1.7431704134480608e-05, + "loss": 0.6466, + "step": 9407 + }, + { + "epoch": 25.634877384196184, + "grad_norm": 7.771955966949463, + "learning_rate": 1.7431113626451733e-05, + "loss": 0.4752, + "step": 9408 + }, + { + "epoch": 25.637602179836513, + "grad_norm": 8.836752891540527, + "learning_rate": 1.7430523060549586e-05, + "loss": 0.5073, + "step": 9409 + }, + { + "epoch": 25.64032697547684, + "grad_norm": 8.095437049865723, + "learning_rate": 1.7429932436778755e-05, + "loss": 0.656, + "step": 9410 + }, + { + "epoch": 25.643051771117165, + "grad_norm": 7.719583988189697, + "learning_rate": 1.7429341755143857e-05, + "loss": 0.4961, + "step": 9411 + }, + { + "epoch": 25.645776566757494, + "grad_norm": 6.682363510131836, + "learning_rate": 1.7428751015649483e-05, + "loss": 0.7285, + "step": 9412 + }, + { + "epoch": 25.64850136239782, + "grad_norm": 7.992876052856445, + "learning_rate": 1.7428160218300236e-05, + "loss": 0.584, + "step": 9413 + }, + { + "epoch": 25.651226158038146, + "grad_norm": 7.828421115875244, + "learning_rate": 1.7427569363100714e-05, + "loss": 0.5701, + "step": 9414 + }, + { + "epoch": 25.653950953678475, + "grad_norm": 7.200517654418945, + "learning_rate": 1.742697845005552e-05, + "loss": 0.6543, + "step": 9415 + }, + { + "epoch": 25.6566757493188, + "grad_norm": 9.306139945983887, + "learning_rate": 1.7426387479169256e-05, + "loss": 0.5515, + "step": 9416 + }, + { + "epoch": 25.659400544959126, + "grad_norm": 6.922572612762451, + "learning_rate": 1.7425796450446532e-05, + "loss": 0.5296, + "step": 9417 + }, + { + "epoch": 25.662125340599456, + "grad_norm": 6.6560444831848145, + "learning_rate": 1.7425205363891938e-05, + "loss": 0.6051, + "step": 9418 + }, + { + "epoch": 25.66485013623978, + "grad_norm": 8.202136993408203, + "learning_rate": 1.7424614219510087e-05, + "loss": 0.8121, + "step": 9419 + }, + { + "epoch": 25.667574931880107, + "grad_norm": 7.640063285827637, + "learning_rate": 1.742402301730558e-05, + "loss": 0.6223, + "step": 9420 + }, + { + "epoch": 25.670299727520437, + "grad_norm": 7.376254081726074, + "learning_rate": 1.7423431757283018e-05, + "loss": 0.5077, + "step": 9421 + }, + { + "epoch": 25.673024523160763, + "grad_norm": 8.305665016174316, + "learning_rate": 1.742284043944701e-05, + "loss": 0.5715, + "step": 9422 + }, + { + "epoch": 25.67574931880109, + "grad_norm": 6.209292411804199, + "learning_rate": 1.742224906380216e-05, + "loss": 0.4484, + "step": 9423 + }, + { + "epoch": 25.678474114441418, + "grad_norm": 8.914823532104492, + "learning_rate": 1.7421657630353068e-05, + "loss": 0.6091, + "step": 9424 + }, + { + "epoch": 25.681198910081743, + "grad_norm": 7.535190105438232, + "learning_rate": 1.742106613910435e-05, + "loss": 0.5803, + "step": 9425 + }, + { + "epoch": 25.68392370572207, + "grad_norm": 7.564618110656738, + "learning_rate": 1.7420474590060606e-05, + "loss": 0.4732, + "step": 9426 + }, + { + "epoch": 25.6866485013624, + "grad_norm": 7.2093963623046875, + "learning_rate": 1.7419882983226446e-05, + "loss": 0.6475, + "step": 9427 + }, + { + "epoch": 25.689373297002724, + "grad_norm": 8.094961166381836, + "learning_rate": 1.7419291318606476e-05, + "loss": 0.6348, + "step": 9428 + }, + { + "epoch": 25.69209809264305, + "grad_norm": 11.35478687286377, + "learning_rate": 1.7418699596205303e-05, + "loss": 0.5717, + "step": 9429 + }, + { + "epoch": 25.69482288828338, + "grad_norm": 7.570865631103516, + "learning_rate": 1.7418107816027538e-05, + "loss": 0.5313, + "step": 9430 + }, + { + "epoch": 25.697547683923705, + "grad_norm": 7.583775043487549, + "learning_rate": 1.741751597807779e-05, + "loss": 0.5817, + "step": 9431 + }, + { + "epoch": 25.70027247956403, + "grad_norm": 7.399974346160889, + "learning_rate": 1.741692408236066e-05, + "loss": 0.4835, + "step": 9432 + }, + { + "epoch": 25.70299727520436, + "grad_norm": 7.177084922790527, + "learning_rate": 1.7416332128880768e-05, + "loss": 0.5538, + "step": 9433 + }, + { + "epoch": 25.705722070844686, + "grad_norm": 6.838465213775635, + "learning_rate": 1.7415740117642718e-05, + "loss": 0.551, + "step": 9434 + }, + { + "epoch": 25.708446866485012, + "grad_norm": 7.103573799133301, + "learning_rate": 1.7415148048651126e-05, + "loss": 0.504, + "step": 9435 + }, + { + "epoch": 25.71117166212534, + "grad_norm": 7.283553600311279, + "learning_rate": 1.7414555921910597e-05, + "loss": 0.7719, + "step": 9436 + }, + { + "epoch": 25.713896457765667, + "grad_norm": 7.7645087242126465, + "learning_rate": 1.7413963737425747e-05, + "loss": 0.5516, + "step": 9437 + }, + { + "epoch": 25.716621253405993, + "grad_norm": 8.091785430908203, + "learning_rate": 1.7413371495201183e-05, + "loss": 0.5369, + "step": 9438 + }, + { + "epoch": 25.719346049046322, + "grad_norm": 6.979974269866943, + "learning_rate": 1.7412779195241524e-05, + "loss": 0.9425, + "step": 9439 + }, + { + "epoch": 25.722070844686648, + "grad_norm": 9.18759536743164, + "learning_rate": 1.741218683755138e-05, + "loss": 0.5754, + "step": 9440 + }, + { + "epoch": 25.724795640326974, + "grad_norm": 7.882137775421143, + "learning_rate": 1.7411594422135357e-05, + "loss": 0.5159, + "step": 9441 + }, + { + "epoch": 25.727520435967303, + "grad_norm": 7.561557769775391, + "learning_rate": 1.741100194899808e-05, + "loss": 0.6474, + "step": 9442 + }, + { + "epoch": 25.73024523160763, + "grad_norm": 17.012176513671875, + "learning_rate": 1.741040941814416e-05, + "loss": 0.6215, + "step": 9443 + }, + { + "epoch": 25.732970027247955, + "grad_norm": 7.687644004821777, + "learning_rate": 1.7409816829578205e-05, + "loss": 0.6672, + "step": 9444 + }, + { + "epoch": 25.735694822888284, + "grad_norm": 6.788773059844971, + "learning_rate": 1.7409224183304836e-05, + "loss": 0.5242, + "step": 9445 + }, + { + "epoch": 25.73841961852861, + "grad_norm": 8.36744213104248, + "learning_rate": 1.740863147932867e-05, + "loss": 0.4936, + "step": 9446 + }, + { + "epoch": 25.741144414168936, + "grad_norm": 7.843606948852539, + "learning_rate": 1.740803871765432e-05, + "loss": 0.6784, + "step": 9447 + }, + { + "epoch": 25.743869209809265, + "grad_norm": 8.095901489257812, + "learning_rate": 1.7407445898286405e-05, + "loss": 0.5069, + "step": 9448 + }, + { + "epoch": 25.74659400544959, + "grad_norm": 8.641240119934082, + "learning_rate": 1.7406853021229535e-05, + "loss": 0.7564, + "step": 9449 + }, + { + "epoch": 25.749318801089917, + "grad_norm": 7.994680881500244, + "learning_rate": 1.7406260086488336e-05, + "loss": 0.5792, + "step": 9450 + }, + { + "epoch": 25.752043596730246, + "grad_norm": 7.075345993041992, + "learning_rate": 1.740566709406742e-05, + "loss": 0.6983, + "step": 9451 + }, + { + "epoch": 25.754768392370572, + "grad_norm": 7.390691757202148, + "learning_rate": 1.7405074043971407e-05, + "loss": 0.7299, + "step": 9452 + }, + { + "epoch": 25.757493188010898, + "grad_norm": 9.825465202331543, + "learning_rate": 1.7404480936204914e-05, + "loss": 0.7331, + "step": 9453 + }, + { + "epoch": 25.760217983651227, + "grad_norm": 8.008077621459961, + "learning_rate": 1.7403887770772564e-05, + "loss": 0.5295, + "step": 9454 + }, + { + "epoch": 25.762942779291553, + "grad_norm": 8.09028148651123, + "learning_rate": 1.7403294547678975e-05, + "loss": 0.6837, + "step": 9455 + }, + { + "epoch": 25.76566757493188, + "grad_norm": 7.616891384124756, + "learning_rate": 1.7402701266928767e-05, + "loss": 0.5135, + "step": 9456 + }, + { + "epoch": 25.768392370572208, + "grad_norm": 14.6254243850708, + "learning_rate": 1.7402107928526556e-05, + "loss": 0.5233, + "step": 9457 + }, + { + "epoch": 25.771117166212534, + "grad_norm": 7.203038692474365, + "learning_rate": 1.740151453247697e-05, + "loss": 0.4981, + "step": 9458 + }, + { + "epoch": 25.77384196185286, + "grad_norm": 8.74550724029541, + "learning_rate": 1.7400921078784624e-05, + "loss": 0.6011, + "step": 9459 + }, + { + "epoch": 25.77656675749319, + "grad_norm": 7.549883842468262, + "learning_rate": 1.7400327567454145e-05, + "loss": 0.4445, + "step": 9460 + }, + { + "epoch": 25.779291553133515, + "grad_norm": 7.61672306060791, + "learning_rate": 1.7399733998490152e-05, + "loss": 0.6873, + "step": 9461 + }, + { + "epoch": 25.78201634877384, + "grad_norm": 7.361455917358398, + "learning_rate": 1.739914037189727e-05, + "loss": 0.6927, + "step": 9462 + }, + { + "epoch": 25.78474114441417, + "grad_norm": 5.834643840789795, + "learning_rate": 1.739854668768012e-05, + "loss": 0.7412, + "step": 9463 + }, + { + "epoch": 25.787465940054496, + "grad_norm": 8.191956520080566, + "learning_rate": 1.7397952945843325e-05, + "loss": 0.6303, + "step": 9464 + }, + { + "epoch": 25.79019073569482, + "grad_norm": 11.40386962890625, + "learning_rate": 1.7397359146391513e-05, + "loss": 0.7029, + "step": 9465 + }, + { + "epoch": 25.79291553133515, + "grad_norm": 8.3353910446167, + "learning_rate": 1.7396765289329308e-05, + "loss": 0.5961, + "step": 9466 + }, + { + "epoch": 25.795640326975477, + "grad_norm": 8.796889305114746, + "learning_rate": 1.739617137466133e-05, + "loss": 0.6309, + "step": 9467 + }, + { + "epoch": 25.798365122615802, + "grad_norm": 7.54941987991333, + "learning_rate": 1.7395577402392208e-05, + "loss": 0.6583, + "step": 9468 + }, + { + "epoch": 25.80108991825613, + "grad_norm": 6.982385635375977, + "learning_rate": 1.739498337252657e-05, + "loss": 0.6166, + "step": 9469 + }, + { + "epoch": 25.803814713896458, + "grad_norm": 7.676999568939209, + "learning_rate": 1.7394389285069034e-05, + "loss": 0.7845, + "step": 9470 + }, + { + "epoch": 25.806539509536783, + "grad_norm": 7.578592777252197, + "learning_rate": 1.7393795140024235e-05, + "loss": 0.8047, + "step": 9471 + }, + { + "epoch": 25.809264305177113, + "grad_norm": 9.978384017944336, + "learning_rate": 1.7393200937396795e-05, + "loss": 0.5497, + "step": 9472 + }, + { + "epoch": 25.81198910081744, + "grad_norm": 13.144746780395508, + "learning_rate": 1.7392606677191345e-05, + "loss": 0.629, + "step": 9473 + }, + { + "epoch": 25.814713896457764, + "grad_norm": 8.699050903320312, + "learning_rate": 1.7392012359412517e-05, + "loss": 0.4867, + "step": 9474 + }, + { + "epoch": 25.817438692098094, + "grad_norm": 11.404301643371582, + "learning_rate": 1.7391417984064932e-05, + "loss": 0.7406, + "step": 9475 + }, + { + "epoch": 25.82016348773842, + "grad_norm": 7.311351776123047, + "learning_rate": 1.7390823551153218e-05, + "loss": 0.5009, + "step": 9476 + }, + { + "epoch": 25.822888283378745, + "grad_norm": 9.406844139099121, + "learning_rate": 1.739022906068201e-05, + "loss": 0.6615, + "step": 9477 + }, + { + "epoch": 25.825613079019075, + "grad_norm": 8.44792366027832, + "learning_rate": 1.738963451265594e-05, + "loss": 0.6606, + "step": 9478 + }, + { + "epoch": 25.8283378746594, + "grad_norm": 9.070053100585938, + "learning_rate": 1.738903990707963e-05, + "loss": 0.5695, + "step": 9479 + }, + { + "epoch": 25.831062670299726, + "grad_norm": 8.260103225708008, + "learning_rate": 1.7388445243957717e-05, + "loss": 0.5321, + "step": 9480 + }, + { + "epoch": 25.833787465940055, + "grad_norm": 8.975306510925293, + "learning_rate": 1.7387850523294827e-05, + "loss": 0.5169, + "step": 9481 + }, + { + "epoch": 25.83651226158038, + "grad_norm": 8.646730422973633, + "learning_rate": 1.7387255745095597e-05, + "loss": 0.4396, + "step": 9482 + }, + { + "epoch": 25.839237057220707, + "grad_norm": 8.46390151977539, + "learning_rate": 1.738666090936466e-05, + "loss": 0.6315, + "step": 9483 + }, + { + "epoch": 25.841961852861036, + "grad_norm": 7.23923397064209, + "learning_rate": 1.738606601610664e-05, + "loss": 0.563, + "step": 9484 + }, + { + "epoch": 25.844686648501362, + "grad_norm": 8.615715980529785, + "learning_rate": 1.738547106532618e-05, + "loss": 0.4901, + "step": 9485 + }, + { + "epoch": 25.847411444141688, + "grad_norm": 9.231773376464844, + "learning_rate": 1.7384876057027907e-05, + "loss": 0.5825, + "step": 9486 + }, + { + "epoch": 25.850136239782017, + "grad_norm": 8.428955078125, + "learning_rate": 1.7384280991216455e-05, + "loss": 0.5003, + "step": 9487 + }, + { + "epoch": 25.852861035422343, + "grad_norm": 9.66771125793457, + "learning_rate": 1.7383685867896463e-05, + "loss": 0.7293, + "step": 9488 + }, + { + "epoch": 25.85558583106267, + "grad_norm": 8.030937194824219, + "learning_rate": 1.7383090687072563e-05, + "loss": 0.4869, + "step": 9489 + }, + { + "epoch": 25.858310626703, + "grad_norm": 7.184062957763672, + "learning_rate": 1.738249544874939e-05, + "loss": 0.6099, + "step": 9490 + }, + { + "epoch": 25.861035422343324, + "grad_norm": 7.648211479187012, + "learning_rate": 1.7381900152931582e-05, + "loss": 0.7165, + "step": 9491 + }, + { + "epoch": 25.86376021798365, + "grad_norm": 7.263122081756592, + "learning_rate": 1.738130479962377e-05, + "loss": 0.4726, + "step": 9492 + }, + { + "epoch": 25.86648501362398, + "grad_norm": 9.472850799560547, + "learning_rate": 1.7380709388830595e-05, + "loss": 0.6682, + "step": 9493 + }, + { + "epoch": 25.869209809264305, + "grad_norm": 10.854084968566895, + "learning_rate": 1.738011392055669e-05, + "loss": 0.5417, + "step": 9494 + }, + { + "epoch": 25.87193460490463, + "grad_norm": 7.673418998718262, + "learning_rate": 1.7379518394806703e-05, + "loss": 0.5994, + "step": 9495 + }, + { + "epoch": 25.87465940054496, + "grad_norm": 8.981013298034668, + "learning_rate": 1.7378922811585256e-05, + "loss": 0.8358, + "step": 9496 + }, + { + "epoch": 25.877384196185286, + "grad_norm": 7.159624099731445, + "learning_rate": 1.7378327170897e-05, + "loss": 0.6071, + "step": 9497 + }, + { + "epoch": 25.88010899182561, + "grad_norm": 7.000638008117676, + "learning_rate": 1.737773147274657e-05, + "loss": 0.4789, + "step": 9498 + }, + { + "epoch": 25.88283378746594, + "grad_norm": 8.612425804138184, + "learning_rate": 1.73771357171386e-05, + "loss": 0.8832, + "step": 9499 + }, + { + "epoch": 25.885558583106267, + "grad_norm": 30.55554962158203, + "learning_rate": 1.7376539904077742e-05, + "loss": 0.6271, + "step": 9500 + }, + { + "epoch": 25.888283378746593, + "grad_norm": 7.560913562774658, + "learning_rate": 1.7375944033568625e-05, + "loss": 0.6835, + "step": 9501 + }, + { + "epoch": 25.891008174386922, + "grad_norm": 7.5395097732543945, + "learning_rate": 1.737534810561589e-05, + "loss": 0.6556, + "step": 9502 + }, + { + "epoch": 25.893732970027248, + "grad_norm": 9.153618812561035, + "learning_rate": 1.7374752120224184e-05, + "loss": 0.7285, + "step": 9503 + }, + { + "epoch": 25.896457765667574, + "grad_norm": 9.776400566101074, + "learning_rate": 1.7374156077398144e-05, + "loss": 0.705, + "step": 9504 + }, + { + "epoch": 25.899182561307903, + "grad_norm": 7.857279300689697, + "learning_rate": 1.7373559977142416e-05, + "loss": 0.5347, + "step": 9505 + }, + { + "epoch": 25.90190735694823, + "grad_norm": 7.109128475189209, + "learning_rate": 1.7372963819461642e-05, + "loss": 0.6846, + "step": 9506 + }, + { + "epoch": 25.904632152588555, + "grad_norm": 7.639939785003662, + "learning_rate": 1.737236760436046e-05, + "loss": 0.6296, + "step": 9507 + }, + { + "epoch": 25.907356948228884, + "grad_norm": 7.69437837600708, + "learning_rate": 1.7371771331843517e-05, + "loss": 0.5632, + "step": 9508 + }, + { + "epoch": 25.91008174386921, + "grad_norm": 8.280343055725098, + "learning_rate": 1.7371175001915455e-05, + "loss": 0.6794, + "step": 9509 + }, + { + "epoch": 25.912806539509535, + "grad_norm": 10.756189346313477, + "learning_rate": 1.7370578614580922e-05, + "loss": 0.6239, + "step": 9510 + }, + { + "epoch": 25.915531335149865, + "grad_norm": 9.908435821533203, + "learning_rate": 1.736998216984456e-05, + "loss": 0.6348, + "step": 9511 + }, + { + "epoch": 25.91825613079019, + "grad_norm": 8.193130493164062, + "learning_rate": 1.7369385667711013e-05, + "loss": 0.6911, + "step": 9512 + }, + { + "epoch": 25.920980926430516, + "grad_norm": 9.463773727416992, + "learning_rate": 1.7368789108184927e-05, + "loss": 0.5245, + "step": 9513 + }, + { + "epoch": 25.923705722070846, + "grad_norm": 8.20947265625, + "learning_rate": 1.7368192491270946e-05, + "loss": 0.5592, + "step": 9514 + }, + { + "epoch": 25.92643051771117, + "grad_norm": 8.28555679321289, + "learning_rate": 1.7367595816973722e-05, + "loss": 0.6529, + "step": 9515 + }, + { + "epoch": 25.929155313351497, + "grad_norm": 7.5748491287231445, + "learning_rate": 1.73669990852979e-05, + "loss": 0.5446, + "step": 9516 + }, + { + "epoch": 25.931880108991827, + "grad_norm": 7.565945148468018, + "learning_rate": 1.7366402296248126e-05, + "loss": 0.6647, + "step": 9517 + }, + { + "epoch": 25.934604904632153, + "grad_norm": 7.207835674285889, + "learning_rate": 1.7365805449829047e-05, + "loss": 0.7472, + "step": 9518 + }, + { + "epoch": 25.93732970027248, + "grad_norm": 9.150147438049316, + "learning_rate": 1.7365208546045315e-05, + "loss": 0.5984, + "step": 9519 + }, + { + "epoch": 25.940054495912808, + "grad_norm": 7.448739528656006, + "learning_rate": 1.736461158490157e-05, + "loss": 0.5756, + "step": 9520 + }, + { + "epoch": 25.942779291553133, + "grad_norm": 9.423181533813477, + "learning_rate": 1.7364014566402472e-05, + "loss": 0.6123, + "step": 9521 + }, + { + "epoch": 25.94550408719346, + "grad_norm": 7.365279197692871, + "learning_rate": 1.7363417490552664e-05, + "loss": 0.4821, + "step": 9522 + }, + { + "epoch": 25.94822888283379, + "grad_norm": 7.734255313873291, + "learning_rate": 1.7362820357356794e-05, + "loss": 0.5531, + "step": 9523 + }, + { + "epoch": 25.950953678474114, + "grad_norm": 6.780492305755615, + "learning_rate": 1.736222316681952e-05, + "loss": 0.6304, + "step": 9524 + }, + { + "epoch": 25.95367847411444, + "grad_norm": 17.256683349609375, + "learning_rate": 1.736162591894549e-05, + "loss": 0.6966, + "step": 9525 + }, + { + "epoch": 25.95640326975477, + "grad_norm": 11.581868171691895, + "learning_rate": 1.7361028613739354e-05, + "loss": 0.6542, + "step": 9526 + }, + { + "epoch": 25.959128065395095, + "grad_norm": 8.833714485168457, + "learning_rate": 1.7360431251205763e-05, + "loss": 0.6693, + "step": 9527 + }, + { + "epoch": 25.96185286103542, + "grad_norm": 7.809795379638672, + "learning_rate": 1.735983383134937e-05, + "loss": 0.7259, + "step": 9528 + }, + { + "epoch": 25.96457765667575, + "grad_norm": 7.3385820388793945, + "learning_rate": 1.7359236354174826e-05, + "loss": 0.6353, + "step": 9529 + }, + { + "epoch": 25.967302452316076, + "grad_norm": 7.326361179351807, + "learning_rate": 1.7358638819686787e-05, + "loss": 0.5353, + "step": 9530 + }, + { + "epoch": 25.970027247956402, + "grad_norm": 6.983292579650879, + "learning_rate": 1.735804122788991e-05, + "loss": 0.6599, + "step": 9531 + }, + { + "epoch": 25.97275204359673, + "grad_norm": 7.214084625244141, + "learning_rate": 1.735744357878884e-05, + "loss": 0.6243, + "step": 9532 + }, + { + "epoch": 25.975476839237057, + "grad_norm": 7.334532737731934, + "learning_rate": 1.7356845872388238e-05, + "loss": 0.8033, + "step": 9533 + }, + { + "epoch": 25.978201634877383, + "grad_norm": 9.344524383544922, + "learning_rate": 1.7356248108692758e-05, + "loss": 0.5524, + "step": 9534 + }, + { + "epoch": 25.980926430517712, + "grad_norm": 7.228560924530029, + "learning_rate": 1.735565028770705e-05, + "loss": 0.6976, + "step": 9535 + }, + { + "epoch": 25.983651226158038, + "grad_norm": 11.06403636932373, + "learning_rate": 1.735505240943578e-05, + "loss": 0.6921, + "step": 9536 + }, + { + "epoch": 25.986376021798364, + "grad_norm": 8.322148323059082, + "learning_rate": 1.7354454473883596e-05, + "loss": 0.5891, + "step": 9537 + }, + { + "epoch": 25.989100817438693, + "grad_norm": 10.034852981567383, + "learning_rate": 1.7353856481055157e-05, + "loss": 0.7438, + "step": 9538 + }, + { + "epoch": 25.99182561307902, + "grad_norm": 11.697212219238281, + "learning_rate": 1.735325843095512e-05, + "loss": 0.4705, + "step": 9539 + }, + { + "epoch": 25.994550408719345, + "grad_norm": 8.835293769836426, + "learning_rate": 1.7352660323588146e-05, + "loss": 0.7668, + "step": 9540 + }, + { + "epoch": 25.997275204359674, + "grad_norm": 7.350338935852051, + "learning_rate": 1.7352062158958887e-05, + "loss": 0.5106, + "step": 9541 + }, + { + "epoch": 26.0, + "grad_norm": 8.838607788085938, + "learning_rate": 1.7351463937072008e-05, + "loss": 0.6144, + "step": 9542 + }, + { + "epoch": 26.002724795640326, + "grad_norm": 7.957286357879639, + "learning_rate": 1.735086565793216e-05, + "loss": 0.5024, + "step": 9543 + }, + { + "epoch": 26.005449591280655, + "grad_norm": 6.296217918395996, + "learning_rate": 1.735026732154401e-05, + "loss": 0.6693, + "step": 9544 + }, + { + "epoch": 26.00817438692098, + "grad_norm": 7.643580436706543, + "learning_rate": 1.734966892791221e-05, + "loss": 0.4755, + "step": 9545 + }, + { + "epoch": 26.010899182561307, + "grad_norm": 9.448199272155762, + "learning_rate": 1.734907047704143e-05, + "loss": 0.6694, + "step": 9546 + }, + { + "epoch": 26.013623978201636, + "grad_norm": 6.621395111083984, + "learning_rate": 1.7348471968936325e-05, + "loss": 0.5294, + "step": 9547 + }, + { + "epoch": 26.016348773841962, + "grad_norm": 10.18807601928711, + "learning_rate": 1.7347873403601557e-05, + "loss": 0.5653, + "step": 9548 + }, + { + "epoch": 26.019073569482288, + "grad_norm": 6.76434850692749, + "learning_rate": 1.7347274781041784e-05, + "loss": 0.4984, + "step": 9549 + }, + { + "epoch": 26.021798365122617, + "grad_norm": 6.526801109313965, + "learning_rate": 1.7346676101261676e-05, + "loss": 0.4005, + "step": 9550 + }, + { + "epoch": 26.024523160762943, + "grad_norm": 8.109182357788086, + "learning_rate": 1.734607736426589e-05, + "loss": 0.5455, + "step": 9551 + }, + { + "epoch": 26.02724795640327, + "grad_norm": 7.0792012214660645, + "learning_rate": 1.7345478570059084e-05, + "loss": 0.5917, + "step": 9552 + }, + { + "epoch": 26.029972752043598, + "grad_norm": 8.693367958068848, + "learning_rate": 1.7344879718645934e-05, + "loss": 0.4088, + "step": 9553 + }, + { + "epoch": 26.032697547683924, + "grad_norm": 7.457730293273926, + "learning_rate": 1.7344280810031097e-05, + "loss": 0.6736, + "step": 9554 + }, + { + "epoch": 26.03542234332425, + "grad_norm": 6.975096702575684, + "learning_rate": 1.7343681844219232e-05, + "loss": 0.6584, + "step": 9555 + }, + { + "epoch": 26.03814713896458, + "grad_norm": 7.109955310821533, + "learning_rate": 1.7343082821215015e-05, + "loss": 0.5279, + "step": 9556 + }, + { + "epoch": 26.040871934604905, + "grad_norm": 9.716678619384766, + "learning_rate": 1.73424837410231e-05, + "loss": 0.4881, + "step": 9557 + }, + { + "epoch": 26.04359673024523, + "grad_norm": 7.266867160797119, + "learning_rate": 1.7341884603648164e-05, + "loss": 0.5488, + "step": 9558 + }, + { + "epoch": 26.04632152588556, + "grad_norm": 7.502307891845703, + "learning_rate": 1.7341285409094862e-05, + "loss": 0.6344, + "step": 9559 + }, + { + "epoch": 26.049046321525886, + "grad_norm": 9.43380355834961, + "learning_rate": 1.7340686157367866e-05, + "loss": 0.4438, + "step": 9560 + }, + { + "epoch": 26.05177111716621, + "grad_norm": 8.707967758178711, + "learning_rate": 1.7340086848471848e-05, + "loss": 0.5626, + "step": 9561 + }, + { + "epoch": 26.05449591280654, + "grad_norm": 20.586732864379883, + "learning_rate": 1.7339487482411464e-05, + "loss": 0.6022, + "step": 9562 + }, + { + "epoch": 26.057220708446867, + "grad_norm": 7.162247657775879, + "learning_rate": 1.733888805919139e-05, + "loss": 0.6588, + "step": 9563 + }, + { + "epoch": 26.059945504087192, + "grad_norm": 7.609987258911133, + "learning_rate": 1.7338288578816292e-05, + "loss": 0.6384, + "step": 9564 + }, + { + "epoch": 26.06267029972752, + "grad_norm": 8.76731014251709, + "learning_rate": 1.733768904129084e-05, + "loss": 0.5563, + "step": 9565 + }, + { + "epoch": 26.065395095367847, + "grad_norm": 13.402876853942871, + "learning_rate": 1.7337089446619697e-05, + "loss": 0.5977, + "step": 9566 + }, + { + "epoch": 26.068119891008173, + "grad_norm": 8.927674293518066, + "learning_rate": 1.733648979480754e-05, + "loss": 0.5298, + "step": 9567 + }, + { + "epoch": 26.070844686648503, + "grad_norm": 7.532134532928467, + "learning_rate": 1.733589008585904e-05, + "loss": 0.5392, + "step": 9568 + }, + { + "epoch": 26.07356948228883, + "grad_norm": 9.537463188171387, + "learning_rate": 1.733529031977886e-05, + "loss": 0.3874, + "step": 9569 + }, + { + "epoch": 26.076294277929154, + "grad_norm": 7.319093704223633, + "learning_rate": 1.7334690496571677e-05, + "loss": 0.4325, + "step": 9570 + }, + { + "epoch": 26.079019073569484, + "grad_norm": 10.53061580657959, + "learning_rate": 1.733409061624216e-05, + "loss": 0.5564, + "step": 9571 + }, + { + "epoch": 26.08174386920981, + "grad_norm": 7.40098237991333, + "learning_rate": 1.733349067879498e-05, + "loss": 0.6164, + "step": 9572 + }, + { + "epoch": 26.084468664850135, + "grad_norm": 6.9981865882873535, + "learning_rate": 1.7332890684234815e-05, + "loss": 0.5289, + "step": 9573 + }, + { + "epoch": 26.087193460490465, + "grad_norm": 7.324646949768066, + "learning_rate": 1.7332290632566325e-05, + "loss": 0.4944, + "step": 9574 + }, + { + "epoch": 26.08991825613079, + "grad_norm": 7.746469497680664, + "learning_rate": 1.73316905237942e-05, + "loss": 0.497, + "step": 9575 + }, + { + "epoch": 26.092643051771116, + "grad_norm": 6.78636360168457, + "learning_rate": 1.7331090357923103e-05, + "loss": 0.4863, + "step": 9576 + }, + { + "epoch": 26.095367847411445, + "grad_norm": 7.395721435546875, + "learning_rate": 1.7330490134957707e-05, + "loss": 0.4698, + "step": 9577 + }, + { + "epoch": 26.09809264305177, + "grad_norm": 8.91894817352295, + "learning_rate": 1.732988985490269e-05, + "loss": 0.5521, + "step": 9578 + }, + { + "epoch": 26.100817438692097, + "grad_norm": 8.462091445922852, + "learning_rate": 1.7329289517762733e-05, + "loss": 0.5223, + "step": 9579 + }, + { + "epoch": 26.103542234332426, + "grad_norm": 7.259838581085205, + "learning_rate": 1.73286891235425e-05, + "loss": 0.4938, + "step": 9580 + }, + { + "epoch": 26.106267029972752, + "grad_norm": 9.486263275146484, + "learning_rate": 1.7328088672246674e-05, + "loss": 0.4198, + "step": 9581 + }, + { + "epoch": 26.108991825613078, + "grad_norm": 7.32037353515625, + "learning_rate": 1.7327488163879923e-05, + "loss": 0.5327, + "step": 9582 + }, + { + "epoch": 26.111716621253407, + "grad_norm": 14.064255714416504, + "learning_rate": 1.7326887598446937e-05, + "loss": 0.5925, + "step": 9583 + }, + { + "epoch": 26.114441416893733, + "grad_norm": 7.668673515319824, + "learning_rate": 1.7326286975952387e-05, + "loss": 0.4813, + "step": 9584 + }, + { + "epoch": 26.11716621253406, + "grad_norm": 7.011399269104004, + "learning_rate": 1.7325686296400946e-05, + "loss": 0.5601, + "step": 9585 + }, + { + "epoch": 26.11989100817439, + "grad_norm": 9.075329780578613, + "learning_rate": 1.7325085559797295e-05, + "loss": 0.5008, + "step": 9586 + }, + { + "epoch": 26.122615803814714, + "grad_norm": 9.160786628723145, + "learning_rate": 1.7324484766146118e-05, + "loss": 0.6431, + "step": 9587 + }, + { + "epoch": 26.12534059945504, + "grad_norm": 6.6641130447387695, + "learning_rate": 1.7323883915452087e-05, + "loss": 0.5106, + "step": 9588 + }, + { + "epoch": 26.12806539509537, + "grad_norm": 8.302316665649414, + "learning_rate": 1.7323283007719883e-05, + "loss": 0.5582, + "step": 9589 + }, + { + "epoch": 26.130790190735695, + "grad_norm": 8.207863807678223, + "learning_rate": 1.7322682042954186e-05, + "loss": 0.5475, + "step": 9590 + }, + { + "epoch": 26.13351498637602, + "grad_norm": 8.551682472229004, + "learning_rate": 1.732208102115968e-05, + "loss": 0.7343, + "step": 9591 + }, + { + "epoch": 26.13623978201635, + "grad_norm": 17.928634643554688, + "learning_rate": 1.732147994234104e-05, + "loss": 0.4928, + "step": 9592 + }, + { + "epoch": 26.138964577656676, + "grad_norm": 8.315779685974121, + "learning_rate": 1.732087880650295e-05, + "loss": 0.4801, + "step": 9593 + }, + { + "epoch": 26.141689373297, + "grad_norm": 8.798788070678711, + "learning_rate": 1.7320277613650093e-05, + "loss": 0.5987, + "step": 9594 + }, + { + "epoch": 26.14441416893733, + "grad_norm": 7.271299839019775, + "learning_rate": 1.7319676363787146e-05, + "loss": 0.626, + "step": 9595 + }, + { + "epoch": 26.147138964577657, + "grad_norm": 7.583462715148926, + "learning_rate": 1.7319075056918798e-05, + "loss": 0.4981, + "step": 9596 + }, + { + "epoch": 26.149863760217983, + "grad_norm": 11.364434242248535, + "learning_rate": 1.731847369304973e-05, + "loss": 0.4866, + "step": 9597 + }, + { + "epoch": 26.152588555858312, + "grad_norm": 8.130598068237305, + "learning_rate": 1.7317872272184624e-05, + "loss": 0.5431, + "step": 9598 + }, + { + "epoch": 26.155313351498638, + "grad_norm": 10.138801574707031, + "learning_rate": 1.7317270794328164e-05, + "loss": 0.4934, + "step": 9599 + }, + { + "epoch": 26.158038147138964, + "grad_norm": 7.542050361633301, + "learning_rate": 1.731666925948503e-05, + "loss": 0.6616, + "step": 9600 + }, + { + "epoch": 26.160762942779293, + "grad_norm": 9.432887077331543, + "learning_rate": 1.731606766765992e-05, + "loss": 0.5143, + "step": 9601 + }, + { + "epoch": 26.16348773841962, + "grad_norm": 10.398560523986816, + "learning_rate": 1.7315466018857505e-05, + "loss": 0.5665, + "step": 9602 + }, + { + "epoch": 26.166212534059945, + "grad_norm": 17.910289764404297, + "learning_rate": 1.7314864313082477e-05, + "loss": 0.5927, + "step": 9603 + }, + { + "epoch": 26.168937329700274, + "grad_norm": 7.854093551635742, + "learning_rate": 1.731426255033952e-05, + "loss": 0.5396, + "step": 9604 + }, + { + "epoch": 26.1716621253406, + "grad_norm": 6.922926902770996, + "learning_rate": 1.7313660730633324e-05, + "loss": 0.4514, + "step": 9605 + }, + { + "epoch": 26.174386920980925, + "grad_norm": 7.1274542808532715, + "learning_rate": 1.7313058853968572e-05, + "loss": 0.6428, + "step": 9606 + }, + { + "epoch": 26.177111716621255, + "grad_norm": 9.016749382019043, + "learning_rate": 1.731245692034995e-05, + "loss": 0.4739, + "step": 9607 + }, + { + "epoch": 26.17983651226158, + "grad_norm": 7.756386756896973, + "learning_rate": 1.7311854929782154e-05, + "loss": 0.5453, + "step": 9608 + }, + { + "epoch": 26.182561307901906, + "grad_norm": 27.780536651611328, + "learning_rate": 1.7311252882269864e-05, + "loss": 0.5505, + "step": 9609 + }, + { + "epoch": 26.185286103542236, + "grad_norm": 9.53674602508545, + "learning_rate": 1.7310650777817775e-05, + "loss": 0.6656, + "step": 9610 + }, + { + "epoch": 26.18801089918256, + "grad_norm": 7.744842052459717, + "learning_rate": 1.7310048616430572e-05, + "loss": 0.6854, + "step": 9611 + }, + { + "epoch": 26.190735694822887, + "grad_norm": 7.945459842681885, + "learning_rate": 1.7309446398112942e-05, + "loss": 0.5873, + "step": 9612 + }, + { + "epoch": 26.193460490463217, + "grad_norm": 8.727627754211426, + "learning_rate": 1.7308844122869583e-05, + "loss": 0.7332, + "step": 9613 + }, + { + "epoch": 26.196185286103542, + "grad_norm": 7.102766513824463, + "learning_rate": 1.7308241790705182e-05, + "loss": 0.7229, + "step": 9614 + }, + { + "epoch": 26.19891008174387, + "grad_norm": 7.141162395477295, + "learning_rate": 1.7307639401624426e-05, + "loss": 0.4993, + "step": 9615 + }, + { + "epoch": 26.201634877384198, + "grad_norm": 7.5889201164245605, + "learning_rate": 1.730703695563201e-05, + "loss": 0.4652, + "step": 9616 + }, + { + "epoch": 26.204359673024523, + "grad_norm": 6.298281669616699, + "learning_rate": 1.7306434452732626e-05, + "loss": 0.8528, + "step": 9617 + }, + { + "epoch": 26.20708446866485, + "grad_norm": 8.14534854888916, + "learning_rate": 1.7305831892930967e-05, + "loss": 0.4977, + "step": 9618 + }, + { + "epoch": 26.20980926430518, + "grad_norm": 8.6360502243042, + "learning_rate": 1.7305229276231723e-05, + "loss": 0.5149, + "step": 9619 + }, + { + "epoch": 26.212534059945504, + "grad_norm": 6.499998092651367, + "learning_rate": 1.7304626602639586e-05, + "loss": 0.6614, + "step": 9620 + }, + { + "epoch": 26.21525885558583, + "grad_norm": 7.012277603149414, + "learning_rate": 1.7304023872159253e-05, + "loss": 0.4642, + "step": 9621 + }, + { + "epoch": 26.21798365122616, + "grad_norm": 8.445688247680664, + "learning_rate": 1.7303421084795423e-05, + "loss": 0.5104, + "step": 9622 + }, + { + "epoch": 26.220708446866485, + "grad_norm": 8.20719051361084, + "learning_rate": 1.7302818240552775e-05, + "loss": 0.5985, + "step": 9623 + }, + { + "epoch": 26.22343324250681, + "grad_norm": 7.609731197357178, + "learning_rate": 1.7302215339436022e-05, + "loss": 0.4766, + "step": 9624 + }, + { + "epoch": 26.22615803814714, + "grad_norm": 7.7689995765686035, + "learning_rate": 1.7301612381449846e-05, + "loss": 0.4874, + "step": 9625 + }, + { + "epoch": 26.228882833787466, + "grad_norm": 7.080004692077637, + "learning_rate": 1.730100936659895e-05, + "loss": 0.7334, + "step": 9626 + }, + { + "epoch": 26.231607629427792, + "grad_norm": 6.169990539550781, + "learning_rate": 1.7300406294888027e-05, + "loss": 0.6745, + "step": 9627 + }, + { + "epoch": 26.23433242506812, + "grad_norm": 9.814729690551758, + "learning_rate": 1.7299803166321778e-05, + "loss": 0.7088, + "step": 9628 + }, + { + "epoch": 26.237057220708447, + "grad_norm": 7.300668716430664, + "learning_rate": 1.729919998090489e-05, + "loss": 0.5634, + "step": 9629 + }, + { + "epoch": 26.239782016348773, + "grad_norm": 8.827960014343262, + "learning_rate": 1.7298596738642074e-05, + "loss": 0.5107, + "step": 9630 + }, + { + "epoch": 26.242506811989102, + "grad_norm": 8.249507904052734, + "learning_rate": 1.7297993439538017e-05, + "loss": 0.4824, + "step": 9631 + }, + { + "epoch": 26.245231607629428, + "grad_norm": 9.042924880981445, + "learning_rate": 1.7297390083597426e-05, + "loss": 0.5739, + "step": 9632 + }, + { + "epoch": 26.247956403269754, + "grad_norm": 7.981200218200684, + "learning_rate": 1.7296786670824993e-05, + "loss": 0.6775, + "step": 9633 + }, + { + "epoch": 26.250681198910083, + "grad_norm": 8.520824432373047, + "learning_rate": 1.7296183201225422e-05, + "loss": 0.5093, + "step": 9634 + }, + { + "epoch": 26.25340599455041, + "grad_norm": 6.9999589920043945, + "learning_rate": 1.729557967480341e-05, + "loss": 0.4789, + "step": 9635 + }, + { + "epoch": 26.256130790190735, + "grad_norm": 8.646928787231445, + "learning_rate": 1.7294976091563663e-05, + "loss": 0.5217, + "step": 9636 + }, + { + "epoch": 26.258855585831064, + "grad_norm": 7.401947498321533, + "learning_rate": 1.729437245151087e-05, + "loss": 0.4224, + "step": 9637 + }, + { + "epoch": 26.26158038147139, + "grad_norm": 22.106281280517578, + "learning_rate": 1.7293768754649743e-05, + "loss": 0.4922, + "step": 9638 + }, + { + "epoch": 26.264305177111716, + "grad_norm": 8.012722969055176, + "learning_rate": 1.7293165000984977e-05, + "loss": 0.6678, + "step": 9639 + }, + { + "epoch": 26.267029972752045, + "grad_norm": 7.759902000427246, + "learning_rate": 1.729256119052128e-05, + "loss": 0.5939, + "step": 9640 + }, + { + "epoch": 26.26975476839237, + "grad_norm": 20.350008010864258, + "learning_rate": 1.729195732326335e-05, + "loss": 0.5517, + "step": 9641 + }, + { + "epoch": 26.272479564032697, + "grad_norm": 7.252711296081543, + "learning_rate": 1.729135339921589e-05, + "loss": 0.6181, + "step": 9642 + }, + { + "epoch": 26.275204359673026, + "grad_norm": 7.245285511016846, + "learning_rate": 1.7290749418383604e-05, + "loss": 0.5903, + "step": 9643 + }, + { + "epoch": 26.277929155313352, + "grad_norm": 7.566021919250488, + "learning_rate": 1.72901453807712e-05, + "loss": 0.5847, + "step": 9644 + }, + { + "epoch": 26.280653950953678, + "grad_norm": 7.564478397369385, + "learning_rate": 1.7289541286383374e-05, + "loss": 0.609, + "step": 9645 + }, + { + "epoch": 26.283378746594007, + "grad_norm": 14.416666984558105, + "learning_rate": 1.7288937135224833e-05, + "loss": 0.4868, + "step": 9646 + }, + { + "epoch": 26.286103542234333, + "grad_norm": 9.122889518737793, + "learning_rate": 1.7288332927300292e-05, + "loss": 0.5007, + "step": 9647 + }, + { + "epoch": 26.28882833787466, + "grad_norm": 7.749236583709717, + "learning_rate": 1.7287728662614444e-05, + "loss": 0.6157, + "step": 9648 + }, + { + "epoch": 26.291553133514988, + "grad_norm": 11.464571952819824, + "learning_rate": 1.7287124341171998e-05, + "loss": 0.4988, + "step": 9649 + }, + { + "epoch": 26.294277929155314, + "grad_norm": 7.148604393005371, + "learning_rate": 1.7286519962977663e-05, + "loss": 0.5306, + "step": 9650 + }, + { + "epoch": 26.29700272479564, + "grad_norm": 7.657546043395996, + "learning_rate": 1.728591552803615e-05, + "loss": 0.5533, + "step": 9651 + }, + { + "epoch": 26.29972752043597, + "grad_norm": 8.062553405761719, + "learning_rate": 1.7285311036352156e-05, + "loss": 0.6571, + "step": 9652 + }, + { + "epoch": 26.302452316076295, + "grad_norm": 7.646594524383545, + "learning_rate": 1.7284706487930396e-05, + "loss": 0.7164, + "step": 9653 + }, + { + "epoch": 26.30517711171662, + "grad_norm": 8.308866500854492, + "learning_rate": 1.7284101882775575e-05, + "loss": 0.6648, + "step": 9654 + }, + { + "epoch": 26.30790190735695, + "grad_norm": 8.04058837890625, + "learning_rate": 1.7283497220892406e-05, + "loss": 0.4776, + "step": 9655 + }, + { + "epoch": 26.310626702997276, + "grad_norm": 8.126984596252441, + "learning_rate": 1.728289250228559e-05, + "loss": 0.5143, + "step": 9656 + }, + { + "epoch": 26.3133514986376, + "grad_norm": 6.92857027053833, + "learning_rate": 1.7282287726959847e-05, + "loss": 0.6617, + "step": 9657 + }, + { + "epoch": 26.31607629427793, + "grad_norm": 7.771056652069092, + "learning_rate": 1.728168289491988e-05, + "loss": 0.5382, + "step": 9658 + }, + { + "epoch": 26.318801089918257, + "grad_norm": 7.239190101623535, + "learning_rate": 1.72810780061704e-05, + "loss": 0.4505, + "step": 9659 + }, + { + "epoch": 26.321525885558582, + "grad_norm": 8.406765937805176, + "learning_rate": 1.728047306071612e-05, + "loss": 0.6041, + "step": 9660 + }, + { + "epoch": 26.32425068119891, + "grad_norm": 9.182141304016113, + "learning_rate": 1.727986805856175e-05, + "loss": 0.4531, + "step": 9661 + }, + { + "epoch": 26.326975476839237, + "grad_norm": 7.7115631103515625, + "learning_rate": 1.7279262999712e-05, + "loss": 0.4387, + "step": 9662 + }, + { + "epoch": 26.329700272479563, + "grad_norm": 8.787193298339844, + "learning_rate": 1.7278657884171585e-05, + "loss": 0.6171, + "step": 9663 + }, + { + "epoch": 26.332425068119893, + "grad_norm": 8.689203262329102, + "learning_rate": 1.7278052711945218e-05, + "loss": 0.5219, + "step": 9664 + }, + { + "epoch": 26.33514986376022, + "grad_norm": 6.698019027709961, + "learning_rate": 1.7277447483037608e-05, + "loss": 0.5166, + "step": 9665 + }, + { + "epoch": 26.337874659400544, + "grad_norm": 8.592679977416992, + "learning_rate": 1.7276842197453475e-05, + "loss": 0.5221, + "step": 9666 + }, + { + "epoch": 26.340599455040874, + "grad_norm": 9.411178588867188, + "learning_rate": 1.7276236855197526e-05, + "loss": 0.6801, + "step": 9667 + }, + { + "epoch": 26.3433242506812, + "grad_norm": 9.463963508605957, + "learning_rate": 1.7275631456274476e-05, + "loss": 0.5466, + "step": 9668 + }, + { + "epoch": 26.346049046321525, + "grad_norm": 7.92461633682251, + "learning_rate": 1.727502600068905e-05, + "loss": 0.5344, + "step": 9669 + }, + { + "epoch": 26.348773841961854, + "grad_norm": 6.824985504150391, + "learning_rate": 1.727442048844595e-05, + "loss": 0.755, + "step": 9670 + }, + { + "epoch": 26.35149863760218, + "grad_norm": 8.3933744430542, + "learning_rate": 1.72738149195499e-05, + "loss": 0.7602, + "step": 9671 + }, + { + "epoch": 26.354223433242506, + "grad_norm": 9.247557640075684, + "learning_rate": 1.727320929400561e-05, + "loss": 0.5687, + "step": 9672 + }, + { + "epoch": 26.356948228882835, + "grad_norm": 8.802834510803223, + "learning_rate": 1.7272603611817803e-05, + "loss": 0.5789, + "step": 9673 + }, + { + "epoch": 26.35967302452316, + "grad_norm": 24.909435272216797, + "learning_rate": 1.7271997872991192e-05, + "loss": 0.5758, + "step": 9674 + }, + { + "epoch": 26.362397820163487, + "grad_norm": 7.1943817138671875, + "learning_rate": 1.7271392077530498e-05, + "loss": 0.6175, + "step": 9675 + }, + { + "epoch": 26.365122615803816, + "grad_norm": 9.605677604675293, + "learning_rate": 1.7270786225440434e-05, + "loss": 0.4918, + "step": 9676 + }, + { + "epoch": 26.367847411444142, + "grad_norm": 8.220892906188965, + "learning_rate": 1.727018031672572e-05, + "loss": 0.6282, + "step": 9677 + }, + { + "epoch": 26.370572207084468, + "grad_norm": 10.437742233276367, + "learning_rate": 1.726957435139108e-05, + "loss": 0.5023, + "step": 9678 + }, + { + "epoch": 26.373297002724797, + "grad_norm": 17.860620498657227, + "learning_rate": 1.7268968329441226e-05, + "loss": 0.5096, + "step": 9679 + }, + { + "epoch": 26.376021798365123, + "grad_norm": 7.564548015594482, + "learning_rate": 1.7268362250880878e-05, + "loss": 0.6897, + "step": 9680 + }, + { + "epoch": 26.37874659400545, + "grad_norm": 8.498891830444336, + "learning_rate": 1.726775611571476e-05, + "loss": 0.5014, + "step": 9681 + }, + { + "epoch": 26.381471389645778, + "grad_norm": 8.183478355407715, + "learning_rate": 1.7267149923947598e-05, + "loss": 0.5712, + "step": 9682 + }, + { + "epoch": 26.384196185286104, + "grad_norm": 8.678196907043457, + "learning_rate": 1.72665436755841e-05, + "loss": 0.5667, + "step": 9683 + }, + { + "epoch": 26.38692098092643, + "grad_norm": 8.562444686889648, + "learning_rate": 1.7265937370628995e-05, + "loss": 0.5267, + "step": 9684 + }, + { + "epoch": 26.38964577656676, + "grad_norm": 6.696924686431885, + "learning_rate": 1.7265331009087004e-05, + "loss": 0.5307, + "step": 9685 + }, + { + "epoch": 26.392370572207085, + "grad_norm": 6.626930236816406, + "learning_rate": 1.7264724590962846e-05, + "loss": 0.4725, + "step": 9686 + }, + { + "epoch": 26.39509536784741, + "grad_norm": 9.666239738464355, + "learning_rate": 1.726411811626125e-05, + "loss": 0.561, + "step": 9687 + }, + { + "epoch": 26.39782016348774, + "grad_norm": 8.817061424255371, + "learning_rate": 1.7263511584986935e-05, + "loss": 0.6234, + "step": 9688 + }, + { + "epoch": 26.400544959128066, + "grad_norm": 9.749441146850586, + "learning_rate": 1.7262904997144626e-05, + "loss": 0.5256, + "step": 9689 + }, + { + "epoch": 26.40326975476839, + "grad_norm": 11.836180686950684, + "learning_rate": 1.7262298352739048e-05, + "loss": 0.5289, + "step": 9690 + }, + { + "epoch": 26.40599455040872, + "grad_norm": 8.412851333618164, + "learning_rate": 1.7261691651774922e-05, + "loss": 0.6529, + "step": 9691 + }, + { + "epoch": 26.408719346049047, + "grad_norm": 8.265201568603516, + "learning_rate": 1.7261084894256975e-05, + "loss": 0.6555, + "step": 9692 + }, + { + "epoch": 26.411444141689373, + "grad_norm": 7.24312686920166, + "learning_rate": 1.7260478080189932e-05, + "loss": 0.6314, + "step": 9693 + }, + { + "epoch": 26.414168937329702, + "grad_norm": 8.179997444152832, + "learning_rate": 1.725987120957852e-05, + "loss": 0.711, + "step": 9694 + }, + { + "epoch": 26.416893732970028, + "grad_norm": 7.774048328399658, + "learning_rate": 1.7259264282427467e-05, + "loss": 0.5784, + "step": 9695 + }, + { + "epoch": 26.419618528610354, + "grad_norm": 9.335322380065918, + "learning_rate": 1.7258657298741494e-05, + "loss": 0.4728, + "step": 9696 + }, + { + "epoch": 26.422343324250683, + "grad_norm": 8.457154273986816, + "learning_rate": 1.7258050258525335e-05, + "loss": 0.5094, + "step": 9697 + }, + { + "epoch": 26.42506811989101, + "grad_norm": 8.617023468017578, + "learning_rate": 1.7257443161783712e-05, + "loss": 0.4645, + "step": 9698 + }, + { + "epoch": 26.427792915531334, + "grad_norm": 19.97624969482422, + "learning_rate": 1.7256836008521354e-05, + "loss": 0.666, + "step": 9699 + }, + { + "epoch": 26.430517711171664, + "grad_norm": 8.577537536621094, + "learning_rate": 1.725622879874299e-05, + "loss": 0.4655, + "step": 9700 + }, + { + "epoch": 26.43324250681199, + "grad_norm": 8.199747085571289, + "learning_rate": 1.7255621532453356e-05, + "loss": 0.591, + "step": 9701 + }, + { + "epoch": 26.435967302452315, + "grad_norm": 8.759621620178223, + "learning_rate": 1.725501420965717e-05, + "loss": 0.4586, + "step": 9702 + }, + { + "epoch": 26.438692098092645, + "grad_norm": 7.397414684295654, + "learning_rate": 1.7254406830359166e-05, + "loss": 0.5256, + "step": 9703 + }, + { + "epoch": 26.44141689373297, + "grad_norm": 10.123652458190918, + "learning_rate": 1.725379939456408e-05, + "loss": 0.4986, + "step": 9704 + }, + { + "epoch": 26.444141689373296, + "grad_norm": 7.325468063354492, + "learning_rate": 1.7253191902276634e-05, + "loss": 0.5513, + "step": 9705 + }, + { + "epoch": 26.446866485013626, + "grad_norm": 11.196511268615723, + "learning_rate": 1.725258435350156e-05, + "loss": 0.6641, + "step": 9706 + }, + { + "epoch": 26.44959128065395, + "grad_norm": 15.448986053466797, + "learning_rate": 1.7251976748243597e-05, + "loss": 0.6542, + "step": 9707 + }, + { + "epoch": 26.452316076294277, + "grad_norm": 8.92198657989502, + "learning_rate": 1.7251369086507472e-05, + "loss": 0.6694, + "step": 9708 + }, + { + "epoch": 26.455040871934607, + "grad_norm": 22.12588882446289, + "learning_rate": 1.725076136829792e-05, + "loss": 0.6179, + "step": 9709 + }, + { + "epoch": 26.457765667574932, + "grad_norm": 9.834114074707031, + "learning_rate": 1.725015359361967e-05, + "loss": 0.7356, + "step": 9710 + }, + { + "epoch": 26.460490463215258, + "grad_norm": 8.150346755981445, + "learning_rate": 1.7249545762477454e-05, + "loss": 0.5803, + "step": 9711 + }, + { + "epoch": 26.463215258855588, + "grad_norm": 10.009634971618652, + "learning_rate": 1.7248937874876013e-05, + "loss": 0.5165, + "step": 9712 + }, + { + "epoch": 26.465940054495913, + "grad_norm": 9.49602222442627, + "learning_rate": 1.7248329930820076e-05, + "loss": 0.4071, + "step": 9713 + }, + { + "epoch": 26.46866485013624, + "grad_norm": 8.119736671447754, + "learning_rate": 1.7247721930314377e-05, + "loss": 0.5149, + "step": 9714 + }, + { + "epoch": 26.47138964577657, + "grad_norm": 9.511920928955078, + "learning_rate": 1.7247113873363656e-05, + "loss": 0.5853, + "step": 9715 + }, + { + "epoch": 26.474114441416894, + "grad_norm": 8.866805076599121, + "learning_rate": 1.7246505759972643e-05, + "loss": 0.559, + "step": 9716 + }, + { + "epoch": 26.47683923705722, + "grad_norm": 27.62454605102539, + "learning_rate": 1.7245897590146078e-05, + "loss": 0.6063, + "step": 9717 + }, + { + "epoch": 26.479564032697546, + "grad_norm": 12.811103820800781, + "learning_rate": 1.7245289363888694e-05, + "loss": 0.5844, + "step": 9718 + }, + { + "epoch": 26.482288828337875, + "grad_norm": 7.823066711425781, + "learning_rate": 1.7244681081205227e-05, + "loss": 0.4919, + "step": 9719 + }, + { + "epoch": 26.4850136239782, + "grad_norm": 5.938113689422607, + "learning_rate": 1.7244072742100422e-05, + "loss": 0.4162, + "step": 9720 + }, + { + "epoch": 26.48773841961853, + "grad_norm": 8.288970947265625, + "learning_rate": 1.724346434657901e-05, + "loss": 0.6464, + "step": 9721 + }, + { + "epoch": 26.490463215258856, + "grad_norm": 15.540919303894043, + "learning_rate": 1.724285589464573e-05, + "loss": 0.4741, + "step": 9722 + }, + { + "epoch": 26.493188010899182, + "grad_norm": 9.762518882751465, + "learning_rate": 1.7242247386305324e-05, + "loss": 0.5653, + "step": 9723 + }, + { + "epoch": 26.495912806539508, + "grad_norm": 9.49687385559082, + "learning_rate": 1.7241638821562526e-05, + "loss": 0.4958, + "step": 9724 + }, + { + "epoch": 26.498637602179837, + "grad_norm": 8.982109069824219, + "learning_rate": 1.7241030200422078e-05, + "loss": 0.5706, + "step": 9725 + }, + { + "epoch": 26.501362397820163, + "grad_norm": 22.22509002685547, + "learning_rate": 1.724042152288872e-05, + "loss": 0.541, + "step": 9726 + }, + { + "epoch": 26.504087193460492, + "grad_norm": 9.978806495666504, + "learning_rate": 1.7239812788967195e-05, + "loss": 0.5566, + "step": 9727 + }, + { + "epoch": 26.506811989100818, + "grad_norm": 9.385416030883789, + "learning_rate": 1.7239203998662234e-05, + "loss": 0.5651, + "step": 9728 + }, + { + "epoch": 26.509536784741144, + "grad_norm": 10.099444389343262, + "learning_rate": 1.7238595151978593e-05, + "loss": 0.526, + "step": 9729 + }, + { + "epoch": 26.51226158038147, + "grad_norm": 7.989203929901123, + "learning_rate": 1.7237986248921003e-05, + "loss": 0.5272, + "step": 9730 + }, + { + "epoch": 26.5149863760218, + "grad_norm": 7.509270668029785, + "learning_rate": 1.7237377289494207e-05, + "loss": 0.6298, + "step": 9731 + }, + { + "epoch": 26.517711171662125, + "grad_norm": 10.203505516052246, + "learning_rate": 1.7236768273702952e-05, + "loss": 0.505, + "step": 9732 + }, + { + "epoch": 26.520435967302454, + "grad_norm": 8.250483512878418, + "learning_rate": 1.7236159201551978e-05, + "loss": 0.5259, + "step": 9733 + }, + { + "epoch": 26.52316076294278, + "grad_norm": 8.439765930175781, + "learning_rate": 1.723555007304603e-05, + "loss": 0.5204, + "step": 9734 + }, + { + "epoch": 26.525885558583106, + "grad_norm": 7.641886234283447, + "learning_rate": 1.7234940888189847e-05, + "loss": 0.4673, + "step": 9735 + }, + { + "epoch": 26.52861035422343, + "grad_norm": 10.620079040527344, + "learning_rate": 1.7234331646988183e-05, + "loss": 0.5453, + "step": 9736 + }, + { + "epoch": 26.53133514986376, + "grad_norm": 7.982536315917969, + "learning_rate": 1.7233722349445774e-05, + "loss": 0.5303, + "step": 9737 + }, + { + "epoch": 26.534059945504087, + "grad_norm": 10.731901168823242, + "learning_rate": 1.7233112995567366e-05, + "loss": 0.5692, + "step": 9738 + }, + { + "epoch": 26.536784741144416, + "grad_norm": 8.416155815124512, + "learning_rate": 1.723250358535771e-05, + "loss": 0.557, + "step": 9739 + }, + { + "epoch": 26.539509536784742, + "grad_norm": 8.52946662902832, + "learning_rate": 1.723189411882155e-05, + "loss": 0.6161, + "step": 9740 + }, + { + "epoch": 26.542234332425068, + "grad_norm": 6.650148391723633, + "learning_rate": 1.723128459596363e-05, + "loss": 0.5844, + "step": 9741 + }, + { + "epoch": 26.544959128065393, + "grad_norm": 8.657482147216797, + "learning_rate": 1.7230675016788697e-05, + "loss": 0.5673, + "step": 9742 + }, + { + "epoch": 26.547683923705723, + "grad_norm": 9.079556465148926, + "learning_rate": 1.72300653813015e-05, + "loss": 0.5774, + "step": 9743 + }, + { + "epoch": 26.55040871934605, + "grad_norm": 7.331713676452637, + "learning_rate": 1.7229455689506786e-05, + "loss": 0.6069, + "step": 9744 + }, + { + "epoch": 26.553133514986374, + "grad_norm": 8.788839340209961, + "learning_rate": 1.7228845941409304e-05, + "loss": 0.6886, + "step": 9745 + }, + { + "epoch": 26.555858310626704, + "grad_norm": 16.687707901000977, + "learning_rate": 1.7228236137013804e-05, + "loss": 0.5566, + "step": 9746 + }, + { + "epoch": 26.55858310626703, + "grad_norm": 10.596636772155762, + "learning_rate": 1.7227626276325033e-05, + "loss": 0.4482, + "step": 9747 + }, + { + "epoch": 26.561307901907355, + "grad_norm": 6.884238243103027, + "learning_rate": 1.722701635934774e-05, + "loss": 0.5292, + "step": 9748 + }, + { + "epoch": 26.564032697547685, + "grad_norm": 19.73212242126465, + "learning_rate": 1.7226406386086675e-05, + "loss": 0.6209, + "step": 9749 + }, + { + "epoch": 26.56675749318801, + "grad_norm": 10.994420051574707, + "learning_rate": 1.7225796356546592e-05, + "loss": 0.7026, + "step": 9750 + }, + { + "epoch": 26.569482288828336, + "grad_norm": 10.321929931640625, + "learning_rate": 1.7225186270732242e-05, + "loss": 0.6399, + "step": 9751 + }, + { + "epoch": 26.572207084468666, + "grad_norm": 9.506365776062012, + "learning_rate": 1.722457612864837e-05, + "loss": 0.5134, + "step": 9752 + }, + { + "epoch": 26.57493188010899, + "grad_norm": 7.55317497253418, + "learning_rate": 1.7223965930299732e-05, + "loss": 0.542, + "step": 9753 + }, + { + "epoch": 26.577656675749317, + "grad_norm": 7.067741394042969, + "learning_rate": 1.722335567569108e-05, + "loss": 0.76, + "step": 9754 + }, + { + "epoch": 26.580381471389646, + "grad_norm": 8.14130687713623, + "learning_rate": 1.7222745364827167e-05, + "loss": 0.4661, + "step": 9755 + }, + { + "epoch": 26.583106267029972, + "grad_norm": 8.30457592010498, + "learning_rate": 1.7222134997712748e-05, + "loss": 0.7259, + "step": 9756 + }, + { + "epoch": 26.585831062670298, + "grad_norm": 8.38310718536377, + "learning_rate": 1.722152457435257e-05, + "loss": 0.6436, + "step": 9757 + }, + { + "epoch": 26.588555858310627, + "grad_norm": 10.805953025817871, + "learning_rate": 1.722091409475139e-05, + "loss": 0.733, + "step": 9758 + }, + { + "epoch": 26.591280653950953, + "grad_norm": 8.848837852478027, + "learning_rate": 1.722030355891397e-05, + "loss": 0.5511, + "step": 9759 + }, + { + "epoch": 26.59400544959128, + "grad_norm": 54.405826568603516, + "learning_rate": 1.721969296684505e-05, + "loss": 0.4696, + "step": 9760 + }, + { + "epoch": 26.59673024523161, + "grad_norm": 13.935903549194336, + "learning_rate": 1.72190823185494e-05, + "loss": 0.5378, + "step": 9761 + }, + { + "epoch": 26.599455040871934, + "grad_norm": 7.5879435539245605, + "learning_rate": 1.721847161403177e-05, + "loss": 0.7851, + "step": 9762 + }, + { + "epoch": 26.60217983651226, + "grad_norm": 8.205209732055664, + "learning_rate": 1.721786085329691e-05, + "loss": 0.4768, + "step": 9763 + }, + { + "epoch": 26.60490463215259, + "grad_norm": 8.208876609802246, + "learning_rate": 1.7217250036349584e-05, + "loss": 0.5588, + "step": 9764 + }, + { + "epoch": 26.607629427792915, + "grad_norm": 17.013639450073242, + "learning_rate": 1.721663916319455e-05, + "loss": 0.527, + "step": 9765 + }, + { + "epoch": 26.61035422343324, + "grad_norm": 17.2004337310791, + "learning_rate": 1.721602823383656e-05, + "loss": 0.5312, + "step": 9766 + }, + { + "epoch": 26.61307901907357, + "grad_norm": 25.651762008666992, + "learning_rate": 1.7215417248280374e-05, + "loss": 0.7311, + "step": 9767 + }, + { + "epoch": 26.615803814713896, + "grad_norm": 27.533079147338867, + "learning_rate": 1.721480620653075e-05, + "loss": 0.6274, + "step": 9768 + }, + { + "epoch": 26.618528610354222, + "grad_norm": 10.6248197555542, + "learning_rate": 1.7214195108592448e-05, + "loss": 0.6133, + "step": 9769 + }, + { + "epoch": 26.62125340599455, + "grad_norm": 10.059863090515137, + "learning_rate": 1.7213583954470228e-05, + "loss": 0.7231, + "step": 9770 + }, + { + "epoch": 26.623978201634877, + "grad_norm": 8.468740463256836, + "learning_rate": 1.721297274416885e-05, + "loss": 0.5704, + "step": 9771 + }, + { + "epoch": 26.626702997275203, + "grad_norm": 9.464869499206543, + "learning_rate": 1.7212361477693068e-05, + "loss": 0.5226, + "step": 9772 + }, + { + "epoch": 26.629427792915532, + "grad_norm": 10.510021209716797, + "learning_rate": 1.721175015504765e-05, + "loss": 0.5062, + "step": 9773 + }, + { + "epoch": 26.632152588555858, + "grad_norm": 8.539653778076172, + "learning_rate": 1.721113877623735e-05, + "loss": 0.5445, + "step": 9774 + }, + { + "epoch": 26.634877384196184, + "grad_norm": 11.123778343200684, + "learning_rate": 1.7210527341266936e-05, + "loss": 0.6424, + "step": 9775 + }, + { + "epoch": 26.637602179836513, + "grad_norm": 10.299055099487305, + "learning_rate": 1.720991585014117e-05, + "loss": 0.5608, + "step": 9776 + }, + { + "epoch": 26.64032697547684, + "grad_norm": 8.966005325317383, + "learning_rate": 1.7209304302864808e-05, + "loss": 0.543, + "step": 9777 + }, + { + "epoch": 26.643051771117165, + "grad_norm": 8.661131858825684, + "learning_rate": 1.7208692699442618e-05, + "loss": 0.4578, + "step": 9778 + }, + { + "epoch": 26.645776566757494, + "grad_norm": 8.650118827819824, + "learning_rate": 1.7208081039879355e-05, + "loss": 0.5977, + "step": 9779 + }, + { + "epoch": 26.64850136239782, + "grad_norm": 9.450804710388184, + "learning_rate": 1.7207469324179796e-05, + "loss": 0.6046, + "step": 9780 + }, + { + "epoch": 26.651226158038146, + "grad_norm": 7.290467739105225, + "learning_rate": 1.7206857552348696e-05, + "loss": 0.636, + "step": 9781 + }, + { + "epoch": 26.653950953678475, + "grad_norm": 8.39273452758789, + "learning_rate": 1.720624572439082e-05, + "loss": 0.553, + "step": 9782 + }, + { + "epoch": 26.6566757493188, + "grad_norm": 10.417442321777344, + "learning_rate": 1.7205633840310935e-05, + "loss": 0.6809, + "step": 9783 + }, + { + "epoch": 26.659400544959126, + "grad_norm": 9.35910701751709, + "learning_rate": 1.7205021900113808e-05, + "loss": 0.5734, + "step": 9784 + }, + { + "epoch": 26.662125340599456, + "grad_norm": 8.904742240905762, + "learning_rate": 1.72044099038042e-05, + "loss": 0.6603, + "step": 9785 + }, + { + "epoch": 26.66485013623978, + "grad_norm": 8.284513473510742, + "learning_rate": 1.7203797851386878e-05, + "loss": 0.5482, + "step": 9786 + }, + { + "epoch": 26.667574931880107, + "grad_norm": 7.7133870124816895, + "learning_rate": 1.720318574286661e-05, + "loss": 0.4943, + "step": 9787 + }, + { + "epoch": 26.670299727520437, + "grad_norm": 7.952728271484375, + "learning_rate": 1.7202573578248166e-05, + "loss": 0.5464, + "step": 9788 + }, + { + "epoch": 26.673024523160763, + "grad_norm": 10.20577621459961, + "learning_rate": 1.7201961357536313e-05, + "loss": 0.5574, + "step": 9789 + }, + { + "epoch": 26.67574931880109, + "grad_norm": 8.854503631591797, + "learning_rate": 1.720134908073581e-05, + "loss": 0.557, + "step": 9790 + }, + { + "epoch": 26.678474114441418, + "grad_norm": 7.459747314453125, + "learning_rate": 1.720073674785144e-05, + "loss": 0.4844, + "step": 9791 + }, + { + "epoch": 26.681198910081743, + "grad_norm": 7.778055667877197, + "learning_rate": 1.720012435888796e-05, + "loss": 0.5489, + "step": 9792 + }, + { + "epoch": 26.68392370572207, + "grad_norm": 7.30932092666626, + "learning_rate": 1.7199511913850142e-05, + "loss": 0.5255, + "step": 9793 + }, + { + "epoch": 26.6866485013624, + "grad_norm": 9.2329740524292, + "learning_rate": 1.7198899412742756e-05, + "loss": 0.6163, + "step": 9794 + }, + { + "epoch": 26.689373297002724, + "grad_norm": 9.634840965270996, + "learning_rate": 1.7198286855570575e-05, + "loss": 0.6769, + "step": 9795 + }, + { + "epoch": 26.69209809264305, + "grad_norm": 9.673457145690918, + "learning_rate": 1.719767424233837e-05, + "loss": 0.6982, + "step": 9796 + }, + { + "epoch": 26.69482288828338, + "grad_norm": 12.041887283325195, + "learning_rate": 1.719706157305091e-05, + "loss": 0.6368, + "step": 9797 + }, + { + "epoch": 26.697547683923705, + "grad_norm": 7.8084821701049805, + "learning_rate": 1.719644884771296e-05, + "loss": 0.4594, + "step": 9798 + }, + { + "epoch": 26.70027247956403, + "grad_norm": 7.280473232269287, + "learning_rate": 1.7195836066329304e-05, + "loss": 0.6399, + "step": 9799 + }, + { + "epoch": 26.70299727520436, + "grad_norm": 8.602075576782227, + "learning_rate": 1.7195223228904705e-05, + "loss": 0.5395, + "step": 9800 + }, + { + "epoch": 26.705722070844686, + "grad_norm": 7.182285785675049, + "learning_rate": 1.719461033544394e-05, + "loss": 0.4574, + "step": 9801 + }, + { + "epoch": 26.708446866485012, + "grad_norm": 13.214006423950195, + "learning_rate": 1.719399738595178e-05, + "loss": 0.6719, + "step": 9802 + }, + { + "epoch": 26.71117166212534, + "grad_norm": 6.748271942138672, + "learning_rate": 1.7193384380433e-05, + "loss": 0.5078, + "step": 9803 + }, + { + "epoch": 26.713896457765667, + "grad_norm": 8.99386978149414, + "learning_rate": 1.7192771318892377e-05, + "loss": 0.548, + "step": 9804 + }, + { + "epoch": 26.716621253405993, + "grad_norm": 7.487708568572998, + "learning_rate": 1.719215820133468e-05, + "loss": 0.4866, + "step": 9805 + }, + { + "epoch": 26.719346049046322, + "grad_norm": 8.8655366897583, + "learning_rate": 1.7191545027764686e-05, + "loss": 0.5208, + "step": 9806 + }, + { + "epoch": 26.722070844686648, + "grad_norm": 8.175238609313965, + "learning_rate": 1.7190931798187173e-05, + "loss": 0.6731, + "step": 9807 + }, + { + "epoch": 26.724795640326974, + "grad_norm": 10.522286415100098, + "learning_rate": 1.719031851260691e-05, + "loss": 0.5506, + "step": 9808 + }, + { + "epoch": 26.727520435967303, + "grad_norm": 9.17513370513916, + "learning_rate": 1.7189705171028684e-05, + "loss": 0.4948, + "step": 9809 + }, + { + "epoch": 26.73024523160763, + "grad_norm": 7.262209415435791, + "learning_rate": 1.7189091773457263e-05, + "loss": 0.5682, + "step": 9810 + }, + { + "epoch": 26.732970027247955, + "grad_norm": 7.6149373054504395, + "learning_rate": 1.7188478319897425e-05, + "loss": 0.6615, + "step": 9811 + }, + { + "epoch": 26.735694822888284, + "grad_norm": 7.136045455932617, + "learning_rate": 1.718786481035395e-05, + "loss": 0.5837, + "step": 9812 + }, + { + "epoch": 26.73841961852861, + "grad_norm": 8.332613945007324, + "learning_rate": 1.7187251244831617e-05, + "loss": 0.5957, + "step": 9813 + }, + { + "epoch": 26.741144414168936, + "grad_norm": 7.949191093444824, + "learning_rate": 1.7186637623335202e-05, + "loss": 0.5762, + "step": 9814 + }, + { + "epoch": 26.743869209809265, + "grad_norm": 8.355345726013184, + "learning_rate": 1.7186023945869482e-05, + "loss": 0.6154, + "step": 9815 + }, + { + "epoch": 26.74659400544959, + "grad_norm": 7.350244998931885, + "learning_rate": 1.718541021243924e-05, + "loss": 0.5094, + "step": 9816 + }, + { + "epoch": 26.749318801089917, + "grad_norm": 7.143017768859863, + "learning_rate": 1.7184796423049258e-05, + "loss": 0.5666, + "step": 9817 + }, + { + "epoch": 26.752043596730246, + "grad_norm": 7.0420451164245605, + "learning_rate": 1.7184182577704308e-05, + "loss": 0.7675, + "step": 9818 + }, + { + "epoch": 26.754768392370572, + "grad_norm": 7.085203647613525, + "learning_rate": 1.7183568676409177e-05, + "loss": 0.5901, + "step": 9819 + }, + { + "epoch": 26.757493188010898, + "grad_norm": 17.482250213623047, + "learning_rate": 1.7182954719168644e-05, + "loss": 0.5327, + "step": 9820 + }, + { + "epoch": 26.760217983651227, + "grad_norm": 8.615785598754883, + "learning_rate": 1.7182340705987493e-05, + "loss": 0.6075, + "step": 9821 + }, + { + "epoch": 26.762942779291553, + "grad_norm": 11.417250633239746, + "learning_rate": 1.7181726636870503e-05, + "loss": 0.6096, + "step": 9822 + }, + { + "epoch": 26.76566757493188, + "grad_norm": 7.919449806213379, + "learning_rate": 1.7181112511822454e-05, + "loss": 0.5388, + "step": 9823 + }, + { + "epoch": 26.768392370572208, + "grad_norm": 7.389474868774414, + "learning_rate": 1.7180498330848136e-05, + "loss": 0.7375, + "step": 9824 + }, + { + "epoch": 26.771117166212534, + "grad_norm": 8.586124420166016, + "learning_rate": 1.7179884093952323e-05, + "loss": 0.5284, + "step": 9825 + }, + { + "epoch": 26.77384196185286, + "grad_norm": 8.27129077911377, + "learning_rate": 1.717926980113981e-05, + "loss": 0.5146, + "step": 9826 + }, + { + "epoch": 26.77656675749319, + "grad_norm": 6.685294151306152, + "learning_rate": 1.717865545241537e-05, + "loss": 0.5565, + "step": 9827 + }, + { + "epoch": 26.779291553133515, + "grad_norm": 9.088601112365723, + "learning_rate": 1.7178041047783794e-05, + "loss": 0.5798, + "step": 9828 + }, + { + "epoch": 26.78201634877384, + "grad_norm": 8.028997421264648, + "learning_rate": 1.7177426587249867e-05, + "loss": 0.4793, + "step": 9829 + }, + { + "epoch": 26.78474114441417, + "grad_norm": 8.733445167541504, + "learning_rate": 1.717681207081837e-05, + "loss": 0.4783, + "step": 9830 + }, + { + "epoch": 26.787465940054496, + "grad_norm": 6.7583088874816895, + "learning_rate": 1.717619749849409e-05, + "loss": 0.5808, + "step": 9831 + }, + { + "epoch": 26.79019073569482, + "grad_norm": 7.639645576477051, + "learning_rate": 1.717558287028182e-05, + "loss": 0.6336, + "step": 9832 + }, + { + "epoch": 26.79291553133515, + "grad_norm": 6.987443447113037, + "learning_rate": 1.717496818618634e-05, + "loss": 0.5704, + "step": 9833 + }, + { + "epoch": 26.795640326975477, + "grad_norm": 7.344447135925293, + "learning_rate": 1.7174353446212438e-05, + "loss": 0.4557, + "step": 9834 + }, + { + "epoch": 26.798365122615802, + "grad_norm": 7.086408615112305, + "learning_rate": 1.71737386503649e-05, + "loss": 0.5657, + "step": 9835 + }, + { + "epoch": 26.80108991825613, + "grad_norm": 7.556144714355469, + "learning_rate": 1.7173123798648517e-05, + "loss": 0.6652, + "step": 9836 + }, + { + "epoch": 26.803814713896458, + "grad_norm": 15.217717170715332, + "learning_rate": 1.717250889106808e-05, + "loss": 0.5214, + "step": 9837 + }, + { + "epoch": 26.806539509536783, + "grad_norm": 9.909323692321777, + "learning_rate": 1.7171893927628374e-05, + "loss": 0.6533, + "step": 9838 + }, + { + "epoch": 26.809264305177113, + "grad_norm": 9.069902420043945, + "learning_rate": 1.7171278908334188e-05, + "loss": 0.6884, + "step": 9839 + }, + { + "epoch": 26.81198910081744, + "grad_norm": 8.221458435058594, + "learning_rate": 1.717066383319031e-05, + "loss": 0.6047, + "step": 9840 + }, + { + "epoch": 26.814713896457764, + "grad_norm": 7.048707962036133, + "learning_rate": 1.7170048702201536e-05, + "loss": 0.6982, + "step": 9841 + }, + { + "epoch": 26.817438692098094, + "grad_norm": 8.236212730407715, + "learning_rate": 1.7169433515372652e-05, + "loss": 0.6212, + "step": 9842 + }, + { + "epoch": 26.82016348773842, + "grad_norm": 13.191624641418457, + "learning_rate": 1.716881827270845e-05, + "loss": 0.5137, + "step": 9843 + }, + { + "epoch": 26.822888283378745, + "grad_norm": 6.405436038970947, + "learning_rate": 1.7168202974213723e-05, + "loss": 0.5905, + "step": 9844 + }, + { + "epoch": 26.825613079019075, + "grad_norm": 8.298712730407715, + "learning_rate": 1.7167587619893266e-05, + "loss": 0.5558, + "step": 9845 + }, + { + "epoch": 26.8283378746594, + "grad_norm": 8.389778137207031, + "learning_rate": 1.7166972209751863e-05, + "loss": 0.6276, + "step": 9846 + }, + { + "epoch": 26.831062670299726, + "grad_norm": 8.159259796142578, + "learning_rate": 1.716635674379431e-05, + "loss": 0.6414, + "step": 9847 + }, + { + "epoch": 26.833787465940055, + "grad_norm": 9.523921012878418, + "learning_rate": 1.7165741222025404e-05, + "loss": 0.5206, + "step": 9848 + }, + { + "epoch": 26.83651226158038, + "grad_norm": 8.652966499328613, + "learning_rate": 1.7165125644449935e-05, + "loss": 0.5121, + "step": 9849 + }, + { + "epoch": 26.839237057220707, + "grad_norm": 8.350944519042969, + "learning_rate": 1.7164510011072698e-05, + "loss": 0.4707, + "step": 9850 + }, + { + "epoch": 26.841961852861036, + "grad_norm": 7.804934024810791, + "learning_rate": 1.7163894321898484e-05, + "loss": 0.501, + "step": 9851 + }, + { + "epoch": 26.844686648501362, + "grad_norm": 7.301161766052246, + "learning_rate": 1.7163278576932096e-05, + "loss": 0.5817, + "step": 9852 + }, + { + "epoch": 26.847411444141688, + "grad_norm": 9.36557674407959, + "learning_rate": 1.7162662776178326e-05, + "loss": 0.4836, + "step": 9853 + }, + { + "epoch": 26.850136239782017, + "grad_norm": 7.538303375244141, + "learning_rate": 1.7162046919641965e-05, + "loss": 0.5938, + "step": 9854 + }, + { + "epoch": 26.852861035422343, + "grad_norm": 7.781804084777832, + "learning_rate": 1.7161431007327817e-05, + "loss": 0.4291, + "step": 9855 + }, + { + "epoch": 26.85558583106267, + "grad_norm": 9.716976165771484, + "learning_rate": 1.7160815039240673e-05, + "loss": 0.5191, + "step": 9856 + }, + { + "epoch": 26.858310626703, + "grad_norm": 8.597269058227539, + "learning_rate": 1.716019901538533e-05, + "loss": 0.6948, + "step": 9857 + }, + { + "epoch": 26.861035422343324, + "grad_norm": 36.90464782714844, + "learning_rate": 1.715958293576659e-05, + "loss": 0.6644, + "step": 9858 + }, + { + "epoch": 26.86376021798365, + "grad_norm": 8.590659141540527, + "learning_rate": 1.7158966800389248e-05, + "loss": 0.6661, + "step": 9859 + }, + { + "epoch": 26.86648501362398, + "grad_norm": 7.516275405883789, + "learning_rate": 1.7158350609258102e-05, + "loss": 0.5664, + "step": 9860 + }, + { + "epoch": 26.869209809264305, + "grad_norm": 8.420100212097168, + "learning_rate": 1.7157734362377954e-05, + "loss": 0.6704, + "step": 9861 + }, + { + "epoch": 26.87193460490463, + "grad_norm": 10.217272758483887, + "learning_rate": 1.71571180597536e-05, + "loss": 0.6155, + "step": 9862 + }, + { + "epoch": 26.87465940054496, + "grad_norm": 8.462159156799316, + "learning_rate": 1.715650170138984e-05, + "loss": 0.574, + "step": 9863 + }, + { + "epoch": 26.877384196185286, + "grad_norm": 8.050196647644043, + "learning_rate": 1.7155885287291477e-05, + "loss": 0.5557, + "step": 9864 + }, + { + "epoch": 26.88010899182561, + "grad_norm": 8.381481170654297, + "learning_rate": 1.715526881746331e-05, + "loss": 0.5322, + "step": 9865 + }, + { + "epoch": 26.88283378746594, + "grad_norm": 7.986210823059082, + "learning_rate": 1.7154652291910134e-05, + "loss": 0.5847, + "step": 9866 + }, + { + "epoch": 26.885558583106267, + "grad_norm": 8.827322006225586, + "learning_rate": 1.7154035710636764e-05, + "loss": 0.4438, + "step": 9867 + }, + { + "epoch": 26.888283378746593, + "grad_norm": 7.283189296722412, + "learning_rate": 1.715341907364799e-05, + "loss": 0.5301, + "step": 9868 + }, + { + "epoch": 26.891008174386922, + "grad_norm": 8.739351272583008, + "learning_rate": 1.7152802380948618e-05, + "loss": 0.5347, + "step": 9869 + }, + { + "epoch": 26.893732970027248, + "grad_norm": 8.528818130493164, + "learning_rate": 1.7152185632543453e-05, + "loss": 0.5613, + "step": 9870 + }, + { + "epoch": 26.896457765667574, + "grad_norm": 8.095894813537598, + "learning_rate": 1.7151568828437294e-05, + "loss": 0.5068, + "step": 9871 + }, + { + "epoch": 26.899182561307903, + "grad_norm": 6.297325611114502, + "learning_rate": 1.7150951968634947e-05, + "loss": 0.5719, + "step": 9872 + }, + { + "epoch": 26.90190735694823, + "grad_norm": 15.39514446258545, + "learning_rate": 1.715033505314122e-05, + "loss": 0.5058, + "step": 9873 + }, + { + "epoch": 26.904632152588555, + "grad_norm": 9.491486549377441, + "learning_rate": 1.7149718081960912e-05, + "loss": 0.6662, + "step": 9874 + }, + { + "epoch": 26.907356948228884, + "grad_norm": 9.023232460021973, + "learning_rate": 1.714910105509883e-05, + "loss": 0.566, + "step": 9875 + }, + { + "epoch": 26.91008174386921, + "grad_norm": 10.471985816955566, + "learning_rate": 1.7148483972559778e-05, + "loss": 0.5975, + "step": 9876 + }, + { + "epoch": 26.912806539509535, + "grad_norm": 7.666295528411865, + "learning_rate": 1.7147866834348567e-05, + "loss": 0.7562, + "step": 9877 + }, + { + "epoch": 26.915531335149865, + "grad_norm": 6.589531898498535, + "learning_rate": 1.7147249640469995e-05, + "loss": 0.6293, + "step": 9878 + }, + { + "epoch": 26.91825613079019, + "grad_norm": 15.742155075073242, + "learning_rate": 1.7146632390928874e-05, + "loss": 0.5092, + "step": 9879 + }, + { + "epoch": 26.920980926430516, + "grad_norm": 7.420589447021484, + "learning_rate": 1.7146015085730006e-05, + "loss": 0.5157, + "step": 9880 + }, + { + "epoch": 26.923705722070846, + "grad_norm": 7.282872676849365, + "learning_rate": 1.7145397724878208e-05, + "loss": 0.584, + "step": 9881 + }, + { + "epoch": 26.92643051771117, + "grad_norm": 6.97989559173584, + "learning_rate": 1.7144780308378283e-05, + "loss": 0.452, + "step": 9882 + }, + { + "epoch": 26.929155313351497, + "grad_norm": 7.551604747772217, + "learning_rate": 1.7144162836235036e-05, + "loss": 0.5566, + "step": 9883 + }, + { + "epoch": 26.931880108991827, + "grad_norm": 8.512497901916504, + "learning_rate": 1.7143545308453274e-05, + "loss": 0.6614, + "step": 9884 + }, + { + "epoch": 26.934604904632153, + "grad_norm": 8.548844337463379, + "learning_rate": 1.714292772503782e-05, + "loss": 0.6156, + "step": 9885 + }, + { + "epoch": 26.93732970027248, + "grad_norm": 8.930683135986328, + "learning_rate": 1.714231008599347e-05, + "loss": 0.6012, + "step": 9886 + }, + { + "epoch": 26.940054495912808, + "grad_norm": 8.837637901306152, + "learning_rate": 1.7141692391325038e-05, + "loss": 0.6991, + "step": 9887 + }, + { + "epoch": 26.942779291553133, + "grad_norm": 7.4434332847595215, + "learning_rate": 1.714107464103734e-05, + "loss": 0.6538, + "step": 9888 + }, + { + "epoch": 26.94550408719346, + "grad_norm": 6.97316837310791, + "learning_rate": 1.714045683513518e-05, + "loss": 0.5726, + "step": 9889 + }, + { + "epoch": 26.94822888283379, + "grad_norm": 7.7166008949279785, + "learning_rate": 1.7139838973623372e-05, + "loss": 0.5148, + "step": 9890 + }, + { + "epoch": 26.950953678474114, + "grad_norm": 10.185364723205566, + "learning_rate": 1.7139221056506728e-05, + "loss": 0.6141, + "step": 9891 + }, + { + "epoch": 26.95367847411444, + "grad_norm": 7.110172271728516, + "learning_rate": 1.7138603083790058e-05, + "loss": 0.4905, + "step": 9892 + }, + { + "epoch": 26.95640326975477, + "grad_norm": 21.275188446044922, + "learning_rate": 1.713798505547818e-05, + "loss": 0.5323, + "step": 9893 + }, + { + "epoch": 26.959128065395095, + "grad_norm": 14.872252464294434, + "learning_rate": 1.7137366971575905e-05, + "loss": 0.5959, + "step": 9894 + }, + { + "epoch": 26.96185286103542, + "grad_norm": 6.733795166015625, + "learning_rate": 1.7136748832088043e-05, + "loss": 0.4517, + "step": 9895 + }, + { + "epoch": 26.96457765667575, + "grad_norm": 8.441132545471191, + "learning_rate": 1.713613063701941e-05, + "loss": 0.6322, + "step": 9896 + }, + { + "epoch": 26.967302452316076, + "grad_norm": 10.844657897949219, + "learning_rate": 1.7135512386374823e-05, + "loss": 0.7972, + "step": 9897 + }, + { + "epoch": 26.970027247956402, + "grad_norm": 8.176034927368164, + "learning_rate": 1.7134894080159096e-05, + "loss": 0.7691, + "step": 9898 + }, + { + "epoch": 26.97275204359673, + "grad_norm": 9.46308708190918, + "learning_rate": 1.7134275718377043e-05, + "loss": 0.575, + "step": 9899 + }, + { + "epoch": 26.975476839237057, + "grad_norm": 8.104681015014648, + "learning_rate": 1.713365730103348e-05, + "loss": 0.6555, + "step": 9900 + }, + { + "epoch": 26.978201634877383, + "grad_norm": 8.981183052062988, + "learning_rate": 1.7133038828133224e-05, + "loss": 0.5291, + "step": 9901 + }, + { + "epoch": 26.980926430517712, + "grad_norm": 10.914739608764648, + "learning_rate": 1.713242029968109e-05, + "loss": 0.7823, + "step": 9902 + }, + { + "epoch": 26.983651226158038, + "grad_norm": 9.093073844909668, + "learning_rate": 1.71318017156819e-05, + "loss": 0.4865, + "step": 9903 + }, + { + "epoch": 26.986376021798364, + "grad_norm": 7.77921724319458, + "learning_rate": 1.7131183076140462e-05, + "loss": 0.6554, + "step": 9904 + }, + { + "epoch": 26.989100817438693, + "grad_norm": 8.578624725341797, + "learning_rate": 1.7130564381061603e-05, + "loss": 0.511, + "step": 9905 + }, + { + "epoch": 26.99182561307902, + "grad_norm": 9.18174934387207, + "learning_rate": 1.7129945630450136e-05, + "loss": 0.5055, + "step": 9906 + }, + { + "epoch": 26.994550408719345, + "grad_norm": 6.425988674163818, + "learning_rate": 1.7129326824310882e-05, + "loss": 0.7188, + "step": 9907 + }, + { + "epoch": 26.997275204359674, + "grad_norm": 8.770267486572266, + "learning_rate": 1.7128707962648662e-05, + "loss": 0.4218, + "step": 9908 + }, + { + "epoch": 27.0, + "grad_norm": 10.719183921813965, + "learning_rate": 1.7128089045468294e-05, + "loss": 0.53, + "step": 9909 + }, + { + "epoch": 27.002724795640326, + "grad_norm": 7.504054069519043, + "learning_rate": 1.71274700727746e-05, + "loss": 0.6198, + "step": 9910 + }, + { + "epoch": 27.005449591280655, + "grad_norm": 10.078618049621582, + "learning_rate": 1.7126851044572395e-05, + "loss": 0.655, + "step": 9911 + }, + { + "epoch": 27.00817438692098, + "grad_norm": 9.173070907592773, + "learning_rate": 1.7126231960866505e-05, + "loss": 0.5139, + "step": 9912 + }, + { + "epoch": 27.010899182561307, + "grad_norm": 7.0432820320129395, + "learning_rate": 1.7125612821661746e-05, + "loss": 0.4684, + "step": 9913 + }, + { + "epoch": 27.013623978201636, + "grad_norm": 7.106161117553711, + "learning_rate": 1.7124993626962946e-05, + "loss": 0.5553, + "step": 9914 + }, + { + "epoch": 27.016348773841962, + "grad_norm": 5.988898277282715, + "learning_rate": 1.7124374376774926e-05, + "loss": 0.6425, + "step": 9915 + }, + { + "epoch": 27.019073569482288, + "grad_norm": 16.35003089904785, + "learning_rate": 1.712375507110251e-05, + "loss": 0.6501, + "step": 9916 + }, + { + "epoch": 27.021798365122617, + "grad_norm": 9.020776748657227, + "learning_rate": 1.7123135709950515e-05, + "loss": 0.566, + "step": 9917 + }, + { + "epoch": 27.024523160762943, + "grad_norm": 6.925570964813232, + "learning_rate": 1.7122516293323767e-05, + "loss": 0.4954, + "step": 9918 + }, + { + "epoch": 27.02724795640327, + "grad_norm": 7.659992694854736, + "learning_rate": 1.7121896821227094e-05, + "loss": 0.4759, + "step": 9919 + }, + { + "epoch": 27.029972752043598, + "grad_norm": 12.315473556518555, + "learning_rate": 1.712127729366532e-05, + "loss": 0.5403, + "step": 9920 + }, + { + "epoch": 27.032697547683924, + "grad_norm": 7.5261383056640625, + "learning_rate": 1.7120657710643264e-05, + "loss": 0.6048, + "step": 9921 + }, + { + "epoch": 27.03542234332425, + "grad_norm": 7.493836402893066, + "learning_rate": 1.7120038072165756e-05, + "loss": 0.5029, + "step": 9922 + }, + { + "epoch": 27.03814713896458, + "grad_norm": 7.221220970153809, + "learning_rate": 1.7119418378237623e-05, + "loss": 0.6017, + "step": 9923 + }, + { + "epoch": 27.040871934604905, + "grad_norm": 7.582027435302734, + "learning_rate": 1.7118798628863685e-05, + "loss": 0.6014, + "step": 9924 + }, + { + "epoch": 27.04359673024523, + "grad_norm": 10.846917152404785, + "learning_rate": 1.7118178824048774e-05, + "loss": 0.5579, + "step": 9925 + }, + { + "epoch": 27.04632152588556, + "grad_norm": 7.30008602142334, + "learning_rate": 1.7117558963797715e-05, + "loss": 0.5022, + "step": 9926 + }, + { + "epoch": 27.049046321525886, + "grad_norm": 6.973043441772461, + "learning_rate": 1.7116939048115336e-05, + "loss": 0.4575, + "step": 9927 + }, + { + "epoch": 27.05177111716621, + "grad_norm": 7.097996711730957, + "learning_rate": 1.711631907700647e-05, + "loss": 0.4754, + "step": 9928 + }, + { + "epoch": 27.05449591280654, + "grad_norm": 9.277467727661133, + "learning_rate": 1.711569905047593e-05, + "loss": 0.676, + "step": 9929 + }, + { + "epoch": 27.057220708446867, + "grad_norm": 7.5056610107421875, + "learning_rate": 1.7115078968528563e-05, + "loss": 0.6619, + "step": 9930 + }, + { + "epoch": 27.059945504087192, + "grad_norm": 8.805801391601562, + "learning_rate": 1.7114458831169184e-05, + "loss": 0.5337, + "step": 9931 + }, + { + "epoch": 27.06267029972752, + "grad_norm": 7.667728424072266, + "learning_rate": 1.7113838638402633e-05, + "loss": 0.4593, + "step": 9932 + }, + { + "epoch": 27.065395095367847, + "grad_norm": 12.151493072509766, + "learning_rate": 1.7113218390233734e-05, + "loss": 0.6071, + "step": 9933 + }, + { + "epoch": 27.068119891008173, + "grad_norm": 7.711685657501221, + "learning_rate": 1.711259808666732e-05, + "loss": 0.5402, + "step": 9934 + }, + { + "epoch": 27.070844686648503, + "grad_norm": 10.571061134338379, + "learning_rate": 1.711197772770822e-05, + "loss": 0.3903, + "step": 9935 + }, + { + "epoch": 27.07356948228883, + "grad_norm": 7.110350608825684, + "learning_rate": 1.7111357313361264e-05, + "loss": 0.4113, + "step": 9936 + }, + { + "epoch": 27.076294277929154, + "grad_norm": 15.685750007629395, + "learning_rate": 1.7110736843631294e-05, + "loss": 0.6638, + "step": 9937 + }, + { + "epoch": 27.079019073569484, + "grad_norm": 6.967113971710205, + "learning_rate": 1.7110116318523126e-05, + "loss": 0.5338, + "step": 9938 + }, + { + "epoch": 27.08174386920981, + "grad_norm": 9.692916870117188, + "learning_rate": 1.7109495738041605e-05, + "loss": 0.5378, + "step": 9939 + }, + { + "epoch": 27.084468664850135, + "grad_norm": 6.948312282562256, + "learning_rate": 1.7108875102191557e-05, + "loss": 0.4175, + "step": 9940 + }, + { + "epoch": 27.087193460490465, + "grad_norm": 7.597878456115723, + "learning_rate": 1.7108254410977822e-05, + "loss": 0.4593, + "step": 9941 + }, + { + "epoch": 27.08991825613079, + "grad_norm": 7.904601097106934, + "learning_rate": 1.710763366440523e-05, + "loss": 0.4382, + "step": 9942 + }, + { + "epoch": 27.092643051771116, + "grad_norm": 9.962733268737793, + "learning_rate": 1.7107012862478614e-05, + "loss": 0.4148, + "step": 9943 + }, + { + "epoch": 27.095367847411445, + "grad_norm": 9.055351257324219, + "learning_rate": 1.710639200520281e-05, + "loss": 0.4607, + "step": 9944 + }, + { + "epoch": 27.09809264305177, + "grad_norm": 7.320572376251221, + "learning_rate": 1.7105771092582655e-05, + "loss": 0.5253, + "step": 9945 + }, + { + "epoch": 27.100817438692097, + "grad_norm": 7.846962928771973, + "learning_rate": 1.7105150124622985e-05, + "loss": 0.6495, + "step": 9946 + }, + { + "epoch": 27.103542234332426, + "grad_norm": 7.681886672973633, + "learning_rate": 1.7104529101328632e-05, + "loss": 0.573, + "step": 9947 + }, + { + "epoch": 27.106267029972752, + "grad_norm": 11.92682933807373, + "learning_rate": 1.7103908022704436e-05, + "loss": 0.4685, + "step": 9948 + }, + { + "epoch": 27.108991825613078, + "grad_norm": 8.032818794250488, + "learning_rate": 1.7103286888755237e-05, + "loss": 0.5396, + "step": 9949 + }, + { + "epoch": 27.111716621253407, + "grad_norm": 6.875002384185791, + "learning_rate": 1.710266569948586e-05, + "loss": 0.591, + "step": 9950 + }, + { + "epoch": 27.114441416893733, + "grad_norm": 10.565400123596191, + "learning_rate": 1.7102044454901155e-05, + "loss": 0.5151, + "step": 9951 + }, + { + "epoch": 27.11716621253406, + "grad_norm": 7.093526363372803, + "learning_rate": 1.7101423155005957e-05, + "loss": 0.5104, + "step": 9952 + }, + { + "epoch": 27.11989100817439, + "grad_norm": 7.847536563873291, + "learning_rate": 1.7100801799805104e-05, + "loss": 0.5755, + "step": 9953 + }, + { + "epoch": 27.122615803814714, + "grad_norm": 9.526288986206055, + "learning_rate": 1.7100180389303435e-05, + "loss": 0.4774, + "step": 9954 + }, + { + "epoch": 27.12534059945504, + "grad_norm": 7.164559364318848, + "learning_rate": 1.7099558923505792e-05, + "loss": 0.5342, + "step": 9955 + }, + { + "epoch": 27.12806539509537, + "grad_norm": 6.162780284881592, + "learning_rate": 1.709893740241701e-05, + "loss": 0.3869, + "step": 9956 + }, + { + "epoch": 27.130790190735695, + "grad_norm": 7.655863285064697, + "learning_rate": 1.7098315826041932e-05, + "loss": 0.4987, + "step": 9957 + }, + { + "epoch": 27.13351498637602, + "grad_norm": 7.7024359703063965, + "learning_rate": 1.7097694194385395e-05, + "loss": 0.6907, + "step": 9958 + }, + { + "epoch": 27.13623978201635, + "grad_norm": 6.282317638397217, + "learning_rate": 1.709707250745225e-05, + "loss": 0.4347, + "step": 9959 + }, + { + "epoch": 27.138964577656676, + "grad_norm": 8.424469947814941, + "learning_rate": 1.7096450765247333e-05, + "loss": 0.5565, + "step": 9960 + }, + { + "epoch": 27.141689373297, + "grad_norm": 7.163951873779297, + "learning_rate": 1.7095828967775485e-05, + "loss": 0.461, + "step": 9961 + }, + { + "epoch": 27.14441416893733, + "grad_norm": 19.0053768157959, + "learning_rate": 1.7095207115041546e-05, + "loss": 0.5612, + "step": 9962 + }, + { + "epoch": 27.147138964577657, + "grad_norm": 10.031600952148438, + "learning_rate": 1.7094585207050363e-05, + "loss": 0.6506, + "step": 9963 + }, + { + "epoch": 27.149863760217983, + "grad_norm": 6.632686614990234, + "learning_rate": 1.709396324380678e-05, + "loss": 0.4497, + "step": 9964 + }, + { + "epoch": 27.152588555858312, + "grad_norm": 6.571283340454102, + "learning_rate": 1.709334122531564e-05, + "loss": 0.6563, + "step": 9965 + }, + { + "epoch": 27.155313351498638, + "grad_norm": 10.044163703918457, + "learning_rate": 1.7092719151581786e-05, + "loss": 0.5818, + "step": 9966 + }, + { + "epoch": 27.158038147138964, + "grad_norm": 7.754175186157227, + "learning_rate": 1.7092097022610064e-05, + "loss": 0.4387, + "step": 9967 + }, + { + "epoch": 27.160762942779293, + "grad_norm": 8.865942001342773, + "learning_rate": 1.709147483840532e-05, + "loss": 0.5388, + "step": 9968 + }, + { + "epoch": 27.16348773841962, + "grad_norm": 8.810154914855957, + "learning_rate": 1.7090852598972398e-05, + "loss": 0.4935, + "step": 9969 + }, + { + "epoch": 27.166212534059945, + "grad_norm": 7.3079681396484375, + "learning_rate": 1.7090230304316142e-05, + "loss": 0.5281, + "step": 9970 + }, + { + "epoch": 27.168937329700274, + "grad_norm": 9.283902168273926, + "learning_rate": 1.7089607954441403e-05, + "loss": 0.5385, + "step": 9971 + }, + { + "epoch": 27.1716621253406, + "grad_norm": 8.04033374786377, + "learning_rate": 1.7088985549353024e-05, + "loss": 0.3656, + "step": 9972 + }, + { + "epoch": 27.174386920980925, + "grad_norm": 12.064838409423828, + "learning_rate": 1.7088363089055854e-05, + "loss": 0.488, + "step": 9973 + }, + { + "epoch": 27.177111716621255, + "grad_norm": 6.4653544425964355, + "learning_rate": 1.708774057355474e-05, + "loss": 0.6996, + "step": 9974 + }, + { + "epoch": 27.17983651226158, + "grad_norm": 7.534409046173096, + "learning_rate": 1.708711800285453e-05, + "loss": 0.5007, + "step": 9975 + }, + { + "epoch": 27.182561307901906, + "grad_norm": 7.947213172912598, + "learning_rate": 1.7086495376960073e-05, + "loss": 0.543, + "step": 9976 + }, + { + "epoch": 27.185286103542236, + "grad_norm": 8.628761291503906, + "learning_rate": 1.708587269587622e-05, + "loss": 0.4768, + "step": 9977 + }, + { + "epoch": 27.18801089918256, + "grad_norm": 8.160655975341797, + "learning_rate": 1.7085249959607818e-05, + "loss": 0.6144, + "step": 9978 + }, + { + "epoch": 27.190735694822887, + "grad_norm": 6.389145851135254, + "learning_rate": 1.7084627168159716e-05, + "loss": 0.7598, + "step": 9979 + }, + { + "epoch": 27.193460490463217, + "grad_norm": 7.102512836456299, + "learning_rate": 1.708400432153677e-05, + "loss": 0.4783, + "step": 9980 + }, + { + "epoch": 27.196185286103542, + "grad_norm": 6.776620864868164, + "learning_rate": 1.7083381419743817e-05, + "loss": 0.5002, + "step": 9981 + }, + { + "epoch": 27.19891008174387, + "grad_norm": 6.986589431762695, + "learning_rate": 1.7082758462785728e-05, + "loss": 0.5826, + "step": 9982 + }, + { + "epoch": 27.201634877384198, + "grad_norm": 6.739128589630127, + "learning_rate": 1.7082135450667335e-05, + "loss": 0.5797, + "step": 9983 + }, + { + "epoch": 27.204359673024523, + "grad_norm": 10.087153434753418, + "learning_rate": 1.7081512383393507e-05, + "loss": 0.4793, + "step": 9984 + }, + { + "epoch": 27.20708446866485, + "grad_norm": 7.079504489898682, + "learning_rate": 1.7080889260969083e-05, + "loss": 0.644, + "step": 9985 + }, + { + "epoch": 27.20980926430518, + "grad_norm": 7.418025493621826, + "learning_rate": 1.708026608339892e-05, + "loss": 0.4905, + "step": 9986 + }, + { + "epoch": 27.212534059945504, + "grad_norm": 7.351944446563721, + "learning_rate": 1.7079642850687877e-05, + "loss": 0.5712, + "step": 9987 + }, + { + "epoch": 27.21525885558583, + "grad_norm": 7.845609664916992, + "learning_rate": 1.7079019562840805e-05, + "loss": 0.7001, + "step": 9988 + }, + { + "epoch": 27.21798365122616, + "grad_norm": 9.999709129333496, + "learning_rate": 1.7078396219862555e-05, + "loss": 0.6672, + "step": 9989 + }, + { + "epoch": 27.220708446866485, + "grad_norm": 8.453604698181152, + "learning_rate": 1.707777282175798e-05, + "loss": 0.5795, + "step": 9990 + }, + { + "epoch": 27.22343324250681, + "grad_norm": 8.12509536743164, + "learning_rate": 1.707714936853194e-05, + "loss": 0.4963, + "step": 9991 + }, + { + "epoch": 27.22615803814714, + "grad_norm": 8.132515907287598, + "learning_rate": 1.7076525860189287e-05, + "loss": 0.642, + "step": 9992 + }, + { + "epoch": 27.228882833787466, + "grad_norm": 7.824767589569092, + "learning_rate": 1.707590229673488e-05, + "loss": 0.3948, + "step": 9993 + }, + { + "epoch": 27.231607629427792, + "grad_norm": 6.789891242980957, + "learning_rate": 1.7075278678173574e-05, + "loss": 0.4338, + "step": 9994 + }, + { + "epoch": 27.23433242506812, + "grad_norm": 7.379485130310059, + "learning_rate": 1.7074655004510225e-05, + "loss": 0.4098, + "step": 9995 + }, + { + "epoch": 27.237057220708447, + "grad_norm": 6.867528915405273, + "learning_rate": 1.7074031275749686e-05, + "loss": 0.575, + "step": 9996 + }, + { + "epoch": 27.239782016348773, + "grad_norm": 6.640412330627441, + "learning_rate": 1.7073407491896824e-05, + "loss": 0.5046, + "step": 9997 + }, + { + "epoch": 27.242506811989102, + "grad_norm": 7.1053786277771, + "learning_rate": 1.7072783652956493e-05, + "loss": 0.5579, + "step": 9998 + }, + { + "epoch": 27.245231607629428, + "grad_norm": 9.06983757019043, + "learning_rate": 1.707215975893355e-05, + "loss": 0.5596, + "step": 9999 + }, + { + "epoch": 27.247956403269754, + "grad_norm": 7.0437912940979, + "learning_rate": 1.7071535809832852e-05, + "loss": 0.6115, + "step": 10000 + }, + { + "epoch": 27.250681198910083, + "grad_norm": 9.336917877197266, + "learning_rate": 1.707091180565926e-05, + "loss": 0.4551, + "step": 10001 + }, + { + "epoch": 27.25340599455041, + "grad_norm": 7.803974151611328, + "learning_rate": 1.7070287746417636e-05, + "loss": 0.4794, + "step": 10002 + }, + { + "epoch": 27.256130790190735, + "grad_norm": 10.840062141418457, + "learning_rate": 1.706966363211284e-05, + "loss": 0.5307, + "step": 10003 + }, + { + "epoch": 27.258855585831064, + "grad_norm": 7.2597336769104, + "learning_rate": 1.7069039462749734e-05, + "loss": 0.6178, + "step": 10004 + }, + { + "epoch": 27.26158038147139, + "grad_norm": 7.98543119430542, + "learning_rate": 1.706841523833317e-05, + "loss": 0.5807, + "step": 10005 + }, + { + "epoch": 27.264305177111716, + "grad_norm": 9.968547821044922, + "learning_rate": 1.7067790958868017e-05, + "loss": 0.6636, + "step": 10006 + }, + { + "epoch": 27.267029972752045, + "grad_norm": 9.231914520263672, + "learning_rate": 1.7067166624359138e-05, + "loss": 0.47, + "step": 10007 + }, + { + "epoch": 27.26975476839237, + "grad_norm": 8.400660514831543, + "learning_rate": 1.706654223481139e-05, + "loss": 0.5679, + "step": 10008 + }, + { + "epoch": 27.272479564032697, + "grad_norm": 8.488985061645508, + "learning_rate": 1.706591779022964e-05, + "loss": 0.5359, + "step": 10009 + }, + { + "epoch": 27.275204359673026, + "grad_norm": 6.763240337371826, + "learning_rate": 1.706529329061875e-05, + "loss": 0.5494, + "step": 10010 + }, + { + "epoch": 27.277929155313352, + "grad_norm": 7.996668815612793, + "learning_rate": 1.706466873598358e-05, + "loss": 0.4254, + "step": 10011 + }, + { + "epoch": 27.280653950953678, + "grad_norm": 8.270384788513184, + "learning_rate": 1.7064044126329e-05, + "loss": 0.4733, + "step": 10012 + }, + { + "epoch": 27.283378746594007, + "grad_norm": 7.509069442749023, + "learning_rate": 1.706341946165987e-05, + "loss": 0.5413, + "step": 10013 + }, + { + "epoch": 27.286103542234333, + "grad_norm": 9.132331848144531, + "learning_rate": 1.706279474198106e-05, + "loss": 0.4437, + "step": 10014 + }, + { + "epoch": 27.28882833787466, + "grad_norm": 6.917953014373779, + "learning_rate": 1.7062169967297432e-05, + "loss": 0.4746, + "step": 10015 + }, + { + "epoch": 27.291553133514988, + "grad_norm": 7.6658477783203125, + "learning_rate": 1.7061545137613847e-05, + "loss": 0.7435, + "step": 10016 + }, + { + "epoch": 27.294277929155314, + "grad_norm": 7.395020961761475, + "learning_rate": 1.706092025293518e-05, + "loss": 0.4034, + "step": 10017 + }, + { + "epoch": 27.29700272479564, + "grad_norm": 6.857711315155029, + "learning_rate": 1.7060295313266292e-05, + "loss": 0.4524, + "step": 10018 + }, + { + "epoch": 27.29972752043597, + "grad_norm": 8.136479377746582, + "learning_rate": 1.7059670318612053e-05, + "loss": 0.3506, + "step": 10019 + }, + { + "epoch": 27.302452316076295, + "grad_norm": 8.787403106689453, + "learning_rate": 1.7059045268977325e-05, + "loss": 0.4917, + "step": 10020 + }, + { + "epoch": 27.30517711171662, + "grad_norm": 6.448479175567627, + "learning_rate": 1.705842016436698e-05, + "loss": 0.5216, + "step": 10021 + }, + { + "epoch": 27.30790190735695, + "grad_norm": 6.3374481201171875, + "learning_rate": 1.705779500478589e-05, + "loss": 0.5302, + "step": 10022 + }, + { + "epoch": 27.310626702997276, + "grad_norm": 7.888910293579102, + "learning_rate": 1.7057169790238916e-05, + "loss": 0.5046, + "step": 10023 + }, + { + "epoch": 27.3133514986376, + "grad_norm": 8.027619361877441, + "learning_rate": 1.705654452073093e-05, + "loss": 0.6215, + "step": 10024 + }, + { + "epoch": 27.31607629427793, + "grad_norm": 8.172956466674805, + "learning_rate": 1.7055919196266806e-05, + "loss": 0.5985, + "step": 10025 + }, + { + "epoch": 27.318801089918257, + "grad_norm": 7.377542972564697, + "learning_rate": 1.705529381685141e-05, + "loss": 0.5151, + "step": 10026 + }, + { + "epoch": 27.321525885558582, + "grad_norm": 7.448740005493164, + "learning_rate": 1.705466838248961e-05, + "loss": 0.5624, + "step": 10027 + }, + { + "epoch": 27.32425068119891, + "grad_norm": 7.380115032196045, + "learning_rate": 1.705404289318628e-05, + "loss": 0.5007, + "step": 10028 + }, + { + "epoch": 27.326975476839237, + "grad_norm": 7.7183518409729, + "learning_rate": 1.7053417348946293e-05, + "loss": 0.5818, + "step": 10029 + }, + { + "epoch": 27.329700272479563, + "grad_norm": 7.5660719871521, + "learning_rate": 1.705279174977452e-05, + "loss": 0.5103, + "step": 10030 + }, + { + "epoch": 27.332425068119893, + "grad_norm": 12.974373817443848, + "learning_rate": 1.7052166095675827e-05, + "loss": 0.645, + "step": 10031 + }, + { + "epoch": 27.33514986376022, + "grad_norm": 7.177042484283447, + "learning_rate": 1.7051540386655094e-05, + "loss": 0.4811, + "step": 10032 + }, + { + "epoch": 27.337874659400544, + "grad_norm": 9.889019012451172, + "learning_rate": 1.705091462271719e-05, + "loss": 0.7004, + "step": 10033 + }, + { + "epoch": 27.340599455040874, + "grad_norm": 7.093506813049316, + "learning_rate": 1.7050288803866992e-05, + "loss": 0.6276, + "step": 10034 + }, + { + "epoch": 27.3433242506812, + "grad_norm": 9.160090446472168, + "learning_rate": 1.7049662930109373e-05, + "loss": 0.6492, + "step": 10035 + }, + { + "epoch": 27.346049046321525, + "grad_norm": 8.586556434631348, + "learning_rate": 1.7049037001449202e-05, + "loss": 0.5503, + "step": 10036 + }, + { + "epoch": 27.348773841961854, + "grad_norm": 7.525806903839111, + "learning_rate": 1.704841101789136e-05, + "loss": 0.4617, + "step": 10037 + }, + { + "epoch": 27.35149863760218, + "grad_norm": 6.517123699188232, + "learning_rate": 1.704778497944072e-05, + "loss": 0.4512, + "step": 10038 + }, + { + "epoch": 27.354223433242506, + "grad_norm": 8.63493824005127, + "learning_rate": 1.704715888610216e-05, + "loss": 0.5289, + "step": 10039 + }, + { + "epoch": 27.356948228882835, + "grad_norm": 7.07725191116333, + "learning_rate": 1.704653273788055e-05, + "loss": 0.7155, + "step": 10040 + }, + { + "epoch": 27.35967302452316, + "grad_norm": 7.394663333892822, + "learning_rate": 1.704590653478077e-05, + "loss": 0.5936, + "step": 10041 + }, + { + "epoch": 27.362397820163487, + "grad_norm": 7.452281951904297, + "learning_rate": 1.7045280276807697e-05, + "loss": 0.6404, + "step": 10042 + }, + { + "epoch": 27.365122615803816, + "grad_norm": 8.40842056274414, + "learning_rate": 1.7044653963966206e-05, + "loss": 0.7006, + "step": 10043 + }, + { + "epoch": 27.367847411444142, + "grad_norm": 7.894318580627441, + "learning_rate": 1.7044027596261178e-05, + "loss": 0.5676, + "step": 10044 + }, + { + "epoch": 27.370572207084468, + "grad_norm": 8.687544822692871, + "learning_rate": 1.704340117369749e-05, + "loss": 0.4442, + "step": 10045 + }, + { + "epoch": 27.373297002724797, + "grad_norm": 6.665185928344727, + "learning_rate": 1.7042774696280023e-05, + "loss": 0.7184, + "step": 10046 + }, + { + "epoch": 27.376021798365123, + "grad_norm": 6.788980960845947, + "learning_rate": 1.704214816401365e-05, + "loss": 0.6483, + "step": 10047 + }, + { + "epoch": 27.37874659400545, + "grad_norm": 8.649880409240723, + "learning_rate": 1.7041521576903254e-05, + "loss": 0.4934, + "step": 10048 + }, + { + "epoch": 27.381471389645778, + "grad_norm": 6.84049654006958, + "learning_rate": 1.7040894934953715e-05, + "loss": 0.5432, + "step": 10049 + }, + { + "epoch": 27.384196185286104, + "grad_norm": 7.426638126373291, + "learning_rate": 1.7040268238169916e-05, + "loss": 0.4585, + "step": 10050 + }, + { + "epoch": 27.38692098092643, + "grad_norm": 7.961089611053467, + "learning_rate": 1.7039641486556732e-05, + "loss": 0.5002, + "step": 10051 + }, + { + "epoch": 27.38964577656676, + "grad_norm": 8.751544952392578, + "learning_rate": 1.7039014680119046e-05, + "loss": 0.6028, + "step": 10052 + }, + { + "epoch": 27.392370572207085, + "grad_norm": 7.071634292602539, + "learning_rate": 1.703838781886174e-05, + "loss": 0.485, + "step": 10053 + }, + { + "epoch": 27.39509536784741, + "grad_norm": 7.8563456535339355, + "learning_rate": 1.7037760902789696e-05, + "loss": 0.6389, + "step": 10054 + }, + { + "epoch": 27.39782016348774, + "grad_norm": 7.355616569519043, + "learning_rate": 1.7037133931907797e-05, + "loss": 0.4425, + "step": 10055 + }, + { + "epoch": 27.400544959128066, + "grad_norm": 8.382254600524902, + "learning_rate": 1.7036506906220928e-05, + "loss": 0.4914, + "step": 10056 + }, + { + "epoch": 27.40326975476839, + "grad_norm": 7.880213260650635, + "learning_rate": 1.7035879825733965e-05, + "loss": 0.5283, + "step": 10057 + }, + { + "epoch": 27.40599455040872, + "grad_norm": 7.893124103546143, + "learning_rate": 1.70352526904518e-05, + "loss": 0.5607, + "step": 10058 + }, + { + "epoch": 27.408719346049047, + "grad_norm": 8.816205024719238, + "learning_rate": 1.7034625500379312e-05, + "loss": 0.4796, + "step": 10059 + }, + { + "epoch": 27.411444141689373, + "grad_norm": 6.785427093505859, + "learning_rate": 1.7033998255521388e-05, + "loss": 0.7288, + "step": 10060 + }, + { + "epoch": 27.414168937329702, + "grad_norm": 8.814774513244629, + "learning_rate": 1.703337095588291e-05, + "loss": 0.4966, + "step": 10061 + }, + { + "epoch": 27.416893732970028, + "grad_norm": 9.867323875427246, + "learning_rate": 1.703274360146877e-05, + "loss": 0.5505, + "step": 10062 + }, + { + "epoch": 27.419618528610354, + "grad_norm": 12.343128204345703, + "learning_rate": 1.7032116192283844e-05, + "loss": 0.5804, + "step": 10063 + }, + { + "epoch": 27.422343324250683, + "grad_norm": 7.334210395812988, + "learning_rate": 1.7031488728333025e-05, + "loss": 0.4539, + "step": 10064 + }, + { + "epoch": 27.42506811989101, + "grad_norm": 7.609729766845703, + "learning_rate": 1.70308612096212e-05, + "loss": 0.5215, + "step": 10065 + }, + { + "epoch": 27.427792915531334, + "grad_norm": 7.235856533050537, + "learning_rate": 1.703023363615325e-05, + "loss": 0.6719, + "step": 10066 + }, + { + "epoch": 27.430517711171664, + "grad_norm": 10.903604507446289, + "learning_rate": 1.7029606007934073e-05, + "loss": 0.4841, + "step": 10067 + }, + { + "epoch": 27.43324250681199, + "grad_norm": 6.353349685668945, + "learning_rate": 1.7028978324968543e-05, + "loss": 0.616, + "step": 10068 + }, + { + "epoch": 27.435967302452315, + "grad_norm": 9.866066932678223, + "learning_rate": 1.702835058726156e-05, + "loss": 0.5229, + "step": 10069 + }, + { + "epoch": 27.438692098092645, + "grad_norm": 7.57305383682251, + "learning_rate": 1.7027722794818008e-05, + "loss": 0.3775, + "step": 10070 + }, + { + "epoch": 27.44141689373297, + "grad_norm": 22.632381439208984, + "learning_rate": 1.702709494764278e-05, + "loss": 0.4514, + "step": 10071 + }, + { + "epoch": 27.444141689373296, + "grad_norm": 7.173084735870361, + "learning_rate": 1.7026467045740762e-05, + "loss": 0.5573, + "step": 10072 + }, + { + "epoch": 27.446866485013626, + "grad_norm": 8.10495376586914, + "learning_rate": 1.7025839089116843e-05, + "loss": 0.4835, + "step": 10073 + }, + { + "epoch": 27.44959128065395, + "grad_norm": 7.458191394805908, + "learning_rate": 1.7025211077775915e-05, + "loss": 0.4229, + "step": 10074 + }, + { + "epoch": 27.452316076294277, + "grad_norm": 7.296041011810303, + "learning_rate": 1.702458301172287e-05, + "loss": 0.5245, + "step": 10075 + }, + { + "epoch": 27.455040871934607, + "grad_norm": 8.165763854980469, + "learning_rate": 1.70239548909626e-05, + "loss": 0.3905, + "step": 10076 + }, + { + "epoch": 27.457765667574932, + "grad_norm": 10.956998825073242, + "learning_rate": 1.7023326715499994e-05, + "loss": 0.555, + "step": 10077 + }, + { + "epoch": 27.460490463215258, + "grad_norm": 7.5906805992126465, + "learning_rate": 1.7022698485339945e-05, + "loss": 0.6392, + "step": 10078 + }, + { + "epoch": 27.463215258855588, + "grad_norm": 5.883872032165527, + "learning_rate": 1.7022070200487344e-05, + "loss": 0.4222, + "step": 10079 + }, + { + "epoch": 27.465940054495913, + "grad_norm": 7.269608974456787, + "learning_rate": 1.702144186094709e-05, + "loss": 0.4908, + "step": 10080 + }, + { + "epoch": 27.46866485013624, + "grad_norm": 6.971725940704346, + "learning_rate": 1.7020813466724072e-05, + "loss": 0.4449, + "step": 10081 + }, + { + "epoch": 27.47138964577657, + "grad_norm": 7.517458915710449, + "learning_rate": 1.7020185017823185e-05, + "loss": 0.459, + "step": 10082 + }, + { + "epoch": 27.474114441416894, + "grad_norm": 8.003358840942383, + "learning_rate": 1.7019556514249323e-05, + "loss": 0.5072, + "step": 10083 + }, + { + "epoch": 27.47683923705722, + "grad_norm": 7.887994766235352, + "learning_rate": 1.701892795600738e-05, + "loss": 0.4629, + "step": 10084 + }, + { + "epoch": 27.479564032697546, + "grad_norm": 7.413704872131348, + "learning_rate": 1.7018299343102252e-05, + "loss": 0.4489, + "step": 10085 + }, + { + "epoch": 27.482288828337875, + "grad_norm": 8.17776107788086, + "learning_rate": 1.7017670675538834e-05, + "loss": 0.5391, + "step": 10086 + }, + { + "epoch": 27.4850136239782, + "grad_norm": 8.881941795349121, + "learning_rate": 1.7017041953322025e-05, + "loss": 0.4822, + "step": 10087 + }, + { + "epoch": 27.48773841961853, + "grad_norm": 8.7860107421875, + "learning_rate": 1.7016413176456717e-05, + "loss": 0.6063, + "step": 10088 + }, + { + "epoch": 27.490463215258856, + "grad_norm": 8.136934280395508, + "learning_rate": 1.701578434494781e-05, + "loss": 0.5015, + "step": 10089 + }, + { + "epoch": 27.493188010899182, + "grad_norm": 7.738018989562988, + "learning_rate": 1.70151554588002e-05, + "loss": 0.5712, + "step": 10090 + }, + { + "epoch": 27.495912806539508, + "grad_norm": 8.951044082641602, + "learning_rate": 1.7014526518018787e-05, + "loss": 0.4677, + "step": 10091 + }, + { + "epoch": 27.498637602179837, + "grad_norm": 8.95796012878418, + "learning_rate": 1.7013897522608464e-05, + "loss": 0.4974, + "step": 10092 + }, + { + "epoch": 27.501362397820163, + "grad_norm": 6.817696571350098, + "learning_rate": 1.7013268472574133e-05, + "loss": 0.586, + "step": 10093 + }, + { + "epoch": 27.504087193460492, + "grad_norm": 9.146210670471191, + "learning_rate": 1.7012639367920694e-05, + "loss": 0.5119, + "step": 10094 + }, + { + "epoch": 27.506811989100818, + "grad_norm": 8.180194854736328, + "learning_rate": 1.7012010208653044e-05, + "loss": 0.5262, + "step": 10095 + }, + { + "epoch": 27.509536784741144, + "grad_norm": 7.886168956756592, + "learning_rate": 1.7011380994776086e-05, + "loss": 0.55, + "step": 10096 + }, + { + "epoch": 27.51226158038147, + "grad_norm": 7.781095027923584, + "learning_rate": 1.701075172629472e-05, + "loss": 0.4719, + "step": 10097 + }, + { + "epoch": 27.5149863760218, + "grad_norm": 9.938278198242188, + "learning_rate": 1.701012240321384e-05, + "loss": 0.4791, + "step": 10098 + }, + { + "epoch": 27.517711171662125, + "grad_norm": 8.60433578491211, + "learning_rate": 1.7009493025538356e-05, + "loss": 0.5984, + "step": 10099 + }, + { + "epoch": 27.520435967302454, + "grad_norm": 7.6925740242004395, + "learning_rate": 1.7008863593273167e-05, + "loss": 0.4728, + "step": 10100 + }, + { + "epoch": 27.52316076294278, + "grad_norm": 10.18087387084961, + "learning_rate": 1.7008234106423175e-05, + "loss": 0.5426, + "step": 10101 + }, + { + "epoch": 27.525885558583106, + "grad_norm": 8.223434448242188, + "learning_rate": 1.7007604564993277e-05, + "loss": 0.4843, + "step": 10102 + }, + { + "epoch": 27.52861035422343, + "grad_norm": 7.773364067077637, + "learning_rate": 1.7006974968988382e-05, + "loss": 0.5776, + "step": 10103 + }, + { + "epoch": 27.53133514986376, + "grad_norm": 7.327798366546631, + "learning_rate": 1.700634531841339e-05, + "loss": 0.5204, + "step": 10104 + }, + { + "epoch": 27.534059945504087, + "grad_norm": 7.9707512855529785, + "learning_rate": 1.7005715613273206e-05, + "loss": 0.3813, + "step": 10105 + }, + { + "epoch": 27.536784741144416, + "grad_norm": 8.973421096801758, + "learning_rate": 1.7005085853572736e-05, + "loss": 0.5999, + "step": 10106 + }, + { + "epoch": 27.539509536784742, + "grad_norm": 6.864203453063965, + "learning_rate": 1.7004456039316883e-05, + "loss": 0.4249, + "step": 10107 + }, + { + "epoch": 27.542234332425068, + "grad_norm": 8.282187461853027, + "learning_rate": 1.700382617051055e-05, + "loss": 0.6014, + "step": 10108 + }, + { + "epoch": 27.544959128065393, + "grad_norm": 12.412527084350586, + "learning_rate": 1.700319624715865e-05, + "loss": 0.4525, + "step": 10109 + }, + { + "epoch": 27.547683923705723, + "grad_norm": 9.558048248291016, + "learning_rate": 1.7002566269266078e-05, + "loss": 0.3632, + "step": 10110 + }, + { + "epoch": 27.55040871934605, + "grad_norm": 9.724501609802246, + "learning_rate": 1.7001936236837743e-05, + "loss": 0.6462, + "step": 10111 + }, + { + "epoch": 27.553133514986374, + "grad_norm": 8.310857772827148, + "learning_rate": 1.700130614987856e-05, + "loss": 0.5931, + "step": 10112 + }, + { + "epoch": 27.555858310626704, + "grad_norm": 14.585291862487793, + "learning_rate": 1.700067600839342e-05, + "loss": 0.4228, + "step": 10113 + }, + { + "epoch": 27.55858310626703, + "grad_norm": 7.609127044677734, + "learning_rate": 1.7000045812387253e-05, + "loss": 0.4537, + "step": 10114 + }, + { + "epoch": 27.561307901907355, + "grad_norm": 8.360729217529297, + "learning_rate": 1.6999415561864946e-05, + "loss": 0.5504, + "step": 10115 + }, + { + "epoch": 27.564032697547685, + "grad_norm": 10.392511367797852, + "learning_rate": 1.699878525683142e-05, + "loss": 0.6907, + "step": 10116 + }, + { + "epoch": 27.56675749318801, + "grad_norm": 9.930464744567871, + "learning_rate": 1.699815489729158e-05, + "loss": 0.5182, + "step": 10117 + }, + { + "epoch": 27.569482288828336, + "grad_norm": 8.100626945495605, + "learning_rate": 1.699752448325033e-05, + "loss": 0.4962, + "step": 10118 + }, + { + "epoch": 27.572207084468666, + "grad_norm": 9.099678039550781, + "learning_rate": 1.699689401471259e-05, + "loss": 0.5587, + "step": 10119 + }, + { + "epoch": 27.57493188010899, + "grad_norm": 8.464005470275879, + "learning_rate": 1.6996263491683263e-05, + "loss": 0.5463, + "step": 10120 + }, + { + "epoch": 27.577656675749317, + "grad_norm": 7.654876232147217, + "learning_rate": 1.699563291416726e-05, + "loss": 0.495, + "step": 10121 + }, + { + "epoch": 27.580381471389646, + "grad_norm": 8.215298652648926, + "learning_rate": 1.699500228216949e-05, + "loss": 0.5095, + "step": 10122 + }, + { + "epoch": 27.583106267029972, + "grad_norm": 8.29395580291748, + "learning_rate": 1.6994371595694875e-05, + "loss": 0.5142, + "step": 10123 + }, + { + "epoch": 27.585831062670298, + "grad_norm": 7.2489190101623535, + "learning_rate": 1.6993740854748315e-05, + "loss": 0.576, + "step": 10124 + }, + { + "epoch": 27.588555858310627, + "grad_norm": 8.529529571533203, + "learning_rate": 1.6993110059334725e-05, + "loss": 0.4901, + "step": 10125 + }, + { + "epoch": 27.591280653950953, + "grad_norm": 9.240521430969238, + "learning_rate": 1.699247920945902e-05, + "loss": 0.7894, + "step": 10126 + }, + { + "epoch": 27.59400544959128, + "grad_norm": 8.59414005279541, + "learning_rate": 1.6991848305126113e-05, + "loss": 0.3962, + "step": 10127 + }, + { + "epoch": 27.59673024523161, + "grad_norm": 7.808393478393555, + "learning_rate": 1.6991217346340917e-05, + "loss": 0.4674, + "step": 10128 + }, + { + "epoch": 27.599455040871934, + "grad_norm": 9.266545295715332, + "learning_rate": 1.6990586333108342e-05, + "loss": 0.4837, + "step": 10129 + }, + { + "epoch": 27.60217983651226, + "grad_norm": 10.481103897094727, + "learning_rate": 1.698995526543331e-05, + "loss": 0.5045, + "step": 10130 + }, + { + "epoch": 27.60490463215259, + "grad_norm": 8.234030723571777, + "learning_rate": 1.698932414332073e-05, + "loss": 0.6446, + "step": 10131 + }, + { + "epoch": 27.607629427792915, + "grad_norm": 8.013397216796875, + "learning_rate": 1.6988692966775515e-05, + "loss": 0.5372, + "step": 10132 + }, + { + "epoch": 27.61035422343324, + "grad_norm": 11.488170623779297, + "learning_rate": 1.6988061735802587e-05, + "loss": 0.5749, + "step": 10133 + }, + { + "epoch": 27.61307901907357, + "grad_norm": 8.59324836730957, + "learning_rate": 1.6987430450406857e-05, + "loss": 0.4888, + "step": 10134 + }, + { + "epoch": 27.615803814713896, + "grad_norm": 6.613129138946533, + "learning_rate": 1.698679911059325e-05, + "loss": 0.6968, + "step": 10135 + }, + { + "epoch": 27.618528610354222, + "grad_norm": 8.80296802520752, + "learning_rate": 1.698616771636667e-05, + "loss": 0.4436, + "step": 10136 + }, + { + "epoch": 27.62125340599455, + "grad_norm": 9.776527404785156, + "learning_rate": 1.698553626773204e-05, + "loss": 0.5546, + "step": 10137 + }, + { + "epoch": 27.623978201634877, + "grad_norm": 9.341790199279785, + "learning_rate": 1.6984904764694282e-05, + "loss": 0.548, + "step": 10138 + }, + { + "epoch": 27.626702997275203, + "grad_norm": 8.773140907287598, + "learning_rate": 1.6984273207258312e-05, + "loss": 0.5074, + "step": 10139 + }, + { + "epoch": 27.629427792915532, + "grad_norm": 7.1406025886535645, + "learning_rate": 1.698364159542904e-05, + "loss": 0.4796, + "step": 10140 + }, + { + "epoch": 27.632152588555858, + "grad_norm": 8.004528999328613, + "learning_rate": 1.6983009929211397e-05, + "loss": 0.4002, + "step": 10141 + }, + { + "epoch": 27.634877384196184, + "grad_norm": 14.518450736999512, + "learning_rate": 1.6982378208610298e-05, + "loss": 0.4852, + "step": 10142 + }, + { + "epoch": 27.637602179836513, + "grad_norm": 12.912113189697266, + "learning_rate": 1.698174643363066e-05, + "loss": 0.5564, + "step": 10143 + }, + { + "epoch": 27.64032697547684, + "grad_norm": 7.492455005645752, + "learning_rate": 1.698111460427741e-05, + "loss": 0.4921, + "step": 10144 + }, + { + "epoch": 27.643051771117165, + "grad_norm": 8.511575698852539, + "learning_rate": 1.6980482720555457e-05, + "loss": 0.562, + "step": 10145 + }, + { + "epoch": 27.645776566757494, + "grad_norm": 8.994081497192383, + "learning_rate": 1.6979850782469734e-05, + "loss": 0.3861, + "step": 10146 + }, + { + "epoch": 27.64850136239782, + "grad_norm": 10.454629898071289, + "learning_rate": 1.6979218790025157e-05, + "loss": 0.5139, + "step": 10147 + }, + { + "epoch": 27.651226158038146, + "grad_norm": 6.342076778411865, + "learning_rate": 1.6978586743226646e-05, + "loss": 0.4712, + "step": 10148 + }, + { + "epoch": 27.653950953678475, + "grad_norm": 7.370853900909424, + "learning_rate": 1.697795464207913e-05, + "loss": 0.4252, + "step": 10149 + }, + { + "epoch": 27.6566757493188, + "grad_norm": 7.944183349609375, + "learning_rate": 1.6977322486587527e-05, + "loss": 0.48, + "step": 10150 + }, + { + "epoch": 27.659400544959126, + "grad_norm": 9.738842964172363, + "learning_rate": 1.697669027675676e-05, + "loss": 0.5269, + "step": 10151 + }, + { + "epoch": 27.662125340599456, + "grad_norm": 10.647909164428711, + "learning_rate": 1.6976058012591755e-05, + "loss": 0.5145, + "step": 10152 + }, + { + "epoch": 27.66485013623978, + "grad_norm": 7.026835918426514, + "learning_rate": 1.697542569409743e-05, + "loss": 0.5372, + "step": 10153 + }, + { + "epoch": 27.667574931880107, + "grad_norm": 7.8032684326171875, + "learning_rate": 1.697479332127872e-05, + "loss": 0.722, + "step": 10154 + }, + { + "epoch": 27.670299727520437, + "grad_norm": 7.139540672302246, + "learning_rate": 1.697416089414054e-05, + "loss": 0.5872, + "step": 10155 + }, + { + "epoch": 27.673024523160763, + "grad_norm": 8.369836807250977, + "learning_rate": 1.6973528412687824e-05, + "loss": 0.6517, + "step": 10156 + }, + { + "epoch": 27.67574931880109, + "grad_norm": 8.08837604522705, + "learning_rate": 1.697289587692549e-05, + "loss": 0.5886, + "step": 10157 + }, + { + "epoch": 27.678474114441418, + "grad_norm": 11.793229103088379, + "learning_rate": 1.6972263286858467e-05, + "loss": 0.4599, + "step": 10158 + }, + { + "epoch": 27.681198910081743, + "grad_norm": 7.740310192108154, + "learning_rate": 1.6971630642491683e-05, + "loss": 0.4795, + "step": 10159 + }, + { + "epoch": 27.68392370572207, + "grad_norm": 17.676279067993164, + "learning_rate": 1.6970997943830062e-05, + "loss": 0.422, + "step": 10160 + }, + { + "epoch": 27.6866485013624, + "grad_norm": 7.5012617111206055, + "learning_rate": 1.6970365190878536e-05, + "loss": 0.5285, + "step": 10161 + }, + { + "epoch": 27.689373297002724, + "grad_norm": 8.547582626342773, + "learning_rate": 1.696973238364203e-05, + "loss": 0.4307, + "step": 10162 + }, + { + "epoch": 27.69209809264305, + "grad_norm": 9.068389892578125, + "learning_rate": 1.6969099522125475e-05, + "loss": 0.6285, + "step": 10163 + }, + { + "epoch": 27.69482288828338, + "grad_norm": 9.725485801696777, + "learning_rate": 1.6968466606333792e-05, + "loss": 0.5322, + "step": 10164 + }, + { + "epoch": 27.697547683923705, + "grad_norm": 8.065115928649902, + "learning_rate": 1.6967833636271916e-05, + "loss": 0.5037, + "step": 10165 + }, + { + "epoch": 27.70027247956403, + "grad_norm": 7.664557456970215, + "learning_rate": 1.6967200611944776e-05, + "loss": 0.4163, + "step": 10166 + }, + { + "epoch": 27.70299727520436, + "grad_norm": 8.630768775939941, + "learning_rate": 1.69665675333573e-05, + "loss": 0.5409, + "step": 10167 + }, + { + "epoch": 27.705722070844686, + "grad_norm": 7.188152313232422, + "learning_rate": 1.696593440051443e-05, + "loss": 0.5503, + "step": 10168 + }, + { + "epoch": 27.708446866485012, + "grad_norm": 10.388522148132324, + "learning_rate": 1.6965301213421075e-05, + "loss": 0.6546, + "step": 10169 + }, + { + "epoch": 27.71117166212534, + "grad_norm": 9.461798667907715, + "learning_rate": 1.6964667972082187e-05, + "loss": 0.5003, + "step": 10170 + }, + { + "epoch": 27.713896457765667, + "grad_norm": 10.95566463470459, + "learning_rate": 1.6964034676502686e-05, + "loss": 0.5399, + "step": 10171 + }, + { + "epoch": 27.716621253405993, + "grad_norm": 14.988588333129883, + "learning_rate": 1.6963401326687506e-05, + "loss": 0.5426, + "step": 10172 + }, + { + "epoch": 27.719346049046322, + "grad_norm": 7.101005554199219, + "learning_rate": 1.696276792264158e-05, + "loss": 0.476, + "step": 10173 + }, + { + "epoch": 27.722070844686648, + "grad_norm": 8.343110084533691, + "learning_rate": 1.6962134464369846e-05, + "loss": 0.5077, + "step": 10174 + }, + { + "epoch": 27.724795640326974, + "grad_norm": 12.384000778198242, + "learning_rate": 1.696150095187723e-05, + "loss": 0.5668, + "step": 10175 + }, + { + "epoch": 27.727520435967303, + "grad_norm": 7.71723747253418, + "learning_rate": 1.6960867385168668e-05, + "loss": 0.4366, + "step": 10176 + }, + { + "epoch": 27.73024523160763, + "grad_norm": 7.035843372344971, + "learning_rate": 1.6960233764249095e-05, + "loss": 0.6004, + "step": 10177 + }, + { + "epoch": 27.732970027247955, + "grad_norm": 8.7925386428833, + "learning_rate": 1.6959600089123447e-05, + "loss": 0.5704, + "step": 10178 + }, + { + "epoch": 27.735694822888284, + "grad_norm": 7.859381198883057, + "learning_rate": 1.6958966359796657e-05, + "loss": 0.4832, + "step": 10179 + }, + { + "epoch": 27.73841961852861, + "grad_norm": 7.379161834716797, + "learning_rate": 1.695833257627366e-05, + "loss": 0.6636, + "step": 10180 + }, + { + "epoch": 27.741144414168936, + "grad_norm": 7.621696949005127, + "learning_rate": 1.695769873855939e-05, + "loss": 0.4753, + "step": 10181 + }, + { + "epoch": 27.743869209809265, + "grad_norm": 7.432315349578857, + "learning_rate": 1.695706484665879e-05, + "loss": 0.6271, + "step": 10182 + }, + { + "epoch": 27.74659400544959, + "grad_norm": 8.763675689697266, + "learning_rate": 1.695643090057679e-05, + "loss": 0.5212, + "step": 10183 + }, + { + "epoch": 27.749318801089917, + "grad_norm": 8.227683067321777, + "learning_rate": 1.6955796900318337e-05, + "loss": 0.5168, + "step": 10184 + }, + { + "epoch": 27.752043596730246, + "grad_norm": 8.002479553222656, + "learning_rate": 1.6955162845888354e-05, + "loss": 0.5506, + "step": 10185 + }, + { + "epoch": 27.754768392370572, + "grad_norm": 7.464667320251465, + "learning_rate": 1.6954528737291787e-05, + "loss": 0.3843, + "step": 10186 + }, + { + "epoch": 27.757493188010898, + "grad_norm": 8.782455444335938, + "learning_rate": 1.695389457453358e-05, + "loss": 0.4337, + "step": 10187 + }, + { + "epoch": 27.760217983651227, + "grad_norm": 6.0465922355651855, + "learning_rate": 1.6953260357618662e-05, + "loss": 0.3922, + "step": 10188 + }, + { + "epoch": 27.762942779291553, + "grad_norm": 9.327617645263672, + "learning_rate": 1.6952626086551977e-05, + "loss": 0.49, + "step": 10189 + }, + { + "epoch": 27.76566757493188, + "grad_norm": 8.79337215423584, + "learning_rate": 1.6951991761338463e-05, + "loss": 0.6237, + "step": 10190 + }, + { + "epoch": 27.768392370572208, + "grad_norm": 8.579442977905273, + "learning_rate": 1.695135738198306e-05, + "loss": 0.5703, + "step": 10191 + }, + { + "epoch": 27.771117166212534, + "grad_norm": 8.197420120239258, + "learning_rate": 1.6950722948490713e-05, + "loss": 0.5209, + "step": 10192 + }, + { + "epoch": 27.77384196185286, + "grad_norm": 8.335177421569824, + "learning_rate": 1.6950088460866357e-05, + "loss": 0.5037, + "step": 10193 + }, + { + "epoch": 27.77656675749319, + "grad_norm": 7.469491958618164, + "learning_rate": 1.694945391911493e-05, + "loss": 0.4836, + "step": 10194 + }, + { + "epoch": 27.779291553133515, + "grad_norm": 8.92253303527832, + "learning_rate": 1.694881932324139e-05, + "loss": 0.4843, + "step": 10195 + }, + { + "epoch": 27.78201634877384, + "grad_norm": 8.606045722961426, + "learning_rate": 1.6948184673250665e-05, + "loss": 0.5375, + "step": 10196 + }, + { + "epoch": 27.78474114441417, + "grad_norm": 7.045773506164551, + "learning_rate": 1.69475499691477e-05, + "loss": 0.4955, + "step": 10197 + }, + { + "epoch": 27.787465940054496, + "grad_norm": 8.528428077697754, + "learning_rate": 1.694691521093744e-05, + "loss": 0.4139, + "step": 10198 + }, + { + "epoch": 27.79019073569482, + "grad_norm": 11.833290100097656, + "learning_rate": 1.6946280398624828e-05, + "loss": 0.5298, + "step": 10199 + }, + { + "epoch": 27.79291553133515, + "grad_norm": 7.898739337921143, + "learning_rate": 1.6945645532214805e-05, + "loss": 0.6686, + "step": 10200 + }, + { + "epoch": 27.795640326975477, + "grad_norm": 8.228962898254395, + "learning_rate": 1.694501061171232e-05, + "loss": 0.493, + "step": 10201 + }, + { + "epoch": 27.798365122615802, + "grad_norm": 10.405641555786133, + "learning_rate": 1.6944375637122318e-05, + "loss": 0.5291, + "step": 10202 + }, + { + "epoch": 27.80108991825613, + "grad_norm": 8.502785682678223, + "learning_rate": 1.694374060844974e-05, + "loss": 0.5408, + "step": 10203 + }, + { + "epoch": 27.803814713896458, + "grad_norm": 8.7985200881958, + "learning_rate": 1.6943105525699534e-05, + "loss": 0.6182, + "step": 10204 + }, + { + "epoch": 27.806539509536783, + "grad_norm": 8.150802612304688, + "learning_rate": 1.6942470388876645e-05, + "loss": 0.692, + "step": 10205 + }, + { + "epoch": 27.809264305177113, + "grad_norm": 6.949302673339844, + "learning_rate": 1.6941835197986023e-05, + "loss": 0.564, + "step": 10206 + }, + { + "epoch": 27.81198910081744, + "grad_norm": 11.274639129638672, + "learning_rate": 1.694119995303261e-05, + "loss": 0.5856, + "step": 10207 + }, + { + "epoch": 27.814713896457764, + "grad_norm": 7.7016072273254395, + "learning_rate": 1.6940564654021355e-05, + "loss": 0.5806, + "step": 10208 + }, + { + "epoch": 27.817438692098094, + "grad_norm": 8.560013771057129, + "learning_rate": 1.6939929300957206e-05, + "loss": 0.6448, + "step": 10209 + }, + { + "epoch": 27.82016348773842, + "grad_norm": 6.942630290985107, + "learning_rate": 1.693929389384511e-05, + "loss": 0.4706, + "step": 10210 + }, + { + "epoch": 27.822888283378745, + "grad_norm": 6.969632148742676, + "learning_rate": 1.6938658432690016e-05, + "loss": 0.4278, + "step": 10211 + }, + { + "epoch": 27.825613079019075, + "grad_norm": 7.503054618835449, + "learning_rate": 1.6938022917496876e-05, + "loss": 0.4682, + "step": 10212 + }, + { + "epoch": 27.8283378746594, + "grad_norm": 8.342432975769043, + "learning_rate": 1.6937387348270636e-05, + "loss": 0.4071, + "step": 10213 + }, + { + "epoch": 27.831062670299726, + "grad_norm": 7.85593318939209, + "learning_rate": 1.6936751725016248e-05, + "loss": 0.6279, + "step": 10214 + }, + { + "epoch": 27.833787465940055, + "grad_norm": 6.302553653717041, + "learning_rate": 1.6936116047738657e-05, + "loss": 0.5239, + "step": 10215 + }, + { + "epoch": 27.83651226158038, + "grad_norm": 8.658904075622559, + "learning_rate": 1.6935480316442818e-05, + "loss": 0.5029, + "step": 10216 + }, + { + "epoch": 27.839237057220707, + "grad_norm": 7.880286693572998, + "learning_rate": 1.6934844531133686e-05, + "loss": 0.509, + "step": 10217 + }, + { + "epoch": 27.841961852861036, + "grad_norm": 6.384045124053955, + "learning_rate": 1.6934208691816203e-05, + "loss": 0.4031, + "step": 10218 + }, + { + "epoch": 27.844686648501362, + "grad_norm": 7.981046199798584, + "learning_rate": 1.6933572798495327e-05, + "loss": 0.4557, + "step": 10219 + }, + { + "epoch": 27.847411444141688, + "grad_norm": 7.138590335845947, + "learning_rate": 1.6932936851176013e-05, + "loss": 0.6566, + "step": 10220 + }, + { + "epoch": 27.850136239782017, + "grad_norm": 6.986456871032715, + "learning_rate": 1.6932300849863207e-05, + "loss": 0.4547, + "step": 10221 + }, + { + "epoch": 27.852861035422343, + "grad_norm": 7.824373245239258, + "learning_rate": 1.6931664794561862e-05, + "loss": 0.5171, + "step": 10222 + }, + { + "epoch": 27.85558583106267, + "grad_norm": 8.812350273132324, + "learning_rate": 1.693102868527694e-05, + "loss": 0.6844, + "step": 10223 + }, + { + "epoch": 27.858310626703, + "grad_norm": 6.86625862121582, + "learning_rate": 1.693039252201339e-05, + "loss": 0.3973, + "step": 10224 + }, + { + "epoch": 27.861035422343324, + "grad_norm": 10.785688400268555, + "learning_rate": 1.692975630477616e-05, + "loss": 0.7382, + "step": 10225 + }, + { + "epoch": 27.86376021798365, + "grad_norm": 42.3944091796875, + "learning_rate": 1.6929120033570218e-05, + "loss": 0.5722, + "step": 10226 + }, + { + "epoch": 27.86648501362398, + "grad_norm": 7.785507678985596, + "learning_rate": 1.6928483708400504e-05, + "loss": 0.4921, + "step": 10227 + }, + { + "epoch": 27.869209809264305, + "grad_norm": 6.294122695922852, + "learning_rate": 1.692784732927199e-05, + "loss": 0.4783, + "step": 10228 + }, + { + "epoch": 27.87193460490463, + "grad_norm": 7.572083950042725, + "learning_rate": 1.692721089618962e-05, + "loss": 0.4753, + "step": 10229 + }, + { + "epoch": 27.87465940054496, + "grad_norm": 10.167337417602539, + "learning_rate": 1.6926574409158354e-05, + "loss": 0.5658, + "step": 10230 + }, + { + "epoch": 27.877384196185286, + "grad_norm": 7.328114986419678, + "learning_rate": 1.692593786818315e-05, + "loss": 0.5149, + "step": 10231 + }, + { + "epoch": 27.88010899182561, + "grad_norm": 7.156718730926514, + "learning_rate": 1.6925301273268965e-05, + "loss": 0.5066, + "step": 10232 + }, + { + "epoch": 27.88283378746594, + "grad_norm": 11.570022583007812, + "learning_rate": 1.6924664624420758e-05, + "loss": 0.5504, + "step": 10233 + }, + { + "epoch": 27.885558583106267, + "grad_norm": 7.075197219848633, + "learning_rate": 1.6924027921643485e-05, + "loss": 0.4808, + "step": 10234 + }, + { + "epoch": 27.888283378746593, + "grad_norm": 8.273008346557617, + "learning_rate": 1.6923391164942106e-05, + "loss": 0.703, + "step": 10235 + }, + { + "epoch": 27.891008174386922, + "grad_norm": 6.79816198348999, + "learning_rate": 1.6922754354321577e-05, + "loss": 0.713, + "step": 10236 + }, + { + "epoch": 27.893732970027248, + "grad_norm": 7.069867134094238, + "learning_rate": 1.6922117489786863e-05, + "loss": 0.6285, + "step": 10237 + }, + { + "epoch": 27.896457765667574, + "grad_norm": 6.594805717468262, + "learning_rate": 1.6921480571342916e-05, + "loss": 0.5786, + "step": 10238 + }, + { + "epoch": 27.899182561307903, + "grad_norm": 8.521928787231445, + "learning_rate": 1.6920843598994707e-05, + "loss": 0.4567, + "step": 10239 + }, + { + "epoch": 27.90190735694823, + "grad_norm": 9.371071815490723, + "learning_rate": 1.6920206572747186e-05, + "loss": 0.4895, + "step": 10240 + }, + { + "epoch": 27.904632152588555, + "grad_norm": 7.50525426864624, + "learning_rate": 1.691956949260532e-05, + "loss": 0.4757, + "step": 10241 + }, + { + "epoch": 27.907356948228884, + "grad_norm": 9.543774604797363, + "learning_rate": 1.691893235857407e-05, + "loss": 0.4894, + "step": 10242 + }, + { + "epoch": 27.91008174386921, + "grad_norm": 7.727305889129639, + "learning_rate": 1.69182951706584e-05, + "loss": 0.6274, + "step": 10243 + }, + { + "epoch": 27.912806539509535, + "grad_norm": 8.318642616271973, + "learning_rate": 1.6917657928863267e-05, + "loss": 0.4711, + "step": 10244 + }, + { + "epoch": 27.915531335149865, + "grad_norm": 7.303012847900391, + "learning_rate": 1.691702063319364e-05, + "loss": 0.5171, + "step": 10245 + }, + { + "epoch": 27.91825613079019, + "grad_norm": 7.7373247146606445, + "learning_rate": 1.6916383283654478e-05, + "loss": 0.6812, + "step": 10246 + }, + { + "epoch": 27.920980926430516, + "grad_norm": 8.06027889251709, + "learning_rate": 1.691574588025074e-05, + "loss": 0.6066, + "step": 10247 + }, + { + "epoch": 27.923705722070846, + "grad_norm": 8.682061195373535, + "learning_rate": 1.6915108422987402e-05, + "loss": 0.5661, + "step": 10248 + }, + { + "epoch": 27.92643051771117, + "grad_norm": 6.264842510223389, + "learning_rate": 1.691447091186942e-05, + "loss": 0.5078, + "step": 10249 + }, + { + "epoch": 27.929155313351497, + "grad_norm": 8.2464017868042, + "learning_rate": 1.6913833346901758e-05, + "loss": 0.615, + "step": 10250 + }, + { + "epoch": 27.931880108991827, + "grad_norm": 14.93500804901123, + "learning_rate": 1.6913195728089388e-05, + "loss": 0.55, + "step": 10251 + }, + { + "epoch": 27.934604904632153, + "grad_norm": 8.586822509765625, + "learning_rate": 1.6912558055437273e-05, + "loss": 0.4811, + "step": 10252 + }, + { + "epoch": 27.93732970027248, + "grad_norm": 6.676853656768799, + "learning_rate": 1.6911920328950376e-05, + "loss": 0.547, + "step": 10253 + }, + { + "epoch": 27.940054495912808, + "grad_norm": 10.004607200622559, + "learning_rate": 1.6911282548633664e-05, + "loss": 0.751, + "step": 10254 + }, + { + "epoch": 27.942779291553133, + "grad_norm": 9.108039855957031, + "learning_rate": 1.691064471449211e-05, + "loss": 0.4478, + "step": 10255 + }, + { + "epoch": 27.94550408719346, + "grad_norm": 7.818694114685059, + "learning_rate": 1.691000682653068e-05, + "loss": 0.5316, + "step": 10256 + }, + { + "epoch": 27.94822888283379, + "grad_norm": 6.828567028045654, + "learning_rate": 1.690936888475433e-05, + "loss": 0.4294, + "step": 10257 + }, + { + "epoch": 27.950953678474114, + "grad_norm": 9.278924942016602, + "learning_rate": 1.6908730889168047e-05, + "loss": 0.4493, + "step": 10258 + }, + { + "epoch": 27.95367847411444, + "grad_norm": 8.610934257507324, + "learning_rate": 1.690809283977678e-05, + "loss": 0.62, + "step": 10259 + }, + { + "epoch": 27.95640326975477, + "grad_norm": 7.227691650390625, + "learning_rate": 1.6907454736585517e-05, + "loss": 0.5197, + "step": 10260 + }, + { + "epoch": 27.959128065395095, + "grad_norm": 6.648590087890625, + "learning_rate": 1.6906816579599217e-05, + "loss": 0.5727, + "step": 10261 + }, + { + "epoch": 27.96185286103542, + "grad_norm": 6.574821949005127, + "learning_rate": 1.690617836882285e-05, + "loss": 0.4755, + "step": 10262 + }, + { + "epoch": 27.96457765667575, + "grad_norm": 7.378173351287842, + "learning_rate": 1.690554010426139e-05, + "loss": 0.5754, + "step": 10263 + }, + { + "epoch": 27.967302452316076, + "grad_norm": 10.361187934875488, + "learning_rate": 1.6904901785919806e-05, + "loss": 0.6264, + "step": 10264 + }, + { + "epoch": 27.970027247956402, + "grad_norm": 7.284205436706543, + "learning_rate": 1.6904263413803068e-05, + "loss": 0.446, + "step": 10265 + }, + { + "epoch": 27.97275204359673, + "grad_norm": 7.510517597198486, + "learning_rate": 1.6903624987916147e-05, + "loss": 0.5075, + "step": 10266 + }, + { + "epoch": 27.975476839237057, + "grad_norm": 8.687686920166016, + "learning_rate": 1.690298650826402e-05, + "loss": 0.5695, + "step": 10267 + }, + { + "epoch": 27.978201634877383, + "grad_norm": 7.612741470336914, + "learning_rate": 1.6902347974851653e-05, + "loss": 0.4938, + "step": 10268 + }, + { + "epoch": 27.980926430517712, + "grad_norm": 8.871014595031738, + "learning_rate": 1.6901709387684025e-05, + "loss": 0.5045, + "step": 10269 + }, + { + "epoch": 27.983651226158038, + "grad_norm": 7.562943458557129, + "learning_rate": 1.6901070746766108e-05, + "loss": 0.5377, + "step": 10270 + }, + { + "epoch": 27.986376021798364, + "grad_norm": 9.494495391845703, + "learning_rate": 1.690043205210287e-05, + "loss": 0.5172, + "step": 10271 + }, + { + "epoch": 27.989100817438693, + "grad_norm": 8.3716459274292, + "learning_rate": 1.689979330369929e-05, + "loss": 0.5178, + "step": 10272 + }, + { + "epoch": 27.99182561307902, + "grad_norm": 9.27304744720459, + "learning_rate": 1.6899154501560344e-05, + "loss": 0.4353, + "step": 10273 + }, + { + "epoch": 27.994550408719345, + "grad_norm": 7.550212383270264, + "learning_rate": 1.6898515645691002e-05, + "loss": 0.4103, + "step": 10274 + }, + { + "epoch": 27.997275204359674, + "grad_norm": 8.311297416687012, + "learning_rate": 1.6897876736096247e-05, + "loss": 0.4959, + "step": 10275 + }, + { + "epoch": 28.0, + "grad_norm": 6.824106216430664, + "learning_rate": 1.6897237772781046e-05, + "loss": 0.6491, + "step": 10276 + }, + { + "epoch": 28.002724795640326, + "grad_norm": 7.665373802185059, + "learning_rate": 1.6896598755750376e-05, + "loss": 0.606, + "step": 10277 + }, + { + "epoch": 28.005449591280655, + "grad_norm": 6.007593631744385, + "learning_rate": 1.689595968500922e-05, + "loss": 0.4334, + "step": 10278 + }, + { + "epoch": 28.00817438692098, + "grad_norm": 7.365853309631348, + "learning_rate": 1.6895320560562554e-05, + "loss": 0.4828, + "step": 10279 + }, + { + "epoch": 28.010899182561307, + "grad_norm": 8.586054801940918, + "learning_rate": 1.6894681382415353e-05, + "loss": 0.532, + "step": 10280 + }, + { + "epoch": 28.013623978201636, + "grad_norm": 9.997074127197266, + "learning_rate": 1.6894042150572594e-05, + "loss": 0.4187, + "step": 10281 + }, + { + "epoch": 28.016348773841962, + "grad_norm": 8.226503372192383, + "learning_rate": 1.6893402865039257e-05, + "loss": 0.4926, + "step": 10282 + }, + { + "epoch": 28.019073569482288, + "grad_norm": 7.064162731170654, + "learning_rate": 1.689276352582032e-05, + "loss": 0.5343, + "step": 10283 + }, + { + "epoch": 28.021798365122617, + "grad_norm": 18.196016311645508, + "learning_rate": 1.6892124132920763e-05, + "loss": 0.4216, + "step": 10284 + }, + { + "epoch": 28.024523160762943, + "grad_norm": 6.422055721282959, + "learning_rate": 1.6891484686345565e-05, + "loss": 0.5878, + "step": 10285 + }, + { + "epoch": 28.02724795640327, + "grad_norm": 6.667153835296631, + "learning_rate": 1.6890845186099705e-05, + "loss": 0.6854, + "step": 10286 + }, + { + "epoch": 28.029972752043598, + "grad_norm": 5.945711135864258, + "learning_rate": 1.6890205632188166e-05, + "loss": 0.396, + "step": 10287 + }, + { + "epoch": 28.032697547683924, + "grad_norm": 8.55396556854248, + "learning_rate": 1.6889566024615928e-05, + "loss": 0.4163, + "step": 10288 + }, + { + "epoch": 28.03542234332425, + "grad_norm": 6.2634406089782715, + "learning_rate": 1.688892636338797e-05, + "loss": 0.3436, + "step": 10289 + }, + { + "epoch": 28.03814713896458, + "grad_norm": 8.88974666595459, + "learning_rate": 1.6888286648509272e-05, + "loss": 0.4431, + "step": 10290 + }, + { + "epoch": 28.040871934604905, + "grad_norm": 6.603543758392334, + "learning_rate": 1.6887646879984826e-05, + "loss": 0.4554, + "step": 10291 + }, + { + "epoch": 28.04359673024523, + "grad_norm": 7.227399826049805, + "learning_rate": 1.6887007057819606e-05, + "loss": 0.5347, + "step": 10292 + }, + { + "epoch": 28.04632152588556, + "grad_norm": 7.476388931274414, + "learning_rate": 1.6886367182018593e-05, + "loss": 0.5303, + "step": 10293 + }, + { + "epoch": 28.049046321525886, + "grad_norm": 8.124524116516113, + "learning_rate": 1.6885727252586774e-05, + "loss": 0.479, + "step": 10294 + }, + { + "epoch": 28.05177111716621, + "grad_norm": 7.9931640625, + "learning_rate": 1.6885087269529136e-05, + "loss": 0.7098, + "step": 10295 + }, + { + "epoch": 28.05449591280654, + "grad_norm": 6.5644636154174805, + "learning_rate": 1.6884447232850657e-05, + "loss": 0.5326, + "step": 10296 + }, + { + "epoch": 28.057220708446867, + "grad_norm": 7.5684285163879395, + "learning_rate": 1.688380714255633e-05, + "loss": 0.6125, + "step": 10297 + }, + { + "epoch": 28.059945504087192, + "grad_norm": 7.379377841949463, + "learning_rate": 1.688316699865113e-05, + "loss": 0.4286, + "step": 10298 + }, + { + "epoch": 28.06267029972752, + "grad_norm": 8.864320755004883, + "learning_rate": 1.6882526801140046e-05, + "loss": 0.5087, + "step": 10299 + }, + { + "epoch": 28.065395095367847, + "grad_norm": 8.201573371887207, + "learning_rate": 1.6881886550028068e-05, + "loss": 0.372, + "step": 10300 + }, + { + "epoch": 28.068119891008173, + "grad_norm": 6.924935817718506, + "learning_rate": 1.688124624532018e-05, + "loss": 0.3792, + "step": 10301 + }, + { + "epoch": 28.070844686648503, + "grad_norm": 17.250703811645508, + "learning_rate": 1.6880605887021362e-05, + "loss": 0.4113, + "step": 10302 + }, + { + "epoch": 28.07356948228883, + "grad_norm": 7.773608207702637, + "learning_rate": 1.687996547513661e-05, + "loss": 0.5192, + "step": 10303 + }, + { + "epoch": 28.076294277929154, + "grad_norm": 11.720868110656738, + "learning_rate": 1.6879325009670912e-05, + "loss": 0.5282, + "step": 10304 + }, + { + "epoch": 28.079019073569484, + "grad_norm": 8.303223609924316, + "learning_rate": 1.6878684490629247e-05, + "loss": 0.4907, + "step": 10305 + }, + { + "epoch": 28.08174386920981, + "grad_norm": 5.874635219573975, + "learning_rate": 1.687804391801661e-05, + "loss": 0.5293, + "step": 10306 + }, + { + "epoch": 28.084468664850135, + "grad_norm": 6.997998237609863, + "learning_rate": 1.687740329183799e-05, + "loss": 0.3651, + "step": 10307 + }, + { + "epoch": 28.087193460490465, + "grad_norm": 11.347203254699707, + "learning_rate": 1.687676261209837e-05, + "loss": 0.4861, + "step": 10308 + }, + { + "epoch": 28.08991825613079, + "grad_norm": 9.801603317260742, + "learning_rate": 1.6876121878802748e-05, + "loss": 0.5014, + "step": 10309 + }, + { + "epoch": 28.092643051771116, + "grad_norm": 7.367988586425781, + "learning_rate": 1.687548109195611e-05, + "loss": 0.5709, + "step": 10310 + }, + { + "epoch": 28.095367847411445, + "grad_norm": 8.178997993469238, + "learning_rate": 1.6874840251563448e-05, + "loss": 0.5577, + "step": 10311 + }, + { + "epoch": 28.09809264305177, + "grad_norm": 10.153870582580566, + "learning_rate": 1.6874199357629747e-05, + "loss": 0.5374, + "step": 10312 + }, + { + "epoch": 28.100817438692097, + "grad_norm": 7.0586066246032715, + "learning_rate": 1.6873558410160006e-05, + "loss": 0.373, + "step": 10313 + }, + { + "epoch": 28.103542234332426, + "grad_norm": 6.657742977142334, + "learning_rate": 1.6872917409159213e-05, + "loss": 0.3198, + "step": 10314 + }, + { + "epoch": 28.106267029972752, + "grad_norm": 8.027143478393555, + "learning_rate": 1.6872276354632358e-05, + "loss": 0.5042, + "step": 10315 + }, + { + "epoch": 28.108991825613078, + "grad_norm": 6.80226993560791, + "learning_rate": 1.687163524658444e-05, + "loss": 0.4276, + "step": 10316 + }, + { + "epoch": 28.111716621253407, + "grad_norm": 7.309327602386475, + "learning_rate": 1.6870994085020446e-05, + "loss": 0.4528, + "step": 10317 + }, + { + "epoch": 28.114441416893733, + "grad_norm": 9.73857593536377, + "learning_rate": 1.687035286994537e-05, + "loss": 0.483, + "step": 10318 + }, + { + "epoch": 28.11716621253406, + "grad_norm": 7.97163200378418, + "learning_rate": 1.6869711601364206e-05, + "loss": 0.4059, + "step": 10319 + }, + { + "epoch": 28.11989100817439, + "grad_norm": 6.555824279785156, + "learning_rate": 1.686907027928195e-05, + "loss": 0.4689, + "step": 10320 + }, + { + "epoch": 28.122615803814714, + "grad_norm": 7.380853652954102, + "learning_rate": 1.6868428903703598e-05, + "loss": 0.4585, + "step": 10321 + }, + { + "epoch": 28.12534059945504, + "grad_norm": 7.245654106140137, + "learning_rate": 1.6867787474634142e-05, + "loss": 0.5209, + "step": 10322 + }, + { + "epoch": 28.12806539509537, + "grad_norm": 7.773459434509277, + "learning_rate": 1.6867145992078577e-05, + "loss": 0.5188, + "step": 10323 + }, + { + "epoch": 28.130790190735695, + "grad_norm": 7.523104667663574, + "learning_rate": 1.68665044560419e-05, + "loss": 0.3985, + "step": 10324 + }, + { + "epoch": 28.13351498637602, + "grad_norm": 7.532975673675537, + "learning_rate": 1.686586286652911e-05, + "loss": 0.4188, + "step": 10325 + }, + { + "epoch": 28.13623978201635, + "grad_norm": 8.93874740600586, + "learning_rate": 1.6865221223545198e-05, + "loss": 0.4528, + "step": 10326 + }, + { + "epoch": 28.138964577656676, + "grad_norm": 7.237036228179932, + "learning_rate": 1.6864579527095163e-05, + "loss": 0.491, + "step": 10327 + }, + { + "epoch": 28.141689373297, + "grad_norm": 7.244105339050293, + "learning_rate": 1.6863937777184006e-05, + "loss": 0.4947, + "step": 10328 + }, + { + "epoch": 28.14441416893733, + "grad_norm": 13.066157341003418, + "learning_rate": 1.686329597381672e-05, + "loss": 0.5469, + "step": 10329 + }, + { + "epoch": 28.147138964577657, + "grad_norm": 6.924302577972412, + "learning_rate": 1.686265411699831e-05, + "loss": 0.4539, + "step": 10330 + }, + { + "epoch": 28.149863760217983, + "grad_norm": 7.257571697235107, + "learning_rate": 1.6862012206733768e-05, + "loss": 0.6908, + "step": 10331 + }, + { + "epoch": 28.152588555858312, + "grad_norm": 10.561065673828125, + "learning_rate": 1.6861370243028097e-05, + "loss": 0.6219, + "step": 10332 + }, + { + "epoch": 28.155313351498638, + "grad_norm": 8.823827743530273, + "learning_rate": 1.6860728225886295e-05, + "loss": 0.4505, + "step": 10333 + }, + { + "epoch": 28.158038147138964, + "grad_norm": 6.851810932159424, + "learning_rate": 1.6860086155313364e-05, + "loss": 0.5002, + "step": 10334 + }, + { + "epoch": 28.160762942779293, + "grad_norm": 8.059377670288086, + "learning_rate": 1.6859444031314297e-05, + "loss": 0.4726, + "step": 10335 + }, + { + "epoch": 28.16348773841962, + "grad_norm": 9.536529541015625, + "learning_rate": 1.6858801853894105e-05, + "loss": 0.3778, + "step": 10336 + }, + { + "epoch": 28.166212534059945, + "grad_norm": 6.575474739074707, + "learning_rate": 1.6858159623057787e-05, + "loss": 0.4834, + "step": 10337 + }, + { + "epoch": 28.168937329700274, + "grad_norm": 13.317432403564453, + "learning_rate": 1.685751733881034e-05, + "loss": 0.4341, + "step": 10338 + }, + { + "epoch": 28.1716621253406, + "grad_norm": 8.081430435180664, + "learning_rate": 1.685687500115677e-05, + "loss": 0.6339, + "step": 10339 + }, + { + "epoch": 28.174386920980925, + "grad_norm": 8.51950454711914, + "learning_rate": 1.6856232610102074e-05, + "loss": 0.5239, + "step": 10340 + }, + { + "epoch": 28.177111716621255, + "grad_norm": 9.547775268554688, + "learning_rate": 1.6855590165651263e-05, + "loss": 0.6049, + "step": 10341 + }, + { + "epoch": 28.17983651226158, + "grad_norm": 7.281281471252441, + "learning_rate": 1.6854947667809333e-05, + "loss": 0.4608, + "step": 10342 + }, + { + "epoch": 28.182561307901906, + "grad_norm": 8.876697540283203, + "learning_rate": 1.6854305116581294e-05, + "loss": 0.5292, + "step": 10343 + }, + { + "epoch": 28.185286103542236, + "grad_norm": 7.376714706420898, + "learning_rate": 1.685366251197215e-05, + "loss": 0.5331, + "step": 10344 + }, + { + "epoch": 28.18801089918256, + "grad_norm": 6.850920677185059, + "learning_rate": 1.68530198539869e-05, + "loss": 0.4112, + "step": 10345 + }, + { + "epoch": 28.190735694822887, + "grad_norm": 8.650160789489746, + "learning_rate": 1.685237714263055e-05, + "loss": 0.7314, + "step": 10346 + }, + { + "epoch": 28.193460490463217, + "grad_norm": 14.532156944274902, + "learning_rate": 1.6851734377908106e-05, + "loss": 0.4206, + "step": 10347 + }, + { + "epoch": 28.196185286103542, + "grad_norm": 8.100082397460938, + "learning_rate": 1.685109155982458e-05, + "loss": 0.5037, + "step": 10348 + }, + { + "epoch": 28.19891008174387, + "grad_norm": 6.799877166748047, + "learning_rate": 1.6850448688384972e-05, + "loss": 0.4937, + "step": 10349 + }, + { + "epoch": 28.201634877384198, + "grad_norm": 7.809359550476074, + "learning_rate": 1.6849805763594293e-05, + "loss": 0.5504, + "step": 10350 + }, + { + "epoch": 28.204359673024523, + "grad_norm": 6.646524429321289, + "learning_rate": 1.684916278545754e-05, + "loss": 0.3853, + "step": 10351 + }, + { + "epoch": 28.20708446866485, + "grad_norm": 10.917232513427734, + "learning_rate": 1.6848519753979732e-05, + "loss": 0.3925, + "step": 10352 + }, + { + "epoch": 28.20980926430518, + "grad_norm": 6.854604721069336, + "learning_rate": 1.6847876669165874e-05, + "loss": 0.56, + "step": 10353 + }, + { + "epoch": 28.212534059945504, + "grad_norm": 8.6856689453125, + "learning_rate": 1.684723353102097e-05, + "loss": 0.5193, + "step": 10354 + }, + { + "epoch": 28.21525885558583, + "grad_norm": 7.57242488861084, + "learning_rate": 1.684659033955003e-05, + "loss": 0.5102, + "step": 10355 + }, + { + "epoch": 28.21798365122616, + "grad_norm": 7.709518909454346, + "learning_rate": 1.684594709475807e-05, + "loss": 0.5396, + "step": 10356 + }, + { + "epoch": 28.220708446866485, + "grad_norm": 8.30573558807373, + "learning_rate": 1.6845303796650094e-05, + "loss": 0.3871, + "step": 10357 + }, + { + "epoch": 28.22343324250681, + "grad_norm": 9.018017768859863, + "learning_rate": 1.684466044523111e-05, + "loss": 0.4784, + "step": 10358 + }, + { + "epoch": 28.22615803814714, + "grad_norm": 8.360239028930664, + "learning_rate": 1.6844017040506132e-05, + "loss": 0.5625, + "step": 10359 + }, + { + "epoch": 28.228882833787466, + "grad_norm": 7.19600772857666, + "learning_rate": 1.6843373582480168e-05, + "loss": 0.3723, + "step": 10360 + }, + { + "epoch": 28.231607629427792, + "grad_norm": 26.532180786132812, + "learning_rate": 1.684273007115823e-05, + "loss": 0.4842, + "step": 10361 + }, + { + "epoch": 28.23433242506812, + "grad_norm": 7.297877788543701, + "learning_rate": 1.6842086506545334e-05, + "loss": 0.3293, + "step": 10362 + }, + { + "epoch": 28.237057220708447, + "grad_norm": 10.168774604797363, + "learning_rate": 1.6841442888646483e-05, + "loss": 0.4346, + "step": 10363 + }, + { + "epoch": 28.239782016348773, + "grad_norm": 9.161511421203613, + "learning_rate": 1.68407992174667e-05, + "loss": 0.527, + "step": 10364 + }, + { + "epoch": 28.242506811989102, + "grad_norm": 8.480376243591309, + "learning_rate": 1.684015549301099e-05, + "loss": 0.4944, + "step": 10365 + }, + { + "epoch": 28.245231607629428, + "grad_norm": 8.92908763885498, + "learning_rate": 1.6839511715284372e-05, + "loss": 0.5138, + "step": 10366 + }, + { + "epoch": 28.247956403269754, + "grad_norm": 8.959177017211914, + "learning_rate": 1.6838867884291855e-05, + "loss": 0.4398, + "step": 10367 + }, + { + "epoch": 28.250681198910083, + "grad_norm": 14.875165939331055, + "learning_rate": 1.6838224000038455e-05, + "loss": 0.5484, + "step": 10368 + }, + { + "epoch": 28.25340599455041, + "grad_norm": 7.646803855895996, + "learning_rate": 1.683758006252919e-05, + "loss": 0.6553, + "step": 10369 + }, + { + "epoch": 28.256130790190735, + "grad_norm": 7.4817705154418945, + "learning_rate": 1.6836936071769064e-05, + "loss": 0.5055, + "step": 10370 + }, + { + "epoch": 28.258855585831064, + "grad_norm": 10.627854347229004, + "learning_rate": 1.6836292027763102e-05, + "loss": 0.453, + "step": 10371 + }, + { + "epoch": 28.26158038147139, + "grad_norm": 8.66915512084961, + "learning_rate": 1.6835647930516322e-05, + "loss": 0.5134, + "step": 10372 + }, + { + "epoch": 28.264305177111716, + "grad_norm": 6.920253753662109, + "learning_rate": 1.6835003780033738e-05, + "loss": 0.5014, + "step": 10373 + }, + { + "epoch": 28.267029972752045, + "grad_norm": 8.081284523010254, + "learning_rate": 1.6834359576320357e-05, + "loss": 0.41, + "step": 10374 + }, + { + "epoch": 28.26975476839237, + "grad_norm": 7.855467796325684, + "learning_rate": 1.683371531938121e-05, + "loss": 0.5132, + "step": 10375 + }, + { + "epoch": 28.272479564032697, + "grad_norm": 13.5990629196167, + "learning_rate": 1.6833071009221306e-05, + "loss": 0.551, + "step": 10376 + }, + { + "epoch": 28.275204359673026, + "grad_norm": 11.321314811706543, + "learning_rate": 1.683242664584566e-05, + "loss": 0.5769, + "step": 10377 + }, + { + "epoch": 28.277929155313352, + "grad_norm": 11.942986488342285, + "learning_rate": 1.68317822292593e-05, + "loss": 0.4187, + "step": 10378 + }, + { + "epoch": 28.280653950953678, + "grad_norm": 8.610215187072754, + "learning_rate": 1.683113775946724e-05, + "loss": 0.6056, + "step": 10379 + }, + { + "epoch": 28.283378746594007, + "grad_norm": 8.839770317077637, + "learning_rate": 1.6830493236474497e-05, + "loss": 0.3628, + "step": 10380 + }, + { + "epoch": 28.286103542234333, + "grad_norm": 7.970127105712891, + "learning_rate": 1.6829848660286093e-05, + "loss": 0.6532, + "step": 10381 + }, + { + "epoch": 28.28882833787466, + "grad_norm": 6.654072284698486, + "learning_rate": 1.6829204030907045e-05, + "loss": 0.5068, + "step": 10382 + }, + { + "epoch": 28.291553133514988, + "grad_norm": 9.671961784362793, + "learning_rate": 1.6828559348342382e-05, + "loss": 0.4399, + "step": 10383 + }, + { + "epoch": 28.294277929155314, + "grad_norm": 9.164841651916504, + "learning_rate": 1.6827914612597115e-05, + "loss": 0.3484, + "step": 10384 + }, + { + "epoch": 28.29700272479564, + "grad_norm": 8.438698768615723, + "learning_rate": 1.682726982367627e-05, + "loss": 0.4659, + "step": 10385 + }, + { + "epoch": 28.29972752043597, + "grad_norm": 7.779649257659912, + "learning_rate": 1.6826624981584868e-05, + "loss": 0.663, + "step": 10386 + }, + { + "epoch": 28.302452316076295, + "grad_norm": 7.599969387054443, + "learning_rate": 1.6825980086327927e-05, + "loss": 0.4323, + "step": 10387 + }, + { + "epoch": 28.30517711171662, + "grad_norm": 7.940140724182129, + "learning_rate": 1.6825335137910474e-05, + "loss": 0.3535, + "step": 10388 + }, + { + "epoch": 28.30790190735695, + "grad_norm": 6.6571807861328125, + "learning_rate": 1.6824690136337533e-05, + "loss": 0.5281, + "step": 10389 + }, + { + "epoch": 28.310626702997276, + "grad_norm": 14.657061576843262, + "learning_rate": 1.682404508161412e-05, + "loss": 0.6565, + "step": 10390 + }, + { + "epoch": 28.3133514986376, + "grad_norm": 7.262669563293457, + "learning_rate": 1.682339997374527e-05, + "loss": 0.5697, + "step": 10391 + }, + { + "epoch": 28.31607629427793, + "grad_norm": 7.552542209625244, + "learning_rate": 1.6822754812735995e-05, + "loss": 0.4747, + "step": 10392 + }, + { + "epoch": 28.318801089918257, + "grad_norm": 9.409974098205566, + "learning_rate": 1.6822109598591327e-05, + "loss": 0.4474, + "step": 10393 + }, + { + "epoch": 28.321525885558582, + "grad_norm": 7.490232467651367, + "learning_rate": 1.682146433131629e-05, + "loss": 0.4171, + "step": 10394 + }, + { + "epoch": 28.32425068119891, + "grad_norm": 10.111641883850098, + "learning_rate": 1.682081901091591e-05, + "loss": 0.4914, + "step": 10395 + }, + { + "epoch": 28.326975476839237, + "grad_norm": 8.32813835144043, + "learning_rate": 1.6820173637395208e-05, + "loss": 0.5367, + "step": 10396 + }, + { + "epoch": 28.329700272479563, + "grad_norm": 6.854457378387451, + "learning_rate": 1.6819528210759216e-05, + "loss": 0.4817, + "step": 10397 + }, + { + "epoch": 28.332425068119893, + "grad_norm": 7.725712299346924, + "learning_rate": 1.6818882731012954e-05, + "loss": 0.6059, + "step": 10398 + }, + { + "epoch": 28.33514986376022, + "grad_norm": 6.47776460647583, + "learning_rate": 1.6818237198161456e-05, + "loss": 0.6245, + "step": 10399 + }, + { + "epoch": 28.337874659400544, + "grad_norm": 7.381679534912109, + "learning_rate": 1.6817591612209744e-05, + "loss": 0.4849, + "step": 10400 + }, + { + "epoch": 28.340599455040874, + "grad_norm": 7.378352642059326, + "learning_rate": 1.681694597316285e-05, + "loss": 0.4969, + "step": 10401 + }, + { + "epoch": 28.3433242506812, + "grad_norm": 6.980203628540039, + "learning_rate": 1.6816300281025796e-05, + "loss": 0.5902, + "step": 10402 + }, + { + "epoch": 28.346049046321525, + "grad_norm": 9.453960418701172, + "learning_rate": 1.681565453580362e-05, + "loss": 0.5278, + "step": 10403 + }, + { + "epoch": 28.348773841961854, + "grad_norm": 7.603379726409912, + "learning_rate": 1.681500873750134e-05, + "loss": 0.5557, + "step": 10404 + }, + { + "epoch": 28.35149863760218, + "grad_norm": 7.9871039390563965, + "learning_rate": 1.6814362886123994e-05, + "loss": 0.4535, + "step": 10405 + }, + { + "epoch": 28.354223433242506, + "grad_norm": 8.485020637512207, + "learning_rate": 1.6813716981676612e-05, + "loss": 0.5384, + "step": 10406 + }, + { + "epoch": 28.356948228882835, + "grad_norm": 7.360891819000244, + "learning_rate": 1.681307102416422e-05, + "loss": 0.4211, + "step": 10407 + }, + { + "epoch": 28.35967302452316, + "grad_norm": 8.2415771484375, + "learning_rate": 1.681242501359185e-05, + "loss": 0.4482, + "step": 10408 + }, + { + "epoch": 28.362397820163487, + "grad_norm": 7.84987735748291, + "learning_rate": 1.681177894996453e-05, + "loss": 0.5217, + "step": 10409 + }, + { + "epoch": 28.365122615803816, + "grad_norm": 11.041234970092773, + "learning_rate": 1.6811132833287296e-05, + "loss": 0.5422, + "step": 10410 + }, + { + "epoch": 28.367847411444142, + "grad_norm": 9.216878890991211, + "learning_rate": 1.6810486663565183e-05, + "loss": 0.4366, + "step": 10411 + }, + { + "epoch": 28.370572207084468, + "grad_norm": 8.009267807006836, + "learning_rate": 1.680984044080322e-05, + "loss": 0.6246, + "step": 10412 + }, + { + "epoch": 28.373297002724797, + "grad_norm": 8.616374969482422, + "learning_rate": 1.680919416500643e-05, + "loss": 0.4103, + "step": 10413 + }, + { + "epoch": 28.376021798365123, + "grad_norm": 8.781277656555176, + "learning_rate": 1.6808547836179862e-05, + "loss": 0.5015, + "step": 10414 + }, + { + "epoch": 28.37874659400545, + "grad_norm": 7.765417098999023, + "learning_rate": 1.680790145432854e-05, + "loss": 0.5505, + "step": 10415 + }, + { + "epoch": 28.381471389645778, + "grad_norm": 6.382985591888428, + "learning_rate": 1.6807255019457503e-05, + "loss": 0.3701, + "step": 10416 + }, + { + "epoch": 28.384196185286104, + "grad_norm": 8.345076560974121, + "learning_rate": 1.680660853157178e-05, + "loss": 0.5445, + "step": 10417 + }, + { + "epoch": 28.38692098092643, + "grad_norm": 6.24092960357666, + "learning_rate": 1.680596199067641e-05, + "loss": 0.5378, + "step": 10418 + }, + { + "epoch": 28.38964577656676, + "grad_norm": 8.847549438476562, + "learning_rate": 1.6805315396776427e-05, + "loss": 0.5143, + "step": 10419 + }, + { + "epoch": 28.392370572207085, + "grad_norm": 8.919387817382812, + "learning_rate": 1.6804668749876867e-05, + "loss": 0.5549, + "step": 10420 + }, + { + "epoch": 28.39509536784741, + "grad_norm": 8.392271995544434, + "learning_rate": 1.6804022049982768e-05, + "loss": 0.5368, + "step": 10421 + }, + { + "epoch": 28.39782016348774, + "grad_norm": 8.466325759887695, + "learning_rate": 1.6803375297099162e-05, + "loss": 0.4869, + "step": 10422 + }, + { + "epoch": 28.400544959128066, + "grad_norm": 7.85569953918457, + "learning_rate": 1.6802728491231083e-05, + "loss": 0.407, + "step": 10423 + }, + { + "epoch": 28.40326975476839, + "grad_norm": 9.220958709716797, + "learning_rate": 1.680208163238358e-05, + "loss": 0.4977, + "step": 10424 + }, + { + "epoch": 28.40599455040872, + "grad_norm": 7.3440141677856445, + "learning_rate": 1.6801434720561683e-05, + "loss": 0.576, + "step": 10425 + }, + { + "epoch": 28.408719346049047, + "grad_norm": 6.604451656341553, + "learning_rate": 1.680078775577043e-05, + "loss": 0.481, + "step": 10426 + }, + { + "epoch": 28.411444141689373, + "grad_norm": 6.42094612121582, + "learning_rate": 1.680014073801486e-05, + "loss": 0.4882, + "step": 10427 + }, + { + "epoch": 28.414168937329702, + "grad_norm": 8.168827056884766, + "learning_rate": 1.6799493667300018e-05, + "loss": 0.4686, + "step": 10428 + }, + { + "epoch": 28.416893732970028, + "grad_norm": 7.647387504577637, + "learning_rate": 1.6798846543630934e-05, + "loss": 0.47, + "step": 10429 + }, + { + "epoch": 28.419618528610354, + "grad_norm": 8.366386413574219, + "learning_rate": 1.6798199367012652e-05, + "loss": 0.4745, + "step": 10430 + }, + { + "epoch": 28.422343324250683, + "grad_norm": 8.590060234069824, + "learning_rate": 1.6797552137450214e-05, + "loss": 0.514, + "step": 10431 + }, + { + "epoch": 28.42506811989101, + "grad_norm": 6.036066055297852, + "learning_rate": 1.6796904854948656e-05, + "loss": 0.4146, + "step": 10432 + }, + { + "epoch": 28.427792915531334, + "grad_norm": 8.050939559936523, + "learning_rate": 1.6796257519513024e-05, + "loss": 0.457, + "step": 10433 + }, + { + "epoch": 28.430517711171664, + "grad_norm": 11.273110389709473, + "learning_rate": 1.6795610131148357e-05, + "loss": 0.663, + "step": 10434 + }, + { + "epoch": 28.43324250681199, + "grad_norm": 7.349226951599121, + "learning_rate": 1.6794962689859696e-05, + "loss": 0.5003, + "step": 10435 + }, + { + "epoch": 28.435967302452315, + "grad_norm": 7.010150909423828, + "learning_rate": 1.6794315195652085e-05, + "loss": 0.4498, + "step": 10436 + }, + { + "epoch": 28.438692098092645, + "grad_norm": 8.3838529586792, + "learning_rate": 1.6793667648530567e-05, + "loss": 0.5936, + "step": 10437 + }, + { + "epoch": 28.44141689373297, + "grad_norm": 25.742835998535156, + "learning_rate": 1.6793020048500183e-05, + "loss": 0.4208, + "step": 10438 + }, + { + "epoch": 28.444141689373296, + "grad_norm": 7.778672218322754, + "learning_rate": 1.6792372395565978e-05, + "loss": 0.7396, + "step": 10439 + }, + { + "epoch": 28.446866485013626, + "grad_norm": 7.268556594848633, + "learning_rate": 1.6791724689732992e-05, + "loss": 0.6994, + "step": 10440 + }, + { + "epoch": 28.44959128065395, + "grad_norm": 8.157234191894531, + "learning_rate": 1.6791076931006276e-05, + "loss": 0.4328, + "step": 10441 + }, + { + "epoch": 28.452316076294277, + "grad_norm": 7.949583530426025, + "learning_rate": 1.679042911939087e-05, + "loss": 0.3544, + "step": 10442 + }, + { + "epoch": 28.455040871934607, + "grad_norm": 6.344139575958252, + "learning_rate": 1.6789781254891822e-05, + "loss": 0.4261, + "step": 10443 + }, + { + "epoch": 28.457765667574932, + "grad_norm": 13.322134017944336, + "learning_rate": 1.6789133337514178e-05, + "loss": 0.562, + "step": 10444 + }, + { + "epoch": 28.460490463215258, + "grad_norm": 7.682892322540283, + "learning_rate": 1.6788485367262975e-05, + "loss": 0.6436, + "step": 10445 + }, + { + "epoch": 28.463215258855588, + "grad_norm": 10.428749084472656, + "learning_rate": 1.6787837344143273e-05, + "loss": 0.6119, + "step": 10446 + }, + { + "epoch": 28.465940054495913, + "grad_norm": 11.043083190917969, + "learning_rate": 1.678718926816011e-05, + "loss": 0.5913, + "step": 10447 + }, + { + "epoch": 28.46866485013624, + "grad_norm": 8.230341911315918, + "learning_rate": 1.6786541139318537e-05, + "loss": 0.4512, + "step": 10448 + }, + { + "epoch": 28.47138964577657, + "grad_norm": 7.745244026184082, + "learning_rate": 1.6785892957623598e-05, + "loss": 0.5378, + "step": 10449 + }, + { + "epoch": 28.474114441416894, + "grad_norm": 18.82840347290039, + "learning_rate": 1.678524472308034e-05, + "loss": 0.4413, + "step": 10450 + }, + { + "epoch": 28.47683923705722, + "grad_norm": 6.365556240081787, + "learning_rate": 1.678459643569382e-05, + "loss": 0.5273, + "step": 10451 + }, + { + "epoch": 28.479564032697546, + "grad_norm": 5.9933037757873535, + "learning_rate": 1.6783948095469082e-05, + "loss": 0.3474, + "step": 10452 + }, + { + "epoch": 28.482288828337875, + "grad_norm": 9.864625930786133, + "learning_rate": 1.678329970241117e-05, + "loss": 0.4769, + "step": 10453 + }, + { + "epoch": 28.4850136239782, + "grad_norm": 7.456377029418945, + "learning_rate": 1.678265125652514e-05, + "loss": 0.5831, + "step": 10454 + }, + { + "epoch": 28.48773841961853, + "grad_norm": 8.414080619812012, + "learning_rate": 1.6782002757816043e-05, + "loss": 0.5112, + "step": 10455 + }, + { + "epoch": 28.490463215258856, + "grad_norm": 14.215851783752441, + "learning_rate": 1.6781354206288924e-05, + "loss": 0.5678, + "step": 10456 + }, + { + "epoch": 28.493188010899182, + "grad_norm": 8.581607818603516, + "learning_rate": 1.6780705601948833e-05, + "loss": 0.4189, + "step": 10457 + }, + { + "epoch": 28.495912806539508, + "grad_norm": 10.440707206726074, + "learning_rate": 1.6780056944800833e-05, + "loss": 0.4722, + "step": 10458 + }, + { + "epoch": 28.498637602179837, + "grad_norm": 8.628376960754395, + "learning_rate": 1.6779408234849964e-05, + "loss": 0.4987, + "step": 10459 + }, + { + "epoch": 28.501362397820163, + "grad_norm": 9.071776390075684, + "learning_rate": 1.677875947210128e-05, + "loss": 0.5309, + "step": 10460 + }, + { + "epoch": 28.504087193460492, + "grad_norm": 52.496681213378906, + "learning_rate": 1.6778110656559837e-05, + "loss": 0.4279, + "step": 10461 + }, + { + "epoch": 28.506811989100818, + "grad_norm": 9.852365493774414, + "learning_rate": 1.677746178823069e-05, + "loss": 0.5231, + "step": 10462 + }, + { + "epoch": 28.509536784741144, + "grad_norm": 7.248706340789795, + "learning_rate": 1.6776812867118885e-05, + "loss": 0.5611, + "step": 10463 + }, + { + "epoch": 28.51226158038147, + "grad_norm": 12.963179588317871, + "learning_rate": 1.6776163893229476e-05, + "loss": 0.4556, + "step": 10464 + }, + { + "epoch": 28.5149863760218, + "grad_norm": 8.917076110839844, + "learning_rate": 1.6775514866567527e-05, + "loss": 0.6695, + "step": 10465 + }, + { + "epoch": 28.517711171662125, + "grad_norm": 10.566930770874023, + "learning_rate": 1.677486578713808e-05, + "loss": 0.4056, + "step": 10466 + }, + { + "epoch": 28.520435967302454, + "grad_norm": 9.388032913208008, + "learning_rate": 1.6774216654946203e-05, + "loss": 0.4838, + "step": 10467 + }, + { + "epoch": 28.52316076294278, + "grad_norm": 16.75680160522461, + "learning_rate": 1.677356746999694e-05, + "loss": 0.5612, + "step": 10468 + }, + { + "epoch": 28.525885558583106, + "grad_norm": 8.811739921569824, + "learning_rate": 1.6772918232295353e-05, + "loss": 0.4979, + "step": 10469 + }, + { + "epoch": 28.52861035422343, + "grad_norm": 13.264880180358887, + "learning_rate": 1.6772268941846496e-05, + "loss": 0.4393, + "step": 10470 + }, + { + "epoch": 28.53133514986376, + "grad_norm": 7.859387397766113, + "learning_rate": 1.6771619598655432e-05, + "loss": 0.4305, + "step": 10471 + }, + { + "epoch": 28.534059945504087, + "grad_norm": 7.618261814117432, + "learning_rate": 1.6770970202727206e-05, + "loss": 0.6329, + "step": 10472 + }, + { + "epoch": 28.536784741144416, + "grad_norm": 9.38042163848877, + "learning_rate": 1.6770320754066886e-05, + "loss": 0.6401, + "step": 10473 + }, + { + "epoch": 28.539509536784742, + "grad_norm": 9.186793327331543, + "learning_rate": 1.676967125267952e-05, + "loss": 0.4864, + "step": 10474 + }, + { + "epoch": 28.542234332425068, + "grad_norm": 8.843674659729004, + "learning_rate": 1.6769021698570178e-05, + "loss": 0.5904, + "step": 10475 + }, + { + "epoch": 28.544959128065393, + "grad_norm": 8.38227367401123, + "learning_rate": 1.676837209174391e-05, + "loss": 0.4263, + "step": 10476 + }, + { + "epoch": 28.547683923705723, + "grad_norm": 7.939977169036865, + "learning_rate": 1.676772243220578e-05, + "loss": 0.5242, + "step": 10477 + }, + { + "epoch": 28.55040871934605, + "grad_norm": 15.47470760345459, + "learning_rate": 1.6767072719960845e-05, + "loss": 0.5037, + "step": 10478 + }, + { + "epoch": 28.553133514986374, + "grad_norm": 9.203507423400879, + "learning_rate": 1.6766422955014164e-05, + "loss": 0.467, + "step": 10479 + }, + { + "epoch": 28.555858310626704, + "grad_norm": 7.513101577758789, + "learning_rate": 1.67657731373708e-05, + "loss": 0.6239, + "step": 10480 + }, + { + "epoch": 28.55858310626703, + "grad_norm": 12.132689476013184, + "learning_rate": 1.6765123267035813e-05, + "loss": 0.6172, + "step": 10481 + }, + { + "epoch": 28.561307901907355, + "grad_norm": 8.619035720825195, + "learning_rate": 1.6764473344014264e-05, + "loss": 0.4727, + "step": 10482 + }, + { + "epoch": 28.564032697547685, + "grad_norm": 7.933316230773926, + "learning_rate": 1.6763823368311213e-05, + "loss": 0.4595, + "step": 10483 + }, + { + "epoch": 28.56675749318801, + "grad_norm": 9.0542573928833, + "learning_rate": 1.6763173339931718e-05, + "loss": 0.3766, + "step": 10484 + }, + { + "epoch": 28.569482288828336, + "grad_norm": 12.085680961608887, + "learning_rate": 1.6762523258880855e-05, + "loss": 0.4951, + "step": 10485 + }, + { + "epoch": 28.572207084468666, + "grad_norm": 8.230812072753906, + "learning_rate": 1.6761873125163676e-05, + "loss": 0.4879, + "step": 10486 + }, + { + "epoch": 28.57493188010899, + "grad_norm": 13.951199531555176, + "learning_rate": 1.6761222938785245e-05, + "loss": 0.3983, + "step": 10487 + }, + { + "epoch": 28.577656675749317, + "grad_norm": 8.826639175415039, + "learning_rate": 1.676057269975063e-05, + "loss": 0.5461, + "step": 10488 + }, + { + "epoch": 28.580381471389646, + "grad_norm": 10.449169158935547, + "learning_rate": 1.675992240806489e-05, + "loss": 0.4296, + "step": 10489 + }, + { + "epoch": 28.583106267029972, + "grad_norm": 6.757328510284424, + "learning_rate": 1.6759272063733094e-05, + "loss": 0.549, + "step": 10490 + }, + { + "epoch": 28.585831062670298, + "grad_norm": 9.143452644348145, + "learning_rate": 1.6758621666760304e-05, + "loss": 0.4813, + "step": 10491 + }, + { + "epoch": 28.588555858310627, + "grad_norm": 36.08699417114258, + "learning_rate": 1.675797121715159e-05, + "loss": 0.4719, + "step": 10492 + }, + { + "epoch": 28.591280653950953, + "grad_norm": 12.879393577575684, + "learning_rate": 1.6757320714912007e-05, + "loss": 0.4965, + "step": 10493 + }, + { + "epoch": 28.59400544959128, + "grad_norm": 8.112102508544922, + "learning_rate": 1.6756670160046628e-05, + "loss": 0.4584, + "step": 10494 + }, + { + "epoch": 28.59673024523161, + "grad_norm": 6.9734392166137695, + "learning_rate": 1.6756019552560522e-05, + "loss": 0.5682, + "step": 10495 + }, + { + "epoch": 28.599455040871934, + "grad_norm": 7.311095714569092, + "learning_rate": 1.6755368892458753e-05, + "loss": 0.5016, + "step": 10496 + }, + { + "epoch": 28.60217983651226, + "grad_norm": 8.643707275390625, + "learning_rate": 1.675471817974639e-05, + "loss": 0.6283, + "step": 10497 + }, + { + "epoch": 28.60490463215259, + "grad_norm": 7.092410564422607, + "learning_rate": 1.6754067414428497e-05, + "loss": 0.6003, + "step": 10498 + }, + { + "epoch": 28.607629427792915, + "grad_norm": 9.788068771362305, + "learning_rate": 1.6753416596510144e-05, + "loss": 0.45, + "step": 10499 + }, + { + "epoch": 28.61035422343324, + "grad_norm": 9.50992488861084, + "learning_rate": 1.6752765725996402e-05, + "loss": 0.5356, + "step": 10500 + }, + { + "epoch": 28.61307901907357, + "grad_norm": 7.4705281257629395, + "learning_rate": 1.6752114802892332e-05, + "loss": 0.5111, + "step": 10501 + }, + { + "epoch": 28.615803814713896, + "grad_norm": 12.41318416595459, + "learning_rate": 1.6751463827203018e-05, + "loss": 0.4525, + "step": 10502 + }, + { + "epoch": 28.618528610354222, + "grad_norm": 10.357723236083984, + "learning_rate": 1.6750812798933512e-05, + "loss": 0.6619, + "step": 10503 + }, + { + "epoch": 28.62125340599455, + "grad_norm": 8.30016803741455, + "learning_rate": 1.6750161718088902e-05, + "loss": 0.4381, + "step": 10504 + }, + { + "epoch": 28.623978201634877, + "grad_norm": 9.020997047424316, + "learning_rate": 1.6749510584674243e-05, + "loss": 0.4266, + "step": 10505 + }, + { + "epoch": 28.626702997275203, + "grad_norm": 7.495340347290039, + "learning_rate": 1.6748859398694616e-05, + "loss": 0.3745, + "step": 10506 + }, + { + "epoch": 28.629427792915532, + "grad_norm": 11.160477638244629, + "learning_rate": 1.674820816015509e-05, + "loss": 0.4176, + "step": 10507 + }, + { + "epoch": 28.632152588555858, + "grad_norm": 9.42709732055664, + "learning_rate": 1.6747556869060735e-05, + "loss": 0.5268, + "step": 10508 + }, + { + "epoch": 28.634877384196184, + "grad_norm": 7.919163227081299, + "learning_rate": 1.6746905525416625e-05, + "loss": 0.39, + "step": 10509 + }, + { + "epoch": 28.637602179836513, + "grad_norm": 10.078733444213867, + "learning_rate": 1.674625412922783e-05, + "loss": 0.5568, + "step": 10510 + }, + { + "epoch": 28.64032697547684, + "grad_norm": 9.338096618652344, + "learning_rate": 1.6745602680499426e-05, + "loss": 0.5707, + "step": 10511 + }, + { + "epoch": 28.643051771117165, + "grad_norm": 8.589585304260254, + "learning_rate": 1.6744951179236487e-05, + "loss": 0.5765, + "step": 10512 + }, + { + "epoch": 28.645776566757494, + "grad_norm": 8.227743148803711, + "learning_rate": 1.6744299625444082e-05, + "loss": 0.4916, + "step": 10513 + }, + { + "epoch": 28.64850136239782, + "grad_norm": 12.171733856201172, + "learning_rate": 1.674364801912729e-05, + "loss": 0.5273, + "step": 10514 + }, + { + "epoch": 28.651226158038146, + "grad_norm": 8.201462745666504, + "learning_rate": 1.6742996360291184e-05, + "loss": 0.5538, + "step": 10515 + }, + { + "epoch": 28.653950953678475, + "grad_norm": 7.957534313201904, + "learning_rate": 1.674234464894084e-05, + "loss": 0.4372, + "step": 10516 + }, + { + "epoch": 28.6566757493188, + "grad_norm": 11.711692810058594, + "learning_rate": 1.6741692885081333e-05, + "loss": 0.535, + "step": 10517 + }, + { + "epoch": 28.659400544959126, + "grad_norm": 7.344912052154541, + "learning_rate": 1.6741041068717737e-05, + "loss": 0.578, + "step": 10518 + }, + { + "epoch": 28.662125340599456, + "grad_norm": 17.266468048095703, + "learning_rate": 1.674038919985513e-05, + "loss": 0.4063, + "step": 10519 + }, + { + "epoch": 28.66485013623978, + "grad_norm": 7.3692626953125, + "learning_rate": 1.6739737278498595e-05, + "loss": 0.5085, + "step": 10520 + }, + { + "epoch": 28.667574931880107, + "grad_norm": 8.309320449829102, + "learning_rate": 1.6739085304653197e-05, + "loss": 0.4993, + "step": 10521 + }, + { + "epoch": 28.670299727520437, + "grad_norm": 9.00151538848877, + "learning_rate": 1.673843327832402e-05, + "loss": 0.5508, + "step": 10522 + }, + { + "epoch": 28.673024523160763, + "grad_norm": 7.283410549163818, + "learning_rate": 1.6737781199516143e-05, + "loss": 0.481, + "step": 10523 + }, + { + "epoch": 28.67574931880109, + "grad_norm": 9.720575332641602, + "learning_rate": 1.6737129068234642e-05, + "loss": 0.5471, + "step": 10524 + }, + { + "epoch": 28.678474114441418, + "grad_norm": 7.802993297576904, + "learning_rate": 1.67364768844846e-05, + "loss": 0.6346, + "step": 10525 + }, + { + "epoch": 28.681198910081743, + "grad_norm": 9.069677352905273, + "learning_rate": 1.6735824648271085e-05, + "loss": 0.442, + "step": 10526 + }, + { + "epoch": 28.68392370572207, + "grad_norm": 12.54915714263916, + "learning_rate": 1.6735172359599193e-05, + "loss": 0.7076, + "step": 10527 + }, + { + "epoch": 28.6866485013624, + "grad_norm": 7.4631853103637695, + "learning_rate": 1.673452001847399e-05, + "loss": 0.5363, + "step": 10528 + }, + { + "epoch": 28.689373297002724, + "grad_norm": 7.945371627807617, + "learning_rate": 1.6733867624900565e-05, + "loss": 0.5799, + "step": 10529 + }, + { + "epoch": 28.69209809264305, + "grad_norm": 8.726821899414062, + "learning_rate": 1.6733215178883996e-05, + "loss": 0.4099, + "step": 10530 + }, + { + "epoch": 28.69482288828338, + "grad_norm": 7.770522594451904, + "learning_rate": 1.6732562680429358e-05, + "loss": 0.4289, + "step": 10531 + }, + { + "epoch": 28.697547683923705, + "grad_norm": 7.258590221405029, + "learning_rate": 1.6731910129541745e-05, + "loss": 0.5604, + "step": 10532 + }, + { + "epoch": 28.70027247956403, + "grad_norm": 7.198451995849609, + "learning_rate": 1.673125752622623e-05, + "loss": 0.5089, + "step": 10533 + }, + { + "epoch": 28.70299727520436, + "grad_norm": 7.6721882820129395, + "learning_rate": 1.67306048704879e-05, + "loss": 0.4549, + "step": 10534 + }, + { + "epoch": 28.705722070844686, + "grad_norm": 9.911489486694336, + "learning_rate": 1.672995216233183e-05, + "loss": 0.5649, + "step": 10535 + }, + { + "epoch": 28.708446866485012, + "grad_norm": 8.163591384887695, + "learning_rate": 1.6729299401763116e-05, + "loss": 0.4192, + "step": 10536 + }, + { + "epoch": 28.71117166212534, + "grad_norm": 8.404854774475098, + "learning_rate": 1.672864658878683e-05, + "loss": 0.4542, + "step": 10537 + }, + { + "epoch": 28.713896457765667, + "grad_norm": 8.87028694152832, + "learning_rate": 1.6727993723408066e-05, + "loss": 0.4514, + "step": 10538 + }, + { + "epoch": 28.716621253405993, + "grad_norm": 10.431681632995605, + "learning_rate": 1.67273408056319e-05, + "loss": 0.4138, + "step": 10539 + }, + { + "epoch": 28.719346049046322, + "grad_norm": 8.951879501342773, + "learning_rate": 1.672668783546342e-05, + "loss": 0.5924, + "step": 10540 + }, + { + "epoch": 28.722070844686648, + "grad_norm": 14.982688903808594, + "learning_rate": 1.6726034812907713e-05, + "loss": 0.4955, + "step": 10541 + }, + { + "epoch": 28.724795640326974, + "grad_norm": 12.39867115020752, + "learning_rate": 1.672538173796986e-05, + "loss": 0.5046, + "step": 10542 + }, + { + "epoch": 28.727520435967303, + "grad_norm": 8.843228340148926, + "learning_rate": 1.6724728610654955e-05, + "loss": 0.4193, + "step": 10543 + }, + { + "epoch": 28.73024523160763, + "grad_norm": 8.99812126159668, + "learning_rate": 1.672407543096808e-05, + "loss": 0.4847, + "step": 10544 + }, + { + "epoch": 28.732970027247955, + "grad_norm": 7.509914398193359, + "learning_rate": 1.6723422198914317e-05, + "loss": 0.448, + "step": 10545 + }, + { + "epoch": 28.735694822888284, + "grad_norm": 7.077925682067871, + "learning_rate": 1.6722768914498763e-05, + "loss": 0.3459, + "step": 10546 + }, + { + "epoch": 28.73841961852861, + "grad_norm": 13.859886169433594, + "learning_rate": 1.6722115577726497e-05, + "loss": 0.6188, + "step": 10547 + }, + { + "epoch": 28.741144414168936, + "grad_norm": 8.113566398620605, + "learning_rate": 1.6721462188602618e-05, + "loss": 0.4128, + "step": 10548 + }, + { + "epoch": 28.743869209809265, + "grad_norm": 7.334417819976807, + "learning_rate": 1.6720808747132204e-05, + "loss": 0.3771, + "step": 10549 + }, + { + "epoch": 28.74659400544959, + "grad_norm": 7.81968879699707, + "learning_rate": 1.6720155253320348e-05, + "loss": 0.4758, + "step": 10550 + }, + { + "epoch": 28.749318801089917, + "grad_norm": 7.863037586212158, + "learning_rate": 1.6719501707172135e-05, + "loss": 0.3486, + "step": 10551 + }, + { + "epoch": 28.752043596730246, + "grad_norm": 7.974241256713867, + "learning_rate": 1.6718848108692665e-05, + "loss": 0.5805, + "step": 10552 + }, + { + "epoch": 28.754768392370572, + "grad_norm": 14.860568046569824, + "learning_rate": 1.671819445788702e-05, + "loss": 0.562, + "step": 10553 + }, + { + "epoch": 28.757493188010898, + "grad_norm": 7.626082420349121, + "learning_rate": 1.671754075476029e-05, + "loss": 0.6777, + "step": 10554 + }, + { + "epoch": 28.760217983651227, + "grad_norm": 8.53664779663086, + "learning_rate": 1.6716886999317573e-05, + "loss": 0.4551, + "step": 10555 + }, + { + "epoch": 28.762942779291553, + "grad_norm": 8.117570877075195, + "learning_rate": 1.6716233191563956e-05, + "loss": 0.4374, + "step": 10556 + }, + { + "epoch": 28.76566757493188, + "grad_norm": 9.303681373596191, + "learning_rate": 1.671557933150453e-05, + "loss": 0.5538, + "step": 10557 + }, + { + "epoch": 28.768392370572208, + "grad_norm": 10.377424240112305, + "learning_rate": 1.6714925419144384e-05, + "loss": 0.5431, + "step": 10558 + }, + { + "epoch": 28.771117166212534, + "grad_norm": 10.983673095703125, + "learning_rate": 1.671427145448862e-05, + "loss": 0.4244, + "step": 10559 + }, + { + "epoch": 28.77384196185286, + "grad_norm": 8.11573314666748, + "learning_rate": 1.6713617437542328e-05, + "loss": 0.3999, + "step": 10560 + }, + { + "epoch": 28.77656675749319, + "grad_norm": 18.627511978149414, + "learning_rate": 1.6712963368310596e-05, + "loss": 0.6816, + "step": 10561 + }, + { + "epoch": 28.779291553133515, + "grad_norm": 7.47135591506958, + "learning_rate": 1.671230924679852e-05, + "loss": 0.6332, + "step": 10562 + }, + { + "epoch": 28.78201634877384, + "grad_norm": 8.145977973937988, + "learning_rate": 1.6711655073011196e-05, + "loss": 0.5015, + "step": 10563 + }, + { + "epoch": 28.78474114441417, + "grad_norm": 7.705799102783203, + "learning_rate": 1.6711000846953722e-05, + "loss": 0.5104, + "step": 10564 + }, + { + "epoch": 28.787465940054496, + "grad_norm": 6.46087121963501, + "learning_rate": 1.671034656863119e-05, + "loss": 0.6451, + "step": 10565 + }, + { + "epoch": 28.79019073569482, + "grad_norm": 7.06374454498291, + "learning_rate": 1.6709692238048688e-05, + "loss": 0.4239, + "step": 10566 + }, + { + "epoch": 28.79291553133515, + "grad_norm": 20.436994552612305, + "learning_rate": 1.670903785521132e-05, + "loss": 0.5519, + "step": 10567 + }, + { + "epoch": 28.795640326975477, + "grad_norm": 8.40551471710205, + "learning_rate": 1.670838342012419e-05, + "loss": 0.4232, + "step": 10568 + }, + { + "epoch": 28.798365122615802, + "grad_norm": 7.828116416931152, + "learning_rate": 1.6707728932792376e-05, + "loss": 0.5026, + "step": 10569 + }, + { + "epoch": 28.80108991825613, + "grad_norm": 8.556410789489746, + "learning_rate": 1.670707439322099e-05, + "loss": 0.499, + "step": 10570 + }, + { + "epoch": 28.803814713896458, + "grad_norm": 7.418813228607178, + "learning_rate": 1.6706419801415122e-05, + "loss": 0.5561, + "step": 10571 + }, + { + "epoch": 28.806539509536783, + "grad_norm": 9.093198776245117, + "learning_rate": 1.6705765157379876e-05, + "loss": 0.4318, + "step": 10572 + }, + { + "epoch": 28.809264305177113, + "grad_norm": 6.8813252449035645, + "learning_rate": 1.6705110461120343e-05, + "loss": 0.5348, + "step": 10573 + }, + { + "epoch": 28.81198910081744, + "grad_norm": 9.664884567260742, + "learning_rate": 1.670445571264163e-05, + "loss": 0.5199, + "step": 10574 + }, + { + "epoch": 28.814713896457764, + "grad_norm": 6.698128700256348, + "learning_rate": 1.6703800911948825e-05, + "loss": 0.5584, + "step": 10575 + }, + { + "epoch": 28.817438692098094, + "grad_norm": 8.184273719787598, + "learning_rate": 1.6703146059047038e-05, + "loss": 0.5055, + "step": 10576 + }, + { + "epoch": 28.82016348773842, + "grad_norm": 10.05097484588623, + "learning_rate": 1.6702491153941367e-05, + "loss": 0.5341, + "step": 10577 + }, + { + "epoch": 28.822888283378745, + "grad_norm": 7.727924346923828, + "learning_rate": 1.6701836196636908e-05, + "loss": 0.5427, + "step": 10578 + }, + { + "epoch": 28.825613079019075, + "grad_norm": 7.529411792755127, + "learning_rate": 1.6701181187138767e-05, + "loss": 0.5878, + "step": 10579 + }, + { + "epoch": 28.8283378746594, + "grad_norm": 7.188710689544678, + "learning_rate": 1.670052612545204e-05, + "loss": 0.4862, + "step": 10580 + }, + { + "epoch": 28.831062670299726, + "grad_norm": 12.786149978637695, + "learning_rate": 1.669987101158183e-05, + "loss": 0.5767, + "step": 10581 + }, + { + "epoch": 28.833787465940055, + "grad_norm": 10.405355453491211, + "learning_rate": 1.6699215845533244e-05, + "loss": 0.4841, + "step": 10582 + }, + { + "epoch": 28.83651226158038, + "grad_norm": 7.407323360443115, + "learning_rate": 1.6698560627311378e-05, + "loss": 0.4706, + "step": 10583 + }, + { + "epoch": 28.839237057220707, + "grad_norm": 8.080324172973633, + "learning_rate": 1.669790535692134e-05, + "loss": 0.5331, + "step": 10584 + }, + { + "epoch": 28.841961852861036, + "grad_norm": 11.468756675720215, + "learning_rate": 1.6697250034368226e-05, + "loss": 0.4819, + "step": 10585 + }, + { + "epoch": 28.844686648501362, + "grad_norm": 7.990210056304932, + "learning_rate": 1.669659465965715e-05, + "loss": 0.5371, + "step": 10586 + }, + { + "epoch": 28.847411444141688, + "grad_norm": 8.95950698852539, + "learning_rate": 1.6695939232793206e-05, + "loss": 0.5915, + "step": 10587 + }, + { + "epoch": 28.850136239782017, + "grad_norm": 8.210714340209961, + "learning_rate": 1.66952837537815e-05, + "loss": 0.5724, + "step": 10588 + }, + { + "epoch": 28.852861035422343, + "grad_norm": 10.971351623535156, + "learning_rate": 1.6694628222627148e-05, + "loss": 0.5953, + "step": 10589 + }, + { + "epoch": 28.85558583106267, + "grad_norm": 7.6229448318481445, + "learning_rate": 1.669397263933524e-05, + "loss": 0.5294, + "step": 10590 + }, + { + "epoch": 28.858310626703, + "grad_norm": 8.125885963439941, + "learning_rate": 1.6693317003910895e-05, + "loss": 0.635, + "step": 10591 + }, + { + "epoch": 28.861035422343324, + "grad_norm": 8.368759155273438, + "learning_rate": 1.6692661316359206e-05, + "loss": 0.5388, + "step": 10592 + }, + { + "epoch": 28.86376021798365, + "grad_norm": 8.914116859436035, + "learning_rate": 1.6692005576685288e-05, + "loss": 0.4432, + "step": 10593 + }, + { + "epoch": 28.86648501362398, + "grad_norm": 9.29539966583252, + "learning_rate": 1.669134978489425e-05, + "loss": 0.589, + "step": 10594 + }, + { + "epoch": 28.869209809264305, + "grad_norm": 11.241096496582031, + "learning_rate": 1.669069394099119e-05, + "loss": 0.5644, + "step": 10595 + }, + { + "epoch": 28.87193460490463, + "grad_norm": 7.38763427734375, + "learning_rate": 1.6690038044981222e-05, + "loss": 0.5002, + "step": 10596 + }, + { + "epoch": 28.87465940054496, + "grad_norm": 7.305187225341797, + "learning_rate": 1.6689382096869457e-05, + "loss": 0.4514, + "step": 10597 + }, + { + "epoch": 28.877384196185286, + "grad_norm": 9.493101119995117, + "learning_rate": 1.6688726096660994e-05, + "loss": 0.4852, + "step": 10598 + }, + { + "epoch": 28.88010899182561, + "grad_norm": 8.345754623413086, + "learning_rate": 1.668807004436095e-05, + "loss": 0.4807, + "step": 10599 + }, + { + "epoch": 28.88283378746594, + "grad_norm": 8.172216415405273, + "learning_rate": 1.668741393997443e-05, + "loss": 0.7126, + "step": 10600 + }, + { + "epoch": 28.885558583106267, + "grad_norm": 8.099128723144531, + "learning_rate": 1.668675778350655e-05, + "loss": 0.4258, + "step": 10601 + }, + { + "epoch": 28.888283378746593, + "grad_norm": 8.967839241027832, + "learning_rate": 1.6686101574962413e-05, + "loss": 0.4801, + "step": 10602 + }, + { + "epoch": 28.891008174386922, + "grad_norm": 8.110413551330566, + "learning_rate": 1.668544531434713e-05, + "loss": 0.5353, + "step": 10603 + }, + { + "epoch": 28.893732970027248, + "grad_norm": 8.122382164001465, + "learning_rate": 1.668478900166582e-05, + "loss": 0.597, + "step": 10604 + }, + { + "epoch": 28.896457765667574, + "grad_norm": 8.046221733093262, + "learning_rate": 1.668413263692358e-05, + "loss": 0.5664, + "step": 10605 + }, + { + "epoch": 28.899182561307903, + "grad_norm": 6.769096851348877, + "learning_rate": 1.6683476220125535e-05, + "loss": 0.4942, + "step": 10606 + }, + { + "epoch": 28.90190735694823, + "grad_norm": 7.824985504150391, + "learning_rate": 1.668281975127679e-05, + "loss": 0.5683, + "step": 10607 + }, + { + "epoch": 28.904632152588555, + "grad_norm": 9.089848518371582, + "learning_rate": 1.6682163230382465e-05, + "loss": 0.5217, + "step": 10608 + }, + { + "epoch": 28.907356948228884, + "grad_norm": 8.377856254577637, + "learning_rate": 1.6681506657447664e-05, + "loss": 0.4709, + "step": 10609 + }, + { + "epoch": 28.91008174386921, + "grad_norm": 7.7487382888793945, + "learning_rate": 1.6680850032477504e-05, + "loss": 0.4902, + "step": 10610 + }, + { + "epoch": 28.912806539509535, + "grad_norm": 6.764167308807373, + "learning_rate": 1.66801933554771e-05, + "loss": 0.4218, + "step": 10611 + }, + { + "epoch": 28.915531335149865, + "grad_norm": 7.561228275299072, + "learning_rate": 1.6679536626451565e-05, + "loss": 0.4656, + "step": 10612 + }, + { + "epoch": 28.91825613079019, + "grad_norm": 7.498943328857422, + "learning_rate": 1.6678879845406014e-05, + "loss": 0.5511, + "step": 10613 + }, + { + "epoch": 28.920980926430516, + "grad_norm": 7.2002153396606445, + "learning_rate": 1.667822301234556e-05, + "loss": 0.3559, + "step": 10614 + }, + { + "epoch": 28.923705722070846, + "grad_norm": 9.295483589172363, + "learning_rate": 1.667756612727532e-05, + "loss": 0.661, + "step": 10615 + }, + { + "epoch": 28.92643051771117, + "grad_norm": 9.446654319763184, + "learning_rate": 1.6676909190200416e-05, + "loss": 0.428, + "step": 10616 + }, + { + "epoch": 28.929155313351497, + "grad_norm": 8.02613353729248, + "learning_rate": 1.667625220112595e-05, + "loss": 0.5871, + "step": 10617 + }, + { + "epoch": 28.931880108991827, + "grad_norm": 7.79987096786499, + "learning_rate": 1.6675595160057053e-05, + "loss": 0.592, + "step": 10618 + }, + { + "epoch": 28.934604904632153, + "grad_norm": 7.361390590667725, + "learning_rate": 1.667493806699883e-05, + "loss": 0.6436, + "step": 10619 + }, + { + "epoch": 28.93732970027248, + "grad_norm": 8.387858390808105, + "learning_rate": 1.667428092195641e-05, + "loss": 0.4167, + "step": 10620 + }, + { + "epoch": 28.940054495912808, + "grad_norm": 8.999015808105469, + "learning_rate": 1.6673623724934898e-05, + "loss": 0.5012, + "step": 10621 + }, + { + "epoch": 28.942779291553133, + "grad_norm": 6.0761823654174805, + "learning_rate": 1.6672966475939426e-05, + "loss": 0.4583, + "step": 10622 + }, + { + "epoch": 28.94550408719346, + "grad_norm": 7.447052955627441, + "learning_rate": 1.66723091749751e-05, + "loss": 0.4194, + "step": 10623 + }, + { + "epoch": 28.94822888283379, + "grad_norm": 7.755176067352295, + "learning_rate": 1.6671651822047052e-05, + "loss": 0.3965, + "step": 10624 + }, + { + "epoch": 28.950953678474114, + "grad_norm": 8.58421516418457, + "learning_rate": 1.667099441716039e-05, + "loss": 0.5266, + "step": 10625 + }, + { + "epoch": 28.95367847411444, + "grad_norm": 6.611844062805176, + "learning_rate": 1.6670336960320237e-05, + "loss": 0.5188, + "step": 10626 + }, + { + "epoch": 28.95640326975477, + "grad_norm": 11.779068946838379, + "learning_rate": 1.6669679451531716e-05, + "loss": 0.4384, + "step": 10627 + }, + { + "epoch": 28.959128065395095, + "grad_norm": 7.734330654144287, + "learning_rate": 1.666902189079995e-05, + "loss": 0.5486, + "step": 10628 + }, + { + "epoch": 28.96185286103542, + "grad_norm": 7.206127166748047, + "learning_rate": 1.6668364278130047e-05, + "loss": 0.4609, + "step": 10629 + }, + { + "epoch": 28.96457765667575, + "grad_norm": 7.38665771484375, + "learning_rate": 1.6667706613527142e-05, + "loss": 0.5, + "step": 10630 + }, + { + "epoch": 28.967302452316076, + "grad_norm": 9.11385726928711, + "learning_rate": 1.6667048896996357e-05, + "loss": 0.4606, + "step": 10631 + }, + { + "epoch": 28.970027247956402, + "grad_norm": 7.674446105957031, + "learning_rate": 1.6666391128542802e-05, + "loss": 0.4459, + "step": 10632 + }, + { + "epoch": 28.97275204359673, + "grad_norm": 7.57926607131958, + "learning_rate": 1.6665733308171615e-05, + "loss": 0.596, + "step": 10633 + }, + { + "epoch": 28.975476839237057, + "grad_norm": 7.778857231140137, + "learning_rate": 1.6665075435887907e-05, + "loss": 0.6039, + "step": 10634 + }, + { + "epoch": 28.978201634877383, + "grad_norm": 9.085589408874512, + "learning_rate": 1.6664417511696807e-05, + "loss": 0.4991, + "step": 10635 + }, + { + "epoch": 28.980926430517712, + "grad_norm": 7.43651819229126, + "learning_rate": 1.6663759535603438e-05, + "loss": 0.4854, + "step": 10636 + }, + { + "epoch": 28.983651226158038, + "grad_norm": 7.128672122955322, + "learning_rate": 1.6663101507612926e-05, + "loss": 0.4504, + "step": 10637 + }, + { + "epoch": 28.986376021798364, + "grad_norm": 8.316488265991211, + "learning_rate": 1.666244342773039e-05, + "loss": 0.4891, + "step": 10638 + }, + { + "epoch": 28.989100817438693, + "grad_norm": 9.425989151000977, + "learning_rate": 1.666178529596096e-05, + "loss": 0.546, + "step": 10639 + }, + { + "epoch": 28.99182561307902, + "grad_norm": 7.048205852508545, + "learning_rate": 1.666112711230976e-05, + "loss": 0.4882, + "step": 10640 + }, + { + "epoch": 28.994550408719345, + "grad_norm": 7.403781890869141, + "learning_rate": 1.666046887678192e-05, + "loss": 0.6663, + "step": 10641 + }, + { + "epoch": 28.997275204359674, + "grad_norm": 6.79907751083374, + "learning_rate": 1.665981058938256e-05, + "loss": 0.6273, + "step": 10642 + }, + { + "epoch": 29.0, + "grad_norm": 6.791356563568115, + "learning_rate": 1.665915225011681e-05, + "loss": 0.5466, + "step": 10643 + }, + { + "epoch": 29.002724795640326, + "grad_norm": 6.716793537139893, + "learning_rate": 1.66584938589898e-05, + "loss": 0.5327, + "step": 10644 + }, + { + "epoch": 29.005449591280655, + "grad_norm": 6.785096168518066, + "learning_rate": 1.665783541600665e-05, + "loss": 0.3464, + "step": 10645 + }, + { + "epoch": 29.00817438692098, + "grad_norm": 7.015567302703857, + "learning_rate": 1.6657176921172492e-05, + "loss": 0.5493, + "step": 10646 + }, + { + "epoch": 29.010899182561307, + "grad_norm": 6.1250834465026855, + "learning_rate": 1.6656518374492458e-05, + "loss": 0.3676, + "step": 10647 + }, + { + "epoch": 29.013623978201636, + "grad_norm": 6.8189873695373535, + "learning_rate": 1.665585977597167e-05, + "loss": 0.4194, + "step": 10648 + }, + { + "epoch": 29.016348773841962, + "grad_norm": 6.028426170349121, + "learning_rate": 1.6655201125615263e-05, + "loss": 0.4869, + "step": 10649 + }, + { + "epoch": 29.019073569482288, + "grad_norm": 8.195756912231445, + "learning_rate": 1.665454242342836e-05, + "loss": 0.5178, + "step": 10650 + }, + { + "epoch": 29.021798365122617, + "grad_norm": 7.648116111755371, + "learning_rate": 1.6653883669416098e-05, + "loss": 0.5685, + "step": 10651 + }, + { + "epoch": 29.024523160762943, + "grad_norm": 6.029077529907227, + "learning_rate": 1.6653224863583602e-05, + "loss": 0.55, + "step": 10652 + }, + { + "epoch": 29.02724795640327, + "grad_norm": 6.578215599060059, + "learning_rate": 1.6652566005936004e-05, + "loss": 0.3692, + "step": 10653 + }, + { + "epoch": 29.029972752043598, + "grad_norm": 6.456214904785156, + "learning_rate": 1.6651907096478436e-05, + "loss": 0.359, + "step": 10654 + }, + { + "epoch": 29.032697547683924, + "grad_norm": 8.54837703704834, + "learning_rate": 1.6651248135216032e-05, + "loss": 0.4001, + "step": 10655 + }, + { + "epoch": 29.03542234332425, + "grad_norm": 8.930901527404785, + "learning_rate": 1.665058912215392e-05, + "loss": 0.4656, + "step": 10656 + }, + { + "epoch": 29.03814713896458, + "grad_norm": 7.996654987335205, + "learning_rate": 1.6649930057297235e-05, + "loss": 0.3322, + "step": 10657 + }, + { + "epoch": 29.040871934604905, + "grad_norm": 7.286412715911865, + "learning_rate": 1.664927094065111e-05, + "loss": 0.4208, + "step": 10658 + }, + { + "epoch": 29.04359673024523, + "grad_norm": 9.534561157226562, + "learning_rate": 1.6648611772220675e-05, + "loss": 0.4321, + "step": 10659 + }, + { + "epoch": 29.04632152588556, + "grad_norm": 7.3517985343933105, + "learning_rate": 1.664795255201107e-05, + "loss": 0.5556, + "step": 10660 + }, + { + "epoch": 29.049046321525886, + "grad_norm": 6.535494327545166, + "learning_rate": 1.664729328002742e-05, + "loss": 0.4312, + "step": 10661 + }, + { + "epoch": 29.05177111716621, + "grad_norm": 6.648280143737793, + "learning_rate": 1.6646633956274862e-05, + "loss": 0.7457, + "step": 10662 + }, + { + "epoch": 29.05449591280654, + "grad_norm": 7.089462757110596, + "learning_rate": 1.6645974580758533e-05, + "loss": 0.431, + "step": 10663 + }, + { + "epoch": 29.057220708446867, + "grad_norm": 7.128489971160889, + "learning_rate": 1.6645315153483572e-05, + "loss": 0.614, + "step": 10664 + }, + { + "epoch": 29.059945504087192, + "grad_norm": 7.6592183113098145, + "learning_rate": 1.6644655674455107e-05, + "loss": 0.3837, + "step": 10665 + }, + { + "epoch": 29.06267029972752, + "grad_norm": 7.780344009399414, + "learning_rate": 1.664399614367828e-05, + "loss": 0.5763, + "step": 10666 + }, + { + "epoch": 29.065395095367847, + "grad_norm": 8.125530242919922, + "learning_rate": 1.6643336561158222e-05, + "loss": 0.4218, + "step": 10667 + }, + { + "epoch": 29.068119891008173, + "grad_norm": 7.207923889160156, + "learning_rate": 1.6642676926900077e-05, + "loss": 0.5035, + "step": 10668 + }, + { + "epoch": 29.070844686648503, + "grad_norm": 8.001280784606934, + "learning_rate": 1.6642017240908975e-05, + "loss": 0.377, + "step": 10669 + }, + { + "epoch": 29.07356948228883, + "grad_norm": 6.393892765045166, + "learning_rate": 1.6641357503190055e-05, + "loss": 0.4096, + "step": 10670 + }, + { + "epoch": 29.076294277929154, + "grad_norm": 6.3388214111328125, + "learning_rate": 1.664069771374846e-05, + "loss": 0.4064, + "step": 10671 + }, + { + "epoch": 29.079019073569484, + "grad_norm": 5.872392177581787, + "learning_rate": 1.664003787258932e-05, + "loss": 0.3359, + "step": 10672 + }, + { + "epoch": 29.08174386920981, + "grad_norm": 7.228592872619629, + "learning_rate": 1.6639377979717784e-05, + "loss": 0.4145, + "step": 10673 + }, + { + "epoch": 29.084468664850135, + "grad_norm": 7.437412261962891, + "learning_rate": 1.6638718035138985e-05, + "loss": 0.4682, + "step": 10674 + }, + { + "epoch": 29.087193460490465, + "grad_norm": 7.387948989868164, + "learning_rate": 1.663805803885806e-05, + "loss": 0.469, + "step": 10675 + }, + { + "epoch": 29.08991825613079, + "grad_norm": 40.065284729003906, + "learning_rate": 1.6637397990880158e-05, + "loss": 0.3711, + "step": 10676 + }, + { + "epoch": 29.092643051771116, + "grad_norm": 7.11245059967041, + "learning_rate": 1.6636737891210412e-05, + "loss": 0.4128, + "step": 10677 + }, + { + "epoch": 29.095367847411445, + "grad_norm": 7.460601329803467, + "learning_rate": 1.663607773985396e-05, + "loss": 0.4702, + "step": 10678 + }, + { + "epoch": 29.09809264305177, + "grad_norm": 13.630023956298828, + "learning_rate": 1.6635417536815953e-05, + "loss": 0.626, + "step": 10679 + }, + { + "epoch": 29.100817438692097, + "grad_norm": 6.180692195892334, + "learning_rate": 1.663475728210153e-05, + "loss": 0.4881, + "step": 10680 + }, + { + "epoch": 29.103542234332426, + "grad_norm": 7.246993541717529, + "learning_rate": 1.6634096975715825e-05, + "loss": 0.4967, + "step": 10681 + }, + { + "epoch": 29.106267029972752, + "grad_norm": 7.189358711242676, + "learning_rate": 1.6633436617663988e-05, + "loss": 0.3922, + "step": 10682 + }, + { + "epoch": 29.108991825613078, + "grad_norm": 8.475040435791016, + "learning_rate": 1.6632776207951165e-05, + "loss": 0.4345, + "step": 10683 + }, + { + "epoch": 29.111716621253407, + "grad_norm": 6.120608329772949, + "learning_rate": 1.663211574658249e-05, + "loss": 0.3836, + "step": 10684 + }, + { + "epoch": 29.114441416893733, + "grad_norm": 7.1794281005859375, + "learning_rate": 1.6631455233563113e-05, + "loss": 0.4676, + "step": 10685 + }, + { + "epoch": 29.11716621253406, + "grad_norm": 7.182884693145752, + "learning_rate": 1.6630794668898175e-05, + "loss": 0.4496, + "step": 10686 + }, + { + "epoch": 29.11989100817439, + "grad_norm": 6.465396881103516, + "learning_rate": 1.6630134052592823e-05, + "loss": 0.4851, + "step": 10687 + }, + { + "epoch": 29.122615803814714, + "grad_norm": 6.79514741897583, + "learning_rate": 1.6629473384652197e-05, + "loss": 0.4568, + "step": 10688 + }, + { + "epoch": 29.12534059945504, + "grad_norm": 8.822425842285156, + "learning_rate": 1.6628812665081446e-05, + "loss": 0.4444, + "step": 10689 + }, + { + "epoch": 29.12806539509537, + "grad_norm": 9.892768859863281, + "learning_rate": 1.6628151893885715e-05, + "loss": 0.5513, + "step": 10690 + }, + { + "epoch": 29.130790190735695, + "grad_norm": 7.1043620109558105, + "learning_rate": 1.6627491071070152e-05, + "loss": 0.3967, + "step": 10691 + }, + { + "epoch": 29.13351498637602, + "grad_norm": 7.769501686096191, + "learning_rate": 1.66268301966399e-05, + "loss": 0.452, + "step": 10692 + }, + { + "epoch": 29.13623978201635, + "grad_norm": 9.14890193939209, + "learning_rate": 1.6626169270600113e-05, + "loss": 0.601, + "step": 10693 + }, + { + "epoch": 29.138964577656676, + "grad_norm": 6.528905391693115, + "learning_rate": 1.662550829295593e-05, + "loss": 0.3549, + "step": 10694 + }, + { + "epoch": 29.141689373297, + "grad_norm": 7.674026966094971, + "learning_rate": 1.66248472637125e-05, + "loss": 0.4982, + "step": 10695 + }, + { + "epoch": 29.14441416893733, + "grad_norm": 6.87601900100708, + "learning_rate": 1.6624186182874977e-05, + "loss": 0.3966, + "step": 10696 + }, + { + "epoch": 29.147138964577657, + "grad_norm": 7.0147552490234375, + "learning_rate": 1.66235250504485e-05, + "loss": 0.4487, + "step": 10697 + }, + { + "epoch": 29.149863760217983, + "grad_norm": 6.048093318939209, + "learning_rate": 1.6622863866438223e-05, + "loss": 0.4211, + "step": 10698 + }, + { + "epoch": 29.152588555858312, + "grad_norm": 6.146883010864258, + "learning_rate": 1.66222026308493e-05, + "loss": 0.4698, + "step": 10699 + }, + { + "epoch": 29.155313351498638, + "grad_norm": 8.4680814743042, + "learning_rate": 1.662154134368687e-05, + "loss": 0.339, + "step": 10700 + }, + { + "epoch": 29.158038147138964, + "grad_norm": 7.185520648956299, + "learning_rate": 1.6620880004956095e-05, + "loss": 0.3368, + "step": 10701 + }, + { + "epoch": 29.160762942779293, + "grad_norm": 7.100562572479248, + "learning_rate": 1.662021861466212e-05, + "loss": 0.5181, + "step": 10702 + }, + { + "epoch": 29.16348773841962, + "grad_norm": 8.350886344909668, + "learning_rate": 1.661955717281009e-05, + "loss": 0.5449, + "step": 10703 + }, + { + "epoch": 29.166212534059945, + "grad_norm": 8.237159729003906, + "learning_rate": 1.6618895679405165e-05, + "loss": 0.4541, + "step": 10704 + }, + { + "epoch": 29.168937329700274, + "grad_norm": 7.449276447296143, + "learning_rate": 1.6618234134452493e-05, + "loss": 0.3835, + "step": 10705 + }, + { + "epoch": 29.1716621253406, + "grad_norm": 7.251029014587402, + "learning_rate": 1.661757253795723e-05, + "loss": 0.5143, + "step": 10706 + }, + { + "epoch": 29.174386920980925, + "grad_norm": 6.984391212463379, + "learning_rate": 1.661691088992452e-05, + "loss": 0.4431, + "step": 10707 + }, + { + "epoch": 29.177111716621255, + "grad_norm": 8.196168899536133, + "learning_rate": 1.661624919035952e-05, + "loss": 0.4003, + "step": 10708 + }, + { + "epoch": 29.17983651226158, + "grad_norm": 7.046302318572998, + "learning_rate": 1.661558743926739e-05, + "loss": 0.4662, + "step": 10709 + }, + { + "epoch": 29.182561307901906, + "grad_norm": 7.18446683883667, + "learning_rate": 1.6614925636653274e-05, + "loss": 0.5267, + "step": 10710 + }, + { + "epoch": 29.185286103542236, + "grad_norm": 7.664499759674072, + "learning_rate": 1.6614263782522332e-05, + "loss": 0.4207, + "step": 10711 + }, + { + "epoch": 29.18801089918256, + "grad_norm": 5.894651412963867, + "learning_rate": 1.6613601876879714e-05, + "loss": 0.5299, + "step": 10712 + }, + { + "epoch": 29.190735694822887, + "grad_norm": 7.169234275817871, + "learning_rate": 1.6612939919730578e-05, + "loss": 0.4573, + "step": 10713 + }, + { + "epoch": 29.193460490463217, + "grad_norm": 10.233022689819336, + "learning_rate": 1.661227791108008e-05, + "loss": 0.4675, + "step": 10714 + }, + { + "epoch": 29.196185286103542, + "grad_norm": 6.739607810974121, + "learning_rate": 1.6611615850933374e-05, + "loss": 0.4117, + "step": 10715 + }, + { + "epoch": 29.19891008174387, + "grad_norm": 6.349090099334717, + "learning_rate": 1.6610953739295617e-05, + "loss": 0.4535, + "step": 10716 + }, + { + "epoch": 29.201634877384198, + "grad_norm": 7.4584479331970215, + "learning_rate": 1.6610291576171965e-05, + "loss": 0.4776, + "step": 10717 + }, + { + "epoch": 29.204359673024523, + "grad_norm": 7.474863529205322, + "learning_rate": 1.6609629361567578e-05, + "loss": 0.3361, + "step": 10718 + }, + { + "epoch": 29.20708446866485, + "grad_norm": 7.306474685668945, + "learning_rate": 1.6608967095487606e-05, + "loss": 0.5182, + "step": 10719 + }, + { + "epoch": 29.20980926430518, + "grad_norm": 6.636267185211182, + "learning_rate": 1.660830477793721e-05, + "loss": 0.5018, + "step": 10720 + }, + { + "epoch": 29.212534059945504, + "grad_norm": 8.042543411254883, + "learning_rate": 1.6607642408921552e-05, + "loss": 0.4495, + "step": 10721 + }, + { + "epoch": 29.21525885558583, + "grad_norm": 7.184332847595215, + "learning_rate": 1.6606979988445787e-05, + "loss": 0.3229, + "step": 10722 + }, + { + "epoch": 29.21798365122616, + "grad_norm": 6.720614433288574, + "learning_rate": 1.6606317516515074e-05, + "loss": 0.4746, + "step": 10723 + }, + { + "epoch": 29.220708446866485, + "grad_norm": 8.756359100341797, + "learning_rate": 1.660565499313457e-05, + "loss": 0.3661, + "step": 10724 + }, + { + "epoch": 29.22343324250681, + "grad_norm": 6.875161647796631, + "learning_rate": 1.6604992418309443e-05, + "loss": 0.3187, + "step": 10725 + }, + { + "epoch": 29.22615803814714, + "grad_norm": 8.915993690490723, + "learning_rate": 1.6604329792044845e-05, + "loss": 0.4139, + "step": 10726 + }, + { + "epoch": 29.228882833787466, + "grad_norm": 14.585935592651367, + "learning_rate": 1.660366711434594e-05, + "loss": 0.3608, + "step": 10727 + }, + { + "epoch": 29.231607629427792, + "grad_norm": 7.285501480102539, + "learning_rate": 1.6603004385217887e-05, + "loss": 0.3971, + "step": 10728 + }, + { + "epoch": 29.23433242506812, + "grad_norm": 7.343924045562744, + "learning_rate": 1.6602341604665848e-05, + "loss": 0.5458, + "step": 10729 + }, + { + "epoch": 29.237057220708447, + "grad_norm": 8.615266799926758, + "learning_rate": 1.6601678772694985e-05, + "loss": 0.5154, + "step": 10730 + }, + { + "epoch": 29.239782016348773, + "grad_norm": 8.476104736328125, + "learning_rate": 1.6601015889310462e-05, + "loss": 0.5087, + "step": 10731 + }, + { + "epoch": 29.242506811989102, + "grad_norm": 6.7297682762146, + "learning_rate": 1.6600352954517437e-05, + "loss": 0.444, + "step": 10732 + }, + { + "epoch": 29.245231607629428, + "grad_norm": 12.848528861999512, + "learning_rate": 1.659968996832108e-05, + "loss": 0.4996, + "step": 10733 + }, + { + "epoch": 29.247956403269754, + "grad_norm": 7.561726093292236, + "learning_rate": 1.6599026930726544e-05, + "loss": 0.3617, + "step": 10734 + }, + { + "epoch": 29.250681198910083, + "grad_norm": 6.653961658477783, + "learning_rate": 1.6598363841739004e-05, + "loss": 0.4031, + "step": 10735 + }, + { + "epoch": 29.25340599455041, + "grad_norm": 7.954012870788574, + "learning_rate": 1.6597700701363615e-05, + "loss": 0.4294, + "step": 10736 + }, + { + "epoch": 29.256130790190735, + "grad_norm": 7.65130090713501, + "learning_rate": 1.6597037509605546e-05, + "loss": 0.5634, + "step": 10737 + }, + { + "epoch": 29.258855585831064, + "grad_norm": 6.7763519287109375, + "learning_rate": 1.6596374266469963e-05, + "loss": 0.5255, + "step": 10738 + }, + { + "epoch": 29.26158038147139, + "grad_norm": 7.821353435516357, + "learning_rate": 1.6595710971962028e-05, + "loss": 0.5572, + "step": 10739 + }, + { + "epoch": 29.264305177111716, + "grad_norm": 6.62902307510376, + "learning_rate": 1.6595047626086908e-05, + "loss": 0.3801, + "step": 10740 + }, + { + "epoch": 29.267029972752045, + "grad_norm": 7.1971564292907715, + "learning_rate": 1.659438422884977e-05, + "loss": 0.5649, + "step": 10741 + }, + { + "epoch": 29.26975476839237, + "grad_norm": 19.59003257751465, + "learning_rate": 1.6593720780255778e-05, + "loss": 0.3581, + "step": 10742 + }, + { + "epoch": 29.272479564032697, + "grad_norm": 7.921016693115234, + "learning_rate": 1.6593057280310105e-05, + "loss": 0.3824, + "step": 10743 + }, + { + "epoch": 29.275204359673026, + "grad_norm": 7.749704837799072, + "learning_rate": 1.659239372901791e-05, + "loss": 0.3783, + "step": 10744 + }, + { + "epoch": 29.277929155313352, + "grad_norm": 7.899710655212402, + "learning_rate": 1.659173012638437e-05, + "loss": 0.475, + "step": 10745 + }, + { + "epoch": 29.280653950953678, + "grad_norm": 7.129073143005371, + "learning_rate": 1.6591066472414647e-05, + "loss": 0.5405, + "step": 10746 + }, + { + "epoch": 29.283378746594007, + "grad_norm": 6.995426654815674, + "learning_rate": 1.6590402767113903e-05, + "loss": 0.6329, + "step": 10747 + }, + { + "epoch": 29.286103542234333, + "grad_norm": 6.966623783111572, + "learning_rate": 1.6589739010487323e-05, + "loss": 0.5219, + "step": 10748 + }, + { + "epoch": 29.28882833787466, + "grad_norm": 6.712077617645264, + "learning_rate": 1.6589075202540064e-05, + "loss": 0.37, + "step": 10749 + }, + { + "epoch": 29.291553133514988, + "grad_norm": 8.465301513671875, + "learning_rate": 1.65884113432773e-05, + "loss": 0.5001, + "step": 10750 + }, + { + "epoch": 29.294277929155314, + "grad_norm": 9.476337432861328, + "learning_rate": 1.65877474327042e-05, + "loss": 0.5214, + "step": 10751 + }, + { + "epoch": 29.29700272479564, + "grad_norm": 26.010038375854492, + "learning_rate": 1.6587083470825933e-05, + "loss": 0.4188, + "step": 10752 + }, + { + "epoch": 29.29972752043597, + "grad_norm": 8.532973289489746, + "learning_rate": 1.6586419457647673e-05, + "loss": 0.485, + "step": 10753 + }, + { + "epoch": 29.302452316076295, + "grad_norm": 7.86745023727417, + "learning_rate": 1.658575539317459e-05, + "loss": 0.444, + "step": 10754 + }, + { + "epoch": 29.30517711171662, + "grad_norm": 7.497247695922852, + "learning_rate": 1.658509127741186e-05, + "loss": 0.4146, + "step": 10755 + }, + { + "epoch": 29.30790190735695, + "grad_norm": 6.255491733551025, + "learning_rate": 1.658442711036465e-05, + "loss": 0.439, + "step": 10756 + }, + { + "epoch": 29.310626702997276, + "grad_norm": 7.498615741729736, + "learning_rate": 1.658376289203813e-05, + "loss": 0.5736, + "step": 10757 + }, + { + "epoch": 29.3133514986376, + "grad_norm": 7.252074718475342, + "learning_rate": 1.6583098622437477e-05, + "loss": 0.5148, + "step": 10758 + }, + { + "epoch": 29.31607629427793, + "grad_norm": 6.788809776306152, + "learning_rate": 1.6582434301567865e-05, + "loss": 0.5305, + "step": 10759 + }, + { + "epoch": 29.318801089918257, + "grad_norm": 8.381567001342773, + "learning_rate": 1.6581769929434467e-05, + "loss": 0.4646, + "step": 10760 + }, + { + "epoch": 29.321525885558582, + "grad_norm": 8.161211967468262, + "learning_rate": 1.6581105506042456e-05, + "loss": 0.5881, + "step": 10761 + }, + { + "epoch": 29.32425068119891, + "grad_norm": 10.112963676452637, + "learning_rate": 1.6580441031397008e-05, + "loss": 0.4094, + "step": 10762 + }, + { + "epoch": 29.326975476839237, + "grad_norm": 8.371186256408691, + "learning_rate": 1.6579776505503294e-05, + "loss": 0.4287, + "step": 10763 + }, + { + "epoch": 29.329700272479563, + "grad_norm": 7.590577602386475, + "learning_rate": 1.65791119283665e-05, + "loss": 0.3506, + "step": 10764 + }, + { + "epoch": 29.332425068119893, + "grad_norm": 7.688154697418213, + "learning_rate": 1.6578447299991788e-05, + "loss": 0.4612, + "step": 10765 + }, + { + "epoch": 29.33514986376022, + "grad_norm": 6.572022914886475, + "learning_rate": 1.657778262038434e-05, + "loss": 0.4254, + "step": 10766 + }, + { + "epoch": 29.337874659400544, + "grad_norm": 8.043402671813965, + "learning_rate": 1.657711788954933e-05, + "loss": 0.4941, + "step": 10767 + }, + { + "epoch": 29.340599455040874, + "grad_norm": 7.502988815307617, + "learning_rate": 1.6576453107491945e-05, + "loss": 0.4216, + "step": 10768 + }, + { + "epoch": 29.3433242506812, + "grad_norm": 6.928520202636719, + "learning_rate": 1.6575788274217347e-05, + "loss": 0.3849, + "step": 10769 + }, + { + "epoch": 29.346049046321525, + "grad_norm": 8.919737815856934, + "learning_rate": 1.6575123389730728e-05, + "loss": 0.4212, + "step": 10770 + }, + { + "epoch": 29.348773841961854, + "grad_norm": 6.961564064025879, + "learning_rate": 1.6574458454037256e-05, + "loss": 0.4708, + "step": 10771 + }, + { + "epoch": 29.35149863760218, + "grad_norm": 7.387964725494385, + "learning_rate": 1.6573793467142114e-05, + "loss": 0.5485, + "step": 10772 + }, + { + "epoch": 29.354223433242506, + "grad_norm": 9.136253356933594, + "learning_rate": 1.657312842905048e-05, + "loss": 0.4797, + "step": 10773 + }, + { + "epoch": 29.356948228882835, + "grad_norm": 7.161242961883545, + "learning_rate": 1.6572463339767537e-05, + "loss": 0.3954, + "step": 10774 + }, + { + "epoch": 29.35967302452316, + "grad_norm": 7.878520488739014, + "learning_rate": 1.6571798199298457e-05, + "loss": 0.4626, + "step": 10775 + }, + { + "epoch": 29.362397820163487, + "grad_norm": 8.14638900756836, + "learning_rate": 1.6571133007648424e-05, + "loss": 0.5304, + "step": 10776 + }, + { + "epoch": 29.365122615803816, + "grad_norm": 8.658432006835938, + "learning_rate": 1.657046776482262e-05, + "loss": 0.5071, + "step": 10777 + }, + { + "epoch": 29.367847411444142, + "grad_norm": 8.138938903808594, + "learning_rate": 1.6569802470826226e-05, + "loss": 0.6318, + "step": 10778 + }, + { + "epoch": 29.370572207084468, + "grad_norm": 6.878420829772949, + "learning_rate": 1.6569137125664417e-05, + "loss": 0.5325, + "step": 10779 + }, + { + "epoch": 29.373297002724797, + "grad_norm": 8.385366439819336, + "learning_rate": 1.6568471729342384e-05, + "loss": 0.5004, + "step": 10780 + }, + { + "epoch": 29.376021798365123, + "grad_norm": 8.681464195251465, + "learning_rate": 1.6567806281865305e-05, + "loss": 0.5396, + "step": 10781 + }, + { + "epoch": 29.37874659400545, + "grad_norm": 6.902587413787842, + "learning_rate": 1.6567140783238358e-05, + "loss": 0.4479, + "step": 10782 + }, + { + "epoch": 29.381471389645778, + "grad_norm": 9.539426803588867, + "learning_rate": 1.6566475233466732e-05, + "loss": 0.5034, + "step": 10783 + }, + { + "epoch": 29.384196185286104, + "grad_norm": 7.421967029571533, + "learning_rate": 1.6565809632555607e-05, + "loss": 0.5312, + "step": 10784 + }, + { + "epoch": 29.38692098092643, + "grad_norm": 8.303641319274902, + "learning_rate": 1.656514398051017e-05, + "loss": 0.5323, + "step": 10785 + }, + { + "epoch": 29.38964577656676, + "grad_norm": 8.001503944396973, + "learning_rate": 1.65644782773356e-05, + "loss": 0.4594, + "step": 10786 + }, + { + "epoch": 29.392370572207085, + "grad_norm": 8.343440055847168, + "learning_rate": 1.6563812523037087e-05, + "loss": 0.4363, + "step": 10787 + }, + { + "epoch": 29.39509536784741, + "grad_norm": 7.275823593139648, + "learning_rate": 1.6563146717619814e-05, + "loss": 0.4149, + "step": 10788 + }, + { + "epoch": 29.39782016348774, + "grad_norm": 7.187505722045898, + "learning_rate": 1.6562480861088966e-05, + "loss": 0.5338, + "step": 10789 + }, + { + "epoch": 29.400544959128066, + "grad_norm": 7.029732704162598, + "learning_rate": 1.6561814953449728e-05, + "loss": 0.3399, + "step": 10790 + }, + { + "epoch": 29.40326975476839, + "grad_norm": 8.944703102111816, + "learning_rate": 1.6561148994707285e-05, + "loss": 0.451, + "step": 10791 + }, + { + "epoch": 29.40599455040872, + "grad_norm": 6.436709880828857, + "learning_rate": 1.6560482984866823e-05, + "loss": 0.5174, + "step": 10792 + }, + { + "epoch": 29.408719346049047, + "grad_norm": 6.83833646774292, + "learning_rate": 1.655981692393353e-05, + "loss": 0.4771, + "step": 10793 + }, + { + "epoch": 29.411444141689373, + "grad_norm": 6.635432243347168, + "learning_rate": 1.65591508119126e-05, + "loss": 0.6338, + "step": 10794 + }, + { + "epoch": 29.414168937329702, + "grad_norm": 7.787850856781006, + "learning_rate": 1.655848464880921e-05, + "loss": 0.4234, + "step": 10795 + }, + { + "epoch": 29.416893732970028, + "grad_norm": 6.895452499389648, + "learning_rate": 1.6557818434628555e-05, + "loss": 0.3962, + "step": 10796 + }, + { + "epoch": 29.419618528610354, + "grad_norm": 14.239097595214844, + "learning_rate": 1.655715216937582e-05, + "loss": 0.5432, + "step": 10797 + }, + { + "epoch": 29.422343324250683, + "grad_norm": 7.626240253448486, + "learning_rate": 1.6556485853056194e-05, + "loss": 0.5251, + "step": 10798 + }, + { + "epoch": 29.42506811989101, + "grad_norm": 7.327658653259277, + "learning_rate": 1.6555819485674865e-05, + "loss": 0.5409, + "step": 10799 + }, + { + "epoch": 29.427792915531334, + "grad_norm": 8.085366249084473, + "learning_rate": 1.655515306723703e-05, + "loss": 0.4064, + "step": 10800 + }, + { + "epoch": 29.430517711171664, + "grad_norm": 8.021275520324707, + "learning_rate": 1.655448659774787e-05, + "loss": 0.4655, + "step": 10801 + }, + { + "epoch": 29.43324250681199, + "grad_norm": 7.704780101776123, + "learning_rate": 1.6553820077212585e-05, + "loss": 0.4886, + "step": 10802 + }, + { + "epoch": 29.435967302452315, + "grad_norm": 8.516914367675781, + "learning_rate": 1.6553153505636356e-05, + "loss": 0.5174, + "step": 10803 + }, + { + "epoch": 29.438692098092645, + "grad_norm": 7.043200492858887, + "learning_rate": 1.6552486883024376e-05, + "loss": 0.3714, + "step": 10804 + }, + { + "epoch": 29.44141689373297, + "grad_norm": 7.265212535858154, + "learning_rate": 1.6551820209381843e-05, + "loss": 0.4593, + "step": 10805 + }, + { + "epoch": 29.444141689373296, + "grad_norm": 6.623559951782227, + "learning_rate": 1.6551153484713943e-05, + "loss": 0.5319, + "step": 10806 + }, + { + "epoch": 29.446866485013626, + "grad_norm": 7.270200252532959, + "learning_rate": 1.655048670902587e-05, + "loss": 0.371, + "step": 10807 + }, + { + "epoch": 29.44959128065395, + "grad_norm": 8.101445198059082, + "learning_rate": 1.654981988232282e-05, + "loss": 0.5175, + "step": 10808 + }, + { + "epoch": 29.452316076294277, + "grad_norm": 6.925370693206787, + "learning_rate": 1.6549153004609982e-05, + "loss": 0.4874, + "step": 10809 + }, + { + "epoch": 29.455040871934607, + "grad_norm": 7.511909008026123, + "learning_rate": 1.654848607589255e-05, + "loss": 0.6361, + "step": 10810 + }, + { + "epoch": 29.457765667574932, + "grad_norm": 10.822510719299316, + "learning_rate": 1.6547819096175722e-05, + "loss": 0.5509, + "step": 10811 + }, + { + "epoch": 29.460490463215258, + "grad_norm": 8.81610107421875, + "learning_rate": 1.6547152065464688e-05, + "loss": 0.4535, + "step": 10812 + }, + { + "epoch": 29.463215258855588, + "grad_norm": 6.656589031219482, + "learning_rate": 1.6546484983764646e-05, + "loss": 0.4775, + "step": 10813 + }, + { + "epoch": 29.465940054495913, + "grad_norm": 10.142149925231934, + "learning_rate": 1.6545817851080785e-05, + "loss": 0.5012, + "step": 10814 + }, + { + "epoch": 29.46866485013624, + "grad_norm": 9.494502067565918, + "learning_rate": 1.654515066741831e-05, + "loss": 0.3914, + "step": 10815 + }, + { + "epoch": 29.47138964577657, + "grad_norm": 6.635324954986572, + "learning_rate": 1.654448343278241e-05, + "loss": 0.5041, + "step": 10816 + }, + { + "epoch": 29.474114441416894, + "grad_norm": 5.768138408660889, + "learning_rate": 1.6543816147178283e-05, + "loss": 0.3553, + "step": 10817 + }, + { + "epoch": 29.47683923705722, + "grad_norm": 8.109676361083984, + "learning_rate": 1.654314881061113e-05, + "loss": 0.4941, + "step": 10818 + }, + { + "epoch": 29.479564032697546, + "grad_norm": 7.911977291107178, + "learning_rate": 1.6542481423086145e-05, + "loss": 0.4431, + "step": 10819 + }, + { + "epoch": 29.482288828337875, + "grad_norm": 5.9850311279296875, + "learning_rate": 1.654181398460852e-05, + "loss": 0.4828, + "step": 10820 + }, + { + "epoch": 29.4850136239782, + "grad_norm": 8.306781768798828, + "learning_rate": 1.6541146495183463e-05, + "loss": 0.5159, + "step": 10821 + }, + { + "epoch": 29.48773841961853, + "grad_norm": 9.13083267211914, + "learning_rate": 1.6540478954816164e-05, + "loss": 0.4634, + "step": 10822 + }, + { + "epoch": 29.490463215258856, + "grad_norm": 7.0769267082214355, + "learning_rate": 1.6539811363511827e-05, + "loss": 0.3601, + "step": 10823 + }, + { + "epoch": 29.493188010899182, + "grad_norm": 8.102646827697754, + "learning_rate": 1.653914372127565e-05, + "loss": 0.4487, + "step": 10824 + }, + { + "epoch": 29.495912806539508, + "grad_norm": 7.4217681884765625, + "learning_rate": 1.6538476028112832e-05, + "loss": 0.3892, + "step": 10825 + }, + { + "epoch": 29.498637602179837, + "grad_norm": 7.808663845062256, + "learning_rate": 1.653780828402857e-05, + "loss": 0.3923, + "step": 10826 + }, + { + "epoch": 29.501362397820163, + "grad_norm": 6.494418144226074, + "learning_rate": 1.6537140489028073e-05, + "loss": 0.5069, + "step": 10827 + }, + { + "epoch": 29.504087193460492, + "grad_norm": 7.85498571395874, + "learning_rate": 1.653647264311653e-05, + "loss": 0.5422, + "step": 10828 + }, + { + "epoch": 29.506811989100818, + "grad_norm": 8.364899635314941, + "learning_rate": 1.6535804746299154e-05, + "loss": 0.4385, + "step": 10829 + }, + { + "epoch": 29.509536784741144, + "grad_norm": 6.561302185058594, + "learning_rate": 1.653513679858114e-05, + "loss": 0.3771, + "step": 10830 + }, + { + "epoch": 29.51226158038147, + "grad_norm": 7.510750770568848, + "learning_rate": 1.6534468799967692e-05, + "loss": 0.7035, + "step": 10831 + }, + { + "epoch": 29.5149863760218, + "grad_norm": 7.323873519897461, + "learning_rate": 1.6533800750464006e-05, + "loss": 0.3801, + "step": 10832 + }, + { + "epoch": 29.517711171662125, + "grad_norm": 7.319087028503418, + "learning_rate": 1.6533132650075293e-05, + "loss": 0.4436, + "step": 10833 + }, + { + "epoch": 29.520435967302454, + "grad_norm": 7.902466297149658, + "learning_rate": 1.6532464498806755e-05, + "loss": 0.3191, + "step": 10834 + }, + { + "epoch": 29.52316076294278, + "grad_norm": 8.569283485412598, + "learning_rate": 1.6531796296663595e-05, + "loss": 0.3892, + "step": 10835 + }, + { + "epoch": 29.525885558583106, + "grad_norm": 9.558220863342285, + "learning_rate": 1.653112804365101e-05, + "loss": 0.4821, + "step": 10836 + }, + { + "epoch": 29.52861035422343, + "grad_norm": 8.228992462158203, + "learning_rate": 1.653045973977421e-05, + "loss": 0.4522, + "step": 10837 + }, + { + "epoch": 29.53133514986376, + "grad_norm": 7.123694896697998, + "learning_rate": 1.6529791385038404e-05, + "loss": 0.4266, + "step": 10838 + }, + { + "epoch": 29.534059945504087, + "grad_norm": 7.235476493835449, + "learning_rate": 1.6529122979448792e-05, + "loss": 0.5008, + "step": 10839 + }, + { + "epoch": 29.536784741144416, + "grad_norm": 7.183542251586914, + "learning_rate": 1.6528454523010583e-05, + "loss": 0.4805, + "step": 10840 + }, + { + "epoch": 29.539509536784742, + "grad_norm": 7.383785724639893, + "learning_rate": 1.6527786015728975e-05, + "loss": 0.5205, + "step": 10841 + }, + { + "epoch": 29.542234332425068, + "grad_norm": 9.598885536193848, + "learning_rate": 1.652711745760918e-05, + "loss": 0.4417, + "step": 10842 + }, + { + "epoch": 29.544959128065393, + "grad_norm": 9.335498809814453, + "learning_rate": 1.6526448848656407e-05, + "loss": 0.5446, + "step": 10843 + }, + { + "epoch": 29.547683923705723, + "grad_norm": 7.628083229064941, + "learning_rate": 1.652578018887586e-05, + "loss": 0.4476, + "step": 10844 + }, + { + "epoch": 29.55040871934605, + "grad_norm": 7.617641448974609, + "learning_rate": 1.6525111478272748e-05, + "loss": 0.4086, + "step": 10845 + }, + { + "epoch": 29.553133514986374, + "grad_norm": 7.333584785461426, + "learning_rate": 1.6524442716852273e-05, + "loss": 0.5005, + "step": 10846 + }, + { + "epoch": 29.555858310626704, + "grad_norm": 7.800898551940918, + "learning_rate": 1.6523773904619653e-05, + "loss": 0.4606, + "step": 10847 + }, + { + "epoch": 29.55858310626703, + "grad_norm": 7.886172294616699, + "learning_rate": 1.652310504158009e-05, + "loss": 0.4534, + "step": 10848 + }, + { + "epoch": 29.561307901907355, + "grad_norm": 9.152216911315918, + "learning_rate": 1.6522436127738797e-05, + "loss": 0.4162, + "step": 10849 + }, + { + "epoch": 29.564032697547685, + "grad_norm": 24.142454147338867, + "learning_rate": 1.652176716310098e-05, + "loss": 0.5763, + "step": 10850 + }, + { + "epoch": 29.56675749318801, + "grad_norm": 7.811501979827881, + "learning_rate": 1.6521098147671847e-05, + "loss": 0.4875, + "step": 10851 + }, + { + "epoch": 29.569482288828336, + "grad_norm": 8.617351531982422, + "learning_rate": 1.6520429081456615e-05, + "loss": 0.4185, + "step": 10852 + }, + { + "epoch": 29.572207084468666, + "grad_norm": 7.524698734283447, + "learning_rate": 1.6519759964460488e-05, + "loss": 0.6508, + "step": 10853 + }, + { + "epoch": 29.57493188010899, + "grad_norm": 8.168391227722168, + "learning_rate": 1.6519090796688685e-05, + "loss": 0.4301, + "step": 10854 + }, + { + "epoch": 29.577656675749317, + "grad_norm": 8.772461891174316, + "learning_rate": 1.651842157814641e-05, + "loss": 0.3873, + "step": 10855 + }, + { + "epoch": 29.580381471389646, + "grad_norm": 7.3811211585998535, + "learning_rate": 1.6517752308838877e-05, + "loss": 0.4337, + "step": 10856 + }, + { + "epoch": 29.583106267029972, + "grad_norm": 6.60532283782959, + "learning_rate": 1.65170829887713e-05, + "loss": 0.4587, + "step": 10857 + }, + { + "epoch": 29.585831062670298, + "grad_norm": 7.635605335235596, + "learning_rate": 1.651641361794889e-05, + "loss": 0.7336, + "step": 10858 + }, + { + "epoch": 29.588555858310627, + "grad_norm": 9.370646476745605, + "learning_rate": 1.6515744196376863e-05, + "loss": 0.5171, + "step": 10859 + }, + { + "epoch": 29.591280653950953, + "grad_norm": 9.356303215026855, + "learning_rate": 1.6515074724060425e-05, + "loss": 0.5969, + "step": 10860 + }, + { + "epoch": 29.59400544959128, + "grad_norm": 13.548718452453613, + "learning_rate": 1.6514405201004797e-05, + "loss": 0.4778, + "step": 10861 + }, + { + "epoch": 29.59673024523161, + "grad_norm": 7.7641472816467285, + "learning_rate": 1.6513735627215192e-05, + "loss": 0.4249, + "step": 10862 + }, + { + "epoch": 29.599455040871934, + "grad_norm": 9.723471641540527, + "learning_rate": 1.651306600269682e-05, + "loss": 0.4331, + "step": 10863 + }, + { + "epoch": 29.60217983651226, + "grad_norm": 6.466434478759766, + "learning_rate": 1.65123963274549e-05, + "loss": 0.4282, + "step": 10864 + }, + { + "epoch": 29.60490463215259, + "grad_norm": 18.430665969848633, + "learning_rate": 1.6511726601494655e-05, + "loss": 0.6192, + "step": 10865 + }, + { + "epoch": 29.607629427792915, + "grad_norm": 6.94656229019165, + "learning_rate": 1.6511056824821285e-05, + "loss": 0.385, + "step": 10866 + }, + { + "epoch": 29.61035422343324, + "grad_norm": 5.463720798492432, + "learning_rate": 1.6510386997440017e-05, + "loss": 0.6242, + "step": 10867 + }, + { + "epoch": 29.61307901907357, + "grad_norm": 7.205257892608643, + "learning_rate": 1.6509717119356065e-05, + "loss": 0.5305, + "step": 10868 + }, + { + "epoch": 29.615803814713896, + "grad_norm": 6.175645351409912, + "learning_rate": 1.6509047190574643e-05, + "loss": 0.4505, + "step": 10869 + }, + { + "epoch": 29.618528610354222, + "grad_norm": 6.795779228210449, + "learning_rate": 1.650837721110097e-05, + "loss": 0.5634, + "step": 10870 + }, + { + "epoch": 29.62125340599455, + "grad_norm": 6.857511520385742, + "learning_rate": 1.6507707180940268e-05, + "loss": 0.4543, + "step": 10871 + }, + { + "epoch": 29.623978201634877, + "grad_norm": 7.351967811584473, + "learning_rate": 1.650703710009775e-05, + "loss": 0.3824, + "step": 10872 + }, + { + "epoch": 29.626702997275203, + "grad_norm": 7.04655647277832, + "learning_rate": 1.6506366968578637e-05, + "loss": 0.4796, + "step": 10873 + }, + { + "epoch": 29.629427792915532, + "grad_norm": 7.237663745880127, + "learning_rate": 1.650569678638815e-05, + "loss": 0.6383, + "step": 10874 + }, + { + "epoch": 29.632152588555858, + "grad_norm": 6.777371406555176, + "learning_rate": 1.65050265535315e-05, + "loss": 0.5815, + "step": 10875 + }, + { + "epoch": 29.634877384196184, + "grad_norm": 6.713928699493408, + "learning_rate": 1.650435627001392e-05, + "loss": 0.4886, + "step": 10876 + }, + { + "epoch": 29.637602179836513, + "grad_norm": 7.542415142059326, + "learning_rate": 1.650368593584062e-05, + "loss": 0.4447, + "step": 10877 + }, + { + "epoch": 29.64032697547684, + "grad_norm": 6.431827068328857, + "learning_rate": 1.650301555101682e-05, + "loss": 0.4555, + "step": 10878 + }, + { + "epoch": 29.643051771117165, + "grad_norm": 7.300482273101807, + "learning_rate": 1.6502345115547745e-05, + "loss": 0.411, + "step": 10879 + }, + { + "epoch": 29.645776566757494, + "grad_norm": 9.059066772460938, + "learning_rate": 1.6501674629438617e-05, + "loss": 0.4895, + "step": 10880 + }, + { + "epoch": 29.64850136239782, + "grad_norm": 7.237509250640869, + "learning_rate": 1.6501004092694655e-05, + "loss": 0.3969, + "step": 10881 + }, + { + "epoch": 29.651226158038146, + "grad_norm": 7.097210884094238, + "learning_rate": 1.6500333505321085e-05, + "loss": 0.4492, + "step": 10882 + }, + { + "epoch": 29.653950953678475, + "grad_norm": 8.74032211303711, + "learning_rate": 1.6499662867323127e-05, + "loss": 0.4481, + "step": 10883 + }, + { + "epoch": 29.6566757493188, + "grad_norm": 7.301566123962402, + "learning_rate": 1.6498992178706002e-05, + "loss": 0.3846, + "step": 10884 + }, + { + "epoch": 29.659400544959126, + "grad_norm": 7.869488716125488, + "learning_rate": 1.6498321439474935e-05, + "loss": 0.5212, + "step": 10885 + }, + { + "epoch": 29.662125340599456, + "grad_norm": 9.363385200500488, + "learning_rate": 1.649765064963515e-05, + "loss": 0.4977, + "step": 10886 + }, + { + "epoch": 29.66485013623978, + "grad_norm": 6.198626518249512, + "learning_rate": 1.649697980919187e-05, + "loss": 0.5959, + "step": 10887 + }, + { + "epoch": 29.667574931880107, + "grad_norm": 6.578914642333984, + "learning_rate": 1.6496308918150323e-05, + "loss": 0.4032, + "step": 10888 + }, + { + "epoch": 29.670299727520437, + "grad_norm": 9.510456085205078, + "learning_rate": 1.649563797651573e-05, + "loss": 0.418, + "step": 10889 + }, + { + "epoch": 29.673024523160763, + "grad_norm": 6.486546039581299, + "learning_rate": 1.6494966984293316e-05, + "loss": 0.3596, + "step": 10890 + }, + { + "epoch": 29.67574931880109, + "grad_norm": 6.955389499664307, + "learning_rate": 1.6494295941488307e-05, + "loss": 0.4252, + "step": 10891 + }, + { + "epoch": 29.678474114441418, + "grad_norm": 6.365244388580322, + "learning_rate": 1.6493624848105934e-05, + "loss": 0.4741, + "step": 10892 + }, + { + "epoch": 29.681198910081743, + "grad_norm": 7.88081169128418, + "learning_rate": 1.649295370415142e-05, + "loss": 0.5278, + "step": 10893 + }, + { + "epoch": 29.68392370572207, + "grad_norm": 7.345284461975098, + "learning_rate": 1.649228250962999e-05, + "loss": 0.4361, + "step": 10894 + }, + { + "epoch": 29.6866485013624, + "grad_norm": 6.725378513336182, + "learning_rate": 1.6491611264546868e-05, + "loss": 0.5792, + "step": 10895 + }, + { + "epoch": 29.689373297002724, + "grad_norm": 8.338081359863281, + "learning_rate": 1.6490939968907295e-05, + "loss": 0.4827, + "step": 10896 + }, + { + "epoch": 29.69209809264305, + "grad_norm": 6.808753967285156, + "learning_rate": 1.6490268622716484e-05, + "loss": 0.4923, + "step": 10897 + }, + { + "epoch": 29.69482288828338, + "grad_norm": 11.013527870178223, + "learning_rate": 1.6489597225979673e-05, + "loss": 0.298, + "step": 10898 + }, + { + "epoch": 29.697547683923705, + "grad_norm": 8.209692001342773, + "learning_rate": 1.6488925778702084e-05, + "loss": 0.4075, + "step": 10899 + }, + { + "epoch": 29.70027247956403, + "grad_norm": 5.375641345977783, + "learning_rate": 1.6488254280888956e-05, + "loss": 0.5535, + "step": 10900 + }, + { + "epoch": 29.70299727520436, + "grad_norm": 9.399170875549316, + "learning_rate": 1.6487582732545506e-05, + "loss": 0.5728, + "step": 10901 + }, + { + "epoch": 29.705722070844686, + "grad_norm": 13.955491065979004, + "learning_rate": 1.6486911133676974e-05, + "loss": 0.4485, + "step": 10902 + }, + { + "epoch": 29.708446866485012, + "grad_norm": 7.763715744018555, + "learning_rate": 1.6486239484288585e-05, + "loss": 0.592, + "step": 10903 + }, + { + "epoch": 29.71117166212534, + "grad_norm": 10.498160362243652, + "learning_rate": 1.6485567784385574e-05, + "loss": 0.4219, + "step": 10904 + }, + { + "epoch": 29.713896457765667, + "grad_norm": 6.306120872497559, + "learning_rate": 1.6484896033973168e-05, + "loss": 0.485, + "step": 10905 + }, + { + "epoch": 29.716621253405993, + "grad_norm": 8.809769630432129, + "learning_rate": 1.6484224233056602e-05, + "loss": 0.4487, + "step": 10906 + }, + { + "epoch": 29.719346049046322, + "grad_norm": 10.231396675109863, + "learning_rate": 1.6483552381641107e-05, + "loss": 0.5508, + "step": 10907 + }, + { + "epoch": 29.722070844686648, + "grad_norm": 8.767487525939941, + "learning_rate": 1.6482880479731912e-05, + "loss": 0.5564, + "step": 10908 + }, + { + "epoch": 29.724795640326974, + "grad_norm": 7.6702375411987305, + "learning_rate": 1.6482208527334257e-05, + "loss": 0.667, + "step": 10909 + }, + { + "epoch": 29.727520435967303, + "grad_norm": 9.525460243225098, + "learning_rate": 1.6481536524453365e-05, + "loss": 0.4465, + "step": 10910 + }, + { + "epoch": 29.73024523160763, + "grad_norm": 6.9797163009643555, + "learning_rate": 1.648086447109448e-05, + "loss": 0.3654, + "step": 10911 + }, + { + "epoch": 29.732970027247955, + "grad_norm": 7.111659049987793, + "learning_rate": 1.6480192367262827e-05, + "loss": 0.4361, + "step": 10912 + }, + { + "epoch": 29.735694822888284, + "grad_norm": 9.03895378112793, + "learning_rate": 1.6479520212963644e-05, + "loss": 0.4158, + "step": 10913 + }, + { + "epoch": 29.73841961852861, + "grad_norm": 7.492087364196777, + "learning_rate": 1.647884800820217e-05, + "loss": 0.3877, + "step": 10914 + }, + { + "epoch": 29.741144414168936, + "grad_norm": 7.278896331787109, + "learning_rate": 1.6478175752983632e-05, + "loss": 0.4546, + "step": 10915 + }, + { + "epoch": 29.743869209809265, + "grad_norm": 8.521524429321289, + "learning_rate": 1.6477503447313276e-05, + "loss": 0.43, + "step": 10916 + }, + { + "epoch": 29.74659400544959, + "grad_norm": 7.021545886993408, + "learning_rate": 1.6476831091196327e-05, + "loss": 0.3748, + "step": 10917 + }, + { + "epoch": 29.749318801089917, + "grad_norm": 7.985683917999268, + "learning_rate": 1.6476158684638027e-05, + "loss": 0.6056, + "step": 10918 + }, + { + "epoch": 29.752043596730246, + "grad_norm": 8.665266036987305, + "learning_rate": 1.647548622764361e-05, + "loss": 0.477, + "step": 10919 + }, + { + "epoch": 29.754768392370572, + "grad_norm": 8.756564140319824, + "learning_rate": 1.6474813720218318e-05, + "loss": 0.542, + "step": 10920 + }, + { + "epoch": 29.757493188010898, + "grad_norm": 7.334249019622803, + "learning_rate": 1.6474141162367384e-05, + "loss": 0.4863, + "step": 10921 + }, + { + "epoch": 29.760217983651227, + "grad_norm": 8.4699125289917, + "learning_rate": 1.6473468554096045e-05, + "loss": 0.601, + "step": 10922 + }, + { + "epoch": 29.762942779291553, + "grad_norm": 7.529186725616455, + "learning_rate": 1.6472795895409542e-05, + "loss": 0.3366, + "step": 10923 + }, + { + "epoch": 29.76566757493188, + "grad_norm": 8.458430290222168, + "learning_rate": 1.6472123186313114e-05, + "loss": 0.5209, + "step": 10924 + }, + { + "epoch": 29.768392370572208, + "grad_norm": 8.96320915222168, + "learning_rate": 1.6471450426811997e-05, + "loss": 0.5283, + "step": 10925 + }, + { + "epoch": 29.771117166212534, + "grad_norm": 11.148738861083984, + "learning_rate": 1.6470777616911435e-05, + "loss": 0.4584, + "step": 10926 + }, + { + "epoch": 29.77384196185286, + "grad_norm": 8.912113189697266, + "learning_rate": 1.6470104756616664e-05, + "loss": 0.5006, + "step": 10927 + }, + { + "epoch": 29.77656675749319, + "grad_norm": 7.305341720581055, + "learning_rate": 1.6469431845932923e-05, + "loss": 0.5061, + "step": 10928 + }, + { + "epoch": 29.779291553133515, + "grad_norm": 6.873284339904785, + "learning_rate": 1.646875888486546e-05, + "loss": 0.3441, + "step": 10929 + }, + { + "epoch": 29.78201634877384, + "grad_norm": 5.6703290939331055, + "learning_rate": 1.6468085873419502e-05, + "loss": 0.6736, + "step": 10930 + }, + { + "epoch": 29.78474114441417, + "grad_norm": 7.85083532333374, + "learning_rate": 1.646741281160031e-05, + "loss": 0.3551, + "step": 10931 + }, + { + "epoch": 29.787465940054496, + "grad_norm": 6.734079360961914, + "learning_rate": 1.646673969941311e-05, + "loss": 0.3798, + "step": 10932 + }, + { + "epoch": 29.79019073569482, + "grad_norm": 6.857694149017334, + "learning_rate": 1.646606653686315e-05, + "loss": 0.5082, + "step": 10933 + }, + { + "epoch": 29.79291553133515, + "grad_norm": 17.572439193725586, + "learning_rate": 1.6465393323955673e-05, + "loss": 0.4622, + "step": 10934 + }, + { + "epoch": 29.795640326975477, + "grad_norm": 6.712080955505371, + "learning_rate": 1.6464720060695918e-05, + "loss": 0.4265, + "step": 10935 + }, + { + "epoch": 29.798365122615802, + "grad_norm": 9.340763092041016, + "learning_rate": 1.6464046747089134e-05, + "loss": 0.5399, + "step": 10936 + }, + { + "epoch": 29.80108991825613, + "grad_norm": 7.187861442565918, + "learning_rate": 1.6463373383140563e-05, + "loss": 0.4803, + "step": 10937 + }, + { + "epoch": 29.803814713896458, + "grad_norm": 7.087644577026367, + "learning_rate": 1.6462699968855446e-05, + "loss": 0.5294, + "step": 10938 + }, + { + "epoch": 29.806539509536783, + "grad_norm": 8.618359565734863, + "learning_rate": 1.6462026504239026e-05, + "loss": 0.5131, + "step": 10939 + }, + { + "epoch": 29.809264305177113, + "grad_norm": 9.606124877929688, + "learning_rate": 1.6461352989296556e-05, + "loss": 0.4279, + "step": 10940 + }, + { + "epoch": 29.81198910081744, + "grad_norm": 8.291728019714355, + "learning_rate": 1.6460679424033278e-05, + "loss": 0.3738, + "step": 10941 + }, + { + "epoch": 29.814713896457764, + "grad_norm": 8.681512832641602, + "learning_rate": 1.6460005808454434e-05, + "loss": 0.4538, + "step": 10942 + }, + { + "epoch": 29.817438692098094, + "grad_norm": 7.411059379577637, + "learning_rate": 1.6459332142565275e-05, + "loss": 0.4568, + "step": 10943 + }, + { + "epoch": 29.82016348773842, + "grad_norm": 11.733348846435547, + "learning_rate": 1.6458658426371043e-05, + "loss": 0.351, + "step": 10944 + }, + { + "epoch": 29.822888283378745, + "grad_norm": 8.563687324523926, + "learning_rate": 1.645798465987699e-05, + "loss": 0.6837, + "step": 10945 + }, + { + "epoch": 29.825613079019075, + "grad_norm": 6.435044765472412, + "learning_rate": 1.6457310843088355e-05, + "loss": 0.2955, + "step": 10946 + }, + { + "epoch": 29.8283378746594, + "grad_norm": 11.304015159606934, + "learning_rate": 1.6456636976010396e-05, + "loss": 0.3521, + "step": 10947 + }, + { + "epoch": 29.831062670299726, + "grad_norm": 8.280211448669434, + "learning_rate": 1.6455963058648353e-05, + "loss": 0.6414, + "step": 10948 + }, + { + "epoch": 29.833787465940055, + "grad_norm": 6.6961259841918945, + "learning_rate": 1.6455289091007478e-05, + "loss": 0.3734, + "step": 10949 + }, + { + "epoch": 29.83651226158038, + "grad_norm": 7.7939372062683105, + "learning_rate": 1.645461507309302e-05, + "loss": 0.4768, + "step": 10950 + }, + { + "epoch": 29.839237057220707, + "grad_norm": 8.741804122924805, + "learning_rate": 1.6453941004910227e-05, + "loss": 0.4564, + "step": 10951 + }, + { + "epoch": 29.841961852861036, + "grad_norm": 7.31764554977417, + "learning_rate": 1.645326688646435e-05, + "loss": 0.576, + "step": 10952 + }, + { + "epoch": 29.844686648501362, + "grad_norm": 6.965038776397705, + "learning_rate": 1.645259271776064e-05, + "loss": 0.5383, + "step": 10953 + }, + { + "epoch": 29.847411444141688, + "grad_norm": 10.115130424499512, + "learning_rate": 1.6451918498804343e-05, + "loss": 0.5702, + "step": 10954 + }, + { + "epoch": 29.850136239782017, + "grad_norm": 7.532892227172852, + "learning_rate": 1.645124422960071e-05, + "loss": 0.4471, + "step": 10955 + }, + { + "epoch": 29.852861035422343, + "grad_norm": 7.694735050201416, + "learning_rate": 1.6450569910154998e-05, + "loss": 0.4386, + "step": 10956 + }, + { + "epoch": 29.85558583106267, + "grad_norm": 7.561770439147949, + "learning_rate": 1.6449895540472455e-05, + "loss": 0.5721, + "step": 10957 + }, + { + "epoch": 29.858310626703, + "grad_norm": 7.428245544433594, + "learning_rate": 1.6449221120558334e-05, + "loss": 0.7021, + "step": 10958 + }, + { + "epoch": 29.861035422343324, + "grad_norm": 8.777802467346191, + "learning_rate": 1.6448546650417883e-05, + "loss": 0.3962, + "step": 10959 + }, + { + "epoch": 29.86376021798365, + "grad_norm": 6.817665100097656, + "learning_rate": 1.644787213005636e-05, + "loss": 0.6262, + "step": 10960 + }, + { + "epoch": 29.86648501362398, + "grad_norm": 7.662132263183594, + "learning_rate": 1.6447197559479017e-05, + "loss": 0.5568, + "step": 10961 + }, + { + "epoch": 29.869209809264305, + "grad_norm": 7.989658832550049, + "learning_rate": 1.6446522938691107e-05, + "loss": 0.5452, + "step": 10962 + }, + { + "epoch": 29.87193460490463, + "grad_norm": 5.7323126792907715, + "learning_rate": 1.6445848267697884e-05, + "loss": 0.5826, + "step": 10963 + }, + { + "epoch": 29.87465940054496, + "grad_norm": 6.911271095275879, + "learning_rate": 1.6445173546504603e-05, + "loss": 0.6467, + "step": 10964 + }, + { + "epoch": 29.877384196185286, + "grad_norm": 6.319054126739502, + "learning_rate": 1.6444498775116512e-05, + "loss": 0.4939, + "step": 10965 + }, + { + "epoch": 29.88010899182561, + "grad_norm": 8.498305320739746, + "learning_rate": 1.6443823953538876e-05, + "loss": 0.4156, + "step": 10966 + }, + { + "epoch": 29.88283378746594, + "grad_norm": 8.051203727722168, + "learning_rate": 1.644314908177695e-05, + "loss": 0.5158, + "step": 10967 + }, + { + "epoch": 29.885558583106267, + "grad_norm": 7.078332901000977, + "learning_rate": 1.6442474159835984e-05, + "loss": 0.5493, + "step": 10968 + }, + { + "epoch": 29.888283378746593, + "grad_norm": 8.033302307128906, + "learning_rate": 1.6441799187721237e-05, + "loss": 0.5834, + "step": 10969 + }, + { + "epoch": 29.891008174386922, + "grad_norm": 7.197174549102783, + "learning_rate": 1.6441124165437962e-05, + "loss": 0.3835, + "step": 10970 + }, + { + "epoch": 29.893732970027248, + "grad_norm": 7.283804416656494, + "learning_rate": 1.6440449092991424e-05, + "loss": 0.4468, + "step": 10971 + }, + { + "epoch": 29.896457765667574, + "grad_norm": 7.508810043334961, + "learning_rate": 1.643977397038687e-05, + "loss": 0.561, + "step": 10972 + }, + { + "epoch": 29.899182561307903, + "grad_norm": 6.808213710784912, + "learning_rate": 1.6439098797629565e-05, + "loss": 0.4292, + "step": 10973 + }, + { + "epoch": 29.90190735694823, + "grad_norm": 7.95700216293335, + "learning_rate": 1.6438423574724768e-05, + "loss": 0.5316, + "step": 10974 + }, + { + "epoch": 29.904632152588555, + "grad_norm": 7.048412799835205, + "learning_rate": 1.6437748301677738e-05, + "loss": 0.5133, + "step": 10975 + }, + { + "epoch": 29.907356948228884, + "grad_norm": 9.064624786376953, + "learning_rate": 1.643707297849373e-05, + "loss": 0.5742, + "step": 10976 + }, + { + "epoch": 29.91008174386921, + "grad_norm": 6.609524250030518, + "learning_rate": 1.6436397605178e-05, + "loss": 0.4809, + "step": 10977 + }, + { + "epoch": 29.912806539509535, + "grad_norm": 6.805055618286133, + "learning_rate": 1.6435722181735817e-05, + "loss": 0.499, + "step": 10978 + }, + { + "epoch": 29.915531335149865, + "grad_norm": 7.3713250160217285, + "learning_rate": 1.6435046708172436e-05, + "loss": 0.42, + "step": 10979 + }, + { + "epoch": 29.91825613079019, + "grad_norm": 10.440509796142578, + "learning_rate": 1.6434371184493117e-05, + "loss": 0.4354, + "step": 10980 + }, + { + "epoch": 29.920980926430516, + "grad_norm": 8.879534721374512, + "learning_rate": 1.6433695610703123e-05, + "loss": 0.4551, + "step": 10981 + }, + { + "epoch": 29.923705722070846, + "grad_norm": 6.668054103851318, + "learning_rate": 1.6433019986807714e-05, + "loss": 0.4812, + "step": 10982 + }, + { + "epoch": 29.92643051771117, + "grad_norm": 9.760262489318848, + "learning_rate": 1.6432344312812153e-05, + "loss": 0.4534, + "step": 10983 + }, + { + "epoch": 29.929155313351497, + "grad_norm": 6.852321147918701, + "learning_rate": 1.64316685887217e-05, + "loss": 0.3206, + "step": 10984 + }, + { + "epoch": 29.931880108991827, + "grad_norm": 17.207426071166992, + "learning_rate": 1.6430992814541625e-05, + "loss": 0.6734, + "step": 10985 + }, + { + "epoch": 29.934604904632153, + "grad_norm": 8.152406692504883, + "learning_rate": 1.643031699027718e-05, + "loss": 0.5496, + "step": 10986 + }, + { + "epoch": 29.93732970027248, + "grad_norm": 7.128805160522461, + "learning_rate": 1.6429641115933635e-05, + "loss": 0.5237, + "step": 10987 + }, + { + "epoch": 29.940054495912808, + "grad_norm": 6.745392322540283, + "learning_rate": 1.642896519151625e-05, + "loss": 0.3401, + "step": 10988 + }, + { + "epoch": 29.942779291553133, + "grad_norm": 6.946228981018066, + "learning_rate": 1.642828921703029e-05, + "loss": 0.3607, + "step": 10989 + }, + { + "epoch": 29.94550408719346, + "grad_norm": 10.81572437286377, + "learning_rate": 1.6427613192481025e-05, + "loss": 0.3947, + "step": 10990 + }, + { + "epoch": 29.94822888283379, + "grad_norm": 7.242533206939697, + "learning_rate": 1.6426937117873713e-05, + "loss": 0.3457, + "step": 10991 + }, + { + "epoch": 29.950953678474114, + "grad_norm": 6.762942314147949, + "learning_rate": 1.642626099321362e-05, + "loss": 0.358, + "step": 10992 + }, + { + "epoch": 29.95367847411444, + "grad_norm": 7.605253219604492, + "learning_rate": 1.6425584818506016e-05, + "loss": 0.4045, + "step": 10993 + }, + { + "epoch": 29.95640326975477, + "grad_norm": 8.510704040527344, + "learning_rate": 1.6424908593756162e-05, + "loss": 0.4006, + "step": 10994 + }, + { + "epoch": 29.959128065395095, + "grad_norm": 8.417881965637207, + "learning_rate": 1.6424232318969327e-05, + "loss": 0.4297, + "step": 10995 + }, + { + "epoch": 29.96185286103542, + "grad_norm": 6.6445536613464355, + "learning_rate": 1.6423555994150776e-05, + "loss": 0.4922, + "step": 10996 + }, + { + "epoch": 29.96457765667575, + "grad_norm": 13.118285179138184, + "learning_rate": 1.6422879619305782e-05, + "loss": 0.5127, + "step": 10997 + }, + { + "epoch": 29.967302452316076, + "grad_norm": 8.387615203857422, + "learning_rate": 1.6422203194439606e-05, + "loss": 0.3346, + "step": 10998 + }, + { + "epoch": 29.970027247956402, + "grad_norm": 8.093526840209961, + "learning_rate": 1.6421526719557514e-05, + "loss": 0.5449, + "step": 10999 + }, + { + "epoch": 29.97275204359673, + "grad_norm": 6.561741828918457, + "learning_rate": 1.6420850194664787e-05, + "loss": 0.4216, + "step": 11000 + }, + { + "epoch": 29.975476839237057, + "grad_norm": 6.173132419586182, + "learning_rate": 1.642017361976668e-05, + "loss": 0.4457, + "step": 11001 + }, + { + "epoch": 29.978201634877383, + "grad_norm": 7.232378005981445, + "learning_rate": 1.6419496994868467e-05, + "loss": 0.4089, + "step": 11002 + }, + { + "epoch": 29.980926430517712, + "grad_norm": 7.017350673675537, + "learning_rate": 1.6418820319975418e-05, + "loss": 0.4875, + "step": 11003 + }, + { + "epoch": 29.983651226158038, + "grad_norm": 7.370197296142578, + "learning_rate": 1.6418143595092805e-05, + "loss": 0.3418, + "step": 11004 + }, + { + "epoch": 29.986376021798364, + "grad_norm": 6.696606636047363, + "learning_rate": 1.6417466820225896e-05, + "loss": 0.5358, + "step": 11005 + }, + { + "epoch": 29.989100817438693, + "grad_norm": 11.178949356079102, + "learning_rate": 1.641678999537996e-05, + "loss": 0.4545, + "step": 11006 + }, + { + "epoch": 29.99182561307902, + "grad_norm": 8.079872131347656, + "learning_rate": 1.6416113120560275e-05, + "loss": 0.3928, + "step": 11007 + }, + { + "epoch": 29.994550408719345, + "grad_norm": 20.830598831176758, + "learning_rate": 1.64154361957721e-05, + "loss": 0.446, + "step": 11008 + }, + { + "epoch": 29.997275204359674, + "grad_norm": 8.717055320739746, + "learning_rate": 1.641475922102072e-05, + "loss": 0.4711, + "step": 11009 + }, + { + "epoch": 30.0, + "grad_norm": 7.055100917816162, + "learning_rate": 1.6414082196311402e-05, + "loss": 0.5015, + "step": 11010 + }, + { + "epoch": 30.002724795640326, + "grad_norm": 6.0088300704956055, + "learning_rate": 1.6413405121649416e-05, + "loss": 0.3615, + "step": 11011 + }, + { + "epoch": 30.005449591280655, + "grad_norm": 5.820860385894775, + "learning_rate": 1.6412727997040036e-05, + "loss": 0.3237, + "step": 11012 + }, + { + "epoch": 30.00817438692098, + "grad_norm": 6.502038955688477, + "learning_rate": 1.641205082248854e-05, + "loss": 0.5334, + "step": 11013 + }, + { + "epoch": 30.010899182561307, + "grad_norm": 7.3135151863098145, + "learning_rate": 1.64113735980002e-05, + "loss": 0.485, + "step": 11014 + }, + { + "epoch": 30.013623978201636, + "grad_norm": 6.81199836730957, + "learning_rate": 1.641069632358028e-05, + "loss": 0.438, + "step": 11015 + }, + { + "epoch": 30.016348773841962, + "grad_norm": 6.724306106567383, + "learning_rate": 1.641001899923407e-05, + "loss": 0.2847, + "step": 11016 + }, + { + "epoch": 30.019073569482288, + "grad_norm": 12.282051086425781, + "learning_rate": 1.640934162496684e-05, + "loss": 0.4241, + "step": 11017 + }, + { + "epoch": 30.021798365122617, + "grad_norm": 7.175605773925781, + "learning_rate": 1.640866420078386e-05, + "loss": 0.3946, + "step": 11018 + }, + { + "epoch": 30.024523160762943, + "grad_norm": 6.926136016845703, + "learning_rate": 1.640798672669041e-05, + "loss": 0.3102, + "step": 11019 + }, + { + "epoch": 30.02724795640327, + "grad_norm": 7.437623500823975, + "learning_rate": 1.6407309202691765e-05, + "loss": 0.463, + "step": 11020 + }, + { + "epoch": 30.029972752043598, + "grad_norm": 6.733150959014893, + "learning_rate": 1.6406631628793205e-05, + "loss": 0.3729, + "step": 11021 + }, + { + "epoch": 30.032697547683924, + "grad_norm": 5.76999044418335, + "learning_rate": 1.6405954005e-05, + "loss": 0.3857, + "step": 11022 + }, + { + "epoch": 30.03542234332425, + "grad_norm": 7.99325704574585, + "learning_rate": 1.6405276331317437e-05, + "loss": 0.452, + "step": 11023 + }, + { + "epoch": 30.03814713896458, + "grad_norm": 6.218040943145752, + "learning_rate": 1.6404598607750785e-05, + "loss": 0.3005, + "step": 11024 + }, + { + "epoch": 30.040871934604905, + "grad_norm": 6.658420085906982, + "learning_rate": 1.6403920834305324e-05, + "loss": 0.3451, + "step": 11025 + }, + { + "epoch": 30.04359673024523, + "grad_norm": 7.311766624450684, + "learning_rate": 1.6403243010986332e-05, + "loss": 0.3774, + "step": 11026 + }, + { + "epoch": 30.04632152588556, + "grad_norm": 8.474394798278809, + "learning_rate": 1.6402565137799096e-05, + "loss": 0.3843, + "step": 11027 + }, + { + "epoch": 30.049046321525886, + "grad_norm": 7.289997577667236, + "learning_rate": 1.6401887214748887e-05, + "loss": 0.4448, + "step": 11028 + }, + { + "epoch": 30.05177111716621, + "grad_norm": 6.859222412109375, + "learning_rate": 1.6401209241840984e-05, + "loss": 0.3199, + "step": 11029 + }, + { + "epoch": 30.05449591280654, + "grad_norm": 6.75163459777832, + "learning_rate": 1.640053121908067e-05, + "loss": 0.438, + "step": 11030 + }, + { + "epoch": 30.057220708446867, + "grad_norm": 6.317370891571045, + "learning_rate": 1.6399853146473223e-05, + "loss": 0.2949, + "step": 11031 + }, + { + "epoch": 30.059945504087192, + "grad_norm": 8.458065032958984, + "learning_rate": 1.6399175024023927e-05, + "loss": 0.4216, + "step": 11032 + }, + { + "epoch": 30.06267029972752, + "grad_norm": 6.969457626342773, + "learning_rate": 1.6398496851738064e-05, + "loss": 0.3399, + "step": 11033 + }, + { + "epoch": 30.065395095367847, + "grad_norm": 6.142038345336914, + "learning_rate": 1.639781862962091e-05, + "loss": 0.2935, + "step": 11034 + }, + { + "epoch": 30.068119891008173, + "grad_norm": 7.265402317047119, + "learning_rate": 1.6397140357677753e-05, + "loss": 0.5065, + "step": 11035 + }, + { + "epoch": 30.070844686648503, + "grad_norm": 8.197349548339844, + "learning_rate": 1.6396462035913872e-05, + "loss": 0.456, + "step": 11036 + }, + { + "epoch": 30.07356948228883, + "grad_norm": 7.076777458190918, + "learning_rate": 1.639578366433455e-05, + "loss": 0.5262, + "step": 11037 + }, + { + "epoch": 30.076294277929154, + "grad_norm": 5.244971752166748, + "learning_rate": 1.639510524294507e-05, + "loss": 0.3103, + "step": 11038 + }, + { + "epoch": 30.079019073569484, + "grad_norm": 6.139191150665283, + "learning_rate": 1.639442677175072e-05, + "loss": 0.3783, + "step": 11039 + }, + { + "epoch": 30.08174386920981, + "grad_norm": 6.427220821380615, + "learning_rate": 1.639374825075678e-05, + "loss": 0.5044, + "step": 11040 + }, + { + "epoch": 30.084468664850135, + "grad_norm": 8.533020973205566, + "learning_rate": 1.639306967996853e-05, + "loss": 0.5481, + "step": 11041 + }, + { + "epoch": 30.087193460490465, + "grad_norm": 6.449970722198486, + "learning_rate": 1.6392391059391258e-05, + "loss": 0.4382, + "step": 11042 + }, + { + "epoch": 30.08991825613079, + "grad_norm": 10.026012420654297, + "learning_rate": 1.6391712389030253e-05, + "loss": 0.4258, + "step": 11043 + }, + { + "epoch": 30.092643051771116, + "grad_norm": 6.1092610359191895, + "learning_rate": 1.63910336688908e-05, + "loss": 0.3223, + "step": 11044 + }, + { + "epoch": 30.095367847411445, + "grad_norm": 9.438382148742676, + "learning_rate": 1.639035489897818e-05, + "loss": 0.4528, + "step": 11045 + }, + { + "epoch": 30.09809264305177, + "grad_norm": 6.647580146789551, + "learning_rate": 1.6389676079297684e-05, + "loss": 0.3857, + "step": 11046 + }, + { + "epoch": 30.100817438692097, + "grad_norm": 5.792067050933838, + "learning_rate": 1.6388997209854595e-05, + "loss": 0.655, + "step": 11047 + }, + { + "epoch": 30.103542234332426, + "grad_norm": 6.984425067901611, + "learning_rate": 1.63883182906542e-05, + "loss": 0.396, + "step": 11048 + }, + { + "epoch": 30.106267029972752, + "grad_norm": 7.124753475189209, + "learning_rate": 1.6387639321701787e-05, + "loss": 0.4637, + "step": 11049 + }, + { + "epoch": 30.108991825613078, + "grad_norm": 9.646773338317871, + "learning_rate": 1.6386960303002647e-05, + "loss": 0.4193, + "step": 11050 + }, + { + "epoch": 30.111716621253407, + "grad_norm": 6.347529888153076, + "learning_rate": 1.6386281234562065e-05, + "loss": 0.3469, + "step": 11051 + }, + { + "epoch": 30.114441416893733, + "grad_norm": 6.188181400299072, + "learning_rate": 1.638560211638533e-05, + "loss": 0.3493, + "step": 11052 + }, + { + "epoch": 30.11716621253406, + "grad_norm": 5.9739251136779785, + "learning_rate": 1.638492294847773e-05, + "loss": 0.4186, + "step": 11053 + }, + { + "epoch": 30.11989100817439, + "grad_norm": 8.596823692321777, + "learning_rate": 1.6384243730844556e-05, + "loss": 0.5058, + "step": 11054 + }, + { + "epoch": 30.122615803814714, + "grad_norm": 7.194712162017822, + "learning_rate": 1.63835644634911e-05, + "loss": 0.3762, + "step": 11055 + }, + { + "epoch": 30.12534059945504, + "grad_norm": 8.324389457702637, + "learning_rate": 1.6382885146422646e-05, + "loss": 0.4172, + "step": 11056 + }, + { + "epoch": 30.12806539509537, + "grad_norm": 6.283515930175781, + "learning_rate": 1.6382205779644487e-05, + "loss": 0.4075, + "step": 11057 + }, + { + "epoch": 30.130790190735695, + "grad_norm": 7.6013312339782715, + "learning_rate": 1.638152636316192e-05, + "loss": 0.4424, + "step": 11058 + }, + { + "epoch": 30.13351498637602, + "grad_norm": 6.367516994476318, + "learning_rate": 1.638084689698023e-05, + "loss": 0.523, + "step": 11059 + }, + { + "epoch": 30.13623978201635, + "grad_norm": 7.755098342895508, + "learning_rate": 1.6380167381104706e-05, + "loss": 0.4693, + "step": 11060 + }, + { + "epoch": 30.138964577656676, + "grad_norm": 7.197167873382568, + "learning_rate": 1.6379487815540648e-05, + "loss": 0.3907, + "step": 11061 + }, + { + "epoch": 30.141689373297, + "grad_norm": 6.419443130493164, + "learning_rate": 1.6378808200293343e-05, + "loss": 0.5005, + "step": 11062 + }, + { + "epoch": 30.14441416893733, + "grad_norm": 6.293830871582031, + "learning_rate": 1.6378128535368084e-05, + "loss": 0.3582, + "step": 11063 + }, + { + "epoch": 30.147138964577657, + "grad_norm": 6.32768440246582, + "learning_rate": 1.6377448820770164e-05, + "loss": 0.3264, + "step": 11064 + }, + { + "epoch": 30.149863760217983, + "grad_norm": 7.156543254852295, + "learning_rate": 1.637676905650488e-05, + "loss": 0.3628, + "step": 11065 + }, + { + "epoch": 30.152588555858312, + "grad_norm": 6.288056373596191, + "learning_rate": 1.637608924257752e-05, + "loss": 0.5111, + "step": 11066 + }, + { + "epoch": 30.155313351498638, + "grad_norm": 6.886847496032715, + "learning_rate": 1.6375409378993387e-05, + "loss": 0.3865, + "step": 11067 + }, + { + "epoch": 30.158038147138964, + "grad_norm": 7.042550086975098, + "learning_rate": 1.637472946575777e-05, + "loss": 0.6097, + "step": 11068 + }, + { + "epoch": 30.160762942779293, + "grad_norm": 6.211397171020508, + "learning_rate": 1.6374049502875963e-05, + "loss": 0.493, + "step": 11069 + }, + { + "epoch": 30.16348773841962, + "grad_norm": 6.925831317901611, + "learning_rate": 1.6373369490353265e-05, + "loss": 0.564, + "step": 11070 + }, + { + "epoch": 30.166212534059945, + "grad_norm": 7.403109073638916, + "learning_rate": 1.637268942819497e-05, + "loss": 0.4129, + "step": 11071 + }, + { + "epoch": 30.168937329700274, + "grad_norm": 5.961977481842041, + "learning_rate": 1.6372009316406376e-05, + "loss": 0.4259, + "step": 11072 + }, + { + "epoch": 30.1716621253406, + "grad_norm": 5.775633335113525, + "learning_rate": 1.6371329154992775e-05, + "loss": 0.5584, + "step": 11073 + }, + { + "epoch": 30.174386920980925, + "grad_norm": 6.836814880371094, + "learning_rate": 1.6370648943959473e-05, + "loss": 0.3898, + "step": 11074 + }, + { + "epoch": 30.177111716621255, + "grad_norm": 7.935107707977295, + "learning_rate": 1.6369968683311758e-05, + "loss": 0.5857, + "step": 11075 + }, + { + "epoch": 30.17983651226158, + "grad_norm": 5.413071155548096, + "learning_rate": 1.6369288373054936e-05, + "loss": 0.6349, + "step": 11076 + }, + { + "epoch": 30.182561307901906, + "grad_norm": 5.701023101806641, + "learning_rate": 1.6368608013194296e-05, + "loss": 0.5304, + "step": 11077 + }, + { + "epoch": 30.185286103542236, + "grad_norm": 6.271266460418701, + "learning_rate": 1.6367927603735144e-05, + "loss": 0.4534, + "step": 11078 + }, + { + "epoch": 30.18801089918256, + "grad_norm": 5.906961441040039, + "learning_rate": 1.636724714468278e-05, + "loss": 0.3754, + "step": 11079 + }, + { + "epoch": 30.190735694822887, + "grad_norm": 6.097695827484131, + "learning_rate": 1.6366566636042495e-05, + "loss": 0.463, + "step": 11080 + }, + { + "epoch": 30.193460490463217, + "grad_norm": 5.9541335105896, + "learning_rate": 1.6365886077819597e-05, + "loss": 0.5026, + "step": 11081 + }, + { + "epoch": 30.196185286103542, + "grad_norm": 7.629851341247559, + "learning_rate": 1.6365205470019383e-05, + "loss": 0.5601, + "step": 11082 + }, + { + "epoch": 30.19891008174387, + "grad_norm": 6.487632751464844, + "learning_rate": 1.6364524812647155e-05, + "loss": 0.4403, + "step": 11083 + }, + { + "epoch": 30.201634877384198, + "grad_norm": 8.499356269836426, + "learning_rate": 1.636384410570821e-05, + "loss": 0.5285, + "step": 11084 + }, + { + "epoch": 30.204359673024523, + "grad_norm": 12.487041473388672, + "learning_rate": 1.636316334920785e-05, + "loss": 0.4891, + "step": 11085 + }, + { + "epoch": 30.20708446866485, + "grad_norm": 6.921417713165283, + "learning_rate": 1.6362482543151382e-05, + "loss": 0.4167, + "step": 11086 + }, + { + "epoch": 30.20980926430518, + "grad_norm": 7.392184257507324, + "learning_rate": 1.6361801687544103e-05, + "loss": 0.4371, + "step": 11087 + }, + { + "epoch": 30.212534059945504, + "grad_norm": 8.208747863769531, + "learning_rate": 1.636112078239132e-05, + "loss": 0.3515, + "step": 11088 + }, + { + "epoch": 30.21525885558583, + "grad_norm": 6.039959907531738, + "learning_rate": 1.636043982769833e-05, + "loss": 0.5775, + "step": 11089 + }, + { + "epoch": 30.21798365122616, + "grad_norm": 5.5182600021362305, + "learning_rate": 1.635975882347044e-05, + "loss": 0.4808, + "step": 11090 + }, + { + "epoch": 30.220708446866485, + "grad_norm": 8.186211585998535, + "learning_rate": 1.6359077769712955e-05, + "loss": 0.3456, + "step": 11091 + }, + { + "epoch": 30.22343324250681, + "grad_norm": 6.7575459480285645, + "learning_rate": 1.6358396666431176e-05, + "loss": 0.4275, + "step": 11092 + }, + { + "epoch": 30.22615803814714, + "grad_norm": 6.863185405731201, + "learning_rate": 1.6357715513630407e-05, + "loss": 0.3653, + "step": 11093 + }, + { + "epoch": 30.228882833787466, + "grad_norm": 7.599756717681885, + "learning_rate": 1.6357034311315954e-05, + "loss": 0.3335, + "step": 11094 + }, + { + "epoch": 30.231607629427792, + "grad_norm": 7.023427486419678, + "learning_rate": 1.635635305949312e-05, + "loss": 0.3951, + "step": 11095 + }, + { + "epoch": 30.23433242506812, + "grad_norm": 5.927885055541992, + "learning_rate": 1.6355671758167218e-05, + "loss": 0.3515, + "step": 11096 + }, + { + "epoch": 30.237057220708447, + "grad_norm": 6.024624347686768, + "learning_rate": 1.635499040734355e-05, + "loss": 0.3495, + "step": 11097 + }, + { + "epoch": 30.239782016348773, + "grad_norm": 6.806307315826416, + "learning_rate": 1.6354309007027417e-05, + "loss": 0.413, + "step": 11098 + }, + { + "epoch": 30.242506811989102, + "grad_norm": 6.517013072967529, + "learning_rate": 1.635362755722413e-05, + "loss": 0.4623, + "step": 11099 + }, + { + "epoch": 30.245231607629428, + "grad_norm": 6.914282321929932, + "learning_rate": 1.6352946057938998e-05, + "loss": 0.3395, + "step": 11100 + }, + { + "epoch": 30.247956403269754, + "grad_norm": 7.303252220153809, + "learning_rate": 1.635226450917733e-05, + "loss": 0.3323, + "step": 11101 + }, + { + "epoch": 30.250681198910083, + "grad_norm": 6.682431697845459, + "learning_rate": 1.635158291094442e-05, + "loss": 0.4211, + "step": 11102 + }, + { + "epoch": 30.25340599455041, + "grad_norm": 5.761322021484375, + "learning_rate": 1.6350901263245594e-05, + "loss": 0.3323, + "step": 11103 + }, + { + "epoch": 30.256130790190735, + "grad_norm": 6.29879093170166, + "learning_rate": 1.6350219566086156e-05, + "loss": 0.4701, + "step": 11104 + }, + { + "epoch": 30.258855585831064, + "grad_norm": 7.568106174468994, + "learning_rate": 1.6349537819471408e-05, + "loss": 0.4886, + "step": 11105 + }, + { + "epoch": 30.26158038147139, + "grad_norm": 6.222177028656006, + "learning_rate": 1.6348856023406666e-05, + "loss": 0.4187, + "step": 11106 + }, + { + "epoch": 30.264305177111716, + "grad_norm": 7.444094657897949, + "learning_rate": 1.6348174177897237e-05, + "loss": 0.4895, + "step": 11107 + }, + { + "epoch": 30.267029972752045, + "grad_norm": 7.142608165740967, + "learning_rate": 1.634749228294843e-05, + "loss": 0.5111, + "step": 11108 + }, + { + "epoch": 30.26975476839237, + "grad_norm": 9.366308212280273, + "learning_rate": 1.634681033856556e-05, + "loss": 0.4298, + "step": 11109 + }, + { + "epoch": 30.272479564032697, + "grad_norm": 6.9632720947265625, + "learning_rate": 1.6346128344753932e-05, + "loss": 0.4662, + "step": 11110 + }, + { + "epoch": 30.275204359673026, + "grad_norm": 6.712884902954102, + "learning_rate": 1.6345446301518864e-05, + "loss": 0.3194, + "step": 11111 + }, + { + "epoch": 30.277929155313352, + "grad_norm": 7.170973777770996, + "learning_rate": 1.634476420886566e-05, + "loss": 0.4743, + "step": 11112 + }, + { + "epoch": 30.280653950953678, + "grad_norm": 6.807126045227051, + "learning_rate": 1.634408206679964e-05, + "loss": 0.3461, + "step": 11113 + }, + { + "epoch": 30.283378746594007, + "grad_norm": 6.459092140197754, + "learning_rate": 1.6343399875326115e-05, + "loss": 0.4248, + "step": 11114 + }, + { + "epoch": 30.286103542234333, + "grad_norm": 6.9402289390563965, + "learning_rate": 1.6342717634450393e-05, + "loss": 0.4156, + "step": 11115 + }, + { + "epoch": 30.28882833787466, + "grad_norm": 7.605564594268799, + "learning_rate": 1.634203534417779e-05, + "loss": 0.5897, + "step": 11116 + }, + { + "epoch": 30.291553133514988, + "grad_norm": 8.335100173950195, + "learning_rate": 1.6341353004513622e-05, + "loss": 0.5774, + "step": 11117 + }, + { + "epoch": 30.294277929155314, + "grad_norm": 7.1958112716674805, + "learning_rate": 1.63406706154632e-05, + "loss": 0.5863, + "step": 11118 + }, + { + "epoch": 30.29700272479564, + "grad_norm": 6.38262939453125, + "learning_rate": 1.633998817703184e-05, + "loss": 0.392, + "step": 11119 + }, + { + "epoch": 30.29972752043597, + "grad_norm": 6.995018005371094, + "learning_rate": 1.6339305689224853e-05, + "loss": 0.4524, + "step": 11120 + }, + { + "epoch": 30.302452316076295, + "grad_norm": 6.139112949371338, + "learning_rate": 1.633862315204756e-05, + "loss": 0.4032, + "step": 11121 + }, + { + "epoch": 30.30517711171662, + "grad_norm": 7.4238362312316895, + "learning_rate": 1.6337940565505275e-05, + "loss": 0.4225, + "step": 11122 + }, + { + "epoch": 30.30790190735695, + "grad_norm": 6.557679176330566, + "learning_rate": 1.633725792960331e-05, + "loss": 0.4968, + "step": 11123 + }, + { + "epoch": 30.310626702997276, + "grad_norm": 7.154829978942871, + "learning_rate": 1.6336575244346983e-05, + "loss": 0.3633, + "step": 11124 + }, + { + "epoch": 30.3133514986376, + "grad_norm": 7.474669933319092, + "learning_rate": 1.6335892509741618e-05, + "loss": 0.4091, + "step": 11125 + }, + { + "epoch": 30.31607629427793, + "grad_norm": 9.34608268737793, + "learning_rate": 1.633520972579252e-05, + "loss": 0.4148, + "step": 11126 + }, + { + "epoch": 30.318801089918257, + "grad_norm": 6.975616931915283, + "learning_rate": 1.6334526892505015e-05, + "loss": 0.3524, + "step": 11127 + }, + { + "epoch": 30.321525885558582, + "grad_norm": 6.626901149749756, + "learning_rate": 1.633384400988442e-05, + "loss": 0.649, + "step": 11128 + }, + { + "epoch": 30.32425068119891, + "grad_norm": 9.110139846801758, + "learning_rate": 1.633316107793605e-05, + "loss": 0.4517, + "step": 11129 + }, + { + "epoch": 30.326975476839237, + "grad_norm": 7.414907932281494, + "learning_rate": 1.6332478096665222e-05, + "loss": 0.4903, + "step": 11130 + }, + { + "epoch": 30.329700272479563, + "grad_norm": 6.143207550048828, + "learning_rate": 1.6331795066077262e-05, + "loss": 0.2961, + "step": 11131 + }, + { + "epoch": 30.332425068119893, + "grad_norm": 7.663824081420898, + "learning_rate": 1.633111198617749e-05, + "loss": 0.3638, + "step": 11132 + }, + { + "epoch": 30.33514986376022, + "grad_norm": 6.809144020080566, + "learning_rate": 1.6330428856971217e-05, + "loss": 0.3295, + "step": 11133 + }, + { + "epoch": 30.337874659400544, + "grad_norm": 6.921654224395752, + "learning_rate": 1.6329745678463765e-05, + "loss": 0.4185, + "step": 11134 + }, + { + "epoch": 30.340599455040874, + "grad_norm": 6.478837013244629, + "learning_rate": 1.6329062450660463e-05, + "loss": 0.4489, + "step": 11135 + }, + { + "epoch": 30.3433242506812, + "grad_norm": 12.89828109741211, + "learning_rate": 1.6328379173566623e-05, + "loss": 0.4382, + "step": 11136 + }, + { + "epoch": 30.346049046321525, + "grad_norm": 9.292570114135742, + "learning_rate": 1.632769584718757e-05, + "loss": 0.4523, + "step": 11137 + }, + { + "epoch": 30.348773841961854, + "grad_norm": 6.0499267578125, + "learning_rate": 1.6327012471528626e-05, + "loss": 0.2988, + "step": 11138 + }, + { + "epoch": 30.35149863760218, + "grad_norm": 6.418890953063965, + "learning_rate": 1.6326329046595112e-05, + "loss": 0.4348, + "step": 11139 + }, + { + "epoch": 30.354223433242506, + "grad_norm": 7.002811431884766, + "learning_rate": 1.632564557239235e-05, + "loss": 0.3316, + "step": 11140 + }, + { + "epoch": 30.356948228882835, + "grad_norm": 8.295167922973633, + "learning_rate": 1.6324962048925666e-05, + "loss": 0.2808, + "step": 11141 + }, + { + "epoch": 30.35967302452316, + "grad_norm": 6.577081203460693, + "learning_rate": 1.632427847620038e-05, + "loss": 0.4397, + "step": 11142 + }, + { + "epoch": 30.362397820163487, + "grad_norm": 9.08464527130127, + "learning_rate": 1.632359485422182e-05, + "loss": 0.4562, + "step": 11143 + }, + { + "epoch": 30.365122615803816, + "grad_norm": 6.9909844398498535, + "learning_rate": 1.63229111829953e-05, + "loss": 0.4818, + "step": 11144 + }, + { + "epoch": 30.367847411444142, + "grad_norm": 9.277730941772461, + "learning_rate": 1.6322227462526157e-05, + "loss": 0.442, + "step": 11145 + }, + { + "epoch": 30.370572207084468, + "grad_norm": 7.0915985107421875, + "learning_rate": 1.6321543692819707e-05, + "loss": 0.3355, + "step": 11146 + }, + { + "epoch": 30.373297002724797, + "grad_norm": 6.999594211578369, + "learning_rate": 1.6320859873881282e-05, + "loss": 0.5162, + "step": 11147 + }, + { + "epoch": 30.376021798365123, + "grad_norm": 7.807701587677002, + "learning_rate": 1.63201760057162e-05, + "loss": 0.5061, + "step": 11148 + }, + { + "epoch": 30.37874659400545, + "grad_norm": 8.793044090270996, + "learning_rate": 1.6319492088329792e-05, + "loss": 0.5065, + "step": 11149 + }, + { + "epoch": 30.381471389645778, + "grad_norm": 8.298761367797852, + "learning_rate": 1.631880812172738e-05, + "loss": 0.3995, + "step": 11150 + }, + { + "epoch": 30.384196185286104, + "grad_norm": 8.38496208190918, + "learning_rate": 1.63181241059143e-05, + "loss": 0.3788, + "step": 11151 + }, + { + "epoch": 30.38692098092643, + "grad_norm": 6.298509120941162, + "learning_rate": 1.631744004089587e-05, + "loss": 0.3848, + "step": 11152 + }, + { + "epoch": 30.38964577656676, + "grad_norm": 7.297521591186523, + "learning_rate": 1.6316755926677415e-05, + "loss": 0.4926, + "step": 11153 + }, + { + "epoch": 30.392370572207085, + "grad_norm": 6.584827423095703, + "learning_rate": 1.6316071763264277e-05, + "loss": 0.5525, + "step": 11154 + }, + { + "epoch": 30.39509536784741, + "grad_norm": 6.54464864730835, + "learning_rate": 1.631538755066177e-05, + "loss": 0.5013, + "step": 11155 + }, + { + "epoch": 30.39782016348774, + "grad_norm": 8.183076858520508, + "learning_rate": 1.631470328887523e-05, + "loss": 0.4586, + "step": 11156 + }, + { + "epoch": 30.400544959128066, + "grad_norm": 6.126870632171631, + "learning_rate": 1.6314018977909982e-05, + "loss": 0.3919, + "step": 11157 + }, + { + "epoch": 30.40326975476839, + "grad_norm": 7.185279846191406, + "learning_rate": 1.631333461777136e-05, + "loss": 0.3845, + "step": 11158 + }, + { + "epoch": 30.40599455040872, + "grad_norm": 6.868136882781982, + "learning_rate": 1.631265020846469e-05, + "loss": 0.4161, + "step": 11159 + }, + { + "epoch": 30.408719346049047, + "grad_norm": 7.411529064178467, + "learning_rate": 1.63119657499953e-05, + "loss": 0.4904, + "step": 11160 + }, + { + "epoch": 30.411444141689373, + "grad_norm": 6.574433326721191, + "learning_rate": 1.631128124236853e-05, + "loss": 0.4001, + "step": 11161 + }, + { + "epoch": 30.414168937329702, + "grad_norm": 6.144572734832764, + "learning_rate": 1.6310596685589703e-05, + "loss": 0.4123, + "step": 11162 + }, + { + "epoch": 30.416893732970028, + "grad_norm": 6.900004863739014, + "learning_rate": 1.6309912079664147e-05, + "loss": 0.4342, + "step": 11163 + }, + { + "epoch": 30.419618528610354, + "grad_norm": 6.595589637756348, + "learning_rate": 1.6309227424597207e-05, + "loss": 0.4882, + "step": 11164 + }, + { + "epoch": 30.422343324250683, + "grad_norm": 7.083584308624268, + "learning_rate": 1.63085427203942e-05, + "loss": 0.4852, + "step": 11165 + }, + { + "epoch": 30.42506811989101, + "grad_norm": 7.238770484924316, + "learning_rate": 1.6307857967060466e-05, + "loss": 0.5204, + "step": 11166 + }, + { + "epoch": 30.427792915531334, + "grad_norm": 7.944159507751465, + "learning_rate": 1.630717316460134e-05, + "loss": 0.3906, + "step": 11167 + }, + { + "epoch": 30.430517711171664, + "grad_norm": 9.476786613464355, + "learning_rate": 1.630648831302215e-05, + "loss": 0.4355, + "step": 11168 + }, + { + "epoch": 30.43324250681199, + "grad_norm": 8.080235481262207, + "learning_rate": 1.6305803412328236e-05, + "loss": 0.4662, + "step": 11169 + }, + { + "epoch": 30.435967302452315, + "grad_norm": 8.67461109161377, + "learning_rate": 1.6305118462524926e-05, + "loss": 0.4588, + "step": 11170 + }, + { + "epoch": 30.438692098092645, + "grad_norm": 6.554092884063721, + "learning_rate": 1.6304433463617554e-05, + "loss": 0.3947, + "step": 11171 + }, + { + "epoch": 30.44141689373297, + "grad_norm": 6.492825984954834, + "learning_rate": 1.630374841561146e-05, + "loss": 0.5317, + "step": 11172 + }, + { + "epoch": 30.444141689373296, + "grad_norm": 6.715017795562744, + "learning_rate": 1.6303063318511973e-05, + "loss": 0.3394, + "step": 11173 + }, + { + "epoch": 30.446866485013626, + "grad_norm": 7.301937580108643, + "learning_rate": 1.6302378172324436e-05, + "loss": 0.4982, + "step": 11174 + }, + { + "epoch": 30.44959128065395, + "grad_norm": 6.503893852233887, + "learning_rate": 1.6301692977054177e-05, + "loss": 0.3516, + "step": 11175 + }, + { + "epoch": 30.452316076294277, + "grad_norm": 7.567931652069092, + "learning_rate": 1.630100773270654e-05, + "loss": 0.4438, + "step": 11176 + }, + { + "epoch": 30.455040871934607, + "grad_norm": 6.096273899078369, + "learning_rate": 1.6300322439286852e-05, + "loss": 0.4471, + "step": 11177 + }, + { + "epoch": 30.457765667574932, + "grad_norm": 7.5801472663879395, + "learning_rate": 1.629963709680046e-05, + "loss": 0.3835, + "step": 11178 + }, + { + "epoch": 30.460490463215258, + "grad_norm": 6.825669765472412, + "learning_rate": 1.6298951705252697e-05, + "loss": 0.4557, + "step": 11179 + }, + { + "epoch": 30.463215258855588, + "grad_norm": 6.852964401245117, + "learning_rate": 1.6298266264648898e-05, + "loss": 0.4685, + "step": 11180 + }, + { + "epoch": 30.465940054495913, + "grad_norm": 6.547214508056641, + "learning_rate": 1.6297580774994404e-05, + "loss": 0.5506, + "step": 11181 + }, + { + "epoch": 30.46866485013624, + "grad_norm": 6.798362731933594, + "learning_rate": 1.6296895236294558e-05, + "loss": 0.3712, + "step": 11182 + }, + { + "epoch": 30.47138964577657, + "grad_norm": 6.006402015686035, + "learning_rate": 1.629620964855469e-05, + "loss": 0.6051, + "step": 11183 + }, + { + "epoch": 30.474114441416894, + "grad_norm": 7.253655433654785, + "learning_rate": 1.6295524011780147e-05, + "loss": 0.5779, + "step": 11184 + }, + { + "epoch": 30.47683923705722, + "grad_norm": 13.01401424407959, + "learning_rate": 1.629483832597626e-05, + "loss": 0.3723, + "step": 11185 + }, + { + "epoch": 30.479564032697546, + "grad_norm": 7.651995658874512, + "learning_rate": 1.6294152591148386e-05, + "loss": 0.46, + "step": 11186 + }, + { + "epoch": 30.482288828337875, + "grad_norm": 8.617700576782227, + "learning_rate": 1.6293466807301843e-05, + "loss": 0.4051, + "step": 11187 + }, + { + "epoch": 30.4850136239782, + "grad_norm": 6.405218601226807, + "learning_rate": 1.629278097444199e-05, + "loss": 0.3129, + "step": 11188 + }, + { + "epoch": 30.48773841961853, + "grad_norm": 8.3556489944458, + "learning_rate": 1.6292095092574154e-05, + "loss": 0.4845, + "step": 11189 + }, + { + "epoch": 30.490463215258856, + "grad_norm": 11.176692008972168, + "learning_rate": 1.629140916170369e-05, + "loss": 0.5119, + "step": 11190 + }, + { + "epoch": 30.493188010899182, + "grad_norm": 7.346235275268555, + "learning_rate": 1.6290723181835933e-05, + "loss": 0.5363, + "step": 11191 + }, + { + "epoch": 30.495912806539508, + "grad_norm": 7.172322750091553, + "learning_rate": 1.6290037152976227e-05, + "loss": 0.4497, + "step": 11192 + }, + { + "epoch": 30.498637602179837, + "grad_norm": 6.90130615234375, + "learning_rate": 1.628935107512991e-05, + "loss": 0.4502, + "step": 11193 + }, + { + "epoch": 30.501362397820163, + "grad_norm": 8.490738868713379, + "learning_rate": 1.6288664948302333e-05, + "loss": 0.3503, + "step": 11194 + }, + { + "epoch": 30.504087193460492, + "grad_norm": 6.3047709465026855, + "learning_rate": 1.6287978772498836e-05, + "loss": 0.2864, + "step": 11195 + }, + { + "epoch": 30.506811989100818, + "grad_norm": 6.159095287322998, + "learning_rate": 1.628729254772476e-05, + "loss": 0.4874, + "step": 11196 + }, + { + "epoch": 30.509536784741144, + "grad_norm": 6.74845027923584, + "learning_rate": 1.6286606273985452e-05, + "loss": 0.3663, + "step": 11197 + }, + { + "epoch": 30.51226158038147, + "grad_norm": 7.2375383377075195, + "learning_rate": 1.628591995128626e-05, + "loss": 0.4338, + "step": 11198 + }, + { + "epoch": 30.5149863760218, + "grad_norm": 6.118013381958008, + "learning_rate": 1.6285233579632525e-05, + "loss": 0.5677, + "step": 11199 + }, + { + "epoch": 30.517711171662125, + "grad_norm": 7.088701248168945, + "learning_rate": 1.628454715902959e-05, + "loss": 0.4264, + "step": 11200 + }, + { + "epoch": 30.520435967302454, + "grad_norm": 8.072192192077637, + "learning_rate": 1.628386068948281e-05, + "loss": 0.4079, + "step": 11201 + }, + { + "epoch": 30.52316076294278, + "grad_norm": 6.230062007904053, + "learning_rate": 1.6283174170997516e-05, + "loss": 0.4247, + "step": 11202 + }, + { + "epoch": 30.525885558583106, + "grad_norm": 7.471052169799805, + "learning_rate": 1.6282487603579073e-05, + "loss": 0.4824, + "step": 11203 + }, + { + "epoch": 30.52861035422343, + "grad_norm": 8.514483451843262, + "learning_rate": 1.6281800987232815e-05, + "loss": 0.4504, + "step": 11204 + }, + { + "epoch": 30.53133514986376, + "grad_norm": 8.606267929077148, + "learning_rate": 1.628111432196409e-05, + "loss": 0.4247, + "step": 11205 + }, + { + "epoch": 30.534059945504087, + "grad_norm": 7.907001495361328, + "learning_rate": 1.628042760777825e-05, + "loss": 0.3819, + "step": 11206 + }, + { + "epoch": 30.536784741144416, + "grad_norm": 7.460330009460449, + "learning_rate": 1.6279740844680647e-05, + "loss": 0.4031, + "step": 11207 + }, + { + "epoch": 30.539509536784742, + "grad_norm": 6.786050319671631, + "learning_rate": 1.627905403267662e-05, + "loss": 0.3704, + "step": 11208 + }, + { + "epoch": 30.542234332425068, + "grad_norm": 7.479556560516357, + "learning_rate": 1.6278367171771522e-05, + "loss": 0.3909, + "step": 11209 + }, + { + "epoch": 30.544959128065393, + "grad_norm": 5.854247093200684, + "learning_rate": 1.6277680261970706e-05, + "loss": 0.4698, + "step": 11210 + }, + { + "epoch": 30.547683923705723, + "grad_norm": 8.77616024017334, + "learning_rate": 1.6276993303279514e-05, + "loss": 0.4579, + "step": 11211 + }, + { + "epoch": 30.55040871934605, + "grad_norm": 8.852252960205078, + "learning_rate": 1.6276306295703307e-05, + "loss": 0.4197, + "step": 11212 + }, + { + "epoch": 30.553133514986374, + "grad_norm": 7.174180507659912, + "learning_rate": 1.6275619239247423e-05, + "loss": 0.3899, + "step": 11213 + }, + { + "epoch": 30.555858310626704, + "grad_norm": 7.6936211585998535, + "learning_rate": 1.6274932133917217e-05, + "loss": 0.4662, + "step": 11214 + }, + { + "epoch": 30.55858310626703, + "grad_norm": 7.429311275482178, + "learning_rate": 1.6274244979718044e-05, + "loss": 0.429, + "step": 11215 + }, + { + "epoch": 30.561307901907355, + "grad_norm": 6.269425868988037, + "learning_rate": 1.627355777665525e-05, + "loss": 0.3629, + "step": 11216 + }, + { + "epoch": 30.564032697547685, + "grad_norm": 7.538383483886719, + "learning_rate": 1.6272870524734193e-05, + "loss": 0.3674, + "step": 11217 + }, + { + "epoch": 30.56675749318801, + "grad_norm": 7.07504940032959, + "learning_rate": 1.6272183223960224e-05, + "loss": 0.4295, + "step": 11218 + }, + { + "epoch": 30.569482288828336, + "grad_norm": 7.453427314758301, + "learning_rate": 1.6271495874338692e-05, + "loss": 0.391, + "step": 11219 + }, + { + "epoch": 30.572207084468666, + "grad_norm": 8.222543716430664, + "learning_rate": 1.6270808475874953e-05, + "loss": 0.475, + "step": 11220 + }, + { + "epoch": 30.57493188010899, + "grad_norm": 6.086309909820557, + "learning_rate": 1.6270121028574358e-05, + "loss": 0.5153, + "step": 11221 + }, + { + "epoch": 30.577656675749317, + "grad_norm": 6.072343349456787, + "learning_rate": 1.6269433532442262e-05, + "loss": 0.4074, + "step": 11222 + }, + { + "epoch": 30.580381471389646, + "grad_norm": 11.468491554260254, + "learning_rate": 1.626874598748402e-05, + "loss": 0.4034, + "step": 11223 + }, + { + "epoch": 30.583106267029972, + "grad_norm": 7.184165954589844, + "learning_rate": 1.6268058393704986e-05, + "loss": 0.2477, + "step": 11224 + }, + { + "epoch": 30.585831062670298, + "grad_norm": 7.140717029571533, + "learning_rate": 1.6267370751110516e-05, + "loss": 0.3927, + "step": 11225 + }, + { + "epoch": 30.588555858310627, + "grad_norm": 7.32138729095459, + "learning_rate": 1.626668305970596e-05, + "loss": 0.4031, + "step": 11226 + }, + { + "epoch": 30.591280653950953, + "grad_norm": 5.864624500274658, + "learning_rate": 1.626599531949668e-05, + "loss": 0.5443, + "step": 11227 + }, + { + "epoch": 30.59400544959128, + "grad_norm": 5.666828632354736, + "learning_rate": 1.626530753048803e-05, + "loss": 0.3853, + "step": 11228 + }, + { + "epoch": 30.59673024523161, + "grad_norm": 5.726497173309326, + "learning_rate": 1.626461969268537e-05, + "loss": 0.4012, + "step": 11229 + }, + { + "epoch": 30.599455040871934, + "grad_norm": 8.0853271484375, + "learning_rate": 1.6263931806094053e-05, + "loss": 0.4961, + "step": 11230 + }, + { + "epoch": 30.60217983651226, + "grad_norm": 10.106380462646484, + "learning_rate": 1.6263243870719436e-05, + "loss": 0.4315, + "step": 11231 + }, + { + "epoch": 30.60490463215259, + "grad_norm": 8.311697959899902, + "learning_rate": 1.6262555886566874e-05, + "loss": 0.3714, + "step": 11232 + }, + { + "epoch": 30.607629427792915, + "grad_norm": 7.060946941375732, + "learning_rate": 1.626186785364173e-05, + "loss": 0.4977, + "step": 11233 + }, + { + "epoch": 30.61035422343324, + "grad_norm": 7.943112373352051, + "learning_rate": 1.6261179771949364e-05, + "loss": 0.4243, + "step": 11234 + }, + { + "epoch": 30.61307901907357, + "grad_norm": 6.9223222732543945, + "learning_rate": 1.6260491641495127e-05, + "loss": 0.5494, + "step": 11235 + }, + { + "epoch": 30.615803814713896, + "grad_norm": 7.2110161781311035, + "learning_rate": 1.6259803462284383e-05, + "loss": 0.5115, + "step": 11236 + }, + { + "epoch": 30.618528610354222, + "grad_norm": 40.30569839477539, + "learning_rate": 1.6259115234322492e-05, + "loss": 0.3106, + "step": 11237 + }, + { + "epoch": 30.62125340599455, + "grad_norm": 6.456710338592529, + "learning_rate": 1.6258426957614814e-05, + "loss": 0.4498, + "step": 11238 + }, + { + "epoch": 30.623978201634877, + "grad_norm": 8.054564476013184, + "learning_rate": 1.625773863216671e-05, + "loss": 0.4762, + "step": 11239 + }, + { + "epoch": 30.626702997275203, + "grad_norm": 6.941972732543945, + "learning_rate": 1.6257050257983536e-05, + "loss": 0.4694, + "step": 11240 + }, + { + "epoch": 30.629427792915532, + "grad_norm": 8.115713119506836, + "learning_rate": 1.625636183507066e-05, + "loss": 0.5095, + "step": 11241 + }, + { + "epoch": 30.632152588555858, + "grad_norm": 13.512476921081543, + "learning_rate": 1.6255673363433432e-05, + "loss": 0.4984, + "step": 11242 + }, + { + "epoch": 30.634877384196184, + "grad_norm": 5.05262565612793, + "learning_rate": 1.6254984843077228e-05, + "loss": 0.4244, + "step": 11243 + }, + { + "epoch": 30.637602179836513, + "grad_norm": 6.971745491027832, + "learning_rate": 1.62542962740074e-05, + "loss": 0.4017, + "step": 11244 + }, + { + "epoch": 30.64032697547684, + "grad_norm": 7.403254985809326, + "learning_rate": 1.625360765622931e-05, + "loss": 0.6022, + "step": 11245 + }, + { + "epoch": 30.643051771117165, + "grad_norm": 7.056795597076416, + "learning_rate": 1.6252918989748333e-05, + "loss": 0.5388, + "step": 11246 + }, + { + "epoch": 30.645776566757494, + "grad_norm": 7.612959384918213, + "learning_rate": 1.625223027456982e-05, + "loss": 0.4792, + "step": 11247 + }, + { + "epoch": 30.64850136239782, + "grad_norm": 6.716630458831787, + "learning_rate": 1.625154151069914e-05, + "loss": 0.4965, + "step": 11248 + }, + { + "epoch": 30.651226158038146, + "grad_norm": 7.09428596496582, + "learning_rate": 1.6250852698141654e-05, + "loss": 0.3607, + "step": 11249 + }, + { + "epoch": 30.653950953678475, + "grad_norm": 6.382897853851318, + "learning_rate": 1.625016383690273e-05, + "loss": 0.3431, + "step": 11250 + }, + { + "epoch": 30.6566757493188, + "grad_norm": 7.352816104888916, + "learning_rate": 1.624947492698773e-05, + "loss": 0.5231, + "step": 11251 + }, + { + "epoch": 30.659400544959126, + "grad_norm": 15.394720077514648, + "learning_rate": 1.624878596840202e-05, + "loss": 0.4471, + "step": 11252 + }, + { + "epoch": 30.662125340599456, + "grad_norm": 9.968376159667969, + "learning_rate": 1.624809696115097e-05, + "loss": 0.476, + "step": 11253 + }, + { + "epoch": 30.66485013623978, + "grad_norm": 9.12043285369873, + "learning_rate": 1.624740790523994e-05, + "loss": 0.684, + "step": 11254 + }, + { + "epoch": 30.667574931880107, + "grad_norm": 7.758697986602783, + "learning_rate": 1.6246718800674296e-05, + "loss": 0.5054, + "step": 11255 + }, + { + "epoch": 30.670299727520437, + "grad_norm": 6.44129753112793, + "learning_rate": 1.624602964745941e-05, + "loss": 0.4493, + "step": 11256 + }, + { + "epoch": 30.673024523160763, + "grad_norm": 7.188642501831055, + "learning_rate": 1.6245340445600643e-05, + "loss": 0.3573, + "step": 11257 + }, + { + "epoch": 30.67574931880109, + "grad_norm": 8.696399688720703, + "learning_rate": 1.6244651195103367e-05, + "loss": 0.5812, + "step": 11258 + }, + { + "epoch": 30.678474114441418, + "grad_norm": 13.490169525146484, + "learning_rate": 1.6243961895972948e-05, + "loss": 0.5551, + "step": 11259 + }, + { + "epoch": 30.681198910081743, + "grad_norm": 7.445071220397949, + "learning_rate": 1.6243272548214758e-05, + "loss": 0.2846, + "step": 11260 + }, + { + "epoch": 30.68392370572207, + "grad_norm": 6.342952251434326, + "learning_rate": 1.624258315183416e-05, + "loss": 0.5732, + "step": 11261 + }, + { + "epoch": 30.6866485013624, + "grad_norm": 7.206576347351074, + "learning_rate": 1.6241893706836525e-05, + "loss": 0.621, + "step": 11262 + }, + { + "epoch": 30.689373297002724, + "grad_norm": 6.406331539154053, + "learning_rate": 1.6241204213227223e-05, + "loss": 0.4424, + "step": 11263 + }, + { + "epoch": 30.69209809264305, + "grad_norm": 6.325895309448242, + "learning_rate": 1.6240514671011623e-05, + "loss": 0.4019, + "step": 11264 + }, + { + "epoch": 30.69482288828338, + "grad_norm": 6.496794700622559, + "learning_rate": 1.6239825080195096e-05, + "loss": 0.442, + "step": 11265 + }, + { + "epoch": 30.697547683923705, + "grad_norm": 6.719447612762451, + "learning_rate": 1.623913544078301e-05, + "loss": 0.4412, + "step": 11266 + }, + { + "epoch": 30.70027247956403, + "grad_norm": 7.510452747344971, + "learning_rate": 1.6238445752780742e-05, + "loss": 0.4723, + "step": 11267 + }, + { + "epoch": 30.70299727520436, + "grad_norm": 7.245124340057373, + "learning_rate": 1.623775601619366e-05, + "loss": 0.462, + "step": 11268 + }, + { + "epoch": 30.705722070844686, + "grad_norm": 7.671139717102051, + "learning_rate": 1.623706623102713e-05, + "loss": 0.4833, + "step": 11269 + }, + { + "epoch": 30.708446866485012, + "grad_norm": 7.977005958557129, + "learning_rate": 1.623637639728653e-05, + "loss": 0.4939, + "step": 11270 + }, + { + "epoch": 30.71117166212534, + "grad_norm": 7.758381366729736, + "learning_rate": 1.623568651497723e-05, + "loss": 0.4451, + "step": 11271 + }, + { + "epoch": 30.713896457765667, + "grad_norm": 8.436704635620117, + "learning_rate": 1.623499658410461e-05, + "loss": 0.3275, + "step": 11272 + }, + { + "epoch": 30.716621253405993, + "grad_norm": 7.324213981628418, + "learning_rate": 1.6234306604674034e-05, + "loss": 0.3871, + "step": 11273 + }, + { + "epoch": 30.719346049046322, + "grad_norm": 6.613918781280518, + "learning_rate": 1.6233616576690876e-05, + "loss": 0.4449, + "step": 11274 + }, + { + "epoch": 30.722070844686648, + "grad_norm": 7.338347434997559, + "learning_rate": 1.6232926500160514e-05, + "loss": 0.5445, + "step": 11275 + }, + { + "epoch": 30.724795640326974, + "grad_norm": 7.05747652053833, + "learning_rate": 1.6232236375088322e-05, + "loss": 0.5292, + "step": 11276 + }, + { + "epoch": 30.727520435967303, + "grad_norm": 10.454824447631836, + "learning_rate": 1.6231546201479676e-05, + "loss": 0.5487, + "step": 11277 + }, + { + "epoch": 30.73024523160763, + "grad_norm": 8.207958221435547, + "learning_rate": 1.623085597933995e-05, + "loss": 0.4236, + "step": 11278 + }, + { + "epoch": 30.732970027247955, + "grad_norm": 7.944293022155762, + "learning_rate": 1.6230165708674513e-05, + "loss": 0.4565, + "step": 11279 + }, + { + "epoch": 30.735694822888284, + "grad_norm": 7.1323137283325195, + "learning_rate": 1.622947538948875e-05, + "loss": 0.4794, + "step": 11280 + }, + { + "epoch": 30.73841961852861, + "grad_norm": 7.217621803283691, + "learning_rate": 1.622878502178803e-05, + "loss": 0.5521, + "step": 11281 + }, + { + "epoch": 30.741144414168936, + "grad_norm": 6.7949652671813965, + "learning_rate": 1.6228094605577734e-05, + "loss": 0.387, + "step": 11282 + }, + { + "epoch": 30.743869209809265, + "grad_norm": 7.413728713989258, + "learning_rate": 1.6227404140863233e-05, + "loss": 0.3795, + "step": 11283 + }, + { + "epoch": 30.74659400544959, + "grad_norm": 5.315408229827881, + "learning_rate": 1.6226713627649914e-05, + "loss": 0.2813, + "step": 11284 + }, + { + "epoch": 30.749318801089917, + "grad_norm": 7.66859245300293, + "learning_rate": 1.622602306594315e-05, + "loss": 0.428, + "step": 11285 + }, + { + "epoch": 30.752043596730246, + "grad_norm": 7.728278636932373, + "learning_rate": 1.622533245574832e-05, + "loss": 0.3884, + "step": 11286 + }, + { + "epoch": 30.754768392370572, + "grad_norm": 5.734921455383301, + "learning_rate": 1.62246417970708e-05, + "loss": 0.3226, + "step": 11287 + }, + { + "epoch": 30.757493188010898, + "grad_norm": 7.37510871887207, + "learning_rate": 1.6223951089915968e-05, + "loss": 0.4894, + "step": 11288 + }, + { + "epoch": 30.760217983651227, + "grad_norm": 6.9354143142700195, + "learning_rate": 1.6223260334289208e-05, + "loss": 0.5839, + "step": 11289 + }, + { + "epoch": 30.762942779291553, + "grad_norm": 7.1436944007873535, + "learning_rate": 1.6222569530195894e-05, + "loss": 0.5088, + "step": 11290 + }, + { + "epoch": 30.76566757493188, + "grad_norm": 6.357337951660156, + "learning_rate": 1.622187867764141e-05, + "loss": 0.4811, + "step": 11291 + }, + { + "epoch": 30.768392370572208, + "grad_norm": 7.193835258483887, + "learning_rate": 1.6221187776631134e-05, + "loss": 0.3481, + "step": 11292 + }, + { + "epoch": 30.771117166212534, + "grad_norm": 6.292130470275879, + "learning_rate": 1.622049682717045e-05, + "loss": 0.4471, + "step": 11293 + }, + { + "epoch": 30.77384196185286, + "grad_norm": 7.480403900146484, + "learning_rate": 1.6219805829264738e-05, + "loss": 0.3723, + "step": 11294 + }, + { + "epoch": 30.77656675749319, + "grad_norm": 6.53055477142334, + "learning_rate": 1.621911478291937e-05, + "loss": 0.5594, + "step": 11295 + }, + { + "epoch": 30.779291553133515, + "grad_norm": 6.633364677429199, + "learning_rate": 1.6218423688139748e-05, + "loss": 0.3906, + "step": 11296 + }, + { + "epoch": 30.78201634877384, + "grad_norm": 6.3846917152404785, + "learning_rate": 1.6217732544931237e-05, + "loss": 0.3395, + "step": 11297 + }, + { + "epoch": 30.78474114441417, + "grad_norm": 5.787449359893799, + "learning_rate": 1.6217041353299224e-05, + "loss": 0.4193, + "step": 11298 + }, + { + "epoch": 30.787465940054496, + "grad_norm": 6.977640151977539, + "learning_rate": 1.6216350113249094e-05, + "loss": 0.4863, + "step": 11299 + }, + { + "epoch": 30.79019073569482, + "grad_norm": 6.857836723327637, + "learning_rate": 1.6215658824786226e-05, + "loss": 0.4244, + "step": 11300 + }, + { + "epoch": 30.79291553133515, + "grad_norm": 6.683234691619873, + "learning_rate": 1.6214967487916012e-05, + "loss": 0.3848, + "step": 11301 + }, + { + "epoch": 30.795640326975477, + "grad_norm": 6.261143684387207, + "learning_rate": 1.6214276102643828e-05, + "loss": 0.331, + "step": 11302 + }, + { + "epoch": 30.798365122615802, + "grad_norm": 8.550078392028809, + "learning_rate": 1.6213584668975064e-05, + "loss": 0.3848, + "step": 11303 + }, + { + "epoch": 30.80108991825613, + "grad_norm": 6.435115814208984, + "learning_rate": 1.6212893186915105e-05, + "loss": 0.3448, + "step": 11304 + }, + { + "epoch": 30.803814713896458, + "grad_norm": 7.466169834136963, + "learning_rate": 1.6212201656469328e-05, + "loss": 0.5968, + "step": 11305 + }, + { + "epoch": 30.806539509536783, + "grad_norm": 7.373120307922363, + "learning_rate": 1.621151007764313e-05, + "loss": 0.3631, + "step": 11306 + }, + { + "epoch": 30.809264305177113, + "grad_norm": 6.224044322967529, + "learning_rate": 1.621081845044189e-05, + "loss": 0.3088, + "step": 11307 + }, + { + "epoch": 30.81198910081744, + "grad_norm": 10.48534107208252, + "learning_rate": 1.6210126774870992e-05, + "loss": 0.44, + "step": 11308 + }, + { + "epoch": 30.814713896457764, + "grad_norm": 6.622835159301758, + "learning_rate": 1.620943505093583e-05, + "loss": 0.4076, + "step": 11309 + }, + { + "epoch": 30.817438692098094, + "grad_norm": 6.534196376800537, + "learning_rate": 1.620874327864179e-05, + "loss": 0.3479, + "step": 11310 + }, + { + "epoch": 30.82016348773842, + "grad_norm": 7.377260208129883, + "learning_rate": 1.620805145799425e-05, + "loss": 0.4688, + "step": 11311 + }, + { + "epoch": 30.822888283378745, + "grad_norm": 9.587128639221191, + "learning_rate": 1.6207359588998608e-05, + "loss": 0.4082, + "step": 11312 + }, + { + "epoch": 30.825613079019075, + "grad_norm": 6.322308540344238, + "learning_rate": 1.620666767166025e-05, + "loss": 0.4466, + "step": 11313 + }, + { + "epoch": 30.8283378746594, + "grad_norm": 10.123698234558105, + "learning_rate": 1.6205975705984565e-05, + "loss": 0.3615, + "step": 11314 + }, + { + "epoch": 30.831062670299726, + "grad_norm": 7.531373977661133, + "learning_rate": 1.620528369197694e-05, + "loss": 0.3455, + "step": 11315 + }, + { + "epoch": 30.833787465940055, + "grad_norm": 6.879456996917725, + "learning_rate": 1.6204591629642767e-05, + "loss": 0.3533, + "step": 11316 + }, + { + "epoch": 30.83651226158038, + "grad_norm": 8.004433631896973, + "learning_rate": 1.620389951898743e-05, + "loss": 0.3981, + "step": 11317 + }, + { + "epoch": 30.839237057220707, + "grad_norm": 7.241403102874756, + "learning_rate": 1.6203207360016328e-05, + "loss": 0.4425, + "step": 11318 + }, + { + "epoch": 30.841961852861036, + "grad_norm": 7.608405113220215, + "learning_rate": 1.6202515152734844e-05, + "loss": 0.448, + "step": 11319 + }, + { + "epoch": 30.844686648501362, + "grad_norm": 6.407038688659668, + "learning_rate": 1.620182289714837e-05, + "loss": 0.38, + "step": 11320 + }, + { + "epoch": 30.847411444141688, + "grad_norm": 6.163354396820068, + "learning_rate": 1.62011305932623e-05, + "loss": 0.4984, + "step": 11321 + }, + { + "epoch": 30.850136239782017, + "grad_norm": 7.411386966705322, + "learning_rate": 1.6200438241082032e-05, + "loss": 0.4138, + "step": 11322 + }, + { + "epoch": 30.852861035422343, + "grad_norm": 7.78454065322876, + "learning_rate": 1.6199745840612942e-05, + "loss": 0.3887, + "step": 11323 + }, + { + "epoch": 30.85558583106267, + "grad_norm": 6.8289794921875, + "learning_rate": 1.619905339186043e-05, + "loss": 0.5495, + "step": 11324 + }, + { + "epoch": 30.858310626703, + "grad_norm": 7.852591037750244, + "learning_rate": 1.6198360894829893e-05, + "loss": 0.543, + "step": 11325 + }, + { + "epoch": 30.861035422343324, + "grad_norm": 6.447912693023682, + "learning_rate": 1.619766834952672e-05, + "loss": 0.5576, + "step": 11326 + }, + { + "epoch": 30.86376021798365, + "grad_norm": 12.491286277770996, + "learning_rate": 1.6196975755956308e-05, + "loss": 0.3752, + "step": 11327 + }, + { + "epoch": 30.86648501362398, + "grad_norm": 7.9670610427856445, + "learning_rate": 1.6196283114124045e-05, + "loss": 0.5906, + "step": 11328 + }, + { + "epoch": 30.869209809264305, + "grad_norm": 6.724163055419922, + "learning_rate": 1.619559042403533e-05, + "loss": 0.412, + "step": 11329 + }, + { + "epoch": 30.87193460490463, + "grad_norm": 7.976020336151123, + "learning_rate": 1.6194897685695558e-05, + "loss": 0.4774, + "step": 11330 + }, + { + "epoch": 30.87465940054496, + "grad_norm": 6.1216607093811035, + "learning_rate": 1.6194204899110118e-05, + "loss": 0.435, + "step": 11331 + }, + { + "epoch": 30.877384196185286, + "grad_norm": 11.007805824279785, + "learning_rate": 1.619351206428441e-05, + "loss": 0.418, + "step": 11332 + }, + { + "epoch": 30.88010899182561, + "grad_norm": 11.148780822753906, + "learning_rate": 1.6192819181223835e-05, + "loss": 0.3734, + "step": 11333 + }, + { + "epoch": 30.88283378746594, + "grad_norm": 6.831493377685547, + "learning_rate": 1.6192126249933776e-05, + "loss": 0.8787, + "step": 11334 + }, + { + "epoch": 30.885558583106267, + "grad_norm": 7.386627197265625, + "learning_rate": 1.619143327041964e-05, + "loss": 0.5354, + "step": 11335 + }, + { + "epoch": 30.888283378746593, + "grad_norm": 14.94681167602539, + "learning_rate": 1.619074024268682e-05, + "loss": 0.4447, + "step": 11336 + }, + { + "epoch": 30.891008174386922, + "grad_norm": 9.879965782165527, + "learning_rate": 1.619004716674072e-05, + "loss": 0.5003, + "step": 11337 + }, + { + "epoch": 30.893732970027248, + "grad_norm": 7.779361248016357, + "learning_rate": 1.6189354042586728e-05, + "loss": 0.4738, + "step": 11338 + }, + { + "epoch": 30.896457765667574, + "grad_norm": 6.914754390716553, + "learning_rate": 1.6188660870230246e-05, + "loss": 0.3867, + "step": 11339 + }, + { + "epoch": 30.899182561307903, + "grad_norm": 6.506638050079346, + "learning_rate": 1.6187967649676674e-05, + "loss": 0.4524, + "step": 11340 + }, + { + "epoch": 30.90190735694823, + "grad_norm": 13.945359230041504, + "learning_rate": 1.6187274380931403e-05, + "loss": 0.423, + "step": 11341 + }, + { + "epoch": 30.904632152588555, + "grad_norm": 8.164636611938477, + "learning_rate": 1.6186581063999844e-05, + "loss": 0.4088, + "step": 11342 + }, + { + "epoch": 30.907356948228884, + "grad_norm": 8.097151756286621, + "learning_rate": 1.6185887698887388e-05, + "loss": 0.5584, + "step": 11343 + }, + { + "epoch": 30.91008174386921, + "grad_norm": 6.8635149002075195, + "learning_rate": 1.618519428559944e-05, + "loss": 0.3417, + "step": 11344 + }, + { + "epoch": 30.912806539509535, + "grad_norm": 7.3902907371521, + "learning_rate": 1.6184500824141395e-05, + "loss": 0.5122, + "step": 11345 + }, + { + "epoch": 30.915531335149865, + "grad_norm": 7.98119592666626, + "learning_rate": 1.618380731451866e-05, + "loss": 0.495, + "step": 11346 + }, + { + "epoch": 30.91825613079019, + "grad_norm": 8.91533374786377, + "learning_rate": 1.618311375673663e-05, + "loss": 0.2698, + "step": 11347 + }, + { + "epoch": 30.920980926430516, + "grad_norm": 6.444336891174316, + "learning_rate": 1.6182420150800712e-05, + "loss": 0.4418, + "step": 11348 + }, + { + "epoch": 30.923705722070846, + "grad_norm": 6.765807628631592, + "learning_rate": 1.6181726496716304e-05, + "loss": 0.5147, + "step": 11349 + }, + { + "epoch": 30.92643051771117, + "grad_norm": 8.13369369506836, + "learning_rate": 1.6181032794488807e-05, + "loss": 0.43, + "step": 11350 + }, + { + "epoch": 30.929155313351497, + "grad_norm": 7.940556526184082, + "learning_rate": 1.6180339044123625e-05, + "loss": 0.4167, + "step": 11351 + }, + { + "epoch": 30.931880108991827, + "grad_norm": 8.560213088989258, + "learning_rate": 1.6179645245626165e-05, + "loss": 0.3338, + "step": 11352 + }, + { + "epoch": 30.934604904632153, + "grad_norm": 8.294337272644043, + "learning_rate": 1.617895139900182e-05, + "loss": 0.4414, + "step": 11353 + }, + { + "epoch": 30.93732970027248, + "grad_norm": 6.885270595550537, + "learning_rate": 1.6178257504256006e-05, + "loss": 0.4163, + "step": 11354 + }, + { + "epoch": 30.940054495912808, + "grad_norm": 9.962544441223145, + "learning_rate": 1.6177563561394123e-05, + "loss": 0.5212, + "step": 11355 + }, + { + "epoch": 30.942779291553133, + "grad_norm": 7.879058837890625, + "learning_rate": 1.617686957042157e-05, + "loss": 0.4608, + "step": 11356 + }, + { + "epoch": 30.94550408719346, + "grad_norm": 9.151025772094727, + "learning_rate": 1.617617553134376e-05, + "loss": 0.5252, + "step": 11357 + }, + { + "epoch": 30.94822888283379, + "grad_norm": 7.61784553527832, + "learning_rate": 1.617548144416609e-05, + "loss": 0.3527, + "step": 11358 + }, + { + "epoch": 30.950953678474114, + "grad_norm": 7.675395965576172, + "learning_rate": 1.617478730889397e-05, + "loss": 0.4101, + "step": 11359 + }, + { + "epoch": 30.95367847411444, + "grad_norm": 7.265422344207764, + "learning_rate": 1.6174093125532803e-05, + "loss": 0.5717, + "step": 11360 + }, + { + "epoch": 30.95640326975477, + "grad_norm": 8.320547103881836, + "learning_rate": 1.6173398894088e-05, + "loss": 0.5793, + "step": 11361 + }, + { + "epoch": 30.959128065395095, + "grad_norm": 7.721741676330566, + "learning_rate": 1.617270461456496e-05, + "loss": 0.3912, + "step": 11362 + }, + { + "epoch": 30.96185286103542, + "grad_norm": 7.551270961761475, + "learning_rate": 1.6172010286969105e-05, + "loss": 0.3861, + "step": 11363 + }, + { + "epoch": 30.96457765667575, + "grad_norm": 7.487505912780762, + "learning_rate": 1.6171315911305824e-05, + "loss": 0.5294, + "step": 11364 + }, + { + "epoch": 30.967302452316076, + "grad_norm": 9.483017921447754, + "learning_rate": 1.6170621487580538e-05, + "loss": 0.3951, + "step": 11365 + }, + { + "epoch": 30.970027247956402, + "grad_norm": 8.659347534179688, + "learning_rate": 1.616992701579865e-05, + "loss": 0.423, + "step": 11366 + }, + { + "epoch": 30.97275204359673, + "grad_norm": 7.702268600463867, + "learning_rate": 1.616923249596557e-05, + "loss": 0.5224, + "step": 11367 + }, + { + "epoch": 30.975476839237057, + "grad_norm": 6.881136417388916, + "learning_rate": 1.6168537928086703e-05, + "loss": 0.4398, + "step": 11368 + }, + { + "epoch": 30.978201634877383, + "grad_norm": 7.698774337768555, + "learning_rate": 1.616784331216746e-05, + "loss": 0.4814, + "step": 11369 + }, + { + "epoch": 30.980926430517712, + "grad_norm": 7.118900775909424, + "learning_rate": 1.6167148648213255e-05, + "loss": 0.5659, + "step": 11370 + }, + { + "epoch": 30.983651226158038, + "grad_norm": 6.75089693069458, + "learning_rate": 1.616645393622949e-05, + "loss": 0.4426, + "step": 11371 + }, + { + "epoch": 30.986376021798364, + "grad_norm": 8.22135066986084, + "learning_rate": 1.6165759176221588e-05, + "loss": 0.364, + "step": 11372 + }, + { + "epoch": 30.989100817438693, + "grad_norm": 6.734350204467773, + "learning_rate": 1.6165064368194946e-05, + "loss": 0.4398, + "step": 11373 + }, + { + "epoch": 30.99182561307902, + "grad_norm": 6.77470588684082, + "learning_rate": 1.6164369512154984e-05, + "loss": 0.428, + "step": 11374 + }, + { + "epoch": 30.994550408719345, + "grad_norm": 7.893370628356934, + "learning_rate": 1.616367460810711e-05, + "loss": 0.5637, + "step": 11375 + }, + { + "epoch": 30.997275204359674, + "grad_norm": 6.426718711853027, + "learning_rate": 1.6162979656056735e-05, + "loss": 0.428, + "step": 11376 + }, + { + "epoch": 31.0, + "grad_norm": 8.785823822021484, + "learning_rate": 1.6162284656009276e-05, + "loss": 0.3823, + "step": 11377 + }, + { + "epoch": 31.002724795640326, + "grad_norm": 7.742459297180176, + "learning_rate": 1.6161589607970137e-05, + "loss": 0.4664, + "step": 11378 + }, + { + "epoch": 31.005449591280655, + "grad_norm": 6.6974992752075195, + "learning_rate": 1.616089451194474e-05, + "loss": 0.3357, + "step": 11379 + }, + { + "epoch": 31.00817438692098, + "grad_norm": 8.149337768554688, + "learning_rate": 1.6160199367938494e-05, + "loss": 0.3966, + "step": 11380 + }, + { + "epoch": 31.010899182561307, + "grad_norm": 6.426740646362305, + "learning_rate": 1.6159504175956815e-05, + "loss": 0.4183, + "step": 11381 + }, + { + "epoch": 31.013623978201636, + "grad_norm": 18.186363220214844, + "learning_rate": 1.6158808936005116e-05, + "loss": 0.4672, + "step": 11382 + }, + { + "epoch": 31.016348773841962, + "grad_norm": 17.358253479003906, + "learning_rate": 1.615811364808881e-05, + "loss": 0.3635, + "step": 11383 + }, + { + "epoch": 31.019073569482288, + "grad_norm": 7.258265972137451, + "learning_rate": 1.6157418312213313e-05, + "loss": 0.4673, + "step": 11384 + }, + { + "epoch": 31.021798365122617, + "grad_norm": 5.632544040679932, + "learning_rate": 1.6156722928384042e-05, + "loss": 0.4389, + "step": 11385 + }, + { + "epoch": 31.024523160762943, + "grad_norm": 6.65710973739624, + "learning_rate": 1.6156027496606408e-05, + "loss": 0.3953, + "step": 11386 + }, + { + "epoch": 31.02724795640327, + "grad_norm": 8.200004577636719, + "learning_rate": 1.615533201688583e-05, + "loss": 0.2825, + "step": 11387 + }, + { + "epoch": 31.029972752043598, + "grad_norm": 6.341181755065918, + "learning_rate": 1.6154636489227726e-05, + "loss": 0.4567, + "step": 11388 + }, + { + "epoch": 31.032697547683924, + "grad_norm": 8.055546760559082, + "learning_rate": 1.615394091363751e-05, + "loss": 0.3899, + "step": 11389 + }, + { + "epoch": 31.03542234332425, + "grad_norm": 6.492162704467773, + "learning_rate": 1.6153245290120602e-05, + "loss": 0.3247, + "step": 11390 + }, + { + "epoch": 31.03814713896458, + "grad_norm": 5.917665958404541, + "learning_rate": 1.6152549618682418e-05, + "loss": 0.3828, + "step": 11391 + }, + { + "epoch": 31.040871934604905, + "grad_norm": 6.391448497772217, + "learning_rate": 1.6151853899328377e-05, + "loss": 0.4669, + "step": 11392 + }, + { + "epoch": 31.04359673024523, + "grad_norm": 7.711374282836914, + "learning_rate": 1.6151158132063892e-05, + "loss": 0.3836, + "step": 11393 + }, + { + "epoch": 31.04632152588556, + "grad_norm": 8.410181045532227, + "learning_rate": 1.615046231689439e-05, + "loss": 0.5526, + "step": 11394 + }, + { + "epoch": 31.049046321525886, + "grad_norm": 9.054497718811035, + "learning_rate": 1.614976645382528e-05, + "loss": 0.4236, + "step": 11395 + }, + { + "epoch": 31.05177111716621, + "grad_norm": 7.943727493286133, + "learning_rate": 1.614907054286199e-05, + "loss": 0.4403, + "step": 11396 + }, + { + "epoch": 31.05449591280654, + "grad_norm": 7.074095726013184, + "learning_rate": 1.6148374584009934e-05, + "loss": 0.2817, + "step": 11397 + }, + { + "epoch": 31.057220708446867, + "grad_norm": 11.083065032958984, + "learning_rate": 1.6147678577274537e-05, + "loss": 0.4228, + "step": 11398 + }, + { + "epoch": 31.059945504087192, + "grad_norm": 6.933168411254883, + "learning_rate": 1.6146982522661216e-05, + "loss": 0.3752, + "step": 11399 + }, + { + "epoch": 31.06267029972752, + "grad_norm": 6.469690322875977, + "learning_rate": 1.6146286420175393e-05, + "loss": 0.3382, + "step": 11400 + }, + { + "epoch": 31.065395095367847, + "grad_norm": 12.152203559875488, + "learning_rate": 1.6145590269822487e-05, + "loss": 0.3333, + "step": 11401 + }, + { + "epoch": 31.068119891008173, + "grad_norm": 6.3950724601745605, + "learning_rate": 1.6144894071607927e-05, + "loss": 0.4603, + "step": 11402 + }, + { + "epoch": 31.070844686648503, + "grad_norm": 6.445328712463379, + "learning_rate": 1.6144197825537127e-05, + "loss": 0.4309, + "step": 11403 + }, + { + "epoch": 31.07356948228883, + "grad_norm": 6.3824334144592285, + "learning_rate": 1.614350153161551e-05, + "loss": 0.4089, + "step": 11404 + }, + { + "epoch": 31.076294277929154, + "grad_norm": 6.513887882232666, + "learning_rate": 1.6142805189848504e-05, + "loss": 0.3729, + "step": 11405 + }, + { + "epoch": 31.079019073569484, + "grad_norm": 9.495572090148926, + "learning_rate": 1.6142108800241527e-05, + "loss": 0.4035, + "step": 11406 + }, + { + "epoch": 31.08174386920981, + "grad_norm": 5.747984409332275, + "learning_rate": 1.6141412362800007e-05, + "loss": 0.2485, + "step": 11407 + }, + { + "epoch": 31.084468664850135, + "grad_norm": 6.530543804168701, + "learning_rate": 1.6140715877529363e-05, + "loss": 0.287, + "step": 11408 + }, + { + "epoch": 31.087193460490465, + "grad_norm": 6.833845615386963, + "learning_rate": 1.614001934443502e-05, + "loss": 0.3145, + "step": 11409 + }, + { + "epoch": 31.08991825613079, + "grad_norm": 6.342391014099121, + "learning_rate": 1.613932276352241e-05, + "loss": 0.4034, + "step": 11410 + }, + { + "epoch": 31.092643051771116, + "grad_norm": 6.921346664428711, + "learning_rate": 1.6138626134796945e-05, + "loss": 0.3413, + "step": 11411 + }, + { + "epoch": 31.095367847411445, + "grad_norm": 5.6658525466918945, + "learning_rate": 1.613792945826406e-05, + "loss": 0.4648, + "step": 11412 + }, + { + "epoch": 31.09809264305177, + "grad_norm": 6.347414493560791, + "learning_rate": 1.6137232733929176e-05, + "loss": 0.3158, + "step": 11413 + }, + { + "epoch": 31.100817438692097, + "grad_norm": 6.033417701721191, + "learning_rate": 1.6136535961797722e-05, + "loss": 0.6105, + "step": 11414 + }, + { + "epoch": 31.103542234332426, + "grad_norm": 8.13783073425293, + "learning_rate": 1.6135839141875127e-05, + "loss": 0.3212, + "step": 11415 + }, + { + "epoch": 31.106267029972752, + "grad_norm": 6.720310688018799, + "learning_rate": 1.613514227416681e-05, + "loss": 0.2846, + "step": 11416 + }, + { + "epoch": 31.108991825613078, + "grad_norm": 6.779971122741699, + "learning_rate": 1.6134445358678205e-05, + "loss": 0.287, + "step": 11417 + }, + { + "epoch": 31.111716621253407, + "grad_norm": 7.640523433685303, + "learning_rate": 1.613374839541474e-05, + "loss": 0.3868, + "step": 11418 + }, + { + "epoch": 31.114441416893733, + "grad_norm": 8.470203399658203, + "learning_rate": 1.6133051384381833e-05, + "loss": 0.3141, + "step": 11419 + }, + { + "epoch": 31.11716621253406, + "grad_norm": 8.201193809509277, + "learning_rate": 1.613235432558492e-05, + "loss": 0.3012, + "step": 11420 + }, + { + "epoch": 31.11989100817439, + "grad_norm": 8.012935638427734, + "learning_rate": 1.6131657219029428e-05, + "loss": 0.5099, + "step": 11421 + }, + { + "epoch": 31.122615803814714, + "grad_norm": 9.044227600097656, + "learning_rate": 1.613096006472079e-05, + "loss": 0.3509, + "step": 11422 + }, + { + "epoch": 31.12534059945504, + "grad_norm": 7.542146682739258, + "learning_rate": 1.6130262862664432e-05, + "loss": 0.3584, + "step": 11423 + }, + { + "epoch": 31.12806539509537, + "grad_norm": 6.187380313873291, + "learning_rate": 1.6129565612865786e-05, + "loss": 0.511, + "step": 11424 + }, + { + "epoch": 31.130790190735695, + "grad_norm": 7.63981294631958, + "learning_rate": 1.6128868315330278e-05, + "loss": 0.4031, + "step": 11425 + }, + { + "epoch": 31.13351498637602, + "grad_norm": 6.212061405181885, + "learning_rate": 1.612817097006334e-05, + "loss": 0.4166, + "step": 11426 + }, + { + "epoch": 31.13623978201635, + "grad_norm": 6.52099609375, + "learning_rate": 1.6127473577070408e-05, + "loss": 0.4107, + "step": 11427 + }, + { + "epoch": 31.138964577656676, + "grad_norm": 7.275450706481934, + "learning_rate": 1.6126776136356906e-05, + "loss": 0.365, + "step": 11428 + }, + { + "epoch": 31.141689373297, + "grad_norm": 7.747114181518555, + "learning_rate": 1.6126078647928266e-05, + "loss": 0.3631, + "step": 11429 + }, + { + "epoch": 31.14441416893733, + "grad_norm": 6.333340644836426, + "learning_rate": 1.6125381111789926e-05, + "loss": 0.3771, + "step": 11430 + }, + { + "epoch": 31.147138964577657, + "grad_norm": 6.653792381286621, + "learning_rate": 1.6124683527947317e-05, + "loss": 0.3546, + "step": 11431 + }, + { + "epoch": 31.149863760217983, + "grad_norm": 7.549876689910889, + "learning_rate": 1.6123985896405863e-05, + "loss": 0.3541, + "step": 11432 + }, + { + "epoch": 31.152588555858312, + "grad_norm": 8.709712982177734, + "learning_rate": 1.612328821717101e-05, + "loss": 0.4449, + "step": 11433 + }, + { + "epoch": 31.155313351498638, + "grad_norm": 7.690953254699707, + "learning_rate": 1.6122590490248185e-05, + "loss": 0.5591, + "step": 11434 + }, + { + "epoch": 31.158038147138964, + "grad_norm": 5.91731595993042, + "learning_rate": 1.612189271564282e-05, + "loss": 0.3455, + "step": 11435 + }, + { + "epoch": 31.160762942779293, + "grad_norm": 6.265995502471924, + "learning_rate": 1.612119489336035e-05, + "loss": 0.4231, + "step": 11436 + }, + { + "epoch": 31.16348773841962, + "grad_norm": 6.31031608581543, + "learning_rate": 1.6120497023406215e-05, + "loss": 0.6752, + "step": 11437 + }, + { + "epoch": 31.166212534059945, + "grad_norm": 6.493164539337158, + "learning_rate": 1.6119799105785845e-05, + "loss": 0.2769, + "step": 11438 + }, + { + "epoch": 31.168937329700274, + "grad_norm": 5.690825939178467, + "learning_rate": 1.6119101140504676e-05, + "loss": 0.2941, + "step": 11439 + }, + { + "epoch": 31.1716621253406, + "grad_norm": 9.791960716247559, + "learning_rate": 1.6118403127568142e-05, + "loss": 0.4533, + "step": 11440 + }, + { + "epoch": 31.174386920980925, + "grad_norm": 5.588350296020508, + "learning_rate": 1.6117705066981685e-05, + "loss": 0.4198, + "step": 11441 + }, + { + "epoch": 31.177111716621255, + "grad_norm": 9.831247329711914, + "learning_rate": 1.611700695875074e-05, + "loss": 0.3397, + "step": 11442 + }, + { + "epoch": 31.17983651226158, + "grad_norm": 8.07266902923584, + "learning_rate": 1.6116308802880737e-05, + "loss": 0.4969, + "step": 11443 + }, + { + "epoch": 31.182561307901906, + "grad_norm": 9.771881103515625, + "learning_rate": 1.6115610599377118e-05, + "loss": 0.5136, + "step": 11444 + }, + { + "epoch": 31.185286103542236, + "grad_norm": 6.985413074493408, + "learning_rate": 1.6114912348245324e-05, + "loss": 0.4005, + "step": 11445 + }, + { + "epoch": 31.18801089918256, + "grad_norm": 9.464669227600098, + "learning_rate": 1.6114214049490787e-05, + "loss": 0.4031, + "step": 11446 + }, + { + "epoch": 31.190735694822887, + "grad_norm": 7.2476487159729, + "learning_rate": 1.6113515703118948e-05, + "loss": 0.3992, + "step": 11447 + }, + { + "epoch": 31.193460490463217, + "grad_norm": 8.128005981445312, + "learning_rate": 1.6112817309135244e-05, + "loss": 0.4161, + "step": 11448 + }, + { + "epoch": 31.196185286103542, + "grad_norm": 5.896011829376221, + "learning_rate": 1.6112118867545118e-05, + "loss": 0.5424, + "step": 11449 + }, + { + "epoch": 31.19891008174387, + "grad_norm": 6.663732051849365, + "learning_rate": 1.6111420378354003e-05, + "loss": 0.3523, + "step": 11450 + }, + { + "epoch": 31.201634877384198, + "grad_norm": 7.829227447509766, + "learning_rate": 1.611072184156735e-05, + "loss": 0.5641, + "step": 11451 + }, + { + "epoch": 31.204359673024523, + "grad_norm": 6.647010326385498, + "learning_rate": 1.6110023257190587e-05, + "loss": 0.5236, + "step": 11452 + }, + { + "epoch": 31.20708446866485, + "grad_norm": 7.284354209899902, + "learning_rate": 1.6109324625229158e-05, + "loss": 0.4636, + "step": 11453 + }, + { + "epoch": 31.20980926430518, + "grad_norm": 6.334175109863281, + "learning_rate": 1.610862594568851e-05, + "loss": 0.3138, + "step": 11454 + }, + { + "epoch": 31.212534059945504, + "grad_norm": 7.065399169921875, + "learning_rate": 1.6107927218574076e-05, + "loss": 0.3054, + "step": 11455 + }, + { + "epoch": 31.21525885558583, + "grad_norm": 6.003612995147705, + "learning_rate": 1.6107228443891303e-05, + "loss": 0.3783, + "step": 11456 + }, + { + "epoch": 31.21798365122616, + "grad_norm": 5.7851667404174805, + "learning_rate": 1.610652962164563e-05, + "loss": 0.3906, + "step": 11457 + }, + { + "epoch": 31.220708446866485, + "grad_norm": 7.043871879577637, + "learning_rate": 1.6105830751842503e-05, + "loss": 0.3427, + "step": 11458 + }, + { + "epoch": 31.22343324250681, + "grad_norm": 5.8861823081970215, + "learning_rate": 1.6105131834487364e-05, + "loss": 0.3306, + "step": 11459 + }, + { + "epoch": 31.22615803814714, + "grad_norm": 6.036689758300781, + "learning_rate": 1.6104432869585652e-05, + "loss": 0.455, + "step": 11460 + }, + { + "epoch": 31.228882833787466, + "grad_norm": 6.158356666564941, + "learning_rate": 1.610373385714281e-05, + "loss": 0.427, + "step": 11461 + }, + { + "epoch": 31.231607629427792, + "grad_norm": 6.051694869995117, + "learning_rate": 1.6103034797164294e-05, + "loss": 0.3, + "step": 11462 + }, + { + "epoch": 31.23433242506812, + "grad_norm": 9.04263973236084, + "learning_rate": 1.6102335689655533e-05, + "loss": 0.4077, + "step": 11463 + }, + { + "epoch": 31.237057220708447, + "grad_norm": 7.521633625030518, + "learning_rate": 1.610163653462198e-05, + "loss": 0.4977, + "step": 11464 + }, + { + "epoch": 31.239782016348773, + "grad_norm": 8.390018463134766, + "learning_rate": 1.6100937332069074e-05, + "loss": 0.3568, + "step": 11465 + }, + { + "epoch": 31.242506811989102, + "grad_norm": 6.256731033325195, + "learning_rate": 1.610023808200227e-05, + "loss": 0.5061, + "step": 11466 + }, + { + "epoch": 31.245231607629428, + "grad_norm": 6.731732368469238, + "learning_rate": 1.6099538784427005e-05, + "loss": 0.3767, + "step": 11467 + }, + { + "epoch": 31.247956403269754, + "grad_norm": 6.79564094543457, + "learning_rate": 1.609883943934873e-05, + "loss": 0.4227, + "step": 11468 + }, + { + "epoch": 31.250681198910083, + "grad_norm": 6.176658630371094, + "learning_rate": 1.609814004677289e-05, + "loss": 0.4348, + "step": 11469 + }, + { + "epoch": 31.25340599455041, + "grad_norm": 5.946808338165283, + "learning_rate": 1.6097440606704928e-05, + "loss": 0.4133, + "step": 11470 + }, + { + "epoch": 31.256130790190735, + "grad_norm": 6.666254043579102, + "learning_rate": 1.60967411191503e-05, + "loss": 0.433, + "step": 11471 + }, + { + "epoch": 31.258855585831064, + "grad_norm": 8.007935523986816, + "learning_rate": 1.6096041584114444e-05, + "loss": 0.4609, + "step": 11472 + }, + { + "epoch": 31.26158038147139, + "grad_norm": 7.5098724365234375, + "learning_rate": 1.6095342001602813e-05, + "loss": 0.4758, + "step": 11473 + }, + { + "epoch": 31.264305177111716, + "grad_norm": 6.390965938568115, + "learning_rate": 1.6094642371620857e-05, + "loss": 0.2469, + "step": 11474 + }, + { + "epoch": 31.267029972752045, + "grad_norm": 6.606525897979736, + "learning_rate": 1.6093942694174024e-05, + "loss": 0.3356, + "step": 11475 + }, + { + "epoch": 31.26975476839237, + "grad_norm": 8.822193145751953, + "learning_rate": 1.609324296926776e-05, + "loss": 0.3881, + "step": 11476 + }, + { + "epoch": 31.272479564032697, + "grad_norm": 7.46927547454834, + "learning_rate": 1.609254319690751e-05, + "loss": 0.4776, + "step": 11477 + }, + { + "epoch": 31.275204359673026, + "grad_norm": 6.187511920928955, + "learning_rate": 1.6091843377098734e-05, + "loss": 0.4377, + "step": 11478 + }, + { + "epoch": 31.277929155313352, + "grad_norm": 6.347655773162842, + "learning_rate": 1.609114350984688e-05, + "loss": 0.3725, + "step": 11479 + }, + { + "epoch": 31.280653950953678, + "grad_norm": 6.0924248695373535, + "learning_rate": 1.6090443595157396e-05, + "loss": 0.5453, + "step": 11480 + }, + { + "epoch": 31.283378746594007, + "grad_norm": 8.578104972839355, + "learning_rate": 1.6089743633035732e-05, + "loss": 0.3582, + "step": 11481 + }, + { + "epoch": 31.286103542234333, + "grad_norm": 8.714938163757324, + "learning_rate": 1.6089043623487338e-05, + "loss": 0.4052, + "step": 11482 + }, + { + "epoch": 31.28882833787466, + "grad_norm": 8.156457901000977, + "learning_rate": 1.608834356651767e-05, + "loss": 0.3929, + "step": 11483 + }, + { + "epoch": 31.291553133514988, + "grad_norm": 7.4753618240356445, + "learning_rate": 1.608764346213218e-05, + "loss": 0.4719, + "step": 11484 + }, + { + "epoch": 31.294277929155314, + "grad_norm": 6.959665775299072, + "learning_rate": 1.6086943310336315e-05, + "loss": 0.2707, + "step": 11485 + }, + { + "epoch": 31.29700272479564, + "grad_norm": 6.778475761413574, + "learning_rate": 1.6086243111135537e-05, + "loss": 0.2784, + "step": 11486 + }, + { + "epoch": 31.29972752043597, + "grad_norm": 8.395167350769043, + "learning_rate": 1.608554286453529e-05, + "loss": 0.5805, + "step": 11487 + }, + { + "epoch": 31.302452316076295, + "grad_norm": 6.569278717041016, + "learning_rate": 1.608484257054103e-05, + "loss": 0.5439, + "step": 11488 + }, + { + "epoch": 31.30517711171662, + "grad_norm": 7.05552339553833, + "learning_rate": 1.6084142229158214e-05, + "loss": 0.4718, + "step": 11489 + }, + { + "epoch": 31.30790190735695, + "grad_norm": 6.05991792678833, + "learning_rate": 1.608344184039229e-05, + "loss": 0.4052, + "step": 11490 + }, + { + "epoch": 31.310626702997276, + "grad_norm": 11.234015464782715, + "learning_rate": 1.6082741404248724e-05, + "loss": 0.4645, + "step": 11491 + }, + { + "epoch": 31.3133514986376, + "grad_norm": 6.1989006996154785, + "learning_rate": 1.608204092073296e-05, + "loss": 0.2135, + "step": 11492 + }, + { + "epoch": 31.31607629427793, + "grad_norm": 6.016495227813721, + "learning_rate": 1.608134038985046e-05, + "loss": 0.339, + "step": 11493 + }, + { + "epoch": 31.318801089918257, + "grad_norm": 7.02424955368042, + "learning_rate": 1.608063981160667e-05, + "loss": 0.4274, + "step": 11494 + }, + { + "epoch": 31.321525885558582, + "grad_norm": 6.882099628448486, + "learning_rate": 1.6079939186007058e-05, + "loss": 0.4521, + "step": 11495 + }, + { + "epoch": 31.32425068119891, + "grad_norm": 7.710224628448486, + "learning_rate": 1.6079238513057073e-05, + "loss": 0.3906, + "step": 11496 + }, + { + "epoch": 31.326975476839237, + "grad_norm": 7.994422912597656, + "learning_rate": 1.6078537792762174e-05, + "loss": 0.4096, + "step": 11497 + }, + { + "epoch": 31.329700272479563, + "grad_norm": 11.75682544708252, + "learning_rate": 1.6077837025127817e-05, + "loss": 0.4886, + "step": 11498 + }, + { + "epoch": 31.332425068119893, + "grad_norm": 7.2599077224731445, + "learning_rate": 1.6077136210159466e-05, + "loss": 0.4537, + "step": 11499 + }, + { + "epoch": 31.33514986376022, + "grad_norm": 6.902833461761475, + "learning_rate": 1.607643534786257e-05, + "loss": 0.4366, + "step": 11500 + }, + { + "epoch": 31.337874659400544, + "grad_norm": 6.804143905639648, + "learning_rate": 1.607573443824259e-05, + "loss": 0.4904, + "step": 11501 + }, + { + "epoch": 31.340599455040874, + "grad_norm": 6.350834846496582, + "learning_rate": 1.6075033481304993e-05, + "loss": 0.3763, + "step": 11502 + }, + { + "epoch": 31.3433242506812, + "grad_norm": 7.131535530090332, + "learning_rate": 1.6074332477055224e-05, + "loss": 0.3984, + "step": 11503 + }, + { + "epoch": 31.346049046321525, + "grad_norm": 6.9918389320373535, + "learning_rate": 1.607363142549875e-05, + "loss": 0.3341, + "step": 11504 + }, + { + "epoch": 31.348773841961854, + "grad_norm": 9.504937171936035, + "learning_rate": 1.607293032664103e-05, + "loss": 0.4984, + "step": 11505 + }, + { + "epoch": 31.35149863760218, + "grad_norm": 6.146029949188232, + "learning_rate": 1.6072229180487523e-05, + "loss": 0.4451, + "step": 11506 + }, + { + "epoch": 31.354223433242506, + "grad_norm": 31.787803649902344, + "learning_rate": 1.6071527987043693e-05, + "loss": 0.463, + "step": 11507 + }, + { + "epoch": 31.356948228882835, + "grad_norm": 6.9770121574401855, + "learning_rate": 1.6070826746314997e-05, + "loss": 0.3743, + "step": 11508 + }, + { + "epoch": 31.35967302452316, + "grad_norm": 6.07723331451416, + "learning_rate": 1.60701254583069e-05, + "loss": 0.4515, + "step": 11509 + }, + { + "epoch": 31.362397820163487, + "grad_norm": 6.7611985206604, + "learning_rate": 1.606942412302486e-05, + "loss": 0.4048, + "step": 11510 + }, + { + "epoch": 31.365122615803816, + "grad_norm": 5.638869762420654, + "learning_rate": 1.606872274047434e-05, + "loss": 0.4251, + "step": 11511 + }, + { + "epoch": 31.367847411444142, + "grad_norm": 13.817146301269531, + "learning_rate": 1.6068021310660806e-05, + "loss": 0.4402, + "step": 11512 + }, + { + "epoch": 31.370572207084468, + "grad_norm": 7.954291343688965, + "learning_rate": 1.606731983358971e-05, + "loss": 0.3469, + "step": 11513 + }, + { + "epoch": 31.373297002724797, + "grad_norm": 6.273427486419678, + "learning_rate": 1.6066618309266527e-05, + "loss": 0.3446, + "step": 11514 + }, + { + "epoch": 31.376021798365123, + "grad_norm": 6.062036991119385, + "learning_rate": 1.6065916737696713e-05, + "loss": 0.5062, + "step": 11515 + }, + { + "epoch": 31.37874659400545, + "grad_norm": 6.418720722198486, + "learning_rate": 1.6065215118885737e-05, + "loss": 0.4177, + "step": 11516 + }, + { + "epoch": 31.381471389645778, + "grad_norm": 5.220983028411865, + "learning_rate": 1.6064513452839064e-05, + "loss": 0.296, + "step": 11517 + }, + { + "epoch": 31.384196185286104, + "grad_norm": 13.341872215270996, + "learning_rate": 1.6063811739562153e-05, + "loss": 0.4035, + "step": 11518 + }, + { + "epoch": 31.38692098092643, + "grad_norm": 7.2220964431762695, + "learning_rate": 1.606310997906047e-05, + "loss": 0.5966, + "step": 11519 + }, + { + "epoch": 31.38964577656676, + "grad_norm": 7.388582229614258, + "learning_rate": 1.606240817133948e-05, + "loss": 0.4999, + "step": 11520 + }, + { + "epoch": 31.392370572207085, + "grad_norm": 6.779852867126465, + "learning_rate": 1.6061706316404653e-05, + "loss": 0.4079, + "step": 11521 + }, + { + "epoch": 31.39509536784741, + "grad_norm": 8.740653991699219, + "learning_rate": 1.606100441426145e-05, + "loss": 0.469, + "step": 11522 + }, + { + "epoch": 31.39782016348774, + "grad_norm": 7.6170854568481445, + "learning_rate": 1.6060302464915346e-05, + "loss": 0.3007, + "step": 11523 + }, + { + "epoch": 31.400544959128066, + "grad_norm": 9.081851959228516, + "learning_rate": 1.6059600468371792e-05, + "loss": 0.3765, + "step": 11524 + }, + { + "epoch": 31.40326975476839, + "grad_norm": 7.019375801086426, + "learning_rate": 1.605889842463627e-05, + "loss": 0.3902, + "step": 11525 + }, + { + "epoch": 31.40599455040872, + "grad_norm": 7.206212043762207, + "learning_rate": 1.605819633371424e-05, + "loss": 0.3379, + "step": 11526 + }, + { + "epoch": 31.408719346049047, + "grad_norm": 7.50978946685791, + "learning_rate": 1.6057494195611177e-05, + "loss": 0.3466, + "step": 11527 + }, + { + "epoch": 31.411444141689373, + "grad_norm": 6.506180763244629, + "learning_rate": 1.605679201033254e-05, + "loss": 0.477, + "step": 11528 + }, + { + "epoch": 31.414168937329702, + "grad_norm": 6.759514331817627, + "learning_rate": 1.6056089777883803e-05, + "loss": 0.4097, + "step": 11529 + }, + { + "epoch": 31.416893732970028, + "grad_norm": 5.902039527893066, + "learning_rate": 1.6055387498270435e-05, + "loss": 0.4765, + "step": 11530 + }, + { + "epoch": 31.419618528610354, + "grad_norm": 6.8216729164123535, + "learning_rate": 1.60546851714979e-05, + "loss": 0.4055, + "step": 11531 + }, + { + "epoch": 31.422343324250683, + "grad_norm": 6.676670074462891, + "learning_rate": 1.6053982797571675e-05, + "loss": 0.3519, + "step": 11532 + }, + { + "epoch": 31.42506811989101, + "grad_norm": 8.04570198059082, + "learning_rate": 1.6053280376497224e-05, + "loss": 0.3382, + "step": 11533 + }, + { + "epoch": 31.427792915531334, + "grad_norm": 8.004631042480469, + "learning_rate": 1.6052577908280022e-05, + "loss": 0.3306, + "step": 11534 + }, + { + "epoch": 31.430517711171664, + "grad_norm": 7.521023750305176, + "learning_rate": 1.605187539292554e-05, + "loss": 0.4975, + "step": 11535 + }, + { + "epoch": 31.43324250681199, + "grad_norm": 12.086722373962402, + "learning_rate": 1.6051172830439243e-05, + "loss": 0.3757, + "step": 11536 + }, + { + "epoch": 31.435967302452315, + "grad_norm": 6.613288879394531, + "learning_rate": 1.605047022082661e-05, + "loss": 0.3819, + "step": 11537 + }, + { + "epoch": 31.438692098092645, + "grad_norm": 6.143130779266357, + "learning_rate": 1.6049767564093107e-05, + "loss": 0.3684, + "step": 11538 + }, + { + "epoch": 31.44141689373297, + "grad_norm": 7.905948638916016, + "learning_rate": 1.604906486024421e-05, + "loss": 0.455, + "step": 11539 + }, + { + "epoch": 31.444141689373296, + "grad_norm": 11.131954193115234, + "learning_rate": 1.6048362109285393e-05, + "loss": 0.3509, + "step": 11540 + }, + { + "epoch": 31.446866485013626, + "grad_norm": 7.644253730773926, + "learning_rate": 1.6047659311222124e-05, + "loss": 0.3681, + "step": 11541 + }, + { + "epoch": 31.44959128065395, + "grad_norm": 6.650498867034912, + "learning_rate": 1.604695646605988e-05, + "loss": 0.3637, + "step": 11542 + }, + { + "epoch": 31.452316076294277, + "grad_norm": 6.839574337005615, + "learning_rate": 1.6046253573804134e-05, + "loss": 0.3998, + "step": 11543 + }, + { + "epoch": 31.455040871934607, + "grad_norm": 7.17881965637207, + "learning_rate": 1.6045550634460357e-05, + "loss": 0.3868, + "step": 11544 + }, + { + "epoch": 31.457765667574932, + "grad_norm": 6.631476402282715, + "learning_rate": 1.6044847648034026e-05, + "loss": 0.36, + "step": 11545 + }, + { + "epoch": 31.460490463215258, + "grad_norm": 11.95763874053955, + "learning_rate": 1.604414461453062e-05, + "loss": 0.343, + "step": 11546 + }, + { + "epoch": 31.463215258855588, + "grad_norm": 7.350583076477051, + "learning_rate": 1.604344153395561e-05, + "loss": 0.4047, + "step": 11547 + }, + { + "epoch": 31.465940054495913, + "grad_norm": 8.300507545471191, + "learning_rate": 1.604273840631447e-05, + "loss": 0.4782, + "step": 11548 + }, + { + "epoch": 31.46866485013624, + "grad_norm": 9.675360679626465, + "learning_rate": 1.6042035231612678e-05, + "loss": 0.412, + "step": 11549 + }, + { + "epoch": 31.47138964577657, + "grad_norm": 7.928048610687256, + "learning_rate": 1.604133200985571e-05, + "loss": 0.5042, + "step": 11550 + }, + { + "epoch": 31.474114441416894, + "grad_norm": 7.155492782592773, + "learning_rate": 1.6040628741049044e-05, + "loss": 0.4232, + "step": 11551 + }, + { + "epoch": 31.47683923705722, + "grad_norm": 10.458273887634277, + "learning_rate": 1.6039925425198156e-05, + "loss": 0.4533, + "step": 11552 + }, + { + "epoch": 31.479564032697546, + "grad_norm": 7.096415042877197, + "learning_rate": 1.603922206230852e-05, + "loss": 0.356, + "step": 11553 + }, + { + "epoch": 31.482288828337875, + "grad_norm": 6.542632102966309, + "learning_rate": 1.603851865238562e-05, + "loss": 0.4031, + "step": 11554 + }, + { + "epoch": 31.4850136239782, + "grad_norm": 6.910850524902344, + "learning_rate": 1.6037815195434928e-05, + "loss": 0.376, + "step": 11555 + }, + { + "epoch": 31.48773841961853, + "grad_norm": 6.508656978607178, + "learning_rate": 1.6037111691461932e-05, + "loss": 0.2852, + "step": 11556 + }, + { + "epoch": 31.490463215258856, + "grad_norm": 8.075109481811523, + "learning_rate": 1.6036408140472096e-05, + "loss": 0.3422, + "step": 11557 + }, + { + "epoch": 31.493188010899182, + "grad_norm": 7.133546352386475, + "learning_rate": 1.6035704542470915e-05, + "loss": 0.3654, + "step": 11558 + }, + { + "epoch": 31.495912806539508, + "grad_norm": 7.562647342681885, + "learning_rate": 1.6035000897463857e-05, + "loss": 0.4445, + "step": 11559 + }, + { + "epoch": 31.498637602179837, + "grad_norm": 6.576021194458008, + "learning_rate": 1.603429720545641e-05, + "loss": 0.5146, + "step": 11560 + }, + { + "epoch": 31.501362397820163, + "grad_norm": 6.826038837432861, + "learning_rate": 1.6033593466454043e-05, + "loss": 0.3154, + "step": 11561 + }, + { + "epoch": 31.504087193460492, + "grad_norm": 7.488579750061035, + "learning_rate": 1.603288968046225e-05, + "loss": 0.382, + "step": 11562 + }, + { + "epoch": 31.506811989100818, + "grad_norm": 7.069460391998291, + "learning_rate": 1.6032185847486504e-05, + "loss": 0.3824, + "step": 11563 + }, + { + "epoch": 31.509536784741144, + "grad_norm": 6.662590980529785, + "learning_rate": 1.6031481967532293e-05, + "loss": 0.5184, + "step": 11564 + }, + { + "epoch": 31.51226158038147, + "grad_norm": 6.6659722328186035, + "learning_rate": 1.603077804060509e-05, + "loss": 0.4854, + "step": 11565 + }, + { + "epoch": 31.5149863760218, + "grad_norm": 8.528528213500977, + "learning_rate": 1.6030074066710387e-05, + "loss": 0.479, + "step": 11566 + }, + { + "epoch": 31.517711171662125, + "grad_norm": 7.04036808013916, + "learning_rate": 1.6029370045853655e-05, + "loss": 0.3589, + "step": 11567 + }, + { + "epoch": 31.520435967302454, + "grad_norm": 8.598791122436523, + "learning_rate": 1.6028665978040388e-05, + "loss": 0.3669, + "step": 11568 + }, + { + "epoch": 31.52316076294278, + "grad_norm": 7.442421913146973, + "learning_rate": 1.602796186327606e-05, + "loss": 0.3, + "step": 11569 + }, + { + "epoch": 31.525885558583106, + "grad_norm": 7.288723468780518, + "learning_rate": 1.6027257701566162e-05, + "loss": 0.4641, + "step": 11570 + }, + { + "epoch": 31.52861035422343, + "grad_norm": 7.482388019561768, + "learning_rate": 1.6026553492916175e-05, + "loss": 0.3338, + "step": 11571 + }, + { + "epoch": 31.53133514986376, + "grad_norm": 8.168521881103516, + "learning_rate": 1.6025849237331583e-05, + "loss": 0.4507, + "step": 11572 + }, + { + "epoch": 31.534059945504087, + "grad_norm": 8.634714126586914, + "learning_rate": 1.602514493481787e-05, + "loss": 0.3071, + "step": 11573 + }, + { + "epoch": 31.536784741144416, + "grad_norm": 7.620938301086426, + "learning_rate": 1.6024440585380524e-05, + "loss": 0.452, + "step": 11574 + }, + { + "epoch": 31.539509536784742, + "grad_norm": 6.787168025970459, + "learning_rate": 1.6023736189025027e-05, + "loss": 0.4082, + "step": 11575 + }, + { + "epoch": 31.542234332425068, + "grad_norm": 7.074665069580078, + "learning_rate": 1.6023031745756864e-05, + "loss": 0.3651, + "step": 11576 + }, + { + "epoch": 31.544959128065393, + "grad_norm": 8.468385696411133, + "learning_rate": 1.602232725558153e-05, + "loss": 0.5849, + "step": 11577 + }, + { + "epoch": 31.547683923705723, + "grad_norm": 10.36236572265625, + "learning_rate": 1.6021622718504503e-05, + "loss": 0.4119, + "step": 11578 + }, + { + "epoch": 31.55040871934605, + "grad_norm": 8.830389022827148, + "learning_rate": 1.602091813453127e-05, + "loss": 0.4364, + "step": 11579 + }, + { + "epoch": 31.553133514986374, + "grad_norm": 7.7621846199035645, + "learning_rate": 1.602021350366732e-05, + "loss": 0.4208, + "step": 11580 + }, + { + "epoch": 31.555858310626704, + "grad_norm": 7.33500337600708, + "learning_rate": 1.6019508825918144e-05, + "loss": 0.427, + "step": 11581 + }, + { + "epoch": 31.55858310626703, + "grad_norm": 8.304717063903809, + "learning_rate": 1.6018804101289224e-05, + "loss": 0.6447, + "step": 11582 + }, + { + "epoch": 31.561307901907355, + "grad_norm": 7.474731922149658, + "learning_rate": 1.6018099329786053e-05, + "loss": 0.4329, + "step": 11583 + }, + { + "epoch": 31.564032697547685, + "grad_norm": 7.509472846984863, + "learning_rate": 1.6017394511414116e-05, + "loss": 0.4271, + "step": 11584 + }, + { + "epoch": 31.56675749318801, + "grad_norm": 8.360748291015625, + "learning_rate": 1.6016689646178906e-05, + "loss": 0.41, + "step": 11585 + }, + { + "epoch": 31.569482288828336, + "grad_norm": 7.341002941131592, + "learning_rate": 1.601598473408591e-05, + "loss": 0.5343, + "step": 11586 + }, + { + "epoch": 31.572207084468666, + "grad_norm": 8.834521293640137, + "learning_rate": 1.601527977514062e-05, + "loss": 0.4105, + "step": 11587 + }, + { + "epoch": 31.57493188010899, + "grad_norm": 6.91571044921875, + "learning_rate": 1.6014574769348526e-05, + "loss": 0.3516, + "step": 11588 + }, + { + "epoch": 31.577656675749317, + "grad_norm": 7.660037040710449, + "learning_rate": 1.6013869716715113e-05, + "loss": 0.4901, + "step": 11589 + }, + { + "epoch": 31.580381471389646, + "grad_norm": 7.215074062347412, + "learning_rate": 1.601316461724588e-05, + "loss": 0.4988, + "step": 11590 + }, + { + "epoch": 31.583106267029972, + "grad_norm": 5.853626251220703, + "learning_rate": 1.6012459470946315e-05, + "loss": 0.3817, + "step": 11591 + }, + { + "epoch": 31.585831062670298, + "grad_norm": 6.667288303375244, + "learning_rate": 1.6011754277821906e-05, + "loss": 0.3326, + "step": 11592 + }, + { + "epoch": 31.588555858310627, + "grad_norm": 7.225183486938477, + "learning_rate": 1.6011049037878145e-05, + "loss": 0.2822, + "step": 11593 + }, + { + "epoch": 31.591280653950953, + "grad_norm": 13.11107063293457, + "learning_rate": 1.6010343751120533e-05, + "loss": 0.4475, + "step": 11594 + }, + { + "epoch": 31.59400544959128, + "grad_norm": 6.232799053192139, + "learning_rate": 1.6009638417554555e-05, + "loss": 0.3852, + "step": 11595 + }, + { + "epoch": 31.59673024523161, + "grad_norm": 7.203550815582275, + "learning_rate": 1.600893303718571e-05, + "loss": 0.4605, + "step": 11596 + }, + { + "epoch": 31.599455040871934, + "grad_norm": 7.108577251434326, + "learning_rate": 1.6008227610019485e-05, + "loss": 0.3255, + "step": 11597 + }, + { + "epoch": 31.60217983651226, + "grad_norm": 6.979862213134766, + "learning_rate": 1.6007522136061378e-05, + "loss": 0.3233, + "step": 11598 + }, + { + "epoch": 31.60490463215259, + "grad_norm": 7.540842533111572, + "learning_rate": 1.600681661531688e-05, + "loss": 0.3895, + "step": 11599 + }, + { + "epoch": 31.607629427792915, + "grad_norm": 7.842855930328369, + "learning_rate": 1.600611104779149e-05, + "loss": 0.3889, + "step": 11600 + }, + { + "epoch": 31.61035422343324, + "grad_norm": 7.594421863555908, + "learning_rate": 1.6005405433490694e-05, + "loss": 0.3911, + "step": 11601 + }, + { + "epoch": 31.61307901907357, + "grad_norm": 5.4124908447265625, + "learning_rate": 1.600469977242e-05, + "loss": 0.5018, + "step": 11602 + }, + { + "epoch": 31.615803814713896, + "grad_norm": 6.882364749908447, + "learning_rate": 1.6003994064584895e-05, + "loss": 0.3772, + "step": 11603 + }, + { + "epoch": 31.618528610354222, + "grad_norm": 8.891324043273926, + "learning_rate": 1.600328830999088e-05, + "loss": 0.3677, + "step": 11604 + }, + { + "epoch": 31.62125340599455, + "grad_norm": 8.092884063720703, + "learning_rate": 1.6002582508643446e-05, + "loss": 0.4644, + "step": 11605 + }, + { + "epoch": 31.623978201634877, + "grad_norm": 13.51522445678711, + "learning_rate": 1.6001876660548098e-05, + "loss": 0.2916, + "step": 11606 + }, + { + "epoch": 31.626702997275203, + "grad_norm": 7.009510040283203, + "learning_rate": 1.6001170765710323e-05, + "loss": 0.4711, + "step": 11607 + }, + { + "epoch": 31.629427792915532, + "grad_norm": 6.411016941070557, + "learning_rate": 1.6000464824135623e-05, + "loss": 0.3018, + "step": 11608 + }, + { + "epoch": 31.632152588555858, + "grad_norm": 8.686745643615723, + "learning_rate": 1.5999758835829497e-05, + "loss": 0.458, + "step": 11609 + }, + { + "epoch": 31.634877384196184, + "grad_norm": 7.0936102867126465, + "learning_rate": 1.599905280079744e-05, + "loss": 0.4555, + "step": 11610 + }, + { + "epoch": 31.637602179836513, + "grad_norm": 5.631973743438721, + "learning_rate": 1.5998346719044956e-05, + "loss": 0.3708, + "step": 11611 + }, + { + "epoch": 31.64032697547684, + "grad_norm": 9.096990585327148, + "learning_rate": 1.5997640590577544e-05, + "loss": 0.4305, + "step": 11612 + }, + { + "epoch": 31.643051771117165, + "grad_norm": 8.056363105773926, + "learning_rate": 1.5996934415400694e-05, + "loss": 0.5111, + "step": 11613 + }, + { + "epoch": 31.645776566757494, + "grad_norm": 7.630584716796875, + "learning_rate": 1.5996228193519914e-05, + "loss": 0.4622, + "step": 11614 + }, + { + "epoch": 31.64850136239782, + "grad_norm": 8.496237754821777, + "learning_rate": 1.5995521924940704e-05, + "loss": 0.3883, + "step": 11615 + }, + { + "epoch": 31.651226158038146, + "grad_norm": 6.984487056732178, + "learning_rate": 1.5994815609668558e-05, + "loss": 0.5494, + "step": 11616 + }, + { + "epoch": 31.653950953678475, + "grad_norm": 8.360382080078125, + "learning_rate": 1.5994109247708983e-05, + "loss": 0.6595, + "step": 11617 + }, + { + "epoch": 31.6566757493188, + "grad_norm": 7.152622222900391, + "learning_rate": 1.5993402839067477e-05, + "loss": 0.3386, + "step": 11618 + }, + { + "epoch": 31.659400544959126, + "grad_norm": 30.050329208374023, + "learning_rate": 1.5992696383749543e-05, + "loss": 0.4098, + "step": 11619 + }, + { + "epoch": 31.662125340599456, + "grad_norm": 6.905817031860352, + "learning_rate": 1.5991989881760687e-05, + "loss": 0.4179, + "step": 11620 + }, + { + "epoch": 31.66485013623978, + "grad_norm": 6.6429572105407715, + "learning_rate": 1.59912833331064e-05, + "loss": 0.563, + "step": 11621 + }, + { + "epoch": 31.667574931880107, + "grad_norm": 7.85490608215332, + "learning_rate": 1.5990576737792192e-05, + "loss": 0.3966, + "step": 11622 + }, + { + "epoch": 31.670299727520437, + "grad_norm": 7.767920017242432, + "learning_rate": 1.598987009582357e-05, + "loss": 0.434, + "step": 11623 + }, + { + "epoch": 31.673024523160763, + "grad_norm": 6.833701133728027, + "learning_rate": 1.598916340720603e-05, + "loss": 0.4659, + "step": 11624 + }, + { + "epoch": 31.67574931880109, + "grad_norm": 7.239294052124023, + "learning_rate": 1.5988456671945078e-05, + "loss": 0.3643, + "step": 11625 + }, + { + "epoch": 31.678474114441418, + "grad_norm": 13.427486419677734, + "learning_rate": 1.598774989004622e-05, + "loss": 0.5385, + "step": 11626 + }, + { + "epoch": 31.681198910081743, + "grad_norm": 6.485818862915039, + "learning_rate": 1.5987043061514953e-05, + "loss": 0.4117, + "step": 11627 + }, + { + "epoch": 31.68392370572207, + "grad_norm": 6.466250419616699, + "learning_rate": 1.598633618635679e-05, + "loss": 0.5883, + "step": 11628 + }, + { + "epoch": 31.6866485013624, + "grad_norm": 6.980894565582275, + "learning_rate": 1.5985629264577237e-05, + "loss": 0.5242, + "step": 11629 + }, + { + "epoch": 31.689373297002724, + "grad_norm": 7.625382423400879, + "learning_rate": 1.5984922296181794e-05, + "loss": 0.5074, + "step": 11630 + }, + { + "epoch": 31.69209809264305, + "grad_norm": 9.570500373840332, + "learning_rate": 1.5984215281175964e-05, + "loss": 0.3946, + "step": 11631 + }, + { + "epoch": 31.69482288828338, + "grad_norm": 6.711041450500488, + "learning_rate": 1.5983508219565264e-05, + "loss": 0.2941, + "step": 11632 + }, + { + "epoch": 31.697547683923705, + "grad_norm": 6.9375104904174805, + "learning_rate": 1.5982801111355195e-05, + "loss": 0.3896, + "step": 11633 + }, + { + "epoch": 31.70027247956403, + "grad_norm": 9.227879524230957, + "learning_rate": 1.598209395655126e-05, + "loss": 0.5455, + "step": 11634 + }, + { + "epoch": 31.70299727520436, + "grad_norm": 7.8122687339782715, + "learning_rate": 1.598138675515897e-05, + "loss": 0.5035, + "step": 11635 + }, + { + "epoch": 31.705722070844686, + "grad_norm": 8.350142478942871, + "learning_rate": 1.5980679507183834e-05, + "loss": 0.4818, + "step": 11636 + }, + { + "epoch": 31.708446866485012, + "grad_norm": 17.139902114868164, + "learning_rate": 1.5979972212631358e-05, + "loss": 0.437, + "step": 11637 + }, + { + "epoch": 31.71117166212534, + "grad_norm": 6.634777545928955, + "learning_rate": 1.597926487150705e-05, + "loss": 0.4443, + "step": 11638 + }, + { + "epoch": 31.713896457765667, + "grad_norm": 8.797743797302246, + "learning_rate": 1.5978557483816423e-05, + "loss": 0.3745, + "step": 11639 + }, + { + "epoch": 31.716621253405993, + "grad_norm": 5.549252510070801, + "learning_rate": 1.5977850049564978e-05, + "loss": 0.4563, + "step": 11640 + }, + { + "epoch": 31.719346049046322, + "grad_norm": 7.894062519073486, + "learning_rate": 1.597714256875823e-05, + "loss": 0.3588, + "step": 11641 + }, + { + "epoch": 31.722070844686648, + "grad_norm": 7.197150707244873, + "learning_rate": 1.597643504140169e-05, + "loss": 0.4125, + "step": 11642 + }, + { + "epoch": 31.724795640326974, + "grad_norm": 7.9397687911987305, + "learning_rate": 1.597572746750087e-05, + "loss": 0.4016, + "step": 11643 + }, + { + "epoch": 31.727520435967303, + "grad_norm": 12.798469543457031, + "learning_rate": 1.597501984706127e-05, + "loss": 0.4362, + "step": 11644 + }, + { + "epoch": 31.73024523160763, + "grad_norm": 7.300980091094971, + "learning_rate": 1.5974312180088407e-05, + "loss": 0.4783, + "step": 11645 + }, + { + "epoch": 31.732970027247955, + "grad_norm": 7.096359729766846, + "learning_rate": 1.5973604466587797e-05, + "loss": 0.4644, + "step": 11646 + }, + { + "epoch": 31.735694822888284, + "grad_norm": 8.164803504943848, + "learning_rate": 1.597289670656495e-05, + "loss": 0.4043, + "step": 11647 + }, + { + "epoch": 31.73841961852861, + "grad_norm": 7.867160797119141, + "learning_rate": 1.5972188900025368e-05, + "loss": 0.4754, + "step": 11648 + }, + { + "epoch": 31.741144414168936, + "grad_norm": 8.261493682861328, + "learning_rate": 1.5971481046974576e-05, + "loss": 0.3015, + "step": 11649 + }, + { + "epoch": 31.743869209809265, + "grad_norm": 15.797551155090332, + "learning_rate": 1.5970773147418084e-05, + "loss": 0.4188, + "step": 11650 + }, + { + "epoch": 31.74659400544959, + "grad_norm": 9.968244552612305, + "learning_rate": 1.59700652013614e-05, + "loss": 0.455, + "step": 11651 + }, + { + "epoch": 31.749318801089917, + "grad_norm": 7.915208339691162, + "learning_rate": 1.5969357208810043e-05, + "loss": 0.378, + "step": 11652 + }, + { + "epoch": 31.752043596730246, + "grad_norm": 10.037928581237793, + "learning_rate": 1.5968649169769518e-05, + "loss": 0.451, + "step": 11653 + }, + { + "epoch": 31.754768392370572, + "grad_norm": 7.658346652984619, + "learning_rate": 1.596794108424535e-05, + "loss": 0.3637, + "step": 11654 + }, + { + "epoch": 31.757493188010898, + "grad_norm": 16.169321060180664, + "learning_rate": 1.5967232952243048e-05, + "loss": 0.4568, + "step": 11655 + }, + { + "epoch": 31.760217983651227, + "grad_norm": 7.466304302215576, + "learning_rate": 1.5966524773768127e-05, + "loss": 0.4997, + "step": 11656 + }, + { + "epoch": 31.762942779291553, + "grad_norm": 8.412617683410645, + "learning_rate": 1.5965816548826104e-05, + "loss": 0.4415, + "step": 11657 + }, + { + "epoch": 31.76566757493188, + "grad_norm": 8.815930366516113, + "learning_rate": 1.5965108277422493e-05, + "loss": 0.372, + "step": 11658 + }, + { + "epoch": 31.768392370572208, + "grad_norm": 9.237602233886719, + "learning_rate": 1.5964399959562812e-05, + "loss": 0.5867, + "step": 11659 + }, + { + "epoch": 31.771117166212534, + "grad_norm": 11.187580108642578, + "learning_rate": 1.5963691595252576e-05, + "loss": 0.3711, + "step": 11660 + }, + { + "epoch": 31.77384196185286, + "grad_norm": 8.331928253173828, + "learning_rate": 1.5962983184497304e-05, + "loss": 0.4207, + "step": 11661 + }, + { + "epoch": 31.77656675749319, + "grad_norm": 7.726268768310547, + "learning_rate": 1.5962274727302506e-05, + "loss": 0.4157, + "step": 11662 + }, + { + "epoch": 31.779291553133515, + "grad_norm": 7.6028594970703125, + "learning_rate": 1.5961566223673707e-05, + "loss": 0.4979, + "step": 11663 + }, + { + "epoch": 31.78201634877384, + "grad_norm": 8.230978012084961, + "learning_rate": 1.5960857673616423e-05, + "loss": 0.3914, + "step": 11664 + }, + { + "epoch": 31.78474114441417, + "grad_norm": 11.412215232849121, + "learning_rate": 1.5960149077136167e-05, + "loss": 0.3205, + "step": 11665 + }, + { + "epoch": 31.787465940054496, + "grad_norm": 7.51002311706543, + "learning_rate": 1.5959440434238465e-05, + "loss": 0.3669, + "step": 11666 + }, + { + "epoch": 31.79019073569482, + "grad_norm": 6.666199684143066, + "learning_rate": 1.5958731744928836e-05, + "loss": 0.3662, + "step": 11667 + }, + { + "epoch": 31.79291553133515, + "grad_norm": 7.396177768707275, + "learning_rate": 1.595802300921279e-05, + "loss": 0.4617, + "step": 11668 + }, + { + "epoch": 31.795640326975477, + "grad_norm": 8.355841636657715, + "learning_rate": 1.5957314227095854e-05, + "loss": 0.4491, + "step": 11669 + }, + { + "epoch": 31.798365122615802, + "grad_norm": 6.12953519821167, + "learning_rate": 1.5956605398583547e-05, + "loss": 0.4865, + "step": 11670 + }, + { + "epoch": 31.80108991825613, + "grad_norm": 8.663213729858398, + "learning_rate": 1.5955896523681392e-05, + "loss": 0.5633, + "step": 11671 + }, + { + "epoch": 31.803814713896458, + "grad_norm": 8.228528022766113, + "learning_rate": 1.5955187602394904e-05, + "loss": 0.4255, + "step": 11672 + }, + { + "epoch": 31.806539509536783, + "grad_norm": 8.043113708496094, + "learning_rate": 1.5954478634729605e-05, + "loss": 0.5658, + "step": 11673 + }, + { + "epoch": 31.809264305177113, + "grad_norm": 8.05732250213623, + "learning_rate": 1.595376962069102e-05, + "loss": 0.4994, + "step": 11674 + }, + { + "epoch": 31.81198910081744, + "grad_norm": 9.802180290222168, + "learning_rate": 1.5953060560284666e-05, + "loss": 0.4033, + "step": 11675 + }, + { + "epoch": 31.814713896457764, + "grad_norm": 9.854981422424316, + "learning_rate": 1.5952351453516076e-05, + "loss": 0.3839, + "step": 11676 + }, + { + "epoch": 31.817438692098094, + "grad_norm": 7.649071216583252, + "learning_rate": 1.5951642300390755e-05, + "loss": 0.5664, + "step": 11677 + }, + { + "epoch": 31.82016348773842, + "grad_norm": 8.393444061279297, + "learning_rate": 1.5950933100914242e-05, + "loss": 0.3582, + "step": 11678 + }, + { + "epoch": 31.822888283378745, + "grad_norm": 6.505215644836426, + "learning_rate": 1.5950223855092047e-05, + "loss": 0.4206, + "step": 11679 + }, + { + "epoch": 31.825613079019075, + "grad_norm": 9.40150260925293, + "learning_rate": 1.5949514562929706e-05, + "loss": 0.5851, + "step": 11680 + }, + { + "epoch": 31.8283378746594, + "grad_norm": 8.124299049377441, + "learning_rate": 1.5948805224432736e-05, + "loss": 0.3621, + "step": 11681 + }, + { + "epoch": 31.831062670299726, + "grad_norm": 12.069969177246094, + "learning_rate": 1.5948095839606657e-05, + "loss": 0.3731, + "step": 11682 + }, + { + "epoch": 31.833787465940055, + "grad_norm": 7.199894428253174, + "learning_rate": 1.5947386408457005e-05, + "loss": 0.3736, + "step": 11683 + }, + { + "epoch": 31.83651226158038, + "grad_norm": 7.235996723175049, + "learning_rate": 1.5946676930989296e-05, + "loss": 0.3235, + "step": 11684 + }, + { + "epoch": 31.839237057220707, + "grad_norm": 13.020691871643066, + "learning_rate": 1.5945967407209062e-05, + "loss": 0.3165, + "step": 11685 + }, + { + "epoch": 31.841961852861036, + "grad_norm": 8.26447868347168, + "learning_rate": 1.5945257837121825e-05, + "loss": 0.3387, + "step": 11686 + }, + { + "epoch": 31.844686648501362, + "grad_norm": 8.25384521484375, + "learning_rate": 1.5944548220733107e-05, + "loss": 0.3323, + "step": 11687 + }, + { + "epoch": 31.847411444141688, + "grad_norm": 7.659300804138184, + "learning_rate": 1.5943838558048442e-05, + "loss": 0.3542, + "step": 11688 + }, + { + "epoch": 31.850136239782017, + "grad_norm": 7.018349647521973, + "learning_rate": 1.594312884907335e-05, + "loss": 0.4067, + "step": 11689 + }, + { + "epoch": 31.852861035422343, + "grad_norm": 9.388994216918945, + "learning_rate": 1.5942419093813365e-05, + "loss": 0.494, + "step": 11690 + }, + { + "epoch": 31.85558583106267, + "grad_norm": 8.678350448608398, + "learning_rate": 1.5941709292274012e-05, + "loss": 0.4118, + "step": 11691 + }, + { + "epoch": 31.858310626703, + "grad_norm": 7.856499195098877, + "learning_rate": 1.594099944446082e-05, + "loss": 0.4857, + "step": 11692 + }, + { + "epoch": 31.861035422343324, + "grad_norm": 8.969182968139648, + "learning_rate": 1.5940289550379312e-05, + "loss": 0.3589, + "step": 11693 + }, + { + "epoch": 31.86376021798365, + "grad_norm": 42.84821319580078, + "learning_rate": 1.5939579610035017e-05, + "loss": 0.5277, + "step": 11694 + }, + { + "epoch": 31.86648501362398, + "grad_norm": 6.726892471313477, + "learning_rate": 1.5938869623433474e-05, + "loss": 0.2977, + "step": 11695 + }, + { + "epoch": 31.869209809264305, + "grad_norm": 7.893887996673584, + "learning_rate": 1.59381595905802e-05, + "loss": 0.3669, + "step": 11696 + }, + { + "epoch": 31.87193460490463, + "grad_norm": 8.389455795288086, + "learning_rate": 1.5937449511480735e-05, + "loss": 0.4604, + "step": 11697 + }, + { + "epoch": 31.87465940054496, + "grad_norm": 7.12132453918457, + "learning_rate": 1.5936739386140602e-05, + "loss": 0.5257, + "step": 11698 + }, + { + "epoch": 31.877384196185286, + "grad_norm": 9.241552352905273, + "learning_rate": 1.593602921456533e-05, + "loss": 0.4019, + "step": 11699 + }, + { + "epoch": 31.88010899182561, + "grad_norm": 8.437087059020996, + "learning_rate": 1.593531899676046e-05, + "loss": 0.3466, + "step": 11700 + }, + { + "epoch": 31.88283378746594, + "grad_norm": 11.758437156677246, + "learning_rate": 1.5934608732731516e-05, + "loss": 0.3138, + "step": 11701 + }, + { + "epoch": 31.885558583106267, + "grad_norm": 7.625300407409668, + "learning_rate": 1.5933898422484026e-05, + "loss": 0.5699, + "step": 11702 + }, + { + "epoch": 31.888283378746593, + "grad_norm": 12.781292915344238, + "learning_rate": 1.593318806602353e-05, + "loss": 0.4352, + "step": 11703 + }, + { + "epoch": 31.891008174386922, + "grad_norm": 9.552247047424316, + "learning_rate": 1.5932477663355554e-05, + "loss": 0.3774, + "step": 11704 + }, + { + "epoch": 31.893732970027248, + "grad_norm": 6.996197700500488, + "learning_rate": 1.593176721448563e-05, + "loss": 0.3453, + "step": 11705 + }, + { + "epoch": 31.896457765667574, + "grad_norm": 16.7490177154541, + "learning_rate": 1.59310567194193e-05, + "loss": 0.3861, + "step": 11706 + }, + { + "epoch": 31.899182561307903, + "grad_norm": 7.065978050231934, + "learning_rate": 1.593034617816209e-05, + "loss": 0.5357, + "step": 11707 + }, + { + "epoch": 31.90190735694823, + "grad_norm": 10.968025207519531, + "learning_rate": 1.592963559071953e-05, + "loss": 0.3481, + "step": 11708 + }, + { + "epoch": 31.904632152588555, + "grad_norm": 12.107632637023926, + "learning_rate": 1.5928924957097166e-05, + "loss": 0.3795, + "step": 11709 + }, + { + "epoch": 31.907356948228884, + "grad_norm": 8.137904167175293, + "learning_rate": 1.5928214277300517e-05, + "loss": 0.4666, + "step": 11710 + }, + { + "epoch": 31.91008174386921, + "grad_norm": 7.665256500244141, + "learning_rate": 1.5927503551335132e-05, + "loss": 0.3523, + "step": 11711 + }, + { + "epoch": 31.912806539509535, + "grad_norm": 8.476051330566406, + "learning_rate": 1.592679277920654e-05, + "loss": 0.454, + "step": 11712 + }, + { + "epoch": 31.915531335149865, + "grad_norm": 8.426595687866211, + "learning_rate": 1.5926081960920276e-05, + "loss": 0.4902, + "step": 11713 + }, + { + "epoch": 31.91825613079019, + "grad_norm": 8.372299194335938, + "learning_rate": 1.5925371096481873e-05, + "loss": 0.4849, + "step": 11714 + }, + { + "epoch": 31.920980926430516, + "grad_norm": 9.851797103881836, + "learning_rate": 1.592466018589687e-05, + "loss": 0.3605, + "step": 11715 + }, + { + "epoch": 31.923705722070846, + "grad_norm": 7.402262210845947, + "learning_rate": 1.592394922917081e-05, + "loss": 0.4611, + "step": 11716 + }, + { + "epoch": 31.92643051771117, + "grad_norm": 8.301385879516602, + "learning_rate": 1.592323822630922e-05, + "loss": 0.4348, + "step": 11717 + }, + { + "epoch": 31.929155313351497, + "grad_norm": 10.224685668945312, + "learning_rate": 1.5922527177317646e-05, + "loss": 0.4246, + "step": 11718 + }, + { + "epoch": 31.931880108991827, + "grad_norm": 7.9992451667785645, + "learning_rate": 1.5921816082201614e-05, + "loss": 0.4367, + "step": 11719 + }, + { + "epoch": 31.934604904632153, + "grad_norm": 9.548096656799316, + "learning_rate": 1.5921104940966675e-05, + "loss": 0.6477, + "step": 11720 + }, + { + "epoch": 31.93732970027248, + "grad_norm": 8.109225273132324, + "learning_rate": 1.592039375361836e-05, + "loss": 0.4449, + "step": 11721 + }, + { + "epoch": 31.940054495912808, + "grad_norm": 8.547680854797363, + "learning_rate": 1.5919682520162208e-05, + "loss": 0.5069, + "step": 11722 + }, + { + "epoch": 31.942779291553133, + "grad_norm": 9.245973587036133, + "learning_rate": 1.591897124060376e-05, + "loss": 0.6393, + "step": 11723 + }, + { + "epoch": 31.94550408719346, + "grad_norm": 11.543919563293457, + "learning_rate": 1.591825991494855e-05, + "loss": 0.3292, + "step": 11724 + }, + { + "epoch": 31.94822888283379, + "grad_norm": 9.651740074157715, + "learning_rate": 1.5917548543202127e-05, + "loss": 0.4369, + "step": 11725 + }, + { + "epoch": 31.950953678474114, + "grad_norm": 12.728254318237305, + "learning_rate": 1.5916837125370025e-05, + "loss": 0.4299, + "step": 11726 + }, + { + "epoch": 31.95367847411444, + "grad_norm": 10.07304859161377, + "learning_rate": 1.5916125661457786e-05, + "loss": 0.4309, + "step": 11727 + }, + { + "epoch": 31.95640326975477, + "grad_norm": 8.557503700256348, + "learning_rate": 1.5915414151470953e-05, + "loss": 0.5154, + "step": 11728 + }, + { + "epoch": 31.959128065395095, + "grad_norm": 9.72024154663086, + "learning_rate": 1.5914702595415062e-05, + "loss": 0.3552, + "step": 11729 + }, + { + "epoch": 31.96185286103542, + "grad_norm": 8.9443998336792, + "learning_rate": 1.5913990993295655e-05, + "loss": 0.4208, + "step": 11730 + }, + { + "epoch": 31.96457765667575, + "grad_norm": 9.49070930480957, + "learning_rate": 1.5913279345118284e-05, + "loss": 0.4914, + "step": 11731 + }, + { + "epoch": 31.967302452316076, + "grad_norm": 7.919051647186279, + "learning_rate": 1.5912567650888476e-05, + "loss": 0.3918, + "step": 11732 + }, + { + "epoch": 31.970027247956402, + "grad_norm": 8.020977973937988, + "learning_rate": 1.5911855910611785e-05, + "loss": 0.519, + "step": 11733 + }, + { + "epoch": 31.97275204359673, + "grad_norm": 7.276769161224365, + "learning_rate": 1.591114412429375e-05, + "loss": 0.4469, + "step": 11734 + }, + { + "epoch": 31.975476839237057, + "grad_norm": 13.29661750793457, + "learning_rate": 1.5910432291939917e-05, + "loss": 0.4273, + "step": 11735 + }, + { + "epoch": 31.978201634877383, + "grad_norm": 7.530263423919678, + "learning_rate": 1.5909720413555826e-05, + "loss": 0.4412, + "step": 11736 + }, + { + "epoch": 31.980926430517712, + "grad_norm": 8.672321319580078, + "learning_rate": 1.590900848914702e-05, + "loss": 0.3605, + "step": 11737 + }, + { + "epoch": 31.983651226158038, + "grad_norm": 8.137622833251953, + "learning_rate": 1.590829651871905e-05, + "loss": 0.4903, + "step": 11738 + }, + { + "epoch": 31.986376021798364, + "grad_norm": 15.847869873046875, + "learning_rate": 1.5907584502277456e-05, + "loss": 0.3915, + "step": 11739 + }, + { + "epoch": 31.989100817438693, + "grad_norm": 6.88349723815918, + "learning_rate": 1.5906872439827782e-05, + "loss": 0.5171, + "step": 11740 + }, + { + "epoch": 31.99182561307902, + "grad_norm": 7.6084160804748535, + "learning_rate": 1.5906160331375577e-05, + "loss": 0.4654, + "step": 11741 + }, + { + "epoch": 31.994550408719345, + "grad_norm": 11.99288558959961, + "learning_rate": 1.5905448176926385e-05, + "loss": 0.3553, + "step": 11742 + }, + { + "epoch": 31.997275204359674, + "grad_norm": 9.274868965148926, + "learning_rate": 1.5904735976485754e-05, + "loss": 0.6314, + "step": 11743 + }, + { + "epoch": 32.0, + "grad_norm": 7.692490100860596, + "learning_rate": 1.5904023730059227e-05, + "loss": 0.5656, + "step": 11744 + }, + { + "epoch": 32.002724795640326, + "grad_norm": 6.655430793762207, + "learning_rate": 1.5903311437652357e-05, + "loss": 0.3511, + "step": 11745 + }, + { + "epoch": 32.00544959128065, + "grad_norm": 7.963028907775879, + "learning_rate": 1.5902599099270686e-05, + "loss": 0.4009, + "step": 11746 + }, + { + "epoch": 32.00817438692098, + "grad_norm": 11.768818855285645, + "learning_rate": 1.5901886714919758e-05, + "loss": 0.275, + "step": 11747 + }, + { + "epoch": 32.01089918256131, + "grad_norm": 7.126332759857178, + "learning_rate": 1.5901174284605132e-05, + "loss": 0.2981, + "step": 11748 + }, + { + "epoch": 32.013623978201636, + "grad_norm": 9.119898796081543, + "learning_rate": 1.590046180833235e-05, + "loss": 0.3867, + "step": 11749 + }, + { + "epoch": 32.01634877384196, + "grad_norm": 6.50003719329834, + "learning_rate": 1.5899749286106957e-05, + "loss": 0.4581, + "step": 11750 + }, + { + "epoch": 32.01907356948229, + "grad_norm": 8.52955436706543, + "learning_rate": 1.5899036717934514e-05, + "loss": 0.3926, + "step": 11751 + }, + { + "epoch": 32.02179836512261, + "grad_norm": 7.3344244956970215, + "learning_rate": 1.5898324103820556e-05, + "loss": 0.3102, + "step": 11752 + }, + { + "epoch": 32.02452316076294, + "grad_norm": 7.1891679763793945, + "learning_rate": 1.5897611443770643e-05, + "loss": 0.3102, + "step": 11753 + }, + { + "epoch": 32.02724795640327, + "grad_norm": 8.859405517578125, + "learning_rate": 1.5896898737790323e-05, + "loss": 0.5104, + "step": 11754 + }, + { + "epoch": 32.0299727520436, + "grad_norm": 7.968280792236328, + "learning_rate": 1.589618598588514e-05, + "loss": 0.4209, + "step": 11755 + }, + { + "epoch": 32.032697547683924, + "grad_norm": 7.986744403839111, + "learning_rate": 1.5895473188060654e-05, + "loss": 0.386, + "step": 11756 + }, + { + "epoch": 32.03542234332425, + "grad_norm": 20.042699813842773, + "learning_rate": 1.5894760344322416e-05, + "loss": 0.3549, + "step": 11757 + }, + { + "epoch": 32.038147138964575, + "grad_norm": 7.735237121582031, + "learning_rate": 1.589404745467597e-05, + "loss": 0.359, + "step": 11758 + }, + { + "epoch": 32.0408719346049, + "grad_norm": 8.201799392700195, + "learning_rate": 1.589333451912687e-05, + "loss": 0.6518, + "step": 11759 + }, + { + "epoch": 32.043596730245234, + "grad_norm": 7.063997268676758, + "learning_rate": 1.5892621537680674e-05, + "loss": 0.2672, + "step": 11760 + }, + { + "epoch": 32.04632152588556, + "grad_norm": 7.970167636871338, + "learning_rate": 1.5891908510342932e-05, + "loss": 0.3202, + "step": 11761 + }, + { + "epoch": 32.049046321525886, + "grad_norm": 7.34511137008667, + "learning_rate": 1.5891195437119193e-05, + "loss": 0.4982, + "step": 11762 + }, + { + "epoch": 32.05177111716621, + "grad_norm": 21.53789710998535, + "learning_rate": 1.5890482318015017e-05, + "loss": 0.3787, + "step": 11763 + }, + { + "epoch": 32.05449591280654, + "grad_norm": 14.992596626281738, + "learning_rate": 1.5889769153035953e-05, + "loss": 0.4414, + "step": 11764 + }, + { + "epoch": 32.05722070844686, + "grad_norm": 8.265618324279785, + "learning_rate": 1.588905594218755e-05, + "loss": 0.3199, + "step": 11765 + }, + { + "epoch": 32.059945504087196, + "grad_norm": 7.635008335113525, + "learning_rate": 1.588834268547538e-05, + "loss": 0.3056, + "step": 11766 + }, + { + "epoch": 32.06267029972752, + "grad_norm": 7.344765663146973, + "learning_rate": 1.588762938290498e-05, + "loss": 0.5309, + "step": 11767 + }, + { + "epoch": 32.06539509536785, + "grad_norm": 9.463160514831543, + "learning_rate": 1.5886916034481914e-05, + "loss": 0.5813, + "step": 11768 + }, + { + "epoch": 32.06811989100817, + "grad_norm": 9.012089729309082, + "learning_rate": 1.5886202640211733e-05, + "loss": 0.5155, + "step": 11769 + }, + { + "epoch": 32.0708446866485, + "grad_norm": 10.00454044342041, + "learning_rate": 1.5885489200099996e-05, + "loss": 0.3176, + "step": 11770 + }, + { + "epoch": 32.073569482288825, + "grad_norm": 7.091330051422119, + "learning_rate": 1.588477571415226e-05, + "loss": 0.3793, + "step": 11771 + }, + { + "epoch": 32.07629427792916, + "grad_norm": 8.165772438049316, + "learning_rate": 1.5884062182374083e-05, + "loss": 0.2841, + "step": 11772 + }, + { + "epoch": 32.079019073569484, + "grad_norm": 8.757858276367188, + "learning_rate": 1.5883348604771013e-05, + "loss": 0.2816, + "step": 11773 + }, + { + "epoch": 32.08174386920981, + "grad_norm": 6.973340034484863, + "learning_rate": 1.5882634981348614e-05, + "loss": 0.4262, + "step": 11774 + }, + { + "epoch": 32.084468664850135, + "grad_norm": 7.131436347961426, + "learning_rate": 1.5881921312112446e-05, + "loss": 0.3938, + "step": 11775 + }, + { + "epoch": 32.08719346049046, + "grad_norm": 8.54784870147705, + "learning_rate": 1.5881207597068065e-05, + "loss": 0.3687, + "step": 11776 + }, + { + "epoch": 32.08991825613079, + "grad_norm": 7.42059850692749, + "learning_rate": 1.5880493836221025e-05, + "loss": 0.3914, + "step": 11777 + }, + { + "epoch": 32.09264305177112, + "grad_norm": 8.61288070678711, + "learning_rate": 1.587978002957689e-05, + "loss": 0.4535, + "step": 11778 + }, + { + "epoch": 32.095367847411445, + "grad_norm": 9.793703079223633, + "learning_rate": 1.587906617714122e-05, + "loss": 0.3553, + "step": 11779 + }, + { + "epoch": 32.09809264305177, + "grad_norm": 7.9810004234313965, + "learning_rate": 1.587835227891957e-05, + "loss": 0.3646, + "step": 11780 + }, + { + "epoch": 32.1008174386921, + "grad_norm": 6.956366062164307, + "learning_rate": 1.58776383349175e-05, + "loss": 0.3989, + "step": 11781 + }, + { + "epoch": 32.10354223433242, + "grad_norm": 9.917304992675781, + "learning_rate": 1.587692434514057e-05, + "loss": 0.3329, + "step": 11782 + }, + { + "epoch": 32.10626702997275, + "grad_norm": 9.136825561523438, + "learning_rate": 1.5876210309594347e-05, + "loss": 0.2871, + "step": 11783 + }, + { + "epoch": 32.10899182561308, + "grad_norm": 7.9324469566345215, + "learning_rate": 1.5875496228284385e-05, + "loss": 0.4206, + "step": 11784 + }, + { + "epoch": 32.11171662125341, + "grad_norm": 17.721887588500977, + "learning_rate": 1.5874782101216246e-05, + "loss": 0.4341, + "step": 11785 + }, + { + "epoch": 32.11444141689373, + "grad_norm": 12.41125202178955, + "learning_rate": 1.5874067928395497e-05, + "loss": 0.4029, + "step": 11786 + }, + { + "epoch": 32.11716621253406, + "grad_norm": 9.059920310974121, + "learning_rate": 1.5873353709827695e-05, + "loss": 0.4584, + "step": 11787 + }, + { + "epoch": 32.119891008174385, + "grad_norm": 9.27950382232666, + "learning_rate": 1.58726394455184e-05, + "loss": 0.3017, + "step": 11788 + }, + { + "epoch": 32.12261580381471, + "grad_norm": 6.377040386199951, + "learning_rate": 1.587192513547318e-05, + "loss": 0.3109, + "step": 11789 + }, + { + "epoch": 32.12534059945504, + "grad_norm": 7.2704243659973145, + "learning_rate": 1.5871210779697598e-05, + "loss": 0.3922, + "step": 11790 + }, + { + "epoch": 32.12806539509537, + "grad_norm": 8.584101676940918, + "learning_rate": 1.587049637819721e-05, + "loss": 0.4524, + "step": 11791 + }, + { + "epoch": 32.130790190735695, + "grad_norm": 12.669682502746582, + "learning_rate": 1.586978193097759e-05, + "loss": 0.4226, + "step": 11792 + }, + { + "epoch": 32.13351498637602, + "grad_norm": 8.62442398071289, + "learning_rate": 1.5869067438044298e-05, + "loss": 0.3394, + "step": 11793 + }, + { + "epoch": 32.13623978201635, + "grad_norm": 7.36232328414917, + "learning_rate": 1.5868352899402895e-05, + "loss": 0.5303, + "step": 11794 + }, + { + "epoch": 32.13896457765667, + "grad_norm": 9.210404396057129, + "learning_rate": 1.5867638315058947e-05, + "loss": 0.6094, + "step": 11795 + }, + { + "epoch": 32.141689373297005, + "grad_norm": 6.262637615203857, + "learning_rate": 1.5866923685018026e-05, + "loss": 0.4605, + "step": 11796 + }, + { + "epoch": 32.14441416893733, + "grad_norm": 13.885269165039062, + "learning_rate": 1.586620900928569e-05, + "loss": 0.3381, + "step": 11797 + }, + { + "epoch": 32.14713896457766, + "grad_norm": 6.554561614990234, + "learning_rate": 1.5865494287867504e-05, + "loss": 0.3335, + "step": 11798 + }, + { + "epoch": 32.14986376021798, + "grad_norm": 7.8454108238220215, + "learning_rate": 1.586477952076904e-05, + "loss": 0.4303, + "step": 11799 + }, + { + "epoch": 32.15258855585831, + "grad_norm": 7.831639289855957, + "learning_rate": 1.586406470799586e-05, + "loss": 0.5651, + "step": 11800 + }, + { + "epoch": 32.155313351498634, + "grad_norm": 12.072447776794434, + "learning_rate": 1.5863349849553533e-05, + "loss": 0.4243, + "step": 11801 + }, + { + "epoch": 32.15803814713897, + "grad_norm": 7.685490608215332, + "learning_rate": 1.5862634945447628e-05, + "loss": 0.3981, + "step": 11802 + }, + { + "epoch": 32.16076294277929, + "grad_norm": 8.947986602783203, + "learning_rate": 1.5861919995683713e-05, + "loss": 0.4612, + "step": 11803 + }, + { + "epoch": 32.16348773841962, + "grad_norm": 10.897587776184082, + "learning_rate": 1.586120500026735e-05, + "loss": 0.3702, + "step": 11804 + }, + { + "epoch": 32.166212534059945, + "grad_norm": 8.40881061553955, + "learning_rate": 1.586048995920411e-05, + "loss": 0.4109, + "step": 11805 + }, + { + "epoch": 32.16893732970027, + "grad_norm": 6.445413112640381, + "learning_rate": 1.5859774872499564e-05, + "loss": 0.3076, + "step": 11806 + }, + { + "epoch": 32.171662125340596, + "grad_norm": 7.084362030029297, + "learning_rate": 1.5859059740159283e-05, + "loss": 0.5631, + "step": 11807 + }, + { + "epoch": 32.17438692098093, + "grad_norm": 6.634472846984863, + "learning_rate": 1.585834456218883e-05, + "loss": 0.2851, + "step": 11808 + }, + { + "epoch": 32.177111716621255, + "grad_norm": 6.578856468200684, + "learning_rate": 1.585762933859378e-05, + "loss": 0.4152, + "step": 11809 + }, + { + "epoch": 32.17983651226158, + "grad_norm": 9.397659301757812, + "learning_rate": 1.58569140693797e-05, + "loss": 0.4192, + "step": 11810 + }, + { + "epoch": 32.182561307901906, + "grad_norm": 6.69155740737915, + "learning_rate": 1.585619875455216e-05, + "loss": 0.306, + "step": 11811 + }, + { + "epoch": 32.18528610354223, + "grad_norm": 7.759404182434082, + "learning_rate": 1.5855483394116734e-05, + "loss": 0.4203, + "step": 11812 + }, + { + "epoch": 32.18801089918256, + "grad_norm": 7.001629829406738, + "learning_rate": 1.5854767988078992e-05, + "loss": 0.3216, + "step": 11813 + }, + { + "epoch": 32.19073569482289, + "grad_norm": 9.282877922058105, + "learning_rate": 1.5854052536444505e-05, + "loss": 0.4682, + "step": 11814 + }, + { + "epoch": 32.19346049046322, + "grad_norm": 7.756398677825928, + "learning_rate": 1.5853337039218846e-05, + "loss": 0.4177, + "step": 11815 + }, + { + "epoch": 32.19618528610354, + "grad_norm": 8.572132110595703, + "learning_rate": 1.5852621496407584e-05, + "loss": 0.4274, + "step": 11816 + }, + { + "epoch": 32.19891008174387, + "grad_norm": 6.335931777954102, + "learning_rate": 1.5851905908016297e-05, + "loss": 0.395, + "step": 11817 + }, + { + "epoch": 32.201634877384194, + "grad_norm": 6.162834167480469, + "learning_rate": 1.5851190274050555e-05, + "loss": 0.3054, + "step": 11818 + }, + { + "epoch": 32.20435967302452, + "grad_norm": 6.942822456359863, + "learning_rate": 1.585047459451593e-05, + "loss": 0.4146, + "step": 11819 + }, + { + "epoch": 32.20708446866485, + "grad_norm": 5.796833038330078, + "learning_rate": 1.5849758869418002e-05, + "loss": 0.2725, + "step": 11820 + }, + { + "epoch": 32.20980926430518, + "grad_norm": 9.037385940551758, + "learning_rate": 1.5849043098762335e-05, + "loss": 0.3282, + "step": 11821 + }, + { + "epoch": 32.212534059945504, + "grad_norm": 9.565847396850586, + "learning_rate": 1.584832728255451e-05, + "loss": 0.4362, + "step": 11822 + }, + { + "epoch": 32.21525885558583, + "grad_norm": 9.69047737121582, + "learning_rate": 1.58476114208001e-05, + "loss": 0.3274, + "step": 11823 + }, + { + "epoch": 32.217983651226156, + "grad_norm": 8.620555877685547, + "learning_rate": 1.584689551350468e-05, + "loss": 0.3643, + "step": 11824 + }, + { + "epoch": 32.22070844686648, + "grad_norm": 9.036141395568848, + "learning_rate": 1.5846179560673825e-05, + "loss": 0.3236, + "step": 11825 + }, + { + "epoch": 32.223433242506815, + "grad_norm": 5.609255313873291, + "learning_rate": 1.5845463562313113e-05, + "loss": 0.4547, + "step": 11826 + }, + { + "epoch": 32.22615803814714, + "grad_norm": 8.770671844482422, + "learning_rate": 1.5844747518428124e-05, + "loss": 0.5427, + "step": 11827 + }, + { + "epoch": 32.228882833787466, + "grad_norm": 11.33442497253418, + "learning_rate": 1.584403142902442e-05, + "loss": 0.4137, + "step": 11828 + }, + { + "epoch": 32.23160762942779, + "grad_norm": 6.859502792358398, + "learning_rate": 1.5843315294107595e-05, + "loss": 0.2459, + "step": 11829 + }, + { + "epoch": 32.23433242506812, + "grad_norm": 7.492730140686035, + "learning_rate": 1.5842599113683216e-05, + "loss": 0.3889, + "step": 11830 + }, + { + "epoch": 32.237057220708444, + "grad_norm": 7.895528316497803, + "learning_rate": 1.5841882887756864e-05, + "loss": 0.4388, + "step": 11831 + }, + { + "epoch": 32.23978201634878, + "grad_norm": 12.864253044128418, + "learning_rate": 1.5841166616334112e-05, + "loss": 0.4497, + "step": 11832 + }, + { + "epoch": 32.2425068119891, + "grad_norm": 6.970122337341309, + "learning_rate": 1.5840450299420548e-05, + "loss": 0.4554, + "step": 11833 + }, + { + "epoch": 32.24523160762943, + "grad_norm": 8.694933891296387, + "learning_rate": 1.5839733937021738e-05, + "loss": 0.2998, + "step": 11834 + }, + { + "epoch": 32.247956403269754, + "grad_norm": 8.716221809387207, + "learning_rate": 1.5839017529143276e-05, + "loss": 0.4441, + "step": 11835 + }, + { + "epoch": 32.25068119891008, + "grad_norm": 6.544258117675781, + "learning_rate": 1.5838301075790726e-05, + "loss": 0.343, + "step": 11836 + }, + { + "epoch": 32.253405994550405, + "grad_norm": 7.905789375305176, + "learning_rate": 1.583758457696968e-05, + "loss": 0.3984, + "step": 11837 + }, + { + "epoch": 32.25613079019074, + "grad_norm": 7.267482757568359, + "learning_rate": 1.5836868032685714e-05, + "loss": 0.3942, + "step": 11838 + }, + { + "epoch": 32.258855585831064, + "grad_norm": 7.333285331726074, + "learning_rate": 1.5836151442944406e-05, + "loss": 0.2985, + "step": 11839 + }, + { + "epoch": 32.26158038147139, + "grad_norm": 7.183562278747559, + "learning_rate": 1.5835434807751337e-05, + "loss": 0.3709, + "step": 11840 + }, + { + "epoch": 32.264305177111716, + "grad_norm": 6.645139217376709, + "learning_rate": 1.583471812711209e-05, + "loss": 0.442, + "step": 11841 + }, + { + "epoch": 32.26702997275204, + "grad_norm": 26.506385803222656, + "learning_rate": 1.583400140103225e-05, + "loss": 0.3225, + "step": 11842 + }, + { + "epoch": 32.26975476839237, + "grad_norm": 25.365419387817383, + "learning_rate": 1.583328462951739e-05, + "loss": 0.4845, + "step": 11843 + }, + { + "epoch": 32.2724795640327, + "grad_norm": 6.552819728851318, + "learning_rate": 1.5832567812573097e-05, + "loss": 0.3095, + "step": 11844 + }, + { + "epoch": 32.275204359673026, + "grad_norm": 7.264756202697754, + "learning_rate": 1.5831850950204955e-05, + "loss": 0.3252, + "step": 11845 + }, + { + "epoch": 32.27792915531335, + "grad_norm": 6.431404113769531, + "learning_rate": 1.5831134042418547e-05, + "loss": 0.4528, + "step": 11846 + }, + { + "epoch": 32.28065395095368, + "grad_norm": 8.371557235717773, + "learning_rate": 1.5830417089219454e-05, + "loss": 0.2578, + "step": 11847 + }, + { + "epoch": 32.283378746594, + "grad_norm": 7.391849517822266, + "learning_rate": 1.582970009061326e-05, + "loss": 0.3527, + "step": 11848 + }, + { + "epoch": 32.28610354223433, + "grad_norm": 8.503427505493164, + "learning_rate": 1.582898304660555e-05, + "loss": 0.2731, + "step": 11849 + }, + { + "epoch": 32.28882833787466, + "grad_norm": 8.949432373046875, + "learning_rate": 1.5828265957201904e-05, + "loss": 0.3873, + "step": 11850 + }, + { + "epoch": 32.29155313351499, + "grad_norm": 6.752440452575684, + "learning_rate": 1.5827548822407912e-05, + "loss": 0.4052, + "step": 11851 + }, + { + "epoch": 32.294277929155314, + "grad_norm": 6.268543243408203, + "learning_rate": 1.582683164222916e-05, + "loss": 0.3759, + "step": 11852 + }, + { + "epoch": 32.29700272479564, + "grad_norm": 6.491923809051514, + "learning_rate": 1.582611441667123e-05, + "loss": 0.3365, + "step": 11853 + }, + { + "epoch": 32.299727520435965, + "grad_norm": 6.925135612487793, + "learning_rate": 1.5825397145739704e-05, + "loss": 0.3329, + "step": 11854 + }, + { + "epoch": 32.30245231607629, + "grad_norm": 7.322439193725586, + "learning_rate": 1.582467982944018e-05, + "loss": 0.4421, + "step": 11855 + }, + { + "epoch": 32.305177111716624, + "grad_norm": 5.905395984649658, + "learning_rate": 1.582396246777823e-05, + "loss": 0.4805, + "step": 11856 + }, + { + "epoch": 32.30790190735695, + "grad_norm": 7.987797260284424, + "learning_rate": 1.582324506075945e-05, + "loss": 0.4595, + "step": 11857 + }, + { + "epoch": 32.310626702997276, + "grad_norm": 8.10444164276123, + "learning_rate": 1.5822527608389428e-05, + "loss": 0.3066, + "step": 11858 + }, + { + "epoch": 32.3133514986376, + "grad_norm": 7.959553241729736, + "learning_rate": 1.5821810110673744e-05, + "loss": 0.2758, + "step": 11859 + }, + { + "epoch": 32.31607629427793, + "grad_norm": 7.548391819000244, + "learning_rate": 1.5821092567617993e-05, + "loss": 0.4469, + "step": 11860 + }, + { + "epoch": 32.31880108991825, + "grad_norm": 6.731222629547119, + "learning_rate": 1.582037497922776e-05, + "loss": 0.4565, + "step": 11861 + }, + { + "epoch": 32.321525885558586, + "grad_norm": 7.5333991050720215, + "learning_rate": 1.581965734550863e-05, + "loss": 0.3308, + "step": 11862 + }, + { + "epoch": 32.32425068119891, + "grad_norm": 13.58120059967041, + "learning_rate": 1.5818939666466203e-05, + "loss": 0.3882, + "step": 11863 + }, + { + "epoch": 32.32697547683924, + "grad_norm": 13.837489128112793, + "learning_rate": 1.5818221942106058e-05, + "loss": 0.3484, + "step": 11864 + }, + { + "epoch": 32.32970027247956, + "grad_norm": 9.037531852722168, + "learning_rate": 1.581750417243379e-05, + "loss": 0.4246, + "step": 11865 + }, + { + "epoch": 32.33242506811989, + "grad_norm": 6.657193660736084, + "learning_rate": 1.5816786357454984e-05, + "loss": 0.3333, + "step": 11866 + }, + { + "epoch": 32.335149863760215, + "grad_norm": 7.076379299163818, + "learning_rate": 1.5816068497175233e-05, + "loss": 0.264, + "step": 11867 + }, + { + "epoch": 32.33787465940055, + "grad_norm": 7.124920845031738, + "learning_rate": 1.5815350591600124e-05, + "loss": 0.4204, + "step": 11868 + }, + { + "epoch": 32.34059945504087, + "grad_norm": 7.654149055480957, + "learning_rate": 1.5814632640735258e-05, + "loss": 0.4473, + "step": 11869 + }, + { + "epoch": 32.3433242506812, + "grad_norm": 9.05989933013916, + "learning_rate": 1.5813914644586218e-05, + "loss": 0.3142, + "step": 11870 + }, + { + "epoch": 32.346049046321525, + "grad_norm": 6.905852794647217, + "learning_rate": 1.5813196603158594e-05, + "loss": 0.4329, + "step": 11871 + }, + { + "epoch": 32.34877384196185, + "grad_norm": 7.0673933029174805, + "learning_rate": 1.581247851645799e-05, + "loss": 0.3491, + "step": 11872 + }, + { + "epoch": 32.35149863760218, + "grad_norm": 7.70352840423584, + "learning_rate": 1.5811760384489983e-05, + "loss": 0.2582, + "step": 11873 + }, + { + "epoch": 32.35422343324251, + "grad_norm": 12.85704517364502, + "learning_rate": 1.581104220726018e-05, + "loss": 0.4186, + "step": 11874 + }, + { + "epoch": 32.356948228882835, + "grad_norm": 8.48851490020752, + "learning_rate": 1.581032398477416e-05, + "loss": 0.3688, + "step": 11875 + }, + { + "epoch": 32.35967302452316, + "grad_norm": 5.9951934814453125, + "learning_rate": 1.580960571703753e-05, + "loss": 0.3363, + "step": 11876 + }, + { + "epoch": 32.36239782016349, + "grad_norm": 6.69450044631958, + "learning_rate": 1.5808887404055876e-05, + "loss": 0.3303, + "step": 11877 + }, + { + "epoch": 32.36512261580381, + "grad_norm": 9.448138236999512, + "learning_rate": 1.580816904583479e-05, + "loss": 0.4879, + "step": 11878 + }, + { + "epoch": 32.36784741144414, + "grad_norm": 6.074221134185791, + "learning_rate": 1.5807450642379874e-05, + "loss": 0.2635, + "step": 11879 + }, + { + "epoch": 32.37057220708447, + "grad_norm": 8.59503173828125, + "learning_rate": 1.580673219369672e-05, + "loss": 0.3106, + "step": 11880 + }, + { + "epoch": 32.3732970027248, + "grad_norm": 9.456225395202637, + "learning_rate": 1.580601369979092e-05, + "loss": 0.42, + "step": 11881 + }, + { + "epoch": 32.37602179836512, + "grad_norm": 6.988005638122559, + "learning_rate": 1.5805295160668075e-05, + "loss": 0.4572, + "step": 11882 + }, + { + "epoch": 32.37874659400545, + "grad_norm": 15.075167655944824, + "learning_rate": 1.5804576576333776e-05, + "loss": 0.3986, + "step": 11883 + }, + { + "epoch": 32.381471389645775, + "grad_norm": 7.345865249633789, + "learning_rate": 1.580385794679362e-05, + "loss": 0.4762, + "step": 11884 + }, + { + "epoch": 32.3841961852861, + "grad_norm": 5.510758876800537, + "learning_rate": 1.580313927205321e-05, + "loss": 0.437, + "step": 11885 + }, + { + "epoch": 32.38692098092643, + "grad_norm": 7.573642253875732, + "learning_rate": 1.5802420552118133e-05, + "loss": 0.3484, + "step": 11886 + }, + { + "epoch": 32.38964577656676, + "grad_norm": 7.1016011238098145, + "learning_rate": 1.5801701786993992e-05, + "loss": 0.5948, + "step": 11887 + }, + { + "epoch": 32.392370572207085, + "grad_norm": 7.032326698303223, + "learning_rate": 1.5800982976686387e-05, + "loss": 0.3499, + "step": 11888 + }, + { + "epoch": 32.39509536784741, + "grad_norm": 7.155482292175293, + "learning_rate": 1.580026412120091e-05, + "loss": 0.4247, + "step": 11889 + }, + { + "epoch": 32.39782016348774, + "grad_norm": 6.175853729248047, + "learning_rate": 1.5799545220543168e-05, + "loss": 0.3085, + "step": 11890 + }, + { + "epoch": 32.40054495912806, + "grad_norm": 9.193768501281738, + "learning_rate": 1.579882627471875e-05, + "loss": 0.33, + "step": 11891 + }, + { + "epoch": 32.403269754768395, + "grad_norm": 7.0792388916015625, + "learning_rate": 1.5798107283733265e-05, + "loss": 0.3567, + "step": 11892 + }, + { + "epoch": 32.40599455040872, + "grad_norm": 6.419934272766113, + "learning_rate": 1.5797388247592304e-05, + "loss": 0.3961, + "step": 11893 + }, + { + "epoch": 32.40871934604905, + "grad_norm": 6.680984973907471, + "learning_rate": 1.5796669166301468e-05, + "loss": 0.4934, + "step": 11894 + }, + { + "epoch": 32.41144414168937, + "grad_norm": 9.507497787475586, + "learning_rate": 1.579595003986636e-05, + "loss": 0.346, + "step": 11895 + }, + { + "epoch": 32.4141689373297, + "grad_norm": 7.483531951904297, + "learning_rate": 1.5795230868292576e-05, + "loss": 0.4828, + "step": 11896 + }, + { + "epoch": 32.416893732970024, + "grad_norm": 6.597445487976074, + "learning_rate": 1.5794511651585725e-05, + "loss": 0.3551, + "step": 11897 + }, + { + "epoch": 32.41961852861036, + "grad_norm": 7.840703964233398, + "learning_rate": 1.5793792389751402e-05, + "loss": 0.3699, + "step": 11898 + }, + { + "epoch": 32.42234332425068, + "grad_norm": 6.960693836212158, + "learning_rate": 1.5793073082795213e-05, + "loss": 0.3769, + "step": 11899 + }, + { + "epoch": 32.42506811989101, + "grad_norm": 12.177355766296387, + "learning_rate": 1.5792353730722757e-05, + "loss": 0.3799, + "step": 11900 + }, + { + "epoch": 32.427792915531334, + "grad_norm": 8.627708435058594, + "learning_rate": 1.5791634333539632e-05, + "loss": 0.4571, + "step": 11901 + }, + { + "epoch": 32.43051771117166, + "grad_norm": 7.5197434425354, + "learning_rate": 1.5790914891251448e-05, + "loss": 0.4738, + "step": 11902 + }, + { + "epoch": 32.433242506811986, + "grad_norm": 9.005895614624023, + "learning_rate": 1.5790195403863808e-05, + "loss": 0.3651, + "step": 11903 + }, + { + "epoch": 32.43596730245232, + "grad_norm": 8.538691520690918, + "learning_rate": 1.578947587138231e-05, + "loss": 0.3392, + "step": 11904 + }, + { + "epoch": 32.438692098092645, + "grad_norm": 7.353978633880615, + "learning_rate": 1.578875629381256e-05, + "loss": 0.3974, + "step": 11905 + }, + { + "epoch": 32.44141689373297, + "grad_norm": 8.60916519165039, + "learning_rate": 1.5788036671160163e-05, + "loss": 0.3304, + "step": 11906 + }, + { + "epoch": 32.444141689373296, + "grad_norm": 6.569250583648682, + "learning_rate": 1.578731700343072e-05, + "loss": 0.4344, + "step": 11907 + }, + { + "epoch": 32.44686648501362, + "grad_norm": 7.190419673919678, + "learning_rate": 1.5786597290629843e-05, + "loss": 0.2899, + "step": 11908 + }, + { + "epoch": 32.44959128065395, + "grad_norm": 7.1112141609191895, + "learning_rate": 1.5785877532763132e-05, + "loss": 0.4316, + "step": 11909 + }, + { + "epoch": 32.45231607629428, + "grad_norm": 6.34969425201416, + "learning_rate": 1.578515772983619e-05, + "loss": 0.3689, + "step": 11910 + }, + { + "epoch": 32.45504087193461, + "grad_norm": 8.304433822631836, + "learning_rate": 1.5784437881854626e-05, + "loss": 0.4647, + "step": 11911 + }, + { + "epoch": 32.45776566757493, + "grad_norm": 27.573606491088867, + "learning_rate": 1.578371798882405e-05, + "loss": 0.4462, + "step": 11912 + }, + { + "epoch": 32.46049046321526, + "grad_norm": 5.862417697906494, + "learning_rate": 1.578299805075006e-05, + "loss": 0.4507, + "step": 11913 + }, + { + "epoch": 32.463215258855584, + "grad_norm": 9.314671516418457, + "learning_rate": 1.5782278067638267e-05, + "loss": 0.4748, + "step": 11914 + }, + { + "epoch": 32.46594005449591, + "grad_norm": 6.722378253936768, + "learning_rate": 1.5781558039494283e-05, + "loss": 0.3104, + "step": 11915 + }, + { + "epoch": 32.46866485013624, + "grad_norm": 8.106048583984375, + "learning_rate": 1.578083796632371e-05, + "loss": 0.4258, + "step": 11916 + }, + { + "epoch": 32.47138964577657, + "grad_norm": 8.299581527709961, + "learning_rate": 1.5780117848132154e-05, + "loss": 0.438, + "step": 11917 + }, + { + "epoch": 32.474114441416894, + "grad_norm": 7.841410160064697, + "learning_rate": 1.5779397684925226e-05, + "loss": 0.3873, + "step": 11918 + }, + { + "epoch": 32.47683923705722, + "grad_norm": 6.277518272399902, + "learning_rate": 1.5778677476708536e-05, + "loss": 0.2712, + "step": 11919 + }, + { + "epoch": 32.479564032697546, + "grad_norm": 6.815647125244141, + "learning_rate": 1.577795722348769e-05, + "loss": 0.2715, + "step": 11920 + }, + { + "epoch": 32.48228882833787, + "grad_norm": 7.107115745544434, + "learning_rate": 1.5777236925268306e-05, + "loss": 0.441, + "step": 11921 + }, + { + "epoch": 32.485013623978205, + "grad_norm": 6.531349182128906, + "learning_rate": 1.577651658205598e-05, + "loss": 0.5261, + "step": 11922 + }, + { + "epoch": 32.48773841961853, + "grad_norm": 6.629528999328613, + "learning_rate": 1.5775796193856332e-05, + "loss": 0.293, + "step": 11923 + }, + { + "epoch": 32.490463215258856, + "grad_norm": 7.79941987991333, + "learning_rate": 1.5775075760674966e-05, + "loss": 0.3395, + "step": 11924 + }, + { + "epoch": 32.49318801089918, + "grad_norm": 7.020432949066162, + "learning_rate": 1.57743552825175e-05, + "loss": 0.4031, + "step": 11925 + }, + { + "epoch": 32.49591280653951, + "grad_norm": 6.841043472290039, + "learning_rate": 1.5773634759389537e-05, + "loss": 0.2846, + "step": 11926 + }, + { + "epoch": 32.49863760217983, + "grad_norm": 7.659816265106201, + "learning_rate": 1.5772914191296697e-05, + "loss": 0.3821, + "step": 11927 + }, + { + "epoch": 32.50136239782017, + "grad_norm": 7.213796138763428, + "learning_rate": 1.577219357824458e-05, + "loss": 0.3698, + "step": 11928 + }, + { + "epoch": 32.50408719346049, + "grad_norm": 5.5160369873046875, + "learning_rate": 1.577147292023881e-05, + "loss": 0.4213, + "step": 11929 + }, + { + "epoch": 32.50681198910082, + "grad_norm": 7.902105808258057, + "learning_rate": 1.5770752217284995e-05, + "loss": 0.4316, + "step": 11930 + }, + { + "epoch": 32.509536784741144, + "grad_norm": 6.753303527832031, + "learning_rate": 1.5770031469388747e-05, + "loss": 0.4515, + "step": 11931 + }, + { + "epoch": 32.51226158038147, + "grad_norm": 7.130935192108154, + "learning_rate": 1.576931067655568e-05, + "loss": 0.3441, + "step": 11932 + }, + { + "epoch": 32.514986376021795, + "grad_norm": 8.129018783569336, + "learning_rate": 1.5768589838791405e-05, + "loss": 0.2713, + "step": 11933 + }, + { + "epoch": 32.51771117166213, + "grad_norm": 7.047908782958984, + "learning_rate": 1.576786895610154e-05, + "loss": 0.3265, + "step": 11934 + }, + { + "epoch": 32.520435967302454, + "grad_norm": 7.914534568786621, + "learning_rate": 1.5767148028491696e-05, + "loss": 0.3427, + "step": 11935 + }, + { + "epoch": 32.52316076294278, + "grad_norm": 11.322606086730957, + "learning_rate": 1.5766427055967488e-05, + "loss": 0.3063, + "step": 11936 + }, + { + "epoch": 32.525885558583106, + "grad_norm": 12.04789924621582, + "learning_rate": 1.5765706038534534e-05, + "loss": 0.4918, + "step": 11937 + }, + { + "epoch": 32.52861035422343, + "grad_norm": 8.268314361572266, + "learning_rate": 1.5764984976198447e-05, + "loss": 0.4151, + "step": 11938 + }, + { + "epoch": 32.53133514986376, + "grad_norm": 5.861069202423096, + "learning_rate": 1.576426386896484e-05, + "loss": 0.3702, + "step": 11939 + }, + { + "epoch": 32.53405994550409, + "grad_norm": 6.333064556121826, + "learning_rate": 1.5763542716839332e-05, + "loss": 0.3506, + "step": 11940 + }, + { + "epoch": 32.536784741144416, + "grad_norm": 8.839204788208008, + "learning_rate": 1.576282151982754e-05, + "loss": 0.3522, + "step": 11941 + }, + { + "epoch": 32.53950953678474, + "grad_norm": 7.407595634460449, + "learning_rate": 1.576210027793508e-05, + "loss": 0.4851, + "step": 11942 + }, + { + "epoch": 32.54223433242507, + "grad_norm": 7.629887580871582, + "learning_rate": 1.5761378991167568e-05, + "loss": 0.4349, + "step": 11943 + }, + { + "epoch": 32.54495912806539, + "grad_norm": 8.962532043457031, + "learning_rate": 1.5760657659530622e-05, + "loss": 0.4535, + "step": 11944 + }, + { + "epoch": 32.54768392370572, + "grad_norm": 6.943212509155273, + "learning_rate": 1.575993628302986e-05, + "loss": 0.4005, + "step": 11945 + }, + { + "epoch": 32.55040871934605, + "grad_norm": 8.85571575164795, + "learning_rate": 1.5759214861670894e-05, + "loss": 0.3887, + "step": 11946 + }, + { + "epoch": 32.55313351498638, + "grad_norm": 7.18424654006958, + "learning_rate": 1.5758493395459353e-05, + "loss": 0.4333, + "step": 11947 + }, + { + "epoch": 32.555858310626704, + "grad_norm": 6.862495422363281, + "learning_rate": 1.5757771884400853e-05, + "loss": 0.3755, + "step": 11948 + }, + { + "epoch": 32.55858310626703, + "grad_norm": 12.841184616088867, + "learning_rate": 1.5757050328501005e-05, + "loss": 0.4854, + "step": 11949 + }, + { + "epoch": 32.561307901907355, + "grad_norm": 6.726277828216553, + "learning_rate": 1.5756328727765443e-05, + "loss": 0.3418, + "step": 11950 + }, + { + "epoch": 32.56403269754768, + "grad_norm": 7.365610122680664, + "learning_rate": 1.575560708219977e-05, + "loss": 0.388, + "step": 11951 + }, + { + "epoch": 32.566757493188014, + "grad_norm": 8.58881664276123, + "learning_rate": 1.5754885391809618e-05, + "loss": 0.5242, + "step": 11952 + }, + { + "epoch": 32.56948228882834, + "grad_norm": 7.2528533935546875, + "learning_rate": 1.5754163656600602e-05, + "loss": 0.3458, + "step": 11953 + }, + { + "epoch": 32.572207084468666, + "grad_norm": 7.158148288726807, + "learning_rate": 1.5753441876578347e-05, + "loss": 0.4552, + "step": 11954 + }, + { + "epoch": 32.57493188010899, + "grad_norm": 8.406827926635742, + "learning_rate": 1.575272005174847e-05, + "loss": 0.3913, + "step": 11955 + }, + { + "epoch": 32.57765667574932, + "grad_norm": 6.260662078857422, + "learning_rate": 1.5751998182116595e-05, + "loss": 0.4446, + "step": 11956 + }, + { + "epoch": 32.58038147138964, + "grad_norm": 6.576188087463379, + "learning_rate": 1.575127626768834e-05, + "loss": 0.4244, + "step": 11957 + }, + { + "epoch": 32.583106267029976, + "grad_norm": 7.728090763092041, + "learning_rate": 1.5750554308469337e-05, + "loss": 0.3572, + "step": 11958 + }, + { + "epoch": 32.5858310626703, + "grad_norm": 10.058018684387207, + "learning_rate": 1.5749832304465197e-05, + "loss": 0.3777, + "step": 11959 + }, + { + "epoch": 32.58855585831063, + "grad_norm": 9.505508422851562, + "learning_rate": 1.574911025568155e-05, + "loss": 0.3886, + "step": 11960 + }, + { + "epoch": 32.59128065395095, + "grad_norm": 10.549141883850098, + "learning_rate": 1.5748388162124017e-05, + "loss": 0.3792, + "step": 11961 + }, + { + "epoch": 32.59400544959128, + "grad_norm": 6.701169490814209, + "learning_rate": 1.5747666023798226e-05, + "loss": 0.3253, + "step": 11962 + }, + { + "epoch": 32.596730245231605, + "grad_norm": 7.991512775421143, + "learning_rate": 1.5746943840709786e-05, + "loss": 0.2688, + "step": 11963 + }, + { + "epoch": 32.59945504087194, + "grad_norm": 7.135027885437012, + "learning_rate": 1.5746221612864342e-05, + "loss": 0.3714, + "step": 11964 + }, + { + "epoch": 32.60217983651226, + "grad_norm": 9.023070335388184, + "learning_rate": 1.5745499340267508e-05, + "loss": 0.5009, + "step": 11965 + }, + { + "epoch": 32.60490463215259, + "grad_norm": 6.113072395324707, + "learning_rate": 1.574477702292491e-05, + "loss": 0.4158, + "step": 11966 + }, + { + "epoch": 32.607629427792915, + "grad_norm": 6.196746349334717, + "learning_rate": 1.574405466084217e-05, + "loss": 0.2893, + "step": 11967 + }, + { + "epoch": 32.61035422343324, + "grad_norm": 7.036569595336914, + "learning_rate": 1.574333225402492e-05, + "loss": 0.3227, + "step": 11968 + }, + { + "epoch": 32.61307901907357, + "grad_norm": 9.898079872131348, + "learning_rate": 1.5742609802478782e-05, + "loss": 0.2725, + "step": 11969 + }, + { + "epoch": 32.6158038147139, + "grad_norm": 9.416449546813965, + "learning_rate": 1.5741887306209383e-05, + "loss": 0.5483, + "step": 11970 + }, + { + "epoch": 32.618528610354225, + "grad_norm": 12.58320426940918, + "learning_rate": 1.574116476522235e-05, + "loss": 0.3538, + "step": 11971 + }, + { + "epoch": 32.62125340599455, + "grad_norm": 9.070144653320312, + "learning_rate": 1.5740442179523315e-05, + "loss": 0.4606, + "step": 11972 + }, + { + "epoch": 32.62397820163488, + "grad_norm": 12.15832805633545, + "learning_rate": 1.5739719549117897e-05, + "loss": 0.3821, + "step": 11973 + }, + { + "epoch": 32.6267029972752, + "grad_norm": 7.7303547859191895, + "learning_rate": 1.5738996874011728e-05, + "loss": 0.3867, + "step": 11974 + }, + { + "epoch": 32.62942779291553, + "grad_norm": 11.707273483276367, + "learning_rate": 1.573827415421044e-05, + "loss": 0.4366, + "step": 11975 + }, + { + "epoch": 32.63215258855586, + "grad_norm": 6.971134662628174, + "learning_rate": 1.5737551389719655e-05, + "loss": 0.4473, + "step": 11976 + }, + { + "epoch": 32.63487738419619, + "grad_norm": 7.204379081726074, + "learning_rate": 1.5736828580545003e-05, + "loss": 0.2962, + "step": 11977 + }, + { + "epoch": 32.63760217983651, + "grad_norm": 7.457752704620361, + "learning_rate": 1.5736105726692117e-05, + "loss": 0.3885, + "step": 11978 + }, + { + "epoch": 32.64032697547684, + "grad_norm": 6.843810081481934, + "learning_rate": 1.5735382828166623e-05, + "loss": 0.5171, + "step": 11979 + }, + { + "epoch": 32.643051771117165, + "grad_norm": 7.744211673736572, + "learning_rate": 1.573465988497415e-05, + "loss": 0.4914, + "step": 11980 + }, + { + "epoch": 32.64577656675749, + "grad_norm": 8.346298217773438, + "learning_rate": 1.5733936897120333e-05, + "loss": 0.3502, + "step": 11981 + }, + { + "epoch": 32.64850136239782, + "grad_norm": 10.77584457397461, + "learning_rate": 1.57332138646108e-05, + "loss": 0.3922, + "step": 11982 + }, + { + "epoch": 32.65122615803815, + "grad_norm": 6.4791693687438965, + "learning_rate": 1.573249078745118e-05, + "loss": 0.4125, + "step": 11983 + }, + { + "epoch": 32.653950953678475, + "grad_norm": 10.286407470703125, + "learning_rate": 1.573176766564711e-05, + "loss": 0.4296, + "step": 11984 + }, + { + "epoch": 32.6566757493188, + "grad_norm": 7.827480316162109, + "learning_rate": 1.5731044499204213e-05, + "loss": 0.4174, + "step": 11985 + }, + { + "epoch": 32.65940054495913, + "grad_norm": 7.769915580749512, + "learning_rate": 1.5730321288128128e-05, + "loss": 0.292, + "step": 11986 + }, + { + "epoch": 32.66212534059945, + "grad_norm": 7.813076972961426, + "learning_rate": 1.5729598032424486e-05, + "loss": 0.4645, + "step": 11987 + }, + { + "epoch": 32.664850136239785, + "grad_norm": 7.816955089569092, + "learning_rate": 1.572887473209892e-05, + "loss": 0.3946, + "step": 11988 + }, + { + "epoch": 32.66757493188011, + "grad_norm": 7.383937835693359, + "learning_rate": 1.572815138715706e-05, + "loss": 0.4445, + "step": 11989 + }, + { + "epoch": 32.67029972752044, + "grad_norm": 11.780363082885742, + "learning_rate": 1.5727427997604545e-05, + "loss": 0.3294, + "step": 11990 + }, + { + "epoch": 32.67302452316076, + "grad_norm": 10.708660125732422, + "learning_rate": 1.5726704563446998e-05, + "loss": 0.2985, + "step": 11991 + }, + { + "epoch": 32.67574931880109, + "grad_norm": 8.770447731018066, + "learning_rate": 1.5725981084690067e-05, + "loss": 0.3227, + "step": 11992 + }, + { + "epoch": 32.678474114441414, + "grad_norm": 8.673264503479004, + "learning_rate": 1.5725257561339375e-05, + "loss": 0.4449, + "step": 11993 + }, + { + "epoch": 32.68119891008175, + "grad_norm": 9.200652122497559, + "learning_rate": 1.5724533993400564e-05, + "loss": 0.3591, + "step": 11994 + }, + { + "epoch": 32.68392370572207, + "grad_norm": 7.240207195281982, + "learning_rate": 1.572381038087927e-05, + "loss": 0.5212, + "step": 11995 + }, + { + "epoch": 32.6866485013624, + "grad_norm": 9.379121780395508, + "learning_rate": 1.5723086723781116e-05, + "loss": 0.3761, + "step": 11996 + }, + { + "epoch": 32.689373297002724, + "grad_norm": 6.244917392730713, + "learning_rate": 1.572236302211175e-05, + "loss": 0.2638, + "step": 11997 + }, + { + "epoch": 32.69209809264305, + "grad_norm": 8.620534896850586, + "learning_rate": 1.5721639275876807e-05, + "loss": 0.3557, + "step": 11998 + }, + { + "epoch": 32.694822888283376, + "grad_norm": 8.94057559967041, + "learning_rate": 1.5720915485081923e-05, + "loss": 0.3119, + "step": 11999 + }, + { + "epoch": 32.69754768392371, + "grad_norm": 15.445932388305664, + "learning_rate": 1.572019164973273e-05, + "loss": 0.3889, + "step": 12000 + }, + { + "epoch": 32.700272479564035, + "grad_norm": 7.084281921386719, + "learning_rate": 1.571946776983487e-05, + "loss": 0.3085, + "step": 12001 + }, + { + "epoch": 32.70299727520436, + "grad_norm": 6.626097679138184, + "learning_rate": 1.571874384539398e-05, + "loss": 0.3419, + "step": 12002 + }, + { + "epoch": 32.705722070844686, + "grad_norm": 6.412007808685303, + "learning_rate": 1.5718019876415696e-05, + "loss": 0.473, + "step": 12003 + }, + { + "epoch": 32.70844686648501, + "grad_norm": 8.777931213378906, + "learning_rate": 1.571729586290566e-05, + "loss": 0.4618, + "step": 12004 + }, + { + "epoch": 32.71117166212534, + "grad_norm": 7.052206039428711, + "learning_rate": 1.5716571804869502e-05, + "loss": 0.3517, + "step": 12005 + }, + { + "epoch": 32.71389645776567, + "grad_norm": 7.550273895263672, + "learning_rate": 1.571584770231287e-05, + "loss": 0.5114, + "step": 12006 + }, + { + "epoch": 32.716621253406, + "grad_norm": 8.385041236877441, + "learning_rate": 1.5715123555241397e-05, + "loss": 0.4684, + "step": 12007 + }, + { + "epoch": 32.71934604904632, + "grad_norm": 7.535192966461182, + "learning_rate": 1.571439936366073e-05, + "loss": 0.5306, + "step": 12008 + }, + { + "epoch": 32.72207084468665, + "grad_norm": 6.882071495056152, + "learning_rate": 1.5713675127576504e-05, + "loss": 0.5009, + "step": 12009 + }, + { + "epoch": 32.724795640326974, + "grad_norm": 9.158919334411621, + "learning_rate": 1.571295084699436e-05, + "loss": 0.4095, + "step": 12010 + }, + { + "epoch": 32.7275204359673, + "grad_norm": 7.361640930175781, + "learning_rate": 1.5712226521919936e-05, + "loss": 0.4253, + "step": 12011 + }, + { + "epoch": 32.73024523160763, + "grad_norm": 7.760611534118652, + "learning_rate": 1.5711502152358878e-05, + "loss": 0.3644, + "step": 12012 + }, + { + "epoch": 32.73297002724796, + "grad_norm": 6.2527756690979, + "learning_rate": 1.5710777738316827e-05, + "loss": 0.3277, + "step": 12013 + }, + { + "epoch": 32.735694822888284, + "grad_norm": 8.708322525024414, + "learning_rate": 1.5710053279799416e-05, + "loss": 0.455, + "step": 12014 + }, + { + "epoch": 32.73841961852861, + "grad_norm": 10.21238899230957, + "learning_rate": 1.5709328776812302e-05, + "loss": 0.4052, + "step": 12015 + }, + { + "epoch": 32.741144414168936, + "grad_norm": 8.482315063476562, + "learning_rate": 1.5708604229361115e-05, + "loss": 0.3911, + "step": 12016 + }, + { + "epoch": 32.74386920980926, + "grad_norm": 7.245648384094238, + "learning_rate": 1.5707879637451502e-05, + "loss": 0.4201, + "step": 12017 + }, + { + "epoch": 32.746594005449595, + "grad_norm": 9.180356979370117, + "learning_rate": 1.5707155001089106e-05, + "loss": 0.4395, + "step": 12018 + }, + { + "epoch": 32.74931880108992, + "grad_norm": 9.307323455810547, + "learning_rate": 1.570643032027957e-05, + "loss": 0.3676, + "step": 12019 + }, + { + "epoch": 32.752043596730246, + "grad_norm": 7.687534809112549, + "learning_rate": 1.570570559502854e-05, + "loss": 0.3707, + "step": 12020 + }, + { + "epoch": 32.75476839237057, + "grad_norm": 6.333620071411133, + "learning_rate": 1.570498082534166e-05, + "loss": 0.4487, + "step": 12021 + }, + { + "epoch": 32.7574931880109, + "grad_norm": 6.845382213592529, + "learning_rate": 1.570425601122457e-05, + "loss": 0.3813, + "step": 12022 + }, + { + "epoch": 32.76021798365122, + "grad_norm": 6.706961154937744, + "learning_rate": 1.5703531152682918e-05, + "loss": 0.466, + "step": 12023 + }, + { + "epoch": 32.762942779291556, + "grad_norm": 8.425186157226562, + "learning_rate": 1.570280624972235e-05, + "loss": 0.4315, + "step": 12024 + }, + { + "epoch": 32.76566757493188, + "grad_norm": 7.779570579528809, + "learning_rate": 1.570208130234851e-05, + "loss": 0.3782, + "step": 12025 + }, + { + "epoch": 32.76839237057221, + "grad_norm": 39.01546096801758, + "learning_rate": 1.5701356310567044e-05, + "loss": 0.3603, + "step": 12026 + }, + { + "epoch": 32.771117166212534, + "grad_norm": 8.052181243896484, + "learning_rate": 1.57006312743836e-05, + "loss": 0.5454, + "step": 12027 + }, + { + "epoch": 32.77384196185286, + "grad_norm": 8.000152587890625, + "learning_rate": 1.569990619380382e-05, + "loss": 0.2993, + "step": 12028 + }, + { + "epoch": 32.776566757493185, + "grad_norm": 8.588805198669434, + "learning_rate": 1.5699181068833355e-05, + "loss": 0.3774, + "step": 12029 + }, + { + "epoch": 32.77929155313352, + "grad_norm": 6.751492023468018, + "learning_rate": 1.5698455899477852e-05, + "loss": 0.3899, + "step": 12030 + }, + { + "epoch": 32.782016348773844, + "grad_norm": 6.409905433654785, + "learning_rate": 1.569773068574296e-05, + "loss": 0.2914, + "step": 12031 + }, + { + "epoch": 32.78474114441417, + "grad_norm": 7.139047145843506, + "learning_rate": 1.5697005427634324e-05, + "loss": 0.331, + "step": 12032 + }, + { + "epoch": 32.787465940054496, + "grad_norm": 6.8841094970703125, + "learning_rate": 1.569628012515759e-05, + "loss": 0.3943, + "step": 12033 + }, + { + "epoch": 32.79019073569482, + "grad_norm": 8.627446174621582, + "learning_rate": 1.5695554778318413e-05, + "loss": 0.534, + "step": 12034 + }, + { + "epoch": 32.79291553133515, + "grad_norm": 7.6862311363220215, + "learning_rate": 1.5694829387122436e-05, + "loss": 0.28, + "step": 12035 + }, + { + "epoch": 32.79564032697548, + "grad_norm": 9.490158081054688, + "learning_rate": 1.5694103951575313e-05, + "loss": 0.4632, + "step": 12036 + }, + { + "epoch": 32.798365122615806, + "grad_norm": 6.376895904541016, + "learning_rate": 1.5693378471682688e-05, + "loss": 0.3123, + "step": 12037 + }, + { + "epoch": 32.80108991825613, + "grad_norm": 8.53414535522461, + "learning_rate": 1.569265294745022e-05, + "loss": 0.5134, + "step": 12038 + }, + { + "epoch": 32.80381471389646, + "grad_norm": 8.084589004516602, + "learning_rate": 1.5691927378883555e-05, + "loss": 0.4007, + "step": 12039 + }, + { + "epoch": 32.80653950953678, + "grad_norm": 9.008152961730957, + "learning_rate": 1.5691201765988336e-05, + "loss": 0.4251, + "step": 12040 + }, + { + "epoch": 32.80926430517711, + "grad_norm": 7.938703536987305, + "learning_rate": 1.5690476108770224e-05, + "loss": 0.5161, + "step": 12041 + }, + { + "epoch": 32.81198910081744, + "grad_norm": 8.03249454498291, + "learning_rate": 1.568975040723487e-05, + "loss": 0.3499, + "step": 12042 + }, + { + "epoch": 32.81471389645777, + "grad_norm": 8.85582447052002, + "learning_rate": 1.568902466138792e-05, + "loss": 0.4211, + "step": 12043 + }, + { + "epoch": 32.817438692098094, + "grad_norm": 7.650516033172607, + "learning_rate": 1.5688298871235028e-05, + "loss": 0.445, + "step": 12044 + }, + { + "epoch": 32.82016348773842, + "grad_norm": 7.037267208099365, + "learning_rate": 1.568757303678185e-05, + "loss": 0.3871, + "step": 12045 + }, + { + "epoch": 32.822888283378745, + "grad_norm": 8.33869743347168, + "learning_rate": 1.5686847158034036e-05, + "loss": 0.4173, + "step": 12046 + }, + { + "epoch": 32.82561307901907, + "grad_norm": 9.3466796875, + "learning_rate": 1.568612123499724e-05, + "loss": 0.4705, + "step": 12047 + }, + { + "epoch": 32.828337874659404, + "grad_norm": 7.2523417472839355, + "learning_rate": 1.5685395267677113e-05, + "loss": 0.4606, + "step": 12048 + }, + { + "epoch": 32.83106267029973, + "grad_norm": 7.06911563873291, + "learning_rate": 1.568466925607931e-05, + "loss": 0.4572, + "step": 12049 + }, + { + "epoch": 32.833787465940055, + "grad_norm": 8.29034423828125, + "learning_rate": 1.5683943200209486e-05, + "loss": 0.347, + "step": 12050 + }, + { + "epoch": 32.83651226158038, + "grad_norm": 7.922194480895996, + "learning_rate": 1.56832171000733e-05, + "loss": 0.4034, + "step": 12051 + }, + { + "epoch": 32.83923705722071, + "grad_norm": 7.565577030181885, + "learning_rate": 1.5682490955676395e-05, + "loss": 0.3679, + "step": 12052 + }, + { + "epoch": 32.84196185286103, + "grad_norm": 8.645038604736328, + "learning_rate": 1.5681764767024435e-05, + "loss": 0.42, + "step": 12053 + }, + { + "epoch": 32.844686648501366, + "grad_norm": 7.09843111038208, + "learning_rate": 1.5681038534123078e-05, + "loss": 0.5084, + "step": 12054 + }, + { + "epoch": 32.84741144414169, + "grad_norm": 8.0593843460083, + "learning_rate": 1.5680312256977974e-05, + "loss": 0.3346, + "step": 12055 + }, + { + "epoch": 32.85013623978202, + "grad_norm": 5.948692798614502, + "learning_rate": 1.5679585935594782e-05, + "loss": 0.493, + "step": 12056 + }, + { + "epoch": 32.85286103542234, + "grad_norm": 6.850461959838867, + "learning_rate": 1.5678859569979154e-05, + "loss": 0.3345, + "step": 12057 + }, + { + "epoch": 32.85558583106267, + "grad_norm": 6.771362781524658, + "learning_rate": 1.5678133160136754e-05, + "loss": 0.4419, + "step": 12058 + }, + { + "epoch": 32.858310626702995, + "grad_norm": 7.2968878746032715, + "learning_rate": 1.5677406706073234e-05, + "loss": 0.3654, + "step": 12059 + }, + { + "epoch": 32.86103542234333, + "grad_norm": 6.3690643310546875, + "learning_rate": 1.5676680207794252e-05, + "loss": 0.3576, + "step": 12060 + }, + { + "epoch": 32.86376021798365, + "grad_norm": 7.52684211730957, + "learning_rate": 1.567595366530547e-05, + "loss": 0.6186, + "step": 12061 + }, + { + "epoch": 32.86648501362398, + "grad_norm": 6.275260925292969, + "learning_rate": 1.567522707861254e-05, + "loss": 0.5436, + "step": 12062 + }, + { + "epoch": 32.869209809264305, + "grad_norm": 7.670266628265381, + "learning_rate": 1.567450044772113e-05, + "loss": 0.5059, + "step": 12063 + }, + { + "epoch": 32.87193460490463, + "grad_norm": 7.877997875213623, + "learning_rate": 1.5673773772636887e-05, + "loss": 0.4254, + "step": 12064 + }, + { + "epoch": 32.87465940054496, + "grad_norm": 7.987328052520752, + "learning_rate": 1.567304705336548e-05, + "loss": 0.3008, + "step": 12065 + }, + { + "epoch": 32.87738419618529, + "grad_norm": 6.786599159240723, + "learning_rate": 1.567232028991256e-05, + "loss": 0.4849, + "step": 12066 + }, + { + "epoch": 32.880108991825615, + "grad_norm": 7.205345630645752, + "learning_rate": 1.5671593482283797e-05, + "loss": 0.3793, + "step": 12067 + }, + { + "epoch": 32.88283378746594, + "grad_norm": 8.275880813598633, + "learning_rate": 1.5670866630484847e-05, + "loss": 0.4988, + "step": 12068 + }, + { + "epoch": 32.88555858310627, + "grad_norm": 6.805363655090332, + "learning_rate": 1.567013973452137e-05, + "loss": 0.3616, + "step": 12069 + }, + { + "epoch": 32.88828337874659, + "grad_norm": 7.106833457946777, + "learning_rate": 1.5669412794399027e-05, + "loss": 0.5326, + "step": 12070 + }, + { + "epoch": 32.89100817438692, + "grad_norm": 9.400209426879883, + "learning_rate": 1.5668685810123477e-05, + "loss": 0.472, + "step": 12071 + }, + { + "epoch": 32.89373297002725, + "grad_norm": 8.801173210144043, + "learning_rate": 1.5667958781700386e-05, + "loss": 0.3932, + "step": 12072 + }, + { + "epoch": 32.89645776566758, + "grad_norm": 7.403770446777344, + "learning_rate": 1.5667231709135414e-05, + "loss": 0.4413, + "step": 12073 + }, + { + "epoch": 32.8991825613079, + "grad_norm": 8.15301513671875, + "learning_rate": 1.5666504592434228e-05, + "loss": 0.313, + "step": 12074 + }, + { + "epoch": 32.90190735694823, + "grad_norm": 8.188809394836426, + "learning_rate": 1.566577743160248e-05, + "loss": 0.4168, + "step": 12075 + }, + { + "epoch": 32.904632152588555, + "grad_norm": 6.774173259735107, + "learning_rate": 1.566505022664584e-05, + "loss": 0.3796, + "step": 12076 + }, + { + "epoch": 32.90735694822888, + "grad_norm": 8.598569869995117, + "learning_rate": 1.5664322977569976e-05, + "loss": 0.4853, + "step": 12077 + }, + { + "epoch": 32.91008174386921, + "grad_norm": 9.037574768066406, + "learning_rate": 1.5663595684380544e-05, + "loss": 0.3386, + "step": 12078 + }, + { + "epoch": 32.91280653950954, + "grad_norm": 8.221321105957031, + "learning_rate": 1.5662868347083213e-05, + "loss": 0.4525, + "step": 12079 + }, + { + "epoch": 32.915531335149865, + "grad_norm": 8.122885704040527, + "learning_rate": 1.5662140965683645e-05, + "loss": 0.511, + "step": 12080 + }, + { + "epoch": 32.91825613079019, + "grad_norm": 12.633194923400879, + "learning_rate": 1.5661413540187504e-05, + "loss": 0.448, + "step": 12081 + }, + { + "epoch": 32.920980926430516, + "grad_norm": 7.939639091491699, + "learning_rate": 1.566068607060046e-05, + "loss": 0.4385, + "step": 12082 + }, + { + "epoch": 32.92370572207084, + "grad_norm": 6.504891395568848, + "learning_rate": 1.565995855692817e-05, + "loss": 0.3574, + "step": 12083 + }, + { + "epoch": 32.926430517711175, + "grad_norm": 7.92395544052124, + "learning_rate": 1.5659230999176307e-05, + "loss": 0.3979, + "step": 12084 + }, + { + "epoch": 32.9291553133515, + "grad_norm": 7.3674635887146, + "learning_rate": 1.5658503397350536e-05, + "loss": 0.5131, + "step": 12085 + }, + { + "epoch": 32.93188010899183, + "grad_norm": 5.609498023986816, + "learning_rate": 1.5657775751456524e-05, + "loss": 0.3665, + "step": 12086 + }, + { + "epoch": 32.93460490463215, + "grad_norm": 11.792949676513672, + "learning_rate": 1.5657048061499932e-05, + "loss": 0.4108, + "step": 12087 + }, + { + "epoch": 32.93732970027248, + "grad_norm": 7.255577087402344, + "learning_rate": 1.5656320327486433e-05, + "loss": 0.37, + "step": 12088 + }, + { + "epoch": 32.940054495912804, + "grad_norm": 17.582035064697266, + "learning_rate": 1.5655592549421695e-05, + "loss": 0.4506, + "step": 12089 + }, + { + "epoch": 32.94277929155314, + "grad_norm": 10.486715316772461, + "learning_rate": 1.565486472731139e-05, + "loss": 0.4735, + "step": 12090 + }, + { + "epoch": 32.94550408719346, + "grad_norm": 7.075913429260254, + "learning_rate": 1.5654136861161174e-05, + "loss": 0.4352, + "step": 12091 + }, + { + "epoch": 32.94822888283379, + "grad_norm": 9.81493091583252, + "learning_rate": 1.5653408950976717e-05, + "loss": 0.3662, + "step": 12092 + }, + { + "epoch": 32.950953678474114, + "grad_norm": 11.64074420928955, + "learning_rate": 1.5652680996763702e-05, + "loss": 0.4028, + "step": 12093 + }, + { + "epoch": 32.95367847411444, + "grad_norm": 6.694557189941406, + "learning_rate": 1.5651952998527786e-05, + "loss": 0.3807, + "step": 12094 + }, + { + "epoch": 32.956403269754766, + "grad_norm": 8.660942077636719, + "learning_rate": 1.5651224956274643e-05, + "loss": 0.3384, + "step": 12095 + }, + { + "epoch": 32.95912806539509, + "grad_norm": 7.801591873168945, + "learning_rate": 1.565049687000994e-05, + "loss": 0.4241, + "step": 12096 + }, + { + "epoch": 32.961852861035425, + "grad_norm": 6.360088348388672, + "learning_rate": 1.5649768739739348e-05, + "loss": 0.5128, + "step": 12097 + }, + { + "epoch": 32.96457765667575, + "grad_norm": 5.70269775390625, + "learning_rate": 1.564904056546854e-05, + "loss": 0.3537, + "step": 12098 + }, + { + "epoch": 32.967302452316076, + "grad_norm": 7.237667560577393, + "learning_rate": 1.564831234720319e-05, + "loss": 0.4069, + "step": 12099 + }, + { + "epoch": 32.9700272479564, + "grad_norm": 9.81737232208252, + "learning_rate": 1.564758408494896e-05, + "loss": 0.5043, + "step": 12100 + }, + { + "epoch": 32.97275204359673, + "grad_norm": 6.362037181854248, + "learning_rate": 1.564685577871153e-05, + "loss": 0.4174, + "step": 12101 + }, + { + "epoch": 32.97547683923706, + "grad_norm": 6.462863922119141, + "learning_rate": 1.564612742849657e-05, + "loss": 0.4637, + "step": 12102 + }, + { + "epoch": 32.97820163487739, + "grad_norm": 12.043787956237793, + "learning_rate": 1.564539903430975e-05, + "loss": 0.4103, + "step": 12103 + }, + { + "epoch": 32.98092643051771, + "grad_norm": 7.939565181732178, + "learning_rate": 1.564467059615674e-05, + "loss": 0.4692, + "step": 12104 + }, + { + "epoch": 32.98365122615804, + "grad_norm": 8.781482696533203, + "learning_rate": 1.564394211404322e-05, + "loss": 0.3722, + "step": 12105 + }, + { + "epoch": 32.986376021798364, + "grad_norm": 8.51310920715332, + "learning_rate": 1.564321358797486e-05, + "loss": 0.4591, + "step": 12106 + }, + { + "epoch": 32.98910081743869, + "grad_norm": 5.838075160980225, + "learning_rate": 1.564248501795734e-05, + "loss": 0.4764, + "step": 12107 + }, + { + "epoch": 32.991825613079016, + "grad_norm": 6.868386745452881, + "learning_rate": 1.564175640399632e-05, + "loss": 0.3613, + "step": 12108 + }, + { + "epoch": 32.99455040871935, + "grad_norm": 6.692442417144775, + "learning_rate": 1.5641027746097484e-05, + "loss": 0.6792, + "step": 12109 + }, + { + "epoch": 32.997275204359674, + "grad_norm": 8.148579597473145, + "learning_rate": 1.564029904426651e-05, + "loss": 0.4401, + "step": 12110 + }, + { + "epoch": 33.0, + "grad_norm": 6.626377105712891, + "learning_rate": 1.5639570298509067e-05, + "loss": 0.2638, + "step": 12111 + }, + { + "epoch": 33.002724795640326, + "grad_norm": 7.323823928833008, + "learning_rate": 1.563884150883083e-05, + "loss": 0.5676, + "step": 12112 + }, + { + "epoch": 33.00544959128065, + "grad_norm": 6.628137588500977, + "learning_rate": 1.563811267523748e-05, + "loss": 0.3055, + "step": 12113 + }, + { + "epoch": 33.00817438692098, + "grad_norm": 10.509965896606445, + "learning_rate": 1.5637383797734685e-05, + "loss": 0.5372, + "step": 12114 + }, + { + "epoch": 33.01089918256131, + "grad_norm": 7.332951068878174, + "learning_rate": 1.5636654876328134e-05, + "loss": 0.3818, + "step": 12115 + }, + { + "epoch": 33.013623978201636, + "grad_norm": 5.587296009063721, + "learning_rate": 1.563592591102349e-05, + "loss": 0.4557, + "step": 12116 + }, + { + "epoch": 33.01634877384196, + "grad_norm": 7.477775573730469, + "learning_rate": 1.5635196901826436e-05, + "loss": 0.6977, + "step": 12117 + }, + { + "epoch": 33.01907356948229, + "grad_norm": 6.747099876403809, + "learning_rate": 1.563446784874265e-05, + "loss": 0.3499, + "step": 12118 + }, + { + "epoch": 33.02179836512261, + "grad_norm": 6.576713562011719, + "learning_rate": 1.5633738751777814e-05, + "loss": 0.3163, + "step": 12119 + }, + { + "epoch": 33.02452316076294, + "grad_norm": 5.987857818603516, + "learning_rate": 1.56330096109376e-05, + "loss": 0.3235, + "step": 12120 + }, + { + "epoch": 33.02724795640327, + "grad_norm": 9.134624481201172, + "learning_rate": 1.5632280426227685e-05, + "loss": 0.5594, + "step": 12121 + }, + { + "epoch": 33.0299727520436, + "grad_norm": 6.8406829833984375, + "learning_rate": 1.5631551197653756e-05, + "loss": 0.3962, + "step": 12122 + }, + { + "epoch": 33.032697547683924, + "grad_norm": 7.628662586212158, + "learning_rate": 1.5630821925221488e-05, + "loss": 0.2757, + "step": 12123 + }, + { + "epoch": 33.03542234332425, + "grad_norm": 6.215722560882568, + "learning_rate": 1.563009260893656e-05, + "loss": 0.3205, + "step": 12124 + }, + { + "epoch": 33.038147138964575, + "grad_norm": 9.666122436523438, + "learning_rate": 1.5629363248804644e-05, + "loss": 0.2663, + "step": 12125 + }, + { + "epoch": 33.0408719346049, + "grad_norm": 6.604397296905518, + "learning_rate": 1.5628633844831436e-05, + "loss": 0.3544, + "step": 12126 + }, + { + "epoch": 33.043596730245234, + "grad_norm": 5.744869232177734, + "learning_rate": 1.5627904397022605e-05, + "loss": 0.4654, + "step": 12127 + }, + { + "epoch": 33.04632152588556, + "grad_norm": 9.151631355285645, + "learning_rate": 1.5627174905383838e-05, + "loss": 0.3775, + "step": 12128 + }, + { + "epoch": 33.049046321525886, + "grad_norm": 7.482045650482178, + "learning_rate": 1.5626445369920816e-05, + "loss": 0.3073, + "step": 12129 + }, + { + "epoch": 33.05177111716621, + "grad_norm": 6.341897487640381, + "learning_rate": 1.5625715790639214e-05, + "loss": 0.3134, + "step": 12130 + }, + { + "epoch": 33.05449591280654, + "grad_norm": 8.26285457611084, + "learning_rate": 1.562498616754472e-05, + "loss": 0.4222, + "step": 12131 + }, + { + "epoch": 33.05722070844686, + "grad_norm": 7.009021282196045, + "learning_rate": 1.5624256500643016e-05, + "loss": 0.3741, + "step": 12132 + }, + { + "epoch": 33.059945504087196, + "grad_norm": 7.427831172943115, + "learning_rate": 1.5623526789939784e-05, + "loss": 0.4128, + "step": 12133 + }, + { + "epoch": 33.06267029972752, + "grad_norm": 5.852236270904541, + "learning_rate": 1.5622797035440703e-05, + "loss": 0.4782, + "step": 12134 + }, + { + "epoch": 33.06539509536785, + "grad_norm": 6.832294940948486, + "learning_rate": 1.5622067237151465e-05, + "loss": 0.2744, + "step": 12135 + }, + { + "epoch": 33.06811989100817, + "grad_norm": 6.296779155731201, + "learning_rate": 1.5621337395077742e-05, + "loss": 0.2502, + "step": 12136 + }, + { + "epoch": 33.0708446866485, + "grad_norm": 9.04610538482666, + "learning_rate": 1.5620607509225227e-05, + "loss": 0.5152, + "step": 12137 + }, + { + "epoch": 33.073569482288825, + "grad_norm": 6.3163909912109375, + "learning_rate": 1.5619877579599604e-05, + "loss": 0.4043, + "step": 12138 + }, + { + "epoch": 33.07629427792916, + "grad_norm": 6.203168869018555, + "learning_rate": 1.5619147606206552e-05, + "loss": 0.4096, + "step": 12139 + }, + { + "epoch": 33.079019073569484, + "grad_norm": 6.571667671203613, + "learning_rate": 1.561841758905176e-05, + "loss": 0.3661, + "step": 12140 + }, + { + "epoch": 33.08174386920981, + "grad_norm": 6.468061447143555, + "learning_rate": 1.5617687528140915e-05, + "loss": 0.4316, + "step": 12141 + }, + { + "epoch": 33.084468664850135, + "grad_norm": 4.98010778427124, + "learning_rate": 1.5616957423479698e-05, + "loss": 0.2972, + "step": 12142 + }, + { + "epoch": 33.08719346049046, + "grad_norm": 7.058682441711426, + "learning_rate": 1.5616227275073796e-05, + "loss": 0.3562, + "step": 12143 + }, + { + "epoch": 33.08991825613079, + "grad_norm": 5.501753807067871, + "learning_rate": 1.56154970829289e-05, + "loss": 0.4178, + "step": 12144 + }, + { + "epoch": 33.09264305177112, + "grad_norm": 6.312686920166016, + "learning_rate": 1.561476684705069e-05, + "loss": 0.2449, + "step": 12145 + }, + { + "epoch": 33.095367847411445, + "grad_norm": 6.514692783355713, + "learning_rate": 1.561403656744486e-05, + "loss": 0.2487, + "step": 12146 + }, + { + "epoch": 33.09809264305177, + "grad_norm": 7.077640056610107, + "learning_rate": 1.5613306244117092e-05, + "loss": 0.4452, + "step": 12147 + }, + { + "epoch": 33.1008174386921, + "grad_norm": 8.67483901977539, + "learning_rate": 1.5612575877073078e-05, + "loss": 0.3589, + "step": 12148 + }, + { + "epoch": 33.10354223433242, + "grad_norm": 5.831808090209961, + "learning_rate": 1.56118454663185e-05, + "loss": 0.3697, + "step": 12149 + }, + { + "epoch": 33.10626702997275, + "grad_norm": 6.515407562255859, + "learning_rate": 1.5611115011859052e-05, + "loss": 0.3438, + "step": 12150 + }, + { + "epoch": 33.10899182561308, + "grad_norm": 8.445128440856934, + "learning_rate": 1.5610384513700422e-05, + "loss": 0.3747, + "step": 12151 + }, + { + "epoch": 33.11171662125341, + "grad_norm": 11.156426429748535, + "learning_rate": 1.5609653971848296e-05, + "loss": 0.3044, + "step": 12152 + }, + { + "epoch": 33.11444141689373, + "grad_norm": 10.229217529296875, + "learning_rate": 1.5608923386308365e-05, + "loss": 0.2704, + "step": 12153 + }, + { + "epoch": 33.11716621253406, + "grad_norm": 6.33029842376709, + "learning_rate": 1.560819275708632e-05, + "loss": 0.3672, + "step": 12154 + }, + { + "epoch": 33.119891008174385, + "grad_norm": 7.576890468597412, + "learning_rate": 1.5607462084187853e-05, + "loss": 0.2351, + "step": 12155 + }, + { + "epoch": 33.12261580381471, + "grad_norm": 7.682079792022705, + "learning_rate": 1.5606731367618647e-05, + "loss": 0.3261, + "step": 12156 + }, + { + "epoch": 33.12534059945504, + "grad_norm": 6.63905668258667, + "learning_rate": 1.5606000607384402e-05, + "loss": 0.3571, + "step": 12157 + }, + { + "epoch": 33.12806539509537, + "grad_norm": 7.063698768615723, + "learning_rate": 1.56052698034908e-05, + "loss": 0.3713, + "step": 12158 + }, + { + "epoch": 33.130790190735695, + "grad_norm": 6.658858299255371, + "learning_rate": 1.5604538955943542e-05, + "loss": 0.3423, + "step": 12159 + }, + { + "epoch": 33.13351498637602, + "grad_norm": 9.059860229492188, + "learning_rate": 1.5603808064748313e-05, + "loss": 0.3508, + "step": 12160 + }, + { + "epoch": 33.13623978201635, + "grad_norm": 7.219796657562256, + "learning_rate": 1.5603077129910805e-05, + "loss": 0.3313, + "step": 12161 + }, + { + "epoch": 33.13896457765667, + "grad_norm": 11.955741882324219, + "learning_rate": 1.5602346151436715e-05, + "loss": 0.3326, + "step": 12162 + }, + { + "epoch": 33.141689373297005, + "grad_norm": 6.73663854598999, + "learning_rate": 1.5601615129331734e-05, + "loss": 0.4324, + "step": 12163 + }, + { + "epoch": 33.14441416893733, + "grad_norm": 6.877493858337402, + "learning_rate": 1.5600884063601554e-05, + "loss": 0.4032, + "step": 12164 + }, + { + "epoch": 33.14713896457766, + "grad_norm": 6.520141124725342, + "learning_rate": 1.560015295425187e-05, + "loss": 0.3725, + "step": 12165 + }, + { + "epoch": 33.14986376021798, + "grad_norm": 6.258823871612549, + "learning_rate": 1.5599421801288373e-05, + "loss": 0.3919, + "step": 12166 + }, + { + "epoch": 33.15258855585831, + "grad_norm": 6.118670463562012, + "learning_rate": 1.5598690604716763e-05, + "loss": 0.3483, + "step": 12167 + }, + { + "epoch": 33.155313351498634, + "grad_norm": 8.57835865020752, + "learning_rate": 1.5597959364542726e-05, + "loss": 0.401, + "step": 12168 + }, + { + "epoch": 33.15803814713897, + "grad_norm": 8.096592903137207, + "learning_rate": 1.559722808077196e-05, + "loss": 0.3821, + "step": 12169 + }, + { + "epoch": 33.16076294277929, + "grad_norm": 6.646443843841553, + "learning_rate": 1.559649675341017e-05, + "loss": 0.3525, + "step": 12170 + }, + { + "epoch": 33.16348773841962, + "grad_norm": 6.403456211090088, + "learning_rate": 1.5595765382463035e-05, + "loss": 0.3165, + "step": 12171 + }, + { + "epoch": 33.166212534059945, + "grad_norm": 6.006011009216309, + "learning_rate": 1.5595033967936264e-05, + "loss": 0.4086, + "step": 12172 + }, + { + "epoch": 33.16893732970027, + "grad_norm": 6.651188850402832, + "learning_rate": 1.5594302509835548e-05, + "loss": 0.4548, + "step": 12173 + }, + { + "epoch": 33.171662125340596, + "grad_norm": 11.389019966125488, + "learning_rate": 1.5593571008166587e-05, + "loss": 0.3697, + "step": 12174 + }, + { + "epoch": 33.17438692098093, + "grad_norm": 5.870072841644287, + "learning_rate": 1.559283946293507e-05, + "loss": 0.2602, + "step": 12175 + }, + { + "epoch": 33.177111716621255, + "grad_norm": 5.876684665679932, + "learning_rate": 1.55921078741467e-05, + "loss": 0.2562, + "step": 12176 + }, + { + "epoch": 33.17983651226158, + "grad_norm": 7.102714538574219, + "learning_rate": 1.5591376241807177e-05, + "loss": 0.3668, + "step": 12177 + }, + { + "epoch": 33.182561307901906, + "grad_norm": 8.703709602355957, + "learning_rate": 1.559064456592219e-05, + "loss": 0.346, + "step": 12178 + }, + { + "epoch": 33.18528610354223, + "grad_norm": 6.849244117736816, + "learning_rate": 1.5589912846497447e-05, + "loss": 0.3544, + "step": 12179 + }, + { + "epoch": 33.18801089918256, + "grad_norm": 5.676214218139648, + "learning_rate": 1.5589181083538646e-05, + "loss": 0.385, + "step": 12180 + }, + { + "epoch": 33.19073569482289, + "grad_norm": 7.680464744567871, + "learning_rate": 1.5588449277051476e-05, + "loss": 0.4911, + "step": 12181 + }, + { + "epoch": 33.19346049046322, + "grad_norm": 8.966886520385742, + "learning_rate": 1.5587717427041645e-05, + "loss": 0.4529, + "step": 12182 + }, + { + "epoch": 33.19618528610354, + "grad_norm": 8.935302734375, + "learning_rate": 1.5586985533514853e-05, + "loss": 0.334, + "step": 12183 + }, + { + "epoch": 33.19891008174387, + "grad_norm": 6.224770545959473, + "learning_rate": 1.5586253596476798e-05, + "loss": 0.3634, + "step": 12184 + }, + { + "epoch": 33.201634877384194, + "grad_norm": 8.594982147216797, + "learning_rate": 1.5585521615933176e-05, + "loss": 0.3778, + "step": 12185 + }, + { + "epoch": 33.20435967302452, + "grad_norm": 6.484743595123291, + "learning_rate": 1.5584789591889693e-05, + "loss": 0.4342, + "step": 12186 + }, + { + "epoch": 33.20708446866485, + "grad_norm": 6.004835605621338, + "learning_rate": 1.5584057524352047e-05, + "loss": 0.2728, + "step": 12187 + }, + { + "epoch": 33.20980926430518, + "grad_norm": 6.681808948516846, + "learning_rate": 1.5583325413325944e-05, + "loss": 0.4458, + "step": 12188 + }, + { + "epoch": 33.212534059945504, + "grad_norm": 7.355443000793457, + "learning_rate": 1.558259325881708e-05, + "loss": 0.6285, + "step": 12189 + }, + { + "epoch": 33.21525885558583, + "grad_norm": 6.397506237030029, + "learning_rate": 1.558186106083116e-05, + "loss": 0.4643, + "step": 12190 + }, + { + "epoch": 33.217983651226156, + "grad_norm": 7.421044826507568, + "learning_rate": 1.5581128819373885e-05, + "loss": 0.3742, + "step": 12191 + }, + { + "epoch": 33.22070844686648, + "grad_norm": 7.265703201293945, + "learning_rate": 1.558039653445096e-05, + "loss": 0.3751, + "step": 12192 + }, + { + "epoch": 33.223433242506815, + "grad_norm": 7.574958801269531, + "learning_rate": 1.5579664206068087e-05, + "loss": 0.2934, + "step": 12193 + }, + { + "epoch": 33.22615803814714, + "grad_norm": 12.124749183654785, + "learning_rate": 1.5578931834230968e-05, + "loss": 0.3745, + "step": 12194 + }, + { + "epoch": 33.228882833787466, + "grad_norm": 8.5874605178833, + "learning_rate": 1.5578199418945304e-05, + "loss": 0.4017, + "step": 12195 + }, + { + "epoch": 33.23160762942779, + "grad_norm": 5.97220516204834, + "learning_rate": 1.5577466960216805e-05, + "loss": 0.2773, + "step": 12196 + }, + { + "epoch": 33.23433242506812, + "grad_norm": 7.527440547943115, + "learning_rate": 1.557673445805117e-05, + "loss": 0.3442, + "step": 12197 + }, + { + "epoch": 33.237057220708444, + "grad_norm": 10.769542694091797, + "learning_rate": 1.5576001912454114e-05, + "loss": 0.3999, + "step": 12198 + }, + { + "epoch": 33.23978201634878, + "grad_norm": 5.666802406311035, + "learning_rate": 1.5575269323431327e-05, + "loss": 0.3604, + "step": 12199 + }, + { + "epoch": 33.2425068119891, + "grad_norm": 7.8562092781066895, + "learning_rate": 1.5574536690988526e-05, + "loss": 0.3625, + "step": 12200 + }, + { + "epoch": 33.24523160762943, + "grad_norm": 7.768949508666992, + "learning_rate": 1.5573804015131414e-05, + "loss": 0.3944, + "step": 12201 + }, + { + "epoch": 33.247956403269754, + "grad_norm": 6.802807807922363, + "learning_rate": 1.5573071295865694e-05, + "loss": 0.2741, + "step": 12202 + }, + { + "epoch": 33.25068119891008, + "grad_norm": 7.93035364151001, + "learning_rate": 1.557233853319707e-05, + "loss": 0.3, + "step": 12203 + }, + { + "epoch": 33.253405994550405, + "grad_norm": 7.202589511871338, + "learning_rate": 1.5571605727131255e-05, + "loss": 0.3619, + "step": 12204 + }, + { + "epoch": 33.25613079019074, + "grad_norm": 9.372316360473633, + "learning_rate": 1.5570872877673958e-05, + "loss": 0.3482, + "step": 12205 + }, + { + "epoch": 33.258855585831064, + "grad_norm": 7.737120628356934, + "learning_rate": 1.5570139984830878e-05, + "loss": 0.2645, + "step": 12206 + }, + { + "epoch": 33.26158038147139, + "grad_norm": 10.476534843444824, + "learning_rate": 1.556940704860773e-05, + "loss": 0.4134, + "step": 12207 + }, + { + "epoch": 33.264305177111716, + "grad_norm": 10.893311500549316, + "learning_rate": 1.5568674069010218e-05, + "loss": 0.4485, + "step": 12208 + }, + { + "epoch": 33.26702997275204, + "grad_norm": 7.452104568481445, + "learning_rate": 1.5567941046044053e-05, + "loss": 0.4108, + "step": 12209 + }, + { + "epoch": 33.26975476839237, + "grad_norm": 6.8772382736206055, + "learning_rate": 1.556720797971494e-05, + "loss": 0.2637, + "step": 12210 + }, + { + "epoch": 33.2724795640327, + "grad_norm": 7.585111618041992, + "learning_rate": 1.556647487002859e-05, + "loss": 0.3127, + "step": 12211 + }, + { + "epoch": 33.275204359673026, + "grad_norm": 11.086917877197266, + "learning_rate": 1.5565741716990714e-05, + "loss": 0.5108, + "step": 12212 + }, + { + "epoch": 33.27792915531335, + "grad_norm": 8.147093772888184, + "learning_rate": 1.556500852060702e-05, + "loss": 0.3434, + "step": 12213 + }, + { + "epoch": 33.28065395095368, + "grad_norm": 7.377264022827148, + "learning_rate": 1.556427528088322e-05, + "loss": 0.4055, + "step": 12214 + }, + { + "epoch": 33.283378746594, + "grad_norm": 6.8624725341796875, + "learning_rate": 1.5563541997825025e-05, + "loss": 0.5069, + "step": 12215 + }, + { + "epoch": 33.28610354223433, + "grad_norm": 9.36638069152832, + "learning_rate": 1.556280867143814e-05, + "loss": 0.425, + "step": 12216 + }, + { + "epoch": 33.28882833787466, + "grad_norm": 5.822850227355957, + "learning_rate": 1.556207530172828e-05, + "loss": 0.3252, + "step": 12217 + }, + { + "epoch": 33.29155313351499, + "grad_norm": 6.872265338897705, + "learning_rate": 1.556134188870116e-05, + "loss": 0.2645, + "step": 12218 + }, + { + "epoch": 33.294277929155314, + "grad_norm": 6.900471210479736, + "learning_rate": 1.5560608432362486e-05, + "loss": 0.2932, + "step": 12219 + }, + { + "epoch": 33.29700272479564, + "grad_norm": 7.023861408233643, + "learning_rate": 1.5559874932717972e-05, + "loss": 0.5451, + "step": 12220 + }, + { + "epoch": 33.299727520435965, + "grad_norm": 8.168889999389648, + "learning_rate": 1.5559141389773334e-05, + "loss": 0.2791, + "step": 12221 + }, + { + "epoch": 33.30245231607629, + "grad_norm": 8.27985954284668, + "learning_rate": 1.555840780353428e-05, + "loss": 0.3385, + "step": 12222 + }, + { + "epoch": 33.305177111716624, + "grad_norm": 6.772516250610352, + "learning_rate": 1.5557674174006525e-05, + "loss": 0.2226, + "step": 12223 + }, + { + "epoch": 33.30790190735695, + "grad_norm": 9.39065933227539, + "learning_rate": 1.5556940501195784e-05, + "loss": 0.2984, + "step": 12224 + }, + { + "epoch": 33.310626702997276, + "grad_norm": 7.225677013397217, + "learning_rate": 1.5556206785107766e-05, + "loss": 0.3233, + "step": 12225 + }, + { + "epoch": 33.3133514986376, + "grad_norm": 6.888895034790039, + "learning_rate": 1.555547302574819e-05, + "loss": 0.3261, + "step": 12226 + }, + { + "epoch": 33.31607629427793, + "grad_norm": 6.585740089416504, + "learning_rate": 1.5554739223122768e-05, + "loss": 0.3632, + "step": 12227 + }, + { + "epoch": 33.31880108991825, + "grad_norm": 6.724668979644775, + "learning_rate": 1.5554005377237217e-05, + "loss": 0.3252, + "step": 12228 + }, + { + "epoch": 33.321525885558586, + "grad_norm": 7.033156394958496, + "learning_rate": 1.5553271488097247e-05, + "loss": 0.3376, + "step": 12229 + }, + { + "epoch": 33.32425068119891, + "grad_norm": 6.2989959716796875, + "learning_rate": 1.5552537555708584e-05, + "loss": 0.4559, + "step": 12230 + }, + { + "epoch": 33.32697547683924, + "grad_norm": 7.348972320556641, + "learning_rate": 1.5551803580076935e-05, + "loss": 0.2397, + "step": 12231 + }, + { + "epoch": 33.32970027247956, + "grad_norm": 6.269176483154297, + "learning_rate": 1.5551069561208018e-05, + "loss": 0.2628, + "step": 12232 + }, + { + "epoch": 33.33242506811989, + "grad_norm": 7.6189093589782715, + "learning_rate": 1.555033549910755e-05, + "loss": 0.3294, + "step": 12233 + }, + { + "epoch": 33.335149863760215, + "grad_norm": 8.982177734375, + "learning_rate": 1.5549601393781244e-05, + "loss": 0.504, + "step": 12234 + }, + { + "epoch": 33.33787465940055, + "grad_norm": 7.15234899520874, + "learning_rate": 1.5548867245234825e-05, + "loss": 0.4194, + "step": 12235 + }, + { + "epoch": 33.34059945504087, + "grad_norm": 5.938183307647705, + "learning_rate": 1.5548133053474004e-05, + "loss": 0.264, + "step": 12236 + }, + { + "epoch": 33.3433242506812, + "grad_norm": 7.6514482498168945, + "learning_rate": 1.5547398818504502e-05, + "loss": 0.4264, + "step": 12237 + }, + { + "epoch": 33.346049046321525, + "grad_norm": 6.497241020202637, + "learning_rate": 1.5546664540332037e-05, + "loss": 0.2015, + "step": 12238 + }, + { + "epoch": 33.34877384196185, + "grad_norm": 6.456487655639648, + "learning_rate": 1.554593021896233e-05, + "loss": 0.257, + "step": 12239 + }, + { + "epoch": 33.35149863760218, + "grad_norm": 7.130777359008789, + "learning_rate": 1.5545195854401095e-05, + "loss": 0.3681, + "step": 12240 + }, + { + "epoch": 33.35422343324251, + "grad_norm": 6.268331050872803, + "learning_rate": 1.5544461446654053e-05, + "loss": 0.2092, + "step": 12241 + }, + { + "epoch": 33.356948228882835, + "grad_norm": 7.931918144226074, + "learning_rate": 1.554372699572692e-05, + "loss": 0.3724, + "step": 12242 + }, + { + "epoch": 33.35967302452316, + "grad_norm": 6.673097610473633, + "learning_rate": 1.5542992501625425e-05, + "loss": 0.3635, + "step": 12243 + }, + { + "epoch": 33.36239782016349, + "grad_norm": 7.56607723236084, + "learning_rate": 1.5542257964355282e-05, + "loss": 0.3472, + "step": 12244 + }, + { + "epoch": 33.36512261580381, + "grad_norm": 5.374823093414307, + "learning_rate": 1.5541523383922206e-05, + "loss": 0.3676, + "step": 12245 + }, + { + "epoch": 33.36784741144414, + "grad_norm": 7.16453218460083, + "learning_rate": 1.554078876033193e-05, + "loss": 0.416, + "step": 12246 + }, + { + "epoch": 33.37057220708447, + "grad_norm": 6.608232498168945, + "learning_rate": 1.5540054093590173e-05, + "loss": 0.4185, + "step": 12247 + }, + { + "epoch": 33.3732970027248, + "grad_norm": 6.824566841125488, + "learning_rate": 1.5539319383702646e-05, + "loss": 0.3732, + "step": 12248 + }, + { + "epoch": 33.37602179836512, + "grad_norm": 6.502536296844482, + "learning_rate": 1.553858463067508e-05, + "loss": 0.3053, + "step": 12249 + }, + { + "epoch": 33.37874659400545, + "grad_norm": 6.010274887084961, + "learning_rate": 1.5537849834513197e-05, + "loss": 0.2581, + "step": 12250 + }, + { + "epoch": 33.381471389645775, + "grad_norm": 7.1450371742248535, + "learning_rate": 1.5537114995222716e-05, + "loss": 0.4281, + "step": 12251 + }, + { + "epoch": 33.3841961852861, + "grad_norm": 6.057378768920898, + "learning_rate": 1.553638011280936e-05, + "loss": 0.4492, + "step": 12252 + }, + { + "epoch": 33.38692098092643, + "grad_norm": 5.5235772132873535, + "learning_rate": 1.553564518727886e-05, + "loss": 0.4549, + "step": 12253 + }, + { + "epoch": 33.38964577656676, + "grad_norm": 5.668849468231201, + "learning_rate": 1.553491021863693e-05, + "loss": 0.2589, + "step": 12254 + }, + { + "epoch": 33.392370572207085, + "grad_norm": 6.622274875640869, + "learning_rate": 1.553417520688929e-05, + "loss": 0.297, + "step": 12255 + }, + { + "epoch": 33.39509536784741, + "grad_norm": 6.553107738494873, + "learning_rate": 1.553344015204168e-05, + "loss": 0.3379, + "step": 12256 + }, + { + "epoch": 33.39782016348774, + "grad_norm": 7.671754360198975, + "learning_rate": 1.5532705054099816e-05, + "loss": 0.4111, + "step": 12257 + }, + { + "epoch": 33.40054495912806, + "grad_norm": 5.965877056121826, + "learning_rate": 1.5531969913069423e-05, + "loss": 0.3313, + "step": 12258 + }, + { + "epoch": 33.403269754768395, + "grad_norm": 10.241011619567871, + "learning_rate": 1.5531234728956227e-05, + "loss": 0.4214, + "step": 12259 + }, + { + "epoch": 33.40599455040872, + "grad_norm": 9.025012969970703, + "learning_rate": 1.553049950176595e-05, + "loss": 0.4389, + "step": 12260 + }, + { + "epoch": 33.40871934604905, + "grad_norm": 6.43281888961792, + "learning_rate": 1.552976423150432e-05, + "loss": 0.3975, + "step": 12261 + }, + { + "epoch": 33.41144414168937, + "grad_norm": 8.139632225036621, + "learning_rate": 1.5529028918177067e-05, + "loss": 0.5136, + "step": 12262 + }, + { + "epoch": 33.4141689373297, + "grad_norm": 7.0361833572387695, + "learning_rate": 1.5528293561789912e-05, + "loss": 0.4117, + "step": 12263 + }, + { + "epoch": 33.416893732970024, + "grad_norm": 7.069800853729248, + "learning_rate": 1.5527558162348588e-05, + "loss": 0.4446, + "step": 12264 + }, + { + "epoch": 33.41961852861036, + "grad_norm": 6.559822082519531, + "learning_rate": 1.5526822719858816e-05, + "loss": 0.3782, + "step": 12265 + }, + { + "epoch": 33.42234332425068, + "grad_norm": 7.176815032958984, + "learning_rate": 1.5526087234326327e-05, + "loss": 0.3492, + "step": 12266 + }, + { + "epoch": 33.42506811989101, + "grad_norm": 6.263866901397705, + "learning_rate": 1.5525351705756852e-05, + "loss": 0.4857, + "step": 12267 + }, + { + "epoch": 33.427792915531334, + "grad_norm": 5.193022727966309, + "learning_rate": 1.552461613415611e-05, + "loss": 0.6106, + "step": 12268 + }, + { + "epoch": 33.43051771117166, + "grad_norm": 6.027821063995361, + "learning_rate": 1.5523880519529838e-05, + "loss": 0.5298, + "step": 12269 + }, + { + "epoch": 33.433242506811986, + "grad_norm": 7.548738956451416, + "learning_rate": 1.5523144861883767e-05, + "loss": 0.4398, + "step": 12270 + }, + { + "epoch": 33.43596730245232, + "grad_norm": 9.499189376831055, + "learning_rate": 1.5522409161223614e-05, + "loss": 0.4428, + "step": 12271 + }, + { + "epoch": 33.438692098092645, + "grad_norm": 7.346479892730713, + "learning_rate": 1.5521673417555117e-05, + "loss": 0.3069, + "step": 12272 + }, + { + "epoch": 33.44141689373297, + "grad_norm": 7.802134037017822, + "learning_rate": 1.552093763088401e-05, + "loss": 0.3533, + "step": 12273 + }, + { + "epoch": 33.444141689373296, + "grad_norm": 6.074779033660889, + "learning_rate": 1.5520201801216017e-05, + "loss": 0.3179, + "step": 12274 + }, + { + "epoch": 33.44686648501362, + "grad_norm": 6.945800304412842, + "learning_rate": 1.551946592855687e-05, + "loss": 0.4674, + "step": 12275 + }, + { + "epoch": 33.44959128065395, + "grad_norm": 5.797735214233398, + "learning_rate": 1.55187300129123e-05, + "loss": 0.5052, + "step": 12276 + }, + { + "epoch": 33.45231607629428, + "grad_norm": 10.462039947509766, + "learning_rate": 1.5517994054288035e-05, + "loss": 0.3609, + "step": 12277 + }, + { + "epoch": 33.45504087193461, + "grad_norm": 6.354482650756836, + "learning_rate": 1.5517258052689813e-05, + "loss": 0.2659, + "step": 12278 + }, + { + "epoch": 33.45776566757493, + "grad_norm": 6.137086868286133, + "learning_rate": 1.5516522008123364e-05, + "loss": 0.29, + "step": 12279 + }, + { + "epoch": 33.46049046321526, + "grad_norm": 6.347009181976318, + "learning_rate": 1.551578592059442e-05, + "loss": 0.307, + "step": 12280 + }, + { + "epoch": 33.463215258855584, + "grad_norm": 19.688533782958984, + "learning_rate": 1.5515049790108705e-05, + "loss": 0.3366, + "step": 12281 + }, + { + "epoch": 33.46594005449591, + "grad_norm": 7.231790065765381, + "learning_rate": 1.5514313616671967e-05, + "loss": 0.4257, + "step": 12282 + }, + { + "epoch": 33.46866485013624, + "grad_norm": 6.826254367828369, + "learning_rate": 1.5513577400289926e-05, + "loss": 0.3163, + "step": 12283 + }, + { + "epoch": 33.47138964577657, + "grad_norm": 6.485746383666992, + "learning_rate": 1.551284114096833e-05, + "loss": 0.2806, + "step": 12284 + }, + { + "epoch": 33.474114441416894, + "grad_norm": 5.880269527435303, + "learning_rate": 1.55121048387129e-05, + "loss": 0.6014, + "step": 12285 + }, + { + "epoch": 33.47683923705722, + "grad_norm": 5.744699954986572, + "learning_rate": 1.5511368493529375e-05, + "loss": 0.3055, + "step": 12286 + }, + { + "epoch": 33.479564032697546, + "grad_norm": 6.363956451416016, + "learning_rate": 1.551063210542349e-05, + "loss": 0.3838, + "step": 12287 + }, + { + "epoch": 33.48228882833787, + "grad_norm": 6.764632701873779, + "learning_rate": 1.5509895674400977e-05, + "loss": 0.3948, + "step": 12288 + }, + { + "epoch": 33.485013623978205, + "grad_norm": 9.482726097106934, + "learning_rate": 1.5509159200467577e-05, + "loss": 0.3629, + "step": 12289 + }, + { + "epoch": 33.48773841961853, + "grad_norm": 9.39960765838623, + "learning_rate": 1.5508422683629022e-05, + "loss": 0.3287, + "step": 12290 + }, + { + "epoch": 33.490463215258856, + "grad_norm": 9.882277488708496, + "learning_rate": 1.5507686123891046e-05, + "loss": 0.3516, + "step": 12291 + }, + { + "epoch": 33.49318801089918, + "grad_norm": 6.911797046661377, + "learning_rate": 1.5506949521259393e-05, + "loss": 0.352, + "step": 12292 + }, + { + "epoch": 33.49591280653951, + "grad_norm": 9.063674926757812, + "learning_rate": 1.550621287573979e-05, + "loss": 0.5132, + "step": 12293 + }, + { + "epoch": 33.49863760217983, + "grad_norm": 8.968364715576172, + "learning_rate": 1.550547618733798e-05, + "loss": 0.5012, + "step": 12294 + }, + { + "epoch": 33.50136239782017, + "grad_norm": 5.682219505310059, + "learning_rate": 1.5504739456059694e-05, + "loss": 0.4999, + "step": 12295 + }, + { + "epoch": 33.50408719346049, + "grad_norm": 6.653972625732422, + "learning_rate": 1.550400268191068e-05, + "loss": 0.2708, + "step": 12296 + }, + { + "epoch": 33.50681198910082, + "grad_norm": 7.9966888427734375, + "learning_rate": 1.5503265864896668e-05, + "loss": 0.33, + "step": 12297 + }, + { + "epoch": 33.509536784741144, + "grad_norm": 6.977714538574219, + "learning_rate": 1.55025290050234e-05, + "loss": 0.3494, + "step": 12298 + }, + { + "epoch": 33.51226158038147, + "grad_norm": 6.731818199157715, + "learning_rate": 1.550179210229661e-05, + "loss": 0.4812, + "step": 12299 + }, + { + "epoch": 33.514986376021795, + "grad_norm": 7.986743927001953, + "learning_rate": 1.5501055156722044e-05, + "loss": 0.4796, + "step": 12300 + }, + { + "epoch": 33.51771117166213, + "grad_norm": 29.076562881469727, + "learning_rate": 1.5500318168305434e-05, + "loss": 0.4885, + "step": 12301 + }, + { + "epoch": 33.520435967302454, + "grad_norm": 12.162221908569336, + "learning_rate": 1.5499581137052527e-05, + "loss": 0.4968, + "step": 12302 + }, + { + "epoch": 33.52316076294278, + "grad_norm": 5.864055156707764, + "learning_rate": 1.5498844062969055e-05, + "loss": 0.2878, + "step": 12303 + }, + { + "epoch": 33.525885558583106, + "grad_norm": 7.06923770904541, + "learning_rate": 1.5498106946060768e-05, + "loss": 0.4002, + "step": 12304 + }, + { + "epoch": 33.52861035422343, + "grad_norm": 8.66711711883545, + "learning_rate": 1.5497369786333398e-05, + "loss": 0.3882, + "step": 12305 + }, + { + "epoch": 33.53133514986376, + "grad_norm": 7.390394687652588, + "learning_rate": 1.5496632583792686e-05, + "loss": 0.416, + "step": 12306 + }, + { + "epoch": 33.53405994550409, + "grad_norm": 10.1567964553833, + "learning_rate": 1.549589533844438e-05, + "loss": 0.3127, + "step": 12307 + }, + { + "epoch": 33.536784741144416, + "grad_norm": 7.279140472412109, + "learning_rate": 1.5495158050294216e-05, + "loss": 0.4403, + "step": 12308 + }, + { + "epoch": 33.53950953678474, + "grad_norm": 7.6444902420043945, + "learning_rate": 1.549442071934794e-05, + "loss": 0.2965, + "step": 12309 + }, + { + "epoch": 33.54223433242507, + "grad_norm": 7.107326984405518, + "learning_rate": 1.549368334561129e-05, + "loss": 0.3421, + "step": 12310 + }, + { + "epoch": 33.54495912806539, + "grad_norm": 6.362401485443115, + "learning_rate": 1.5492945929090015e-05, + "loss": 0.3637, + "step": 12311 + }, + { + "epoch": 33.54768392370572, + "grad_norm": 7.301507472991943, + "learning_rate": 1.549220846978985e-05, + "loss": 0.368, + "step": 12312 + }, + { + "epoch": 33.55040871934605, + "grad_norm": 7.936252117156982, + "learning_rate": 1.549147096771654e-05, + "loss": 0.3716, + "step": 12313 + }, + { + "epoch": 33.55313351498638, + "grad_norm": 6.499980449676514, + "learning_rate": 1.5490733422875836e-05, + "loss": 0.5402, + "step": 12314 + }, + { + "epoch": 33.555858310626704, + "grad_norm": 7.899421215057373, + "learning_rate": 1.5489995835273476e-05, + "loss": 0.3173, + "step": 12315 + }, + { + "epoch": 33.55858310626703, + "grad_norm": 9.74738883972168, + "learning_rate": 1.5489258204915203e-05, + "loss": 0.5145, + "step": 12316 + }, + { + "epoch": 33.561307901907355, + "grad_norm": 8.830711364746094, + "learning_rate": 1.5488520531806767e-05, + "loss": 0.2935, + "step": 12317 + }, + { + "epoch": 33.56403269754768, + "grad_norm": 5.760073661804199, + "learning_rate": 1.5487782815953908e-05, + "loss": 0.3943, + "step": 12318 + }, + { + "epoch": 33.566757493188014, + "grad_norm": 7.559969902038574, + "learning_rate": 1.548704505736237e-05, + "loss": 0.3832, + "step": 12319 + }, + { + "epoch": 33.56948228882834, + "grad_norm": 7.594951629638672, + "learning_rate": 1.5486307256037908e-05, + "loss": 0.4699, + "step": 12320 + }, + { + "epoch": 33.572207084468666, + "grad_norm": 6.055371284484863, + "learning_rate": 1.5485569411986253e-05, + "loss": 0.3524, + "step": 12321 + }, + { + "epoch": 33.57493188010899, + "grad_norm": 7.1531596183776855, + "learning_rate": 1.5484831525213166e-05, + "loss": 0.5202, + "step": 12322 + }, + { + "epoch": 33.57765667574932, + "grad_norm": 6.895809650421143, + "learning_rate": 1.5484093595724388e-05, + "loss": 0.3055, + "step": 12323 + }, + { + "epoch": 33.58038147138964, + "grad_norm": 6.4066057205200195, + "learning_rate": 1.548335562352566e-05, + "loss": 0.2988, + "step": 12324 + }, + { + "epoch": 33.583106267029976, + "grad_norm": 9.409860610961914, + "learning_rate": 1.5482617608622744e-05, + "loss": 0.3773, + "step": 12325 + }, + { + "epoch": 33.5858310626703, + "grad_norm": 7.044551849365234, + "learning_rate": 1.548187955102137e-05, + "loss": 0.3474, + "step": 12326 + }, + { + "epoch": 33.58855585831063, + "grad_norm": 6.563586235046387, + "learning_rate": 1.54811414507273e-05, + "loss": 0.2838, + "step": 12327 + }, + { + "epoch": 33.59128065395095, + "grad_norm": 6.07274055480957, + "learning_rate": 1.5480403307746274e-05, + "loss": 0.3144, + "step": 12328 + }, + { + "epoch": 33.59400544959128, + "grad_norm": 6.972324371337891, + "learning_rate": 1.5479665122084046e-05, + "loss": 0.4146, + "step": 12329 + }, + { + "epoch": 33.596730245231605, + "grad_norm": 7.334195613861084, + "learning_rate": 1.547892689374636e-05, + "loss": 0.368, + "step": 12330 + }, + { + "epoch": 33.59945504087194, + "grad_norm": 6.988025188446045, + "learning_rate": 1.547818862273897e-05, + "loss": 0.2876, + "step": 12331 + }, + { + "epoch": 33.60217983651226, + "grad_norm": 5.555150985717773, + "learning_rate": 1.547745030906762e-05, + "loss": 0.3261, + "step": 12332 + }, + { + "epoch": 33.60490463215259, + "grad_norm": 7.14247989654541, + "learning_rate": 1.5476711952738065e-05, + "loss": 0.4326, + "step": 12333 + }, + { + "epoch": 33.607629427792915, + "grad_norm": 6.2259626388549805, + "learning_rate": 1.547597355375605e-05, + "loss": 0.3841, + "step": 12334 + }, + { + "epoch": 33.61035422343324, + "grad_norm": 6.5841288566589355, + "learning_rate": 1.5475235112127334e-05, + "loss": 0.3844, + "step": 12335 + }, + { + "epoch": 33.61307901907357, + "grad_norm": 7.561180114746094, + "learning_rate": 1.547449662785766e-05, + "loss": 0.3694, + "step": 12336 + }, + { + "epoch": 33.6158038147139, + "grad_norm": 10.145565032958984, + "learning_rate": 1.5473758100952788e-05, + "loss": 0.2518, + "step": 12337 + }, + { + "epoch": 33.618528610354225, + "grad_norm": 7.336001873016357, + "learning_rate": 1.547301953141846e-05, + "loss": 0.3024, + "step": 12338 + }, + { + "epoch": 33.62125340599455, + "grad_norm": 6.709211826324463, + "learning_rate": 1.5472280919260436e-05, + "loss": 0.305, + "step": 12339 + }, + { + "epoch": 33.62397820163488, + "grad_norm": 7.38783073425293, + "learning_rate": 1.547154226448446e-05, + "loss": 0.4097, + "step": 12340 + }, + { + "epoch": 33.6267029972752, + "grad_norm": 7.559239387512207, + "learning_rate": 1.5470803567096286e-05, + "loss": 0.2374, + "step": 12341 + }, + { + "epoch": 33.62942779291553, + "grad_norm": 11.160633087158203, + "learning_rate": 1.5470064827101677e-05, + "loss": 0.4155, + "step": 12342 + }, + { + "epoch": 33.63215258855586, + "grad_norm": 8.600433349609375, + "learning_rate": 1.5469326044506373e-05, + "loss": 0.4086, + "step": 12343 + }, + { + "epoch": 33.63487738419619, + "grad_norm": 8.076839447021484, + "learning_rate": 1.5468587219316136e-05, + "loss": 0.5254, + "step": 12344 + }, + { + "epoch": 33.63760217983651, + "grad_norm": 6.322586536407471, + "learning_rate": 1.5467848351536717e-05, + "loss": 0.487, + "step": 12345 + }, + { + "epoch": 33.64032697547684, + "grad_norm": 7.030972480773926, + "learning_rate": 1.5467109441173876e-05, + "loss": 0.3795, + "step": 12346 + }, + { + "epoch": 33.643051771117165, + "grad_norm": 6.812682628631592, + "learning_rate": 1.5466370488233358e-05, + "loss": 0.4005, + "step": 12347 + }, + { + "epoch": 33.64577656675749, + "grad_norm": 7.285449028015137, + "learning_rate": 1.5465631492720923e-05, + "loss": 0.3118, + "step": 12348 + }, + { + "epoch": 33.64850136239782, + "grad_norm": 7.952854633331299, + "learning_rate": 1.546489245464233e-05, + "loss": 0.3741, + "step": 12349 + }, + { + "epoch": 33.65122615803815, + "grad_norm": 7.379002094268799, + "learning_rate": 1.5464153374003323e-05, + "loss": 0.5068, + "step": 12350 + }, + { + "epoch": 33.653950953678475, + "grad_norm": 7.423781394958496, + "learning_rate": 1.546341425080967e-05, + "loss": 0.4805, + "step": 12351 + }, + { + "epoch": 33.6566757493188, + "grad_norm": 10.176163673400879, + "learning_rate": 1.546267508506712e-05, + "loss": 0.3536, + "step": 12352 + }, + { + "epoch": 33.65940054495913, + "grad_norm": 7.722346782684326, + "learning_rate": 1.5461935876781436e-05, + "loss": 0.4416, + "step": 12353 + }, + { + "epoch": 33.66212534059945, + "grad_norm": 8.772095680236816, + "learning_rate": 1.546119662595837e-05, + "loss": 0.3454, + "step": 12354 + }, + { + "epoch": 33.664850136239785, + "grad_norm": 9.018723487854004, + "learning_rate": 1.546045733260368e-05, + "loss": 0.3676, + "step": 12355 + }, + { + "epoch": 33.66757493188011, + "grad_norm": 8.277616500854492, + "learning_rate": 1.5459717996723124e-05, + "loss": 0.3713, + "step": 12356 + }, + { + "epoch": 33.67029972752044, + "grad_norm": 7.505500793457031, + "learning_rate": 1.545897861832246e-05, + "loss": 0.372, + "step": 12357 + }, + { + "epoch": 33.67302452316076, + "grad_norm": 8.260039329528809, + "learning_rate": 1.5458239197407446e-05, + "loss": 0.3753, + "step": 12358 + }, + { + "epoch": 33.67574931880109, + "grad_norm": 5.778948783874512, + "learning_rate": 1.545749973398384e-05, + "loss": 0.3793, + "step": 12359 + }, + { + "epoch": 33.678474114441414, + "grad_norm": 7.623692512512207, + "learning_rate": 1.5456760228057405e-05, + "loss": 0.2953, + "step": 12360 + }, + { + "epoch": 33.68119891008175, + "grad_norm": 8.117790222167969, + "learning_rate": 1.545602067963389e-05, + "loss": 0.3764, + "step": 12361 + }, + { + "epoch": 33.68392370572207, + "grad_norm": 8.630905151367188, + "learning_rate": 1.5455281088719067e-05, + "loss": 0.306, + "step": 12362 + }, + { + "epoch": 33.6866485013624, + "grad_norm": 7.467883110046387, + "learning_rate": 1.5454541455318693e-05, + "loss": 0.3481, + "step": 12363 + }, + { + "epoch": 33.689373297002724, + "grad_norm": 7.620356559753418, + "learning_rate": 1.545380177943852e-05, + "loss": 0.4457, + "step": 12364 + }, + { + "epoch": 33.69209809264305, + "grad_norm": 8.849483489990234, + "learning_rate": 1.545306206108432e-05, + "loss": 0.3399, + "step": 12365 + }, + { + "epoch": 33.694822888283376, + "grad_norm": 7.455567836761475, + "learning_rate": 1.545232230026184e-05, + "loss": 0.3523, + "step": 12366 + }, + { + "epoch": 33.69754768392371, + "grad_norm": 7.081930637359619, + "learning_rate": 1.5451582496976856e-05, + "loss": 0.3188, + "step": 12367 + }, + { + "epoch": 33.700272479564035, + "grad_norm": 6.795620441436768, + "learning_rate": 1.5450842651235118e-05, + "loss": 0.3658, + "step": 12368 + }, + { + "epoch": 33.70299727520436, + "grad_norm": 7.435014724731445, + "learning_rate": 1.5450102763042395e-05, + "loss": 0.3736, + "step": 12369 + }, + { + "epoch": 33.705722070844686, + "grad_norm": 6.455586910247803, + "learning_rate": 1.5449362832404452e-05, + "loss": 0.3816, + "step": 12370 + }, + { + "epoch": 33.70844686648501, + "grad_norm": 7.806655406951904, + "learning_rate": 1.544862285932704e-05, + "loss": 0.2928, + "step": 12371 + }, + { + "epoch": 33.71117166212534, + "grad_norm": 6.863977432250977, + "learning_rate": 1.5447882843815932e-05, + "loss": 0.4536, + "step": 12372 + }, + { + "epoch": 33.71389645776567, + "grad_norm": 7.690101623535156, + "learning_rate": 1.544714278587689e-05, + "loss": 0.3547, + "step": 12373 + }, + { + "epoch": 33.716621253406, + "grad_norm": 9.301826477050781, + "learning_rate": 1.544640268551567e-05, + "loss": 0.3386, + "step": 12374 + }, + { + "epoch": 33.71934604904632, + "grad_norm": 7.949379920959473, + "learning_rate": 1.5445662542738044e-05, + "loss": 0.407, + "step": 12375 + }, + { + "epoch": 33.72207084468665, + "grad_norm": 7.628628253936768, + "learning_rate": 1.544492235754977e-05, + "loss": 0.2996, + "step": 12376 + }, + { + "epoch": 33.724795640326974, + "grad_norm": 5.911596298217773, + "learning_rate": 1.544418212995662e-05, + "loss": 0.3972, + "step": 12377 + }, + { + "epoch": 33.7275204359673, + "grad_norm": 6.364374160766602, + "learning_rate": 1.5443441859964353e-05, + "loss": 0.3899, + "step": 12378 + }, + { + "epoch": 33.73024523160763, + "grad_norm": 7.083815097808838, + "learning_rate": 1.5442701547578736e-05, + "loss": 0.2889, + "step": 12379 + }, + { + "epoch": 33.73297002724796, + "grad_norm": 7.262183666229248, + "learning_rate": 1.5441961192805538e-05, + "loss": 0.4041, + "step": 12380 + }, + { + "epoch": 33.735694822888284, + "grad_norm": 9.222476959228516, + "learning_rate": 1.5441220795650518e-05, + "loss": 0.2729, + "step": 12381 + }, + { + "epoch": 33.73841961852861, + "grad_norm": 5.661161422729492, + "learning_rate": 1.5440480356119445e-05, + "loss": 0.2729, + "step": 12382 + }, + { + "epoch": 33.741144414168936, + "grad_norm": 6.561127662658691, + "learning_rate": 1.5439739874218087e-05, + "loss": 0.5112, + "step": 12383 + }, + { + "epoch": 33.74386920980926, + "grad_norm": 19.514482498168945, + "learning_rate": 1.543899934995221e-05, + "loss": 0.4377, + "step": 12384 + }, + { + "epoch": 33.746594005449595, + "grad_norm": 7.370982646942139, + "learning_rate": 1.543825878332758e-05, + "loss": 0.4215, + "step": 12385 + }, + { + "epoch": 33.74931880108992, + "grad_norm": 6.5547285079956055, + "learning_rate": 1.5437518174349967e-05, + "loss": 0.3623, + "step": 12386 + }, + { + "epoch": 33.752043596730246, + "grad_norm": 6.507667064666748, + "learning_rate": 1.543677752302514e-05, + "loss": 0.3861, + "step": 12387 + }, + { + "epoch": 33.75476839237057, + "grad_norm": 7.1478986740112305, + "learning_rate": 1.543603682935886e-05, + "loss": 0.4197, + "step": 12388 + }, + { + "epoch": 33.7574931880109, + "grad_norm": 6.728658676147461, + "learning_rate": 1.5435296093356902e-05, + "loss": 0.3558, + "step": 12389 + }, + { + "epoch": 33.76021798365122, + "grad_norm": 7.442631244659424, + "learning_rate": 1.5434555315025034e-05, + "loss": 0.3505, + "step": 12390 + }, + { + "epoch": 33.762942779291556, + "grad_norm": 9.225476264953613, + "learning_rate": 1.543381449436902e-05, + "loss": 0.341, + "step": 12391 + }, + { + "epoch": 33.76566757493188, + "grad_norm": 12.1233491897583, + "learning_rate": 1.5433073631394638e-05, + "loss": 0.3384, + "step": 12392 + }, + { + "epoch": 33.76839237057221, + "grad_norm": 7.165793418884277, + "learning_rate": 1.5432332726107653e-05, + "loss": 0.3573, + "step": 12393 + }, + { + "epoch": 33.771117166212534, + "grad_norm": 7.290248870849609, + "learning_rate": 1.5431591778513835e-05, + "loss": 0.4198, + "step": 12394 + }, + { + "epoch": 33.77384196185286, + "grad_norm": 6.255857467651367, + "learning_rate": 1.5430850788618955e-05, + "loss": 0.4251, + "step": 12395 + }, + { + "epoch": 33.776566757493185, + "grad_norm": 9.753196716308594, + "learning_rate": 1.5430109756428785e-05, + "loss": 0.3881, + "step": 12396 + }, + { + "epoch": 33.77929155313352, + "grad_norm": 7.622660160064697, + "learning_rate": 1.542936868194909e-05, + "loss": 0.3523, + "step": 12397 + }, + { + "epoch": 33.782016348773844, + "grad_norm": 6.863631725311279, + "learning_rate": 1.5428627565185652e-05, + "loss": 0.3501, + "step": 12398 + }, + { + "epoch": 33.78474114441417, + "grad_norm": 7.674832820892334, + "learning_rate": 1.5427886406144235e-05, + "loss": 0.3888, + "step": 12399 + }, + { + "epoch": 33.787465940054496, + "grad_norm": 4.952965259552002, + "learning_rate": 1.5427145204830615e-05, + "loss": 0.3384, + "step": 12400 + }, + { + "epoch": 33.79019073569482, + "grad_norm": 6.492983818054199, + "learning_rate": 1.542640396125056e-05, + "loss": 0.3019, + "step": 12401 + }, + { + "epoch": 33.79291553133515, + "grad_norm": 6.460616111755371, + "learning_rate": 1.5425662675409845e-05, + "loss": 0.3652, + "step": 12402 + }, + { + "epoch": 33.79564032697548, + "grad_norm": 8.286467552185059, + "learning_rate": 1.5424921347314245e-05, + "loss": 0.403, + "step": 12403 + }, + { + "epoch": 33.798365122615806, + "grad_norm": 6.715384006500244, + "learning_rate": 1.5424179976969536e-05, + "loss": 0.408, + "step": 12404 + }, + { + "epoch": 33.80108991825613, + "grad_norm": 9.546368598937988, + "learning_rate": 1.5423438564381484e-05, + "loss": 0.3706, + "step": 12405 + }, + { + "epoch": 33.80381471389646, + "grad_norm": 6.578489780426025, + "learning_rate": 1.5422697109555867e-05, + "loss": 0.3626, + "step": 12406 + }, + { + "epoch": 33.80653950953678, + "grad_norm": 6.979336738586426, + "learning_rate": 1.542195561249846e-05, + "loss": 0.3411, + "step": 12407 + }, + { + "epoch": 33.80926430517711, + "grad_norm": 10.89571762084961, + "learning_rate": 1.5421214073215037e-05, + "loss": 0.4416, + "step": 12408 + }, + { + "epoch": 33.81198910081744, + "grad_norm": 5.769643783569336, + "learning_rate": 1.5420472491711373e-05, + "loss": 0.3075, + "step": 12409 + }, + { + "epoch": 33.81471389645777, + "grad_norm": 7.007720470428467, + "learning_rate": 1.5419730867993245e-05, + "loss": 0.6479, + "step": 12410 + }, + { + "epoch": 33.817438692098094, + "grad_norm": 6.751010894775391, + "learning_rate": 1.5418989202066427e-05, + "loss": 0.3234, + "step": 12411 + }, + { + "epoch": 33.82016348773842, + "grad_norm": 7.3624749183654785, + "learning_rate": 1.5418247493936695e-05, + "loss": 0.2687, + "step": 12412 + }, + { + "epoch": 33.822888283378745, + "grad_norm": 6.650275230407715, + "learning_rate": 1.5417505743609828e-05, + "loss": 0.2815, + "step": 12413 + }, + { + "epoch": 33.82561307901907, + "grad_norm": 6.142333030700684, + "learning_rate": 1.54167639510916e-05, + "loss": 0.4532, + "step": 12414 + }, + { + "epoch": 33.828337874659404, + "grad_norm": 11.933963775634766, + "learning_rate": 1.5416022116387785e-05, + "loss": 0.5086, + "step": 12415 + }, + { + "epoch": 33.83106267029973, + "grad_norm": 7.944046497344971, + "learning_rate": 1.541528023950417e-05, + "loss": 0.4072, + "step": 12416 + }, + { + "epoch": 33.833787465940055, + "grad_norm": 6.637248992919922, + "learning_rate": 1.5414538320446523e-05, + "loss": 0.2994, + "step": 12417 + }, + { + "epoch": 33.83651226158038, + "grad_norm": 7.869789123535156, + "learning_rate": 1.5413796359220622e-05, + "loss": 0.4477, + "step": 12418 + }, + { + "epoch": 33.83923705722071, + "grad_norm": 7.0807342529296875, + "learning_rate": 1.5413054355832257e-05, + "loss": 0.3052, + "step": 12419 + }, + { + "epoch": 33.84196185286103, + "grad_norm": 12.607836723327637, + "learning_rate": 1.541231231028719e-05, + "loss": 0.3612, + "step": 12420 + }, + { + "epoch": 33.844686648501366, + "grad_norm": 7.435271263122559, + "learning_rate": 1.5411570222591217e-05, + "loss": 0.3848, + "step": 12421 + }, + { + "epoch": 33.84741144414169, + "grad_norm": 7.234927177429199, + "learning_rate": 1.5410828092750106e-05, + "loss": 0.3199, + "step": 12422 + }, + { + "epoch": 33.85013623978202, + "grad_norm": 12.723918914794922, + "learning_rate": 1.541008592076964e-05, + "loss": 0.3752, + "step": 12423 + }, + { + "epoch": 33.85286103542234, + "grad_norm": 7.345337390899658, + "learning_rate": 1.5409343706655603e-05, + "loss": 0.3937, + "step": 12424 + }, + { + "epoch": 33.85558583106267, + "grad_norm": 7.744995594024658, + "learning_rate": 1.5408601450413767e-05, + "loss": 0.3183, + "step": 12425 + }, + { + "epoch": 33.858310626702995, + "grad_norm": 5.900259494781494, + "learning_rate": 1.5407859152049915e-05, + "loss": 0.2372, + "step": 12426 + }, + { + "epoch": 33.86103542234333, + "grad_norm": 7.837316036224365, + "learning_rate": 1.5407116811569833e-05, + "loss": 0.4977, + "step": 12427 + }, + { + "epoch": 33.86376021798365, + "grad_norm": 6.400331974029541, + "learning_rate": 1.54063744289793e-05, + "loss": 0.3331, + "step": 12428 + }, + { + "epoch": 33.86648501362398, + "grad_norm": 7.602609634399414, + "learning_rate": 1.5405632004284097e-05, + "loss": 0.4165, + "step": 12429 + }, + { + "epoch": 33.869209809264305, + "grad_norm": 14.240015983581543, + "learning_rate": 1.5404889537490004e-05, + "loss": 0.2772, + "step": 12430 + }, + { + "epoch": 33.87193460490463, + "grad_norm": 6.371674060821533, + "learning_rate": 1.5404147028602804e-05, + "loss": 0.4153, + "step": 12431 + }, + { + "epoch": 33.87465940054496, + "grad_norm": 7.883369445800781, + "learning_rate": 1.5403404477628286e-05, + "loss": 0.2592, + "step": 12432 + }, + { + "epoch": 33.87738419618529, + "grad_norm": 7.574853897094727, + "learning_rate": 1.5402661884572222e-05, + "loss": 0.3174, + "step": 12433 + }, + { + "epoch": 33.880108991825615, + "grad_norm": 7.4124884605407715, + "learning_rate": 1.5401919249440406e-05, + "loss": 0.3696, + "step": 12434 + }, + { + "epoch": 33.88283378746594, + "grad_norm": 6.390591144561768, + "learning_rate": 1.5401176572238615e-05, + "loss": 0.2631, + "step": 12435 + }, + { + "epoch": 33.88555858310627, + "grad_norm": 5.953117370605469, + "learning_rate": 1.5400433852972633e-05, + "loss": 0.3632, + "step": 12436 + }, + { + "epoch": 33.88828337874659, + "grad_norm": 6.461482048034668, + "learning_rate": 1.5399691091648246e-05, + "loss": 0.3871, + "step": 12437 + }, + { + "epoch": 33.89100817438692, + "grad_norm": 8.403675079345703, + "learning_rate": 1.5398948288271242e-05, + "loss": 0.2888, + "step": 12438 + }, + { + "epoch": 33.89373297002725, + "grad_norm": 7.038022518157959, + "learning_rate": 1.53982054428474e-05, + "loss": 0.3359, + "step": 12439 + }, + { + "epoch": 33.89645776566758, + "grad_norm": 6.362793922424316, + "learning_rate": 1.5397462555382508e-05, + "loss": 0.3172, + "step": 12440 + }, + { + "epoch": 33.8991825613079, + "grad_norm": 6.867793560028076, + "learning_rate": 1.539671962588235e-05, + "loss": 0.382, + "step": 12441 + }, + { + "epoch": 33.90190735694823, + "grad_norm": 10.121224403381348, + "learning_rate": 1.5395976654352715e-05, + "loss": 0.3347, + "step": 12442 + }, + { + "epoch": 33.904632152588555, + "grad_norm": 7.618274688720703, + "learning_rate": 1.539523364079939e-05, + "loss": 0.3734, + "step": 12443 + }, + { + "epoch": 33.90735694822888, + "grad_norm": 6.563361167907715, + "learning_rate": 1.5394490585228154e-05, + "loss": 0.2395, + "step": 12444 + }, + { + "epoch": 33.91008174386921, + "grad_norm": 6.725279808044434, + "learning_rate": 1.5393747487644803e-05, + "loss": 0.3066, + "step": 12445 + }, + { + "epoch": 33.91280653950954, + "grad_norm": 5.6815619468688965, + "learning_rate": 1.539300434805512e-05, + "loss": 0.3529, + "step": 12446 + }, + { + "epoch": 33.915531335149865, + "grad_norm": 6.796170234680176, + "learning_rate": 1.5392261166464886e-05, + "loss": 0.3427, + "step": 12447 + }, + { + "epoch": 33.91825613079019, + "grad_norm": 5.836400032043457, + "learning_rate": 1.5391517942879905e-05, + "loss": 0.3239, + "step": 12448 + }, + { + "epoch": 33.920980926430516, + "grad_norm": 6.661625385284424, + "learning_rate": 1.539077467730595e-05, + "loss": 0.4078, + "step": 12449 + }, + { + "epoch": 33.92370572207084, + "grad_norm": 12.549825668334961, + "learning_rate": 1.539003136974882e-05, + "loss": 0.3369, + "step": 12450 + }, + { + "epoch": 33.926430517711175, + "grad_norm": 7.375289440155029, + "learning_rate": 1.538928802021429e-05, + "loss": 0.3853, + "step": 12451 + }, + { + "epoch": 33.9291553133515, + "grad_norm": 9.283988952636719, + "learning_rate": 1.5388544628708166e-05, + "loss": 0.3829, + "step": 12452 + }, + { + "epoch": 33.93188010899183, + "grad_norm": 5.844550132751465, + "learning_rate": 1.5387801195236227e-05, + "loss": 0.3329, + "step": 12453 + }, + { + "epoch": 33.93460490463215, + "grad_norm": 6.188870906829834, + "learning_rate": 1.538705771980427e-05, + "loss": 0.4023, + "step": 12454 + }, + { + "epoch": 33.93732970027248, + "grad_norm": 8.369707107543945, + "learning_rate": 1.5386314202418076e-05, + "loss": 0.3803, + "step": 12455 + }, + { + "epoch": 33.940054495912804, + "grad_norm": 12.039058685302734, + "learning_rate": 1.538557064308344e-05, + "loss": 0.3149, + "step": 12456 + }, + { + "epoch": 33.94277929155314, + "grad_norm": 14.115557670593262, + "learning_rate": 1.5384827041806157e-05, + "loss": 0.4344, + "step": 12457 + }, + { + "epoch": 33.94550408719346, + "grad_norm": 7.214237689971924, + "learning_rate": 1.5384083398592015e-05, + "loss": 0.4768, + "step": 12458 + }, + { + "epoch": 33.94822888283379, + "grad_norm": 7.765081405639648, + "learning_rate": 1.53833397134468e-05, + "loss": 0.3866, + "step": 12459 + }, + { + "epoch": 33.950953678474114, + "grad_norm": 13.63409423828125, + "learning_rate": 1.5382595986376312e-05, + "loss": 0.3347, + "step": 12460 + }, + { + "epoch": 33.95367847411444, + "grad_norm": 6.552498817443848, + "learning_rate": 1.538185221738634e-05, + "loss": 0.3456, + "step": 12461 + }, + { + "epoch": 33.956403269754766, + "grad_norm": 7.624207496643066, + "learning_rate": 1.538110840648267e-05, + "loss": 0.4122, + "step": 12462 + }, + { + "epoch": 33.95912806539509, + "grad_norm": 7.696471691131592, + "learning_rate": 1.5380364553671107e-05, + "loss": 0.4084, + "step": 12463 + }, + { + "epoch": 33.961852861035425, + "grad_norm": 6.774961471557617, + "learning_rate": 1.537962065895744e-05, + "loss": 0.3287, + "step": 12464 + }, + { + "epoch": 33.96457765667575, + "grad_norm": 7.877649307250977, + "learning_rate": 1.5378876722347455e-05, + "loss": 0.5164, + "step": 12465 + }, + { + "epoch": 33.967302452316076, + "grad_norm": 7.891627311706543, + "learning_rate": 1.5378132743846955e-05, + "loss": 0.3705, + "step": 12466 + }, + { + "epoch": 33.9700272479564, + "grad_norm": 9.303549766540527, + "learning_rate": 1.537738872346173e-05, + "loss": 0.292, + "step": 12467 + }, + { + "epoch": 33.97275204359673, + "grad_norm": 7.350878715515137, + "learning_rate": 1.537664466119757e-05, + "loss": 0.3803, + "step": 12468 + }, + { + "epoch": 33.97547683923706, + "grad_norm": 8.583620071411133, + "learning_rate": 1.537590055706028e-05, + "loss": 0.3895, + "step": 12469 + }, + { + "epoch": 33.97820163487739, + "grad_norm": 6.492166042327881, + "learning_rate": 1.5375156411055644e-05, + "loss": 0.3654, + "step": 12470 + }, + { + "epoch": 33.98092643051771, + "grad_norm": 7.747386455535889, + "learning_rate": 1.5374412223189467e-05, + "loss": 0.2872, + "step": 12471 + }, + { + "epoch": 33.98365122615804, + "grad_norm": 5.402212619781494, + "learning_rate": 1.537366799346754e-05, + "loss": 0.4095, + "step": 12472 + }, + { + "epoch": 33.986376021798364, + "grad_norm": 11.660005569458008, + "learning_rate": 1.537292372189566e-05, + "loss": 0.3462, + "step": 12473 + }, + { + "epoch": 33.98910081743869, + "grad_norm": 6.122496128082275, + "learning_rate": 1.5372179408479624e-05, + "loss": 0.2592, + "step": 12474 + }, + { + "epoch": 33.991825613079016, + "grad_norm": 6.724801540374756, + "learning_rate": 1.5371435053225222e-05, + "loss": 0.3505, + "step": 12475 + }, + { + "epoch": 33.99455040871935, + "grad_norm": 5.974119186401367, + "learning_rate": 1.5370690656138265e-05, + "loss": 0.4124, + "step": 12476 + }, + { + "epoch": 33.997275204359674, + "grad_norm": 6.9660820960998535, + "learning_rate": 1.5369946217224536e-05, + "loss": 0.3219, + "step": 12477 + }, + { + "epoch": 34.0, + "grad_norm": 7.865757465362549, + "learning_rate": 1.536920173648984e-05, + "loss": 0.5123, + "step": 12478 + }, + { + "epoch": 34.002724795640326, + "grad_norm": 6.852688789367676, + "learning_rate": 1.5368457213939973e-05, + "loss": 0.2488, + "step": 12479 + }, + { + "epoch": 34.00544959128065, + "grad_norm": 7.923671245574951, + "learning_rate": 1.5367712649580736e-05, + "loss": 0.3334, + "step": 12480 + }, + { + "epoch": 34.00817438692098, + "grad_norm": 6.53236198425293, + "learning_rate": 1.5366968043417926e-05, + "loss": 0.313, + "step": 12481 + }, + { + "epoch": 34.01089918256131, + "grad_norm": 6.657381534576416, + "learning_rate": 1.5366223395457337e-05, + "loss": 0.2969, + "step": 12482 + }, + { + "epoch": 34.013623978201636, + "grad_norm": 6.5685038566589355, + "learning_rate": 1.536547870570478e-05, + "loss": 0.3204, + "step": 12483 + }, + { + "epoch": 34.01634877384196, + "grad_norm": 6.03550386428833, + "learning_rate": 1.5364733974166042e-05, + "loss": 0.3785, + "step": 12484 + }, + { + "epoch": 34.01907356948229, + "grad_norm": 6.594084739685059, + "learning_rate": 1.536398920084693e-05, + "loss": 0.4122, + "step": 12485 + }, + { + "epoch": 34.02179836512261, + "grad_norm": 6.372106075286865, + "learning_rate": 1.5363244385753244e-05, + "loss": 0.2687, + "step": 12486 + }, + { + "epoch": 34.02452316076294, + "grad_norm": 6.909015655517578, + "learning_rate": 1.5362499528890782e-05, + "loss": 0.2734, + "step": 12487 + }, + { + "epoch": 34.02724795640327, + "grad_norm": 39.4537239074707, + "learning_rate": 1.5361754630265347e-05, + "loss": 0.34, + "step": 12488 + }, + { + "epoch": 34.0299727520436, + "grad_norm": 6.2265448570251465, + "learning_rate": 1.5361009689882737e-05, + "loss": 0.2168, + "step": 12489 + }, + { + "epoch": 34.032697547683924, + "grad_norm": 7.566519260406494, + "learning_rate": 1.5360264707748758e-05, + "loss": 0.4664, + "step": 12490 + }, + { + "epoch": 34.03542234332425, + "grad_norm": 6.685686111450195, + "learning_rate": 1.5359519683869207e-05, + "loss": 0.2734, + "step": 12491 + }, + { + "epoch": 34.038147138964575, + "grad_norm": 8.083074569702148, + "learning_rate": 1.5358774618249895e-05, + "loss": 0.4032, + "step": 12492 + }, + { + "epoch": 34.0408719346049, + "grad_norm": 5.474445343017578, + "learning_rate": 1.5358029510896616e-05, + "loss": 0.4359, + "step": 12493 + }, + { + "epoch": 34.043596730245234, + "grad_norm": 8.933283805847168, + "learning_rate": 1.5357284361815178e-05, + "loss": 0.3463, + "step": 12494 + }, + { + "epoch": 34.04632152588556, + "grad_norm": 7.755788803100586, + "learning_rate": 1.535653917101138e-05, + "loss": 0.3312, + "step": 12495 + }, + { + "epoch": 34.049046321525886, + "grad_norm": 8.029553413391113, + "learning_rate": 1.5355793938491025e-05, + "loss": 0.2626, + "step": 12496 + }, + { + "epoch": 34.05177111716621, + "grad_norm": 8.580611228942871, + "learning_rate": 1.535504866425992e-05, + "loss": 0.3463, + "step": 12497 + }, + { + "epoch": 34.05449591280654, + "grad_norm": 9.165595054626465, + "learning_rate": 1.5354303348323873e-05, + "loss": 0.3956, + "step": 12498 + }, + { + "epoch": 34.05722070844686, + "grad_norm": 10.379510879516602, + "learning_rate": 1.5353557990688675e-05, + "loss": 0.3011, + "step": 12499 + }, + { + "epoch": 34.059945504087196, + "grad_norm": 8.267645835876465, + "learning_rate": 1.5352812591360148e-05, + "loss": 0.4059, + "step": 12500 + }, + { + "epoch": 34.06267029972752, + "grad_norm": 6.728059768676758, + "learning_rate": 1.5352067150344084e-05, + "loss": 0.4751, + "step": 12501 + }, + { + "epoch": 34.06539509536785, + "grad_norm": 6.893502712249756, + "learning_rate": 1.5351321667646298e-05, + "loss": 0.3395, + "step": 12502 + }, + { + "epoch": 34.06811989100817, + "grad_norm": 7.514678478240967, + "learning_rate": 1.5350576143272587e-05, + "loss": 0.325, + "step": 12503 + }, + { + "epoch": 34.0708446866485, + "grad_norm": 6.598287105560303, + "learning_rate": 1.534983057722876e-05, + "loss": 0.3159, + "step": 12504 + }, + { + "epoch": 34.073569482288825, + "grad_norm": 8.37763500213623, + "learning_rate": 1.5349084969520628e-05, + "loss": 0.3809, + "step": 12505 + }, + { + "epoch": 34.07629427792916, + "grad_norm": 6.894758701324463, + "learning_rate": 1.5348339320153992e-05, + "loss": 0.3809, + "step": 12506 + }, + { + "epoch": 34.079019073569484, + "grad_norm": 7.859985828399658, + "learning_rate": 1.5347593629134663e-05, + "loss": 0.2865, + "step": 12507 + }, + { + "epoch": 34.08174386920981, + "grad_norm": 7.461994647979736, + "learning_rate": 1.534684789646845e-05, + "loss": 0.3677, + "step": 12508 + }, + { + "epoch": 34.084468664850135, + "grad_norm": 8.27462100982666, + "learning_rate": 1.5346102122161152e-05, + "loss": 0.369, + "step": 12509 + }, + { + "epoch": 34.08719346049046, + "grad_norm": 5.675178050994873, + "learning_rate": 1.5345356306218586e-05, + "loss": 0.3832, + "step": 12510 + }, + { + "epoch": 34.08991825613079, + "grad_norm": 7.228993892669678, + "learning_rate": 1.5344610448646555e-05, + "loss": 0.3028, + "step": 12511 + }, + { + "epoch": 34.09264305177112, + "grad_norm": 8.06761360168457, + "learning_rate": 1.534386454945087e-05, + "loss": 0.4328, + "step": 12512 + }, + { + "epoch": 34.095367847411445, + "grad_norm": 9.210061073303223, + "learning_rate": 1.5343118608637345e-05, + "loss": 0.3381, + "step": 12513 + }, + { + "epoch": 34.09809264305177, + "grad_norm": 7.22993803024292, + "learning_rate": 1.534237262621178e-05, + "loss": 0.425, + "step": 12514 + }, + { + "epoch": 34.1008174386921, + "grad_norm": 7.0670599937438965, + "learning_rate": 1.5341626602179988e-05, + "loss": 0.3392, + "step": 12515 + }, + { + "epoch": 34.10354223433242, + "grad_norm": 7.207448959350586, + "learning_rate": 1.534088053654778e-05, + "loss": 0.4464, + "step": 12516 + }, + { + "epoch": 34.10626702997275, + "grad_norm": 8.390975952148438, + "learning_rate": 1.534013442932097e-05, + "loss": 0.3948, + "step": 12517 + }, + { + "epoch": 34.10899182561308, + "grad_norm": 6.45070743560791, + "learning_rate": 1.533938828050536e-05, + "loss": 0.3434, + "step": 12518 + }, + { + "epoch": 34.11171662125341, + "grad_norm": 6.419523239135742, + "learning_rate": 1.533864209010677e-05, + "loss": 0.4856, + "step": 12519 + }, + { + "epoch": 34.11444141689373, + "grad_norm": 7.4021525382995605, + "learning_rate": 1.5337895858131004e-05, + "loss": 0.3211, + "step": 12520 + }, + { + "epoch": 34.11716621253406, + "grad_norm": 5.476337909698486, + "learning_rate": 1.5337149584583878e-05, + "loss": 0.4803, + "step": 12521 + }, + { + "epoch": 34.119891008174385, + "grad_norm": 7.536069393157959, + "learning_rate": 1.5336403269471202e-05, + "loss": 0.4091, + "step": 12522 + }, + { + "epoch": 34.12261580381471, + "grad_norm": 6.384524345397949, + "learning_rate": 1.533565691279879e-05, + "loss": 0.256, + "step": 12523 + }, + { + "epoch": 34.12534059945504, + "grad_norm": 5.690863132476807, + "learning_rate": 1.5334910514572453e-05, + "loss": 0.2987, + "step": 12524 + }, + { + "epoch": 34.12806539509537, + "grad_norm": 7.242108345031738, + "learning_rate": 1.5334164074798008e-05, + "loss": 0.3978, + "step": 12525 + }, + { + "epoch": 34.130790190735695, + "grad_norm": 7.1291890144348145, + "learning_rate": 1.5333417593481262e-05, + "loss": 0.3231, + "step": 12526 + }, + { + "epoch": 34.13351498637602, + "grad_norm": 5.386416912078857, + "learning_rate": 1.533267107062803e-05, + "loss": 0.4016, + "step": 12527 + }, + { + "epoch": 34.13623978201635, + "grad_norm": 6.721260070800781, + "learning_rate": 1.5331924506244132e-05, + "loss": 0.2899, + "step": 12528 + }, + { + "epoch": 34.13896457765667, + "grad_norm": 10.538313865661621, + "learning_rate": 1.5331177900335372e-05, + "loss": 0.3217, + "step": 12529 + }, + { + "epoch": 34.141689373297005, + "grad_norm": 6.040736675262451, + "learning_rate": 1.5330431252907575e-05, + "loss": 0.2218, + "step": 12530 + }, + { + "epoch": 34.14441416893733, + "grad_norm": 5.292067050933838, + "learning_rate": 1.5329684563966547e-05, + "loss": 0.2944, + "step": 12531 + }, + { + "epoch": 34.14713896457766, + "grad_norm": 6.043910026550293, + "learning_rate": 1.532893783351811e-05, + "loss": 0.3723, + "step": 12532 + }, + { + "epoch": 34.14986376021798, + "grad_norm": 6.5580573081970215, + "learning_rate": 1.5328191061568076e-05, + "loss": 0.2774, + "step": 12533 + }, + { + "epoch": 34.15258855585831, + "grad_norm": 8.724053382873535, + "learning_rate": 1.532744424812226e-05, + "loss": 0.2576, + "step": 12534 + }, + { + "epoch": 34.155313351498634, + "grad_norm": 6.399105548858643, + "learning_rate": 1.5326697393186482e-05, + "loss": 0.4534, + "step": 12535 + }, + { + "epoch": 34.15803814713897, + "grad_norm": 7.29347038269043, + "learning_rate": 1.5325950496766557e-05, + "loss": 0.2491, + "step": 12536 + }, + { + "epoch": 34.16076294277929, + "grad_norm": 7.133385181427002, + "learning_rate": 1.53252035588683e-05, + "loss": 0.3222, + "step": 12537 + }, + { + "epoch": 34.16348773841962, + "grad_norm": 7.860514163970947, + "learning_rate": 1.5324456579497525e-05, + "loss": 0.3557, + "step": 12538 + }, + { + "epoch": 34.166212534059945, + "grad_norm": 6.143589496612549, + "learning_rate": 1.5323709558660057e-05, + "loss": 0.3087, + "step": 12539 + }, + { + "epoch": 34.16893732970027, + "grad_norm": 7.355077743530273, + "learning_rate": 1.5322962496361705e-05, + "loss": 0.5696, + "step": 12540 + }, + { + "epoch": 34.171662125340596, + "grad_norm": 6.451420783996582, + "learning_rate": 1.53222153926083e-05, + "loss": 0.2737, + "step": 12541 + }, + { + "epoch": 34.17438692098093, + "grad_norm": 6.261687278747559, + "learning_rate": 1.532146824740565e-05, + "loss": 0.4085, + "step": 12542 + }, + { + "epoch": 34.177111716621255, + "grad_norm": 6.657192707061768, + "learning_rate": 1.532072106075958e-05, + "loss": 0.3685, + "step": 12543 + }, + { + "epoch": 34.17983651226158, + "grad_norm": 10.220606803894043, + "learning_rate": 1.53199738326759e-05, + "loss": 0.3737, + "step": 12544 + }, + { + "epoch": 34.182561307901906, + "grad_norm": 5.563790321350098, + "learning_rate": 1.5319226563160438e-05, + "loss": 0.3335, + "step": 12545 + }, + { + "epoch": 34.18528610354223, + "grad_norm": 6.351738929748535, + "learning_rate": 1.531847925221901e-05, + "loss": 0.4303, + "step": 12546 + }, + { + "epoch": 34.18801089918256, + "grad_norm": 7.620738506317139, + "learning_rate": 1.5317731899857434e-05, + "loss": 0.3871, + "step": 12547 + }, + { + "epoch": 34.19073569482289, + "grad_norm": 8.398337364196777, + "learning_rate": 1.5316984506081537e-05, + "loss": 0.3358, + "step": 12548 + }, + { + "epoch": 34.19346049046322, + "grad_norm": 6.083836555480957, + "learning_rate": 1.5316237070897134e-05, + "loss": 0.2913, + "step": 12549 + }, + { + "epoch": 34.19618528610354, + "grad_norm": 6.6067681312561035, + "learning_rate": 1.5315489594310048e-05, + "loss": 0.3098, + "step": 12550 + }, + { + "epoch": 34.19891008174387, + "grad_norm": 10.521763801574707, + "learning_rate": 1.53147420763261e-05, + "loss": 0.5455, + "step": 12551 + }, + { + "epoch": 34.201634877384194, + "grad_norm": 6.089521884918213, + "learning_rate": 1.5313994516951112e-05, + "loss": 0.2724, + "step": 12552 + }, + { + "epoch": 34.20435967302452, + "grad_norm": 5.61362361907959, + "learning_rate": 1.5313246916190907e-05, + "loss": 0.3512, + "step": 12553 + }, + { + "epoch": 34.20708446866485, + "grad_norm": 6.106107234954834, + "learning_rate": 1.5312499274051303e-05, + "loss": 0.2629, + "step": 12554 + }, + { + "epoch": 34.20980926430518, + "grad_norm": 6.168601036071777, + "learning_rate": 1.531175159053813e-05, + "loss": 0.3591, + "step": 12555 + }, + { + "epoch": 34.212534059945504, + "grad_norm": 6.565435886383057, + "learning_rate": 1.5311003865657204e-05, + "loss": 0.3029, + "step": 12556 + }, + { + "epoch": 34.21525885558583, + "grad_norm": 6.768796443939209, + "learning_rate": 1.531025609941435e-05, + "loss": 0.2982, + "step": 12557 + }, + { + "epoch": 34.217983651226156, + "grad_norm": 9.92309856414795, + "learning_rate": 1.5309508291815395e-05, + "loss": 0.2703, + "step": 12558 + }, + { + "epoch": 34.22070844686648, + "grad_norm": 6.509314060211182, + "learning_rate": 1.530876044286616e-05, + "loss": 0.344, + "step": 12559 + }, + { + "epoch": 34.223433242506815, + "grad_norm": 6.4309234619140625, + "learning_rate": 1.5308012552572466e-05, + "loss": 0.3406, + "step": 12560 + }, + { + "epoch": 34.22615803814714, + "grad_norm": 6.504822731018066, + "learning_rate": 1.5307264620940145e-05, + "loss": 0.3438, + "step": 12561 + }, + { + "epoch": 34.228882833787466, + "grad_norm": 7.467302322387695, + "learning_rate": 1.5306516647975014e-05, + "loss": 0.3404, + "step": 12562 + }, + { + "epoch": 34.23160762942779, + "grad_norm": 7.2365288734436035, + "learning_rate": 1.5305768633682906e-05, + "loss": 0.3845, + "step": 12563 + }, + { + "epoch": 34.23433242506812, + "grad_norm": 6.837965965270996, + "learning_rate": 1.530502057806964e-05, + "loss": 0.2961, + "step": 12564 + }, + { + "epoch": 34.237057220708444, + "grad_norm": 6.4085774421691895, + "learning_rate": 1.5304272481141045e-05, + "loss": 0.1936, + "step": 12565 + }, + { + "epoch": 34.23978201634878, + "grad_norm": 6.5254130363464355, + "learning_rate": 1.5303524342902948e-05, + "loss": 0.2939, + "step": 12566 + }, + { + "epoch": 34.2425068119891, + "grad_norm": 7.245466709136963, + "learning_rate": 1.5302776163361173e-05, + "loss": 0.3392, + "step": 12567 + }, + { + "epoch": 34.24523160762943, + "grad_norm": 11.342859268188477, + "learning_rate": 1.530202794252155e-05, + "loss": 0.4028, + "step": 12568 + }, + { + "epoch": 34.247956403269754, + "grad_norm": 8.174638748168945, + "learning_rate": 1.5301279680389902e-05, + "loss": 0.33, + "step": 12569 + }, + { + "epoch": 34.25068119891008, + "grad_norm": 5.684847354888916, + "learning_rate": 1.530053137697206e-05, + "loss": 0.2464, + "step": 12570 + }, + { + "epoch": 34.253405994550405, + "grad_norm": 5.457337379455566, + "learning_rate": 1.5299783032273848e-05, + "loss": 0.4058, + "step": 12571 + }, + { + "epoch": 34.25613079019074, + "grad_norm": 6.069042205810547, + "learning_rate": 1.5299034646301097e-05, + "loss": 0.2861, + "step": 12572 + }, + { + "epoch": 34.258855585831064, + "grad_norm": 6.74777364730835, + "learning_rate": 1.5298286219059634e-05, + "loss": 0.2883, + "step": 12573 + }, + { + "epoch": 34.26158038147139, + "grad_norm": 6.886902809143066, + "learning_rate": 1.5297537750555286e-05, + "loss": 0.3531, + "step": 12574 + }, + { + "epoch": 34.264305177111716, + "grad_norm": 7.231983184814453, + "learning_rate": 1.529678924079389e-05, + "loss": 0.2516, + "step": 12575 + }, + { + "epoch": 34.26702997275204, + "grad_norm": 8.084550857543945, + "learning_rate": 1.5296040689781267e-05, + "loss": 0.2573, + "step": 12576 + }, + { + "epoch": 34.26975476839237, + "grad_norm": 8.349410057067871, + "learning_rate": 1.529529209752325e-05, + "loss": 0.3591, + "step": 12577 + }, + { + "epoch": 34.2724795640327, + "grad_norm": 5.445027828216553, + "learning_rate": 1.529454346402567e-05, + "loss": 0.3697, + "step": 12578 + }, + { + "epoch": 34.275204359673026, + "grad_norm": 12.19077205657959, + "learning_rate": 1.529379478929436e-05, + "loss": 0.4547, + "step": 12579 + }, + { + "epoch": 34.27792915531335, + "grad_norm": 6.323980808258057, + "learning_rate": 1.5293046073335137e-05, + "loss": 0.352, + "step": 12580 + }, + { + "epoch": 34.28065395095368, + "grad_norm": 7.025436878204346, + "learning_rate": 1.529229731615385e-05, + "loss": 0.293, + "step": 12581 + }, + { + "epoch": 34.283378746594, + "grad_norm": 7.498295783996582, + "learning_rate": 1.529154851775631e-05, + "loss": 0.264, + "step": 12582 + }, + { + "epoch": 34.28610354223433, + "grad_norm": 6.7955780029296875, + "learning_rate": 1.529079967814837e-05, + "loss": 0.3305, + "step": 12583 + }, + { + "epoch": 34.28882833787466, + "grad_norm": 7.907827377319336, + "learning_rate": 1.529005079733585e-05, + "loss": 0.3605, + "step": 12584 + }, + { + "epoch": 34.29155313351499, + "grad_norm": 7.189267158508301, + "learning_rate": 1.528930187532459e-05, + "loss": 0.3698, + "step": 12585 + }, + { + "epoch": 34.294277929155314, + "grad_norm": 8.38147258758545, + "learning_rate": 1.528855291212041e-05, + "loss": 0.435, + "step": 12586 + }, + { + "epoch": 34.29700272479564, + "grad_norm": 6.848021507263184, + "learning_rate": 1.5287803907729154e-05, + "loss": 0.349, + "step": 12587 + }, + { + "epoch": 34.299727520435965, + "grad_norm": 5.953732490539551, + "learning_rate": 1.5287054862156648e-05, + "loss": 0.3755, + "step": 12588 + }, + { + "epoch": 34.30245231607629, + "grad_norm": 6.992973804473877, + "learning_rate": 1.5286305775408732e-05, + "loss": 0.4518, + "step": 12589 + }, + { + "epoch": 34.305177111716624, + "grad_norm": 6.778861999511719, + "learning_rate": 1.5285556647491237e-05, + "loss": 0.3205, + "step": 12590 + }, + { + "epoch": 34.30790190735695, + "grad_norm": 6.7751078605651855, + "learning_rate": 1.5284807478409994e-05, + "loss": 0.2394, + "step": 12591 + }, + { + "epoch": 34.310626702997276, + "grad_norm": 6.508416175842285, + "learning_rate": 1.528405826817084e-05, + "loss": 0.3088, + "step": 12592 + }, + { + "epoch": 34.3133514986376, + "grad_norm": 6.094081878662109, + "learning_rate": 1.5283309016779615e-05, + "loss": 0.3897, + "step": 12593 + }, + { + "epoch": 34.31607629427793, + "grad_norm": 6.154423713684082, + "learning_rate": 1.5282559724242145e-05, + "loss": 0.2567, + "step": 12594 + }, + { + "epoch": 34.31880108991825, + "grad_norm": 6.5120038986206055, + "learning_rate": 1.5281810390564274e-05, + "loss": 0.3162, + "step": 12595 + }, + { + "epoch": 34.321525885558586, + "grad_norm": 6.46196985244751, + "learning_rate": 1.528106101575183e-05, + "loss": 0.3739, + "step": 12596 + }, + { + "epoch": 34.32425068119891, + "grad_norm": 7.718747615814209, + "learning_rate": 1.5280311599810654e-05, + "loss": 0.2753, + "step": 12597 + }, + { + "epoch": 34.32697547683924, + "grad_norm": 5.9966816902160645, + "learning_rate": 1.527956214274658e-05, + "loss": 0.3034, + "step": 12598 + }, + { + "epoch": 34.32970027247956, + "grad_norm": 6.607402801513672, + "learning_rate": 1.527881264456545e-05, + "loss": 0.2888, + "step": 12599 + }, + { + "epoch": 34.33242506811989, + "grad_norm": 6.733821392059326, + "learning_rate": 1.5278063105273094e-05, + "loss": 0.3195, + "step": 12600 + }, + { + "epoch": 34.335149863760215, + "grad_norm": 7.093853950500488, + "learning_rate": 1.527731352487535e-05, + "loss": 0.3503, + "step": 12601 + }, + { + "epoch": 34.33787465940055, + "grad_norm": 6.891481399536133, + "learning_rate": 1.5276563903378064e-05, + "loss": 0.3297, + "step": 12602 + }, + { + "epoch": 34.34059945504087, + "grad_norm": 11.526920318603516, + "learning_rate": 1.5275814240787064e-05, + "loss": 0.3038, + "step": 12603 + }, + { + "epoch": 34.3433242506812, + "grad_norm": 5.182687282562256, + "learning_rate": 1.527506453710819e-05, + "loss": 0.4803, + "step": 12604 + }, + { + "epoch": 34.346049046321525, + "grad_norm": 6.055121421813965, + "learning_rate": 1.527431479234729e-05, + "loss": 0.3439, + "step": 12605 + }, + { + "epoch": 34.34877384196185, + "grad_norm": 7.062063694000244, + "learning_rate": 1.527356500651019e-05, + "loss": 0.4901, + "step": 12606 + }, + { + "epoch": 34.35149863760218, + "grad_norm": 6.244130611419678, + "learning_rate": 1.5272815179602743e-05, + "loss": 0.3791, + "step": 12607 + }, + { + "epoch": 34.35422343324251, + "grad_norm": 7.249322891235352, + "learning_rate": 1.5272065311630773e-05, + "loss": 0.2953, + "step": 12608 + }, + { + "epoch": 34.356948228882835, + "grad_norm": 5.700298309326172, + "learning_rate": 1.5271315402600132e-05, + "loss": 0.2553, + "step": 12609 + }, + { + "epoch": 34.35967302452316, + "grad_norm": 6.6068267822265625, + "learning_rate": 1.5270565452516656e-05, + "loss": 0.3201, + "step": 12610 + }, + { + "epoch": 34.36239782016349, + "grad_norm": 8.201449394226074, + "learning_rate": 1.5269815461386187e-05, + "loss": 0.2877, + "step": 12611 + }, + { + "epoch": 34.36512261580381, + "grad_norm": 5.591947555541992, + "learning_rate": 1.5269065429214563e-05, + "loss": 0.2398, + "step": 12612 + }, + { + "epoch": 34.36784741144414, + "grad_norm": 11.065263748168945, + "learning_rate": 1.5268315356007624e-05, + "loss": 0.2484, + "step": 12613 + }, + { + "epoch": 34.37057220708447, + "grad_norm": 6.8644490242004395, + "learning_rate": 1.526756524177122e-05, + "loss": 0.3565, + "step": 12614 + }, + { + "epoch": 34.3732970027248, + "grad_norm": 8.553791046142578, + "learning_rate": 1.5266815086511187e-05, + "loss": 0.392, + "step": 12615 + }, + { + "epoch": 34.37602179836512, + "grad_norm": 5.286713600158691, + "learning_rate": 1.5266064890233363e-05, + "loss": 0.3876, + "step": 12616 + }, + { + "epoch": 34.37874659400545, + "grad_norm": 5.502371311187744, + "learning_rate": 1.52653146529436e-05, + "loss": 0.2347, + "step": 12617 + }, + { + "epoch": 34.381471389645775, + "grad_norm": 15.500739097595215, + "learning_rate": 1.5264564374647732e-05, + "loss": 0.523, + "step": 12618 + }, + { + "epoch": 34.3841961852861, + "grad_norm": 5.708557605743408, + "learning_rate": 1.526381405535161e-05, + "loss": 0.4802, + "step": 12619 + }, + { + "epoch": 34.38692098092643, + "grad_norm": 7.145052433013916, + "learning_rate": 1.5263063695061072e-05, + "loss": 0.3866, + "step": 12620 + }, + { + "epoch": 34.38964577656676, + "grad_norm": 6.679152488708496, + "learning_rate": 1.526231329378196e-05, + "loss": 0.3762, + "step": 12621 + }, + { + "epoch": 34.392370572207085, + "grad_norm": 6.710231304168701, + "learning_rate": 1.5261562851520127e-05, + "loss": 0.4016, + "step": 12622 + }, + { + "epoch": 34.39509536784741, + "grad_norm": 7.736103534698486, + "learning_rate": 1.526081236828141e-05, + "loss": 0.2979, + "step": 12623 + }, + { + "epoch": 34.39782016348774, + "grad_norm": 5.453094005584717, + "learning_rate": 1.5260061844071655e-05, + "loss": 0.2635, + "step": 12624 + }, + { + "epoch": 34.40054495912806, + "grad_norm": 6.7206292152404785, + "learning_rate": 1.5259311278896706e-05, + "loss": 0.449, + "step": 12625 + }, + { + "epoch": 34.403269754768395, + "grad_norm": 6.7119221687316895, + "learning_rate": 1.525856067276241e-05, + "loss": 0.3656, + "step": 12626 + }, + { + "epoch": 34.40599455040872, + "grad_norm": 7.327425479888916, + "learning_rate": 1.5257810025674613e-05, + "loss": 0.2811, + "step": 12627 + }, + { + "epoch": 34.40871934604905, + "grad_norm": 9.062700271606445, + "learning_rate": 1.5257059337639164e-05, + "loss": 0.3171, + "step": 12628 + }, + { + "epoch": 34.41144414168937, + "grad_norm": 6.503924369812012, + "learning_rate": 1.5256308608661904e-05, + "loss": 0.2482, + "step": 12629 + }, + { + "epoch": 34.4141689373297, + "grad_norm": 7.556908130645752, + "learning_rate": 1.5255557838748683e-05, + "loss": 0.2938, + "step": 12630 + }, + { + "epoch": 34.416893732970024, + "grad_norm": 5.482861042022705, + "learning_rate": 1.5254807027905342e-05, + "loss": 0.2621, + "step": 12631 + }, + { + "epoch": 34.41961852861036, + "grad_norm": 8.334380149841309, + "learning_rate": 1.5254056176137742e-05, + "loss": 0.3419, + "step": 12632 + }, + { + "epoch": 34.42234332425068, + "grad_norm": 8.406848907470703, + "learning_rate": 1.5253305283451714e-05, + "loss": 0.369, + "step": 12633 + }, + { + "epoch": 34.42506811989101, + "grad_norm": 7.206605434417725, + "learning_rate": 1.5252554349853114e-05, + "loss": 0.3595, + "step": 12634 + }, + { + "epoch": 34.427792915531334, + "grad_norm": 5.960251331329346, + "learning_rate": 1.5251803375347792e-05, + "loss": 0.2827, + "step": 12635 + }, + { + "epoch": 34.43051771117166, + "grad_norm": 11.61844253540039, + "learning_rate": 1.5251052359941593e-05, + "loss": 0.4728, + "step": 12636 + }, + { + "epoch": 34.433242506811986, + "grad_norm": 7.506865978240967, + "learning_rate": 1.5250301303640368e-05, + "loss": 0.3216, + "step": 12637 + }, + { + "epoch": 34.43596730245232, + "grad_norm": 11.855709075927734, + "learning_rate": 1.5249550206449968e-05, + "loss": 0.398, + "step": 12638 + }, + { + "epoch": 34.438692098092645, + "grad_norm": 6.202294826507568, + "learning_rate": 1.5248799068376236e-05, + "loss": 0.4269, + "step": 12639 + }, + { + "epoch": 34.44141689373297, + "grad_norm": 7.376853942871094, + "learning_rate": 1.5248047889425026e-05, + "loss": 0.4138, + "step": 12640 + }, + { + "epoch": 34.444141689373296, + "grad_norm": 6.544391632080078, + "learning_rate": 1.5247296669602189e-05, + "loss": 0.3949, + "step": 12641 + }, + { + "epoch": 34.44686648501362, + "grad_norm": 6.126943111419678, + "learning_rate": 1.5246545408913575e-05, + "loss": 0.262, + "step": 12642 + }, + { + "epoch": 34.44959128065395, + "grad_norm": 6.744805812835693, + "learning_rate": 1.5245794107365034e-05, + "loss": 0.308, + "step": 12643 + }, + { + "epoch": 34.45231607629428, + "grad_norm": 8.80776309967041, + "learning_rate": 1.5245042764962416e-05, + "loss": 0.4443, + "step": 12644 + }, + { + "epoch": 34.45504087193461, + "grad_norm": 6.651944637298584, + "learning_rate": 1.5244291381711574e-05, + "loss": 0.2739, + "step": 12645 + }, + { + "epoch": 34.45776566757493, + "grad_norm": 6.812028884887695, + "learning_rate": 1.5243539957618363e-05, + "loss": 0.4237, + "step": 12646 + }, + { + "epoch": 34.46049046321526, + "grad_norm": 12.600976943969727, + "learning_rate": 1.5242788492688628e-05, + "loss": 0.4821, + "step": 12647 + }, + { + "epoch": 34.463215258855584, + "grad_norm": 21.884811401367188, + "learning_rate": 1.5242036986928225e-05, + "loss": 0.3579, + "step": 12648 + }, + { + "epoch": 34.46594005449591, + "grad_norm": 7.988901615142822, + "learning_rate": 1.5241285440343008e-05, + "loss": 0.3257, + "step": 12649 + }, + { + "epoch": 34.46866485013624, + "grad_norm": 7.309326171875, + "learning_rate": 1.524053385293883e-05, + "loss": 0.3538, + "step": 12650 + }, + { + "epoch": 34.47138964577657, + "grad_norm": 8.580944061279297, + "learning_rate": 1.5239782224721537e-05, + "loss": 0.4138, + "step": 12651 + }, + { + "epoch": 34.474114441416894, + "grad_norm": 7.301868438720703, + "learning_rate": 1.5239030555696995e-05, + "loss": 0.2907, + "step": 12652 + }, + { + "epoch": 34.47683923705722, + "grad_norm": 16.115550994873047, + "learning_rate": 1.5238278845871048e-05, + "loss": 0.4512, + "step": 12653 + }, + { + "epoch": 34.479564032697546, + "grad_norm": 6.847012996673584, + "learning_rate": 1.5237527095249558e-05, + "loss": 0.3115, + "step": 12654 + }, + { + "epoch": 34.48228882833787, + "grad_norm": 11.58302116394043, + "learning_rate": 1.5236775303838371e-05, + "loss": 0.3449, + "step": 12655 + }, + { + "epoch": 34.485013623978205, + "grad_norm": 10.742802619934082, + "learning_rate": 1.5236023471643352e-05, + "loss": 0.2906, + "step": 12656 + }, + { + "epoch": 34.48773841961853, + "grad_norm": 7.742465972900391, + "learning_rate": 1.5235271598670345e-05, + "loss": 0.5452, + "step": 12657 + }, + { + "epoch": 34.490463215258856, + "grad_norm": 7.01248025894165, + "learning_rate": 1.5234519684925215e-05, + "loss": 0.3445, + "step": 12658 + }, + { + "epoch": 34.49318801089918, + "grad_norm": 11.43049144744873, + "learning_rate": 1.5233767730413811e-05, + "loss": 0.261, + "step": 12659 + }, + { + "epoch": 34.49591280653951, + "grad_norm": 6.926109313964844, + "learning_rate": 1.5233015735141995e-05, + "loss": 0.3703, + "step": 12660 + }, + { + "epoch": 34.49863760217983, + "grad_norm": 6.705916881561279, + "learning_rate": 1.5232263699115616e-05, + "loss": 0.4207, + "step": 12661 + }, + { + "epoch": 34.50136239782017, + "grad_norm": 6.926370620727539, + "learning_rate": 1.5231511622340543e-05, + "loss": 0.2558, + "step": 12662 + }, + { + "epoch": 34.50408719346049, + "grad_norm": 7.000466823577881, + "learning_rate": 1.523075950482262e-05, + "loss": 0.4001, + "step": 12663 + }, + { + "epoch": 34.50681198910082, + "grad_norm": 7.390921592712402, + "learning_rate": 1.5230007346567717e-05, + "loss": 0.2559, + "step": 12664 + }, + { + "epoch": 34.509536784741144, + "grad_norm": 7.2458343505859375, + "learning_rate": 1.5229255147581678e-05, + "loss": 0.5916, + "step": 12665 + }, + { + "epoch": 34.51226158038147, + "grad_norm": 7.20648717880249, + "learning_rate": 1.5228502907870373e-05, + "loss": 0.375, + "step": 12666 + }, + { + "epoch": 34.514986376021795, + "grad_norm": 13.891578674316406, + "learning_rate": 1.5227750627439652e-05, + "loss": 0.5149, + "step": 12667 + }, + { + "epoch": 34.51771117166213, + "grad_norm": 8.530945777893066, + "learning_rate": 1.522699830629538e-05, + "loss": 0.4329, + "step": 12668 + }, + { + "epoch": 34.520435967302454, + "grad_norm": 6.637569427490234, + "learning_rate": 1.522624594444341e-05, + "loss": 0.3663, + "step": 12669 + }, + { + "epoch": 34.52316076294278, + "grad_norm": 9.173357963562012, + "learning_rate": 1.5225493541889609e-05, + "loss": 0.3019, + "step": 12670 + }, + { + "epoch": 34.525885558583106, + "grad_norm": 10.640692710876465, + "learning_rate": 1.522474109863983e-05, + "loss": 0.3535, + "step": 12671 + }, + { + "epoch": 34.52861035422343, + "grad_norm": 8.41413688659668, + "learning_rate": 1.5223988614699939e-05, + "loss": 0.4613, + "step": 12672 + }, + { + "epoch": 34.53133514986376, + "grad_norm": 8.539817810058594, + "learning_rate": 1.5223236090075788e-05, + "loss": 0.3545, + "step": 12673 + }, + { + "epoch": 34.53405994550409, + "grad_norm": 6.650314807891846, + "learning_rate": 1.5222483524773246e-05, + "loss": 0.4908, + "step": 12674 + }, + { + "epoch": 34.536784741144416, + "grad_norm": 7.6259331703186035, + "learning_rate": 1.5221730918798168e-05, + "loss": 0.4193, + "step": 12675 + }, + { + "epoch": 34.53950953678474, + "grad_norm": 7.47517204284668, + "learning_rate": 1.522097827215642e-05, + "loss": 0.312, + "step": 12676 + }, + { + "epoch": 34.54223433242507, + "grad_norm": 8.829288482666016, + "learning_rate": 1.5220225584853858e-05, + "loss": 0.419, + "step": 12677 + }, + { + "epoch": 34.54495912806539, + "grad_norm": 6.424598217010498, + "learning_rate": 1.5219472856896348e-05, + "loss": 0.2655, + "step": 12678 + }, + { + "epoch": 34.54768392370572, + "grad_norm": 7.619609355926514, + "learning_rate": 1.5218720088289753e-05, + "loss": 0.2967, + "step": 12679 + }, + { + "epoch": 34.55040871934605, + "grad_norm": 5.812038898468018, + "learning_rate": 1.5217967279039933e-05, + "loss": 0.4395, + "step": 12680 + }, + { + "epoch": 34.55313351498638, + "grad_norm": 7.461119174957275, + "learning_rate": 1.5217214429152752e-05, + "loss": 0.3044, + "step": 12681 + }, + { + "epoch": 34.555858310626704, + "grad_norm": 6.197144031524658, + "learning_rate": 1.5216461538634076e-05, + "loss": 0.3132, + "step": 12682 + }, + { + "epoch": 34.55858310626703, + "grad_norm": 7.825538158416748, + "learning_rate": 1.521570860748976e-05, + "loss": 0.3924, + "step": 12683 + }, + { + "epoch": 34.561307901907355, + "grad_norm": 8.52588176727295, + "learning_rate": 1.5214955635725677e-05, + "loss": 0.5195, + "step": 12684 + }, + { + "epoch": 34.56403269754768, + "grad_norm": 7.078782081604004, + "learning_rate": 1.5214202623347687e-05, + "loss": 0.2614, + "step": 12685 + }, + { + "epoch": 34.566757493188014, + "grad_norm": 7.565918922424316, + "learning_rate": 1.521344957036165e-05, + "loss": 0.3388, + "step": 12686 + }, + { + "epoch": 34.56948228882834, + "grad_norm": 6.790742874145508, + "learning_rate": 1.5212696476773441e-05, + "loss": 0.2745, + "step": 12687 + }, + { + "epoch": 34.572207084468666, + "grad_norm": 8.860798835754395, + "learning_rate": 1.5211943342588918e-05, + "loss": 0.4206, + "step": 12688 + }, + { + "epoch": 34.57493188010899, + "grad_norm": 9.137691497802734, + "learning_rate": 1.521119016781395e-05, + "loss": 0.4454, + "step": 12689 + }, + { + "epoch": 34.57765667574932, + "grad_norm": 12.674605369567871, + "learning_rate": 1.5210436952454398e-05, + "loss": 0.4881, + "step": 12690 + }, + { + "epoch": 34.58038147138964, + "grad_norm": 6.639235019683838, + "learning_rate": 1.5209683696516129e-05, + "loss": 0.2416, + "step": 12691 + }, + { + "epoch": 34.583106267029976, + "grad_norm": 8.917923927307129, + "learning_rate": 1.5208930400005016e-05, + "loss": 0.3309, + "step": 12692 + }, + { + "epoch": 34.5858310626703, + "grad_norm": 9.904099464416504, + "learning_rate": 1.5208177062926916e-05, + "loss": 0.2929, + "step": 12693 + }, + { + "epoch": 34.58855585831063, + "grad_norm": 7.763059616088867, + "learning_rate": 1.5207423685287704e-05, + "loss": 0.3746, + "step": 12694 + }, + { + "epoch": 34.59128065395095, + "grad_norm": 6.761361122131348, + "learning_rate": 1.5206670267093242e-05, + "loss": 0.2741, + "step": 12695 + }, + { + "epoch": 34.59400544959128, + "grad_norm": 10.17188835144043, + "learning_rate": 1.5205916808349401e-05, + "loss": 0.2814, + "step": 12696 + }, + { + "epoch": 34.596730245231605, + "grad_norm": 7.0764594078063965, + "learning_rate": 1.5205163309062048e-05, + "loss": 0.3881, + "step": 12697 + }, + { + "epoch": 34.59945504087194, + "grad_norm": 8.067386627197266, + "learning_rate": 1.5204409769237048e-05, + "loss": 0.3437, + "step": 12698 + }, + { + "epoch": 34.60217983651226, + "grad_norm": 11.958366394042969, + "learning_rate": 1.5203656188880276e-05, + "loss": 0.3264, + "step": 12699 + }, + { + "epoch": 34.60490463215259, + "grad_norm": 6.704128742218018, + "learning_rate": 1.5202902567997592e-05, + "loss": 0.3314, + "step": 12700 + }, + { + "epoch": 34.607629427792915, + "grad_norm": 7.999274730682373, + "learning_rate": 1.5202148906594874e-05, + "loss": 0.3633, + "step": 12701 + }, + { + "epoch": 34.61035422343324, + "grad_norm": 10.331748962402344, + "learning_rate": 1.5201395204677986e-05, + "loss": 0.4229, + "step": 12702 + }, + { + "epoch": 34.61307901907357, + "grad_norm": 5.908962726593018, + "learning_rate": 1.5200641462252802e-05, + "loss": 0.242, + "step": 12703 + }, + { + "epoch": 34.6158038147139, + "grad_norm": 9.226425170898438, + "learning_rate": 1.5199887679325185e-05, + "loss": 0.3636, + "step": 12704 + }, + { + "epoch": 34.618528610354225, + "grad_norm": 8.724287986755371, + "learning_rate": 1.5199133855901013e-05, + "loss": 0.3567, + "step": 12705 + }, + { + "epoch": 34.62125340599455, + "grad_norm": 9.33549976348877, + "learning_rate": 1.5198379991986154e-05, + "loss": 0.5277, + "step": 12706 + }, + { + "epoch": 34.62397820163488, + "grad_norm": 7.487105369567871, + "learning_rate": 1.519762608758648e-05, + "loss": 0.4089, + "step": 12707 + }, + { + "epoch": 34.6267029972752, + "grad_norm": 6.3186750411987305, + "learning_rate": 1.5196872142707859e-05, + "loss": 0.2189, + "step": 12708 + }, + { + "epoch": 34.62942779291553, + "grad_norm": 13.810160636901855, + "learning_rate": 1.5196118157356168e-05, + "loss": 0.4644, + "step": 12709 + }, + { + "epoch": 34.63215258855586, + "grad_norm": 7.9806413650512695, + "learning_rate": 1.5195364131537273e-05, + "loss": 0.363, + "step": 12710 + }, + { + "epoch": 34.63487738419619, + "grad_norm": 7.039987564086914, + "learning_rate": 1.5194610065257052e-05, + "loss": 0.3934, + "step": 12711 + }, + { + "epoch": 34.63760217983651, + "grad_norm": 6.936146259307861, + "learning_rate": 1.519385595852137e-05, + "loss": 0.3399, + "step": 12712 + }, + { + "epoch": 34.64032697547684, + "grad_norm": 6.270376205444336, + "learning_rate": 1.519310181133611e-05, + "loss": 0.4134, + "step": 12713 + }, + { + "epoch": 34.643051771117165, + "grad_norm": 7.317523956298828, + "learning_rate": 1.5192347623707138e-05, + "loss": 0.4918, + "step": 12714 + }, + { + "epoch": 34.64577656675749, + "grad_norm": 7.332164764404297, + "learning_rate": 1.5191593395640331e-05, + "loss": 0.331, + "step": 12715 + }, + { + "epoch": 34.64850136239782, + "grad_norm": 6.766537189483643, + "learning_rate": 1.5190839127141562e-05, + "loss": 0.5164, + "step": 12716 + }, + { + "epoch": 34.65122615803815, + "grad_norm": 8.445927619934082, + "learning_rate": 1.5190084818216705e-05, + "loss": 0.3835, + "step": 12717 + }, + { + "epoch": 34.653950953678475, + "grad_norm": 7.979760646820068, + "learning_rate": 1.5189330468871633e-05, + "loss": 0.2907, + "step": 12718 + }, + { + "epoch": 34.6566757493188, + "grad_norm": 10.70372486114502, + "learning_rate": 1.5188576079112225e-05, + "loss": 0.3962, + "step": 12719 + }, + { + "epoch": 34.65940054495913, + "grad_norm": 11.06981086730957, + "learning_rate": 1.5187821648944348e-05, + "loss": 0.2766, + "step": 12720 + }, + { + "epoch": 34.66212534059945, + "grad_norm": 6.434134483337402, + "learning_rate": 1.5187067178373887e-05, + "loss": 0.3264, + "step": 12721 + }, + { + "epoch": 34.664850136239785, + "grad_norm": 7.828649044036865, + "learning_rate": 1.5186312667406712e-05, + "loss": 0.3538, + "step": 12722 + }, + { + "epoch": 34.66757493188011, + "grad_norm": 6.914149761199951, + "learning_rate": 1.5185558116048704e-05, + "loss": 0.2717, + "step": 12723 + }, + { + "epoch": 34.67029972752044, + "grad_norm": 12.35200309753418, + "learning_rate": 1.5184803524305733e-05, + "loss": 0.2907, + "step": 12724 + }, + { + "epoch": 34.67302452316076, + "grad_norm": 9.508199691772461, + "learning_rate": 1.5184048892183683e-05, + "loss": 0.2726, + "step": 12725 + }, + { + "epoch": 34.67574931880109, + "grad_norm": 7.7572712898254395, + "learning_rate": 1.5183294219688423e-05, + "loss": 0.2978, + "step": 12726 + }, + { + "epoch": 34.678474114441414, + "grad_norm": 5.914263725280762, + "learning_rate": 1.5182539506825837e-05, + "loss": 0.3403, + "step": 12727 + }, + { + "epoch": 34.68119891008175, + "grad_norm": 7.788616180419922, + "learning_rate": 1.5181784753601797e-05, + "loss": 0.4465, + "step": 12728 + }, + { + "epoch": 34.68392370572207, + "grad_norm": 5.874246120452881, + "learning_rate": 1.5181029960022187e-05, + "loss": 0.3644, + "step": 12729 + }, + { + "epoch": 34.6866485013624, + "grad_norm": 11.232590675354004, + "learning_rate": 1.518027512609288e-05, + "loss": 0.3675, + "step": 12730 + }, + { + "epoch": 34.689373297002724, + "grad_norm": 6.877134323120117, + "learning_rate": 1.5179520251819758e-05, + "loss": 0.2774, + "step": 12731 + }, + { + "epoch": 34.69209809264305, + "grad_norm": 22.318862915039062, + "learning_rate": 1.51787653372087e-05, + "loss": 0.3995, + "step": 12732 + }, + { + "epoch": 34.694822888283376, + "grad_norm": 6.460038185119629, + "learning_rate": 1.5178010382265586e-05, + "loss": 0.2565, + "step": 12733 + }, + { + "epoch": 34.69754768392371, + "grad_norm": 7.191373825073242, + "learning_rate": 1.517725538699629e-05, + "loss": 0.3623, + "step": 12734 + }, + { + "epoch": 34.700272479564035, + "grad_norm": 6.409982681274414, + "learning_rate": 1.51765003514067e-05, + "loss": 0.3607, + "step": 12735 + }, + { + "epoch": 34.70299727520436, + "grad_norm": 6.087721347808838, + "learning_rate": 1.5175745275502686e-05, + "loss": 0.3006, + "step": 12736 + }, + { + "epoch": 34.705722070844686, + "grad_norm": 16.11115264892578, + "learning_rate": 1.5174990159290137e-05, + "loss": 0.3904, + "step": 12737 + }, + { + "epoch": 34.70844686648501, + "grad_norm": 8.521676063537598, + "learning_rate": 1.5174235002774933e-05, + "loss": 0.4363, + "step": 12738 + }, + { + "epoch": 34.71117166212534, + "grad_norm": 7.016096591949463, + "learning_rate": 1.5173479805962954e-05, + "loss": 0.2871, + "step": 12739 + }, + { + "epoch": 34.71389645776567, + "grad_norm": 8.119922637939453, + "learning_rate": 1.5172724568860075e-05, + "loss": 0.4052, + "step": 12740 + }, + { + "epoch": 34.716621253406, + "grad_norm": 10.564770698547363, + "learning_rate": 1.517196929147219e-05, + "loss": 0.351, + "step": 12741 + }, + { + "epoch": 34.71934604904632, + "grad_norm": 5.689218521118164, + "learning_rate": 1.517121397380517e-05, + "loss": 0.3754, + "step": 12742 + }, + { + "epoch": 34.72207084468665, + "grad_norm": 7.102179050445557, + "learning_rate": 1.5170458615864906e-05, + "loss": 0.4146, + "step": 12743 + }, + { + "epoch": 34.724795640326974, + "grad_norm": 7.624054908752441, + "learning_rate": 1.5169703217657274e-05, + "loss": 0.4538, + "step": 12744 + }, + { + "epoch": 34.7275204359673, + "grad_norm": 8.589566230773926, + "learning_rate": 1.5168947779188163e-05, + "loss": 0.5319, + "step": 12745 + }, + { + "epoch": 34.73024523160763, + "grad_norm": 6.940329074859619, + "learning_rate": 1.5168192300463447e-05, + "loss": 0.3917, + "step": 12746 + }, + { + "epoch": 34.73297002724796, + "grad_norm": 6.856508731842041, + "learning_rate": 1.516743678148902e-05, + "loss": 0.4256, + "step": 12747 + }, + { + "epoch": 34.735694822888284, + "grad_norm": 6.467329978942871, + "learning_rate": 1.516668122227076e-05, + "loss": 0.3243, + "step": 12748 + }, + { + "epoch": 34.73841961852861, + "grad_norm": 12.759373664855957, + "learning_rate": 1.5165925622814554e-05, + "loss": 0.241, + "step": 12749 + }, + { + "epoch": 34.741144414168936, + "grad_norm": 6.045810222625732, + "learning_rate": 1.5165169983126287e-05, + "loss": 0.2975, + "step": 12750 + }, + { + "epoch": 34.74386920980926, + "grad_norm": 25.1729736328125, + "learning_rate": 1.516441430321184e-05, + "loss": 0.3225, + "step": 12751 + }, + { + "epoch": 34.746594005449595, + "grad_norm": 7.094336032867432, + "learning_rate": 1.5163658583077103e-05, + "loss": 0.2514, + "step": 12752 + }, + { + "epoch": 34.74931880108992, + "grad_norm": 12.75036334991455, + "learning_rate": 1.5162902822727956e-05, + "loss": 0.3227, + "step": 12753 + }, + { + "epoch": 34.752043596730246, + "grad_norm": 9.665423393249512, + "learning_rate": 1.5162147022170288e-05, + "loss": 0.3798, + "step": 12754 + }, + { + "epoch": 34.75476839237057, + "grad_norm": 8.1179838180542, + "learning_rate": 1.5161391181409987e-05, + "loss": 0.3344, + "step": 12755 + }, + { + "epoch": 34.7574931880109, + "grad_norm": 25.28486442565918, + "learning_rate": 1.5160635300452936e-05, + "loss": 0.3, + "step": 12756 + }, + { + "epoch": 34.76021798365122, + "grad_norm": 8.724785804748535, + "learning_rate": 1.5159879379305028e-05, + "loss": 0.3551, + "step": 12757 + }, + { + "epoch": 34.762942779291556, + "grad_norm": 7.74306058883667, + "learning_rate": 1.515912341797214e-05, + "loss": 0.3218, + "step": 12758 + }, + { + "epoch": 34.76566757493188, + "grad_norm": 7.537326335906982, + "learning_rate": 1.515836741646017e-05, + "loss": 0.3193, + "step": 12759 + }, + { + "epoch": 34.76839237057221, + "grad_norm": 6.181797504425049, + "learning_rate": 1.5157611374774997e-05, + "loss": 0.4611, + "step": 12760 + }, + { + "epoch": 34.771117166212534, + "grad_norm": 7.308982849121094, + "learning_rate": 1.5156855292922512e-05, + "loss": 0.29, + "step": 12761 + }, + { + "epoch": 34.77384196185286, + "grad_norm": 9.729423522949219, + "learning_rate": 1.5156099170908605e-05, + "loss": 0.4969, + "step": 12762 + }, + { + "epoch": 34.776566757493185, + "grad_norm": 7.62312650680542, + "learning_rate": 1.5155343008739162e-05, + "loss": 0.3237, + "step": 12763 + }, + { + "epoch": 34.77929155313352, + "grad_norm": 7.187760353088379, + "learning_rate": 1.5154586806420078e-05, + "loss": 0.3556, + "step": 12764 + }, + { + "epoch": 34.782016348773844, + "grad_norm": 7.4792561531066895, + "learning_rate": 1.5153830563957232e-05, + "loss": 0.4765, + "step": 12765 + }, + { + "epoch": 34.78474114441417, + "grad_norm": 8.713623046875, + "learning_rate": 1.5153074281356523e-05, + "loss": 0.3162, + "step": 12766 + }, + { + "epoch": 34.787465940054496, + "grad_norm": 6.846462726593018, + "learning_rate": 1.5152317958623836e-05, + "loss": 0.3005, + "step": 12767 + }, + { + "epoch": 34.79019073569482, + "grad_norm": 7.01962423324585, + "learning_rate": 1.5151561595765066e-05, + "loss": 0.267, + "step": 12768 + }, + { + "epoch": 34.79291553133515, + "grad_norm": 8.18949031829834, + "learning_rate": 1.5150805192786097e-05, + "loss": 0.297, + "step": 12769 + }, + { + "epoch": 34.79564032697548, + "grad_norm": 7.413372039794922, + "learning_rate": 1.5150048749692822e-05, + "loss": 0.3751, + "step": 12770 + }, + { + "epoch": 34.798365122615806, + "grad_norm": 10.343478202819824, + "learning_rate": 1.5149292266491133e-05, + "loss": 0.3061, + "step": 12771 + }, + { + "epoch": 34.80108991825613, + "grad_norm": 6.774062633514404, + "learning_rate": 1.5148535743186928e-05, + "loss": 0.498, + "step": 12772 + }, + { + "epoch": 34.80381471389646, + "grad_norm": 6.852293491363525, + "learning_rate": 1.5147779179786084e-05, + "loss": 0.3989, + "step": 12773 + }, + { + "epoch": 34.80653950953678, + "grad_norm": 21.525096893310547, + "learning_rate": 1.5147022576294506e-05, + "loss": 0.4672, + "step": 12774 + }, + { + "epoch": 34.80926430517711, + "grad_norm": 9.819718360900879, + "learning_rate": 1.514626593271808e-05, + "loss": 0.3227, + "step": 12775 + }, + { + "epoch": 34.81198910081744, + "grad_norm": 7.6693572998046875, + "learning_rate": 1.5145509249062702e-05, + "loss": 0.2576, + "step": 12776 + }, + { + "epoch": 34.81471389645777, + "grad_norm": 6.69463586807251, + "learning_rate": 1.5144752525334264e-05, + "loss": 0.3507, + "step": 12777 + }, + { + "epoch": 34.817438692098094, + "grad_norm": 8.588858604431152, + "learning_rate": 1.5143995761538657e-05, + "loss": 0.4889, + "step": 12778 + }, + { + "epoch": 34.82016348773842, + "grad_norm": 10.772705078125, + "learning_rate": 1.5143238957681776e-05, + "loss": 0.3785, + "step": 12779 + }, + { + "epoch": 34.822888283378745, + "grad_norm": 6.9552154541015625, + "learning_rate": 1.5142482113769519e-05, + "loss": 0.4968, + "step": 12780 + }, + { + "epoch": 34.82561307901907, + "grad_norm": 6.593571662902832, + "learning_rate": 1.5141725229807773e-05, + "loss": 0.3855, + "step": 12781 + }, + { + "epoch": 34.828337874659404, + "grad_norm": 7.897350311279297, + "learning_rate": 1.5140968305802438e-05, + "loss": 0.2631, + "step": 12782 + }, + { + "epoch": 34.83106267029973, + "grad_norm": 7.923161506652832, + "learning_rate": 1.5140211341759408e-05, + "loss": 0.287, + "step": 12783 + }, + { + "epoch": 34.833787465940055, + "grad_norm": 7.426450729370117, + "learning_rate": 1.5139454337684577e-05, + "loss": 0.3377, + "step": 12784 + }, + { + "epoch": 34.83651226158038, + "grad_norm": 7.1171088218688965, + "learning_rate": 1.5138697293583842e-05, + "loss": 0.3357, + "step": 12785 + }, + { + "epoch": 34.83923705722071, + "grad_norm": 8.326007843017578, + "learning_rate": 1.5137940209463095e-05, + "loss": 0.3349, + "step": 12786 + }, + { + "epoch": 34.84196185286103, + "grad_norm": 6.74309778213501, + "learning_rate": 1.5137183085328237e-05, + "loss": 0.3382, + "step": 12787 + }, + { + "epoch": 34.844686648501366, + "grad_norm": 7.596869468688965, + "learning_rate": 1.5136425921185162e-05, + "loss": 0.4407, + "step": 12788 + }, + { + "epoch": 34.84741144414169, + "grad_norm": 9.84290885925293, + "learning_rate": 1.5135668717039767e-05, + "loss": 0.4174, + "step": 12789 + }, + { + "epoch": 34.85013623978202, + "grad_norm": 8.881937980651855, + "learning_rate": 1.513491147289795e-05, + "loss": 0.3128, + "step": 12790 + }, + { + "epoch": 34.85286103542234, + "grad_norm": 7.489529609680176, + "learning_rate": 1.5134154188765608e-05, + "loss": 0.2996, + "step": 12791 + }, + { + "epoch": 34.85558583106267, + "grad_norm": 5.962601661682129, + "learning_rate": 1.513339686464864e-05, + "loss": 0.2526, + "step": 12792 + }, + { + "epoch": 34.858310626702995, + "grad_norm": 5.978816509246826, + "learning_rate": 1.513263950055294e-05, + "loss": 0.3769, + "step": 12793 + }, + { + "epoch": 34.86103542234333, + "grad_norm": 7.779540538787842, + "learning_rate": 1.5131882096484409e-05, + "loss": 0.3186, + "step": 12794 + }, + { + "epoch": 34.86376021798365, + "grad_norm": 9.456623077392578, + "learning_rate": 1.5131124652448943e-05, + "loss": 0.3513, + "step": 12795 + }, + { + "epoch": 34.86648501362398, + "grad_norm": 7.130842208862305, + "learning_rate": 1.5130367168452449e-05, + "loss": 0.4387, + "step": 12796 + }, + { + "epoch": 34.869209809264305, + "grad_norm": 6.189455986022949, + "learning_rate": 1.5129609644500813e-05, + "loss": 0.4162, + "step": 12797 + }, + { + "epoch": 34.87193460490463, + "grad_norm": 7.358476161956787, + "learning_rate": 1.5128852080599949e-05, + "loss": 0.2995, + "step": 12798 + }, + { + "epoch": 34.87465940054496, + "grad_norm": 6.125901222229004, + "learning_rate": 1.5128094476755747e-05, + "loss": 0.457, + "step": 12799 + }, + { + "epoch": 34.87738419618529, + "grad_norm": 5.849795818328857, + "learning_rate": 1.5127336832974111e-05, + "loss": 0.4403, + "step": 12800 + }, + { + "epoch": 34.880108991825615, + "grad_norm": 6.29843807220459, + "learning_rate": 1.512657914926094e-05, + "loss": 0.2894, + "step": 12801 + }, + { + "epoch": 34.88283378746594, + "grad_norm": 7.504866600036621, + "learning_rate": 1.5125821425622137e-05, + "loss": 0.4162, + "step": 12802 + }, + { + "epoch": 34.88555858310627, + "grad_norm": 7.649609565734863, + "learning_rate": 1.5125063662063602e-05, + "loss": 0.5047, + "step": 12803 + }, + { + "epoch": 34.88828337874659, + "grad_norm": 6.444530010223389, + "learning_rate": 1.5124305858591238e-05, + "loss": 0.4594, + "step": 12804 + }, + { + "epoch": 34.89100817438692, + "grad_norm": 9.201496124267578, + "learning_rate": 1.5123548015210941e-05, + "loss": 0.315, + "step": 12805 + }, + { + "epoch": 34.89373297002725, + "grad_norm": 9.123472213745117, + "learning_rate": 1.5122790131928615e-05, + "loss": 0.3701, + "step": 12806 + }, + { + "epoch": 34.89645776566758, + "grad_norm": 7.393870830535889, + "learning_rate": 1.5122032208750168e-05, + "loss": 0.3359, + "step": 12807 + }, + { + "epoch": 34.8991825613079, + "grad_norm": 8.265925407409668, + "learning_rate": 1.51212742456815e-05, + "loss": 0.3147, + "step": 12808 + }, + { + "epoch": 34.90190735694823, + "grad_norm": 6.999871253967285, + "learning_rate": 1.5120516242728508e-05, + "loss": 0.3462, + "step": 12809 + }, + { + "epoch": 34.904632152588555, + "grad_norm": 9.759187698364258, + "learning_rate": 1.5119758199897106e-05, + "loss": 0.4647, + "step": 12810 + }, + { + "epoch": 34.90735694822888, + "grad_norm": 12.058571815490723, + "learning_rate": 1.511900011719319e-05, + "loss": 0.4572, + "step": 12811 + }, + { + "epoch": 34.91008174386921, + "grad_norm": 5.392372131347656, + "learning_rate": 1.5118241994622666e-05, + "loss": 0.3235, + "step": 12812 + }, + { + "epoch": 34.91280653950954, + "grad_norm": 6.347375869750977, + "learning_rate": 1.5117483832191438e-05, + "loss": 0.2578, + "step": 12813 + }, + { + "epoch": 34.915531335149865, + "grad_norm": 5.794153690338135, + "learning_rate": 1.5116725629905408e-05, + "loss": 0.4393, + "step": 12814 + }, + { + "epoch": 34.91825613079019, + "grad_norm": 7.6299028396606445, + "learning_rate": 1.5115967387770484e-05, + "loss": 0.2598, + "step": 12815 + }, + { + "epoch": 34.920980926430516, + "grad_norm": 6.074033260345459, + "learning_rate": 1.5115209105792574e-05, + "loss": 0.2385, + "step": 12816 + }, + { + "epoch": 34.92370572207084, + "grad_norm": 7.3379411697387695, + "learning_rate": 1.5114450783977579e-05, + "loss": 0.4849, + "step": 12817 + }, + { + "epoch": 34.926430517711175, + "grad_norm": 8.817684173583984, + "learning_rate": 1.5113692422331406e-05, + "loss": 0.446, + "step": 12818 + }, + { + "epoch": 34.9291553133515, + "grad_norm": 6.351326942443848, + "learning_rate": 1.511293402085996e-05, + "loss": 0.4822, + "step": 12819 + }, + { + "epoch": 34.93188010899183, + "grad_norm": 14.489463806152344, + "learning_rate": 1.5112175579569149e-05, + "loss": 0.3636, + "step": 12820 + }, + { + "epoch": 34.93460490463215, + "grad_norm": 7.836480617523193, + "learning_rate": 1.5111417098464879e-05, + "loss": 0.3438, + "step": 12821 + }, + { + "epoch": 34.93732970027248, + "grad_norm": 7.352789878845215, + "learning_rate": 1.5110658577553058e-05, + "loss": 0.5103, + "step": 12822 + }, + { + "epoch": 34.940054495912804, + "grad_norm": 6.39596700668335, + "learning_rate": 1.510990001683959e-05, + "loss": 0.2738, + "step": 12823 + }, + { + "epoch": 34.94277929155314, + "grad_norm": 6.166970729827881, + "learning_rate": 1.5109141416330386e-05, + "loss": 0.3428, + "step": 12824 + }, + { + "epoch": 34.94550408719346, + "grad_norm": 5.944089889526367, + "learning_rate": 1.5108382776031354e-05, + "loss": 0.4155, + "step": 12825 + }, + { + "epoch": 34.94822888283379, + "grad_norm": 6.506803512573242, + "learning_rate": 1.51076240959484e-05, + "loss": 0.294, + "step": 12826 + }, + { + "epoch": 34.950953678474114, + "grad_norm": 7.878262519836426, + "learning_rate": 1.5106865376087437e-05, + "loss": 0.4139, + "step": 12827 + }, + { + "epoch": 34.95367847411444, + "grad_norm": 7.29544734954834, + "learning_rate": 1.5106106616454371e-05, + "loss": 0.3418, + "step": 12828 + }, + { + "epoch": 34.956403269754766, + "grad_norm": 6.37436580657959, + "learning_rate": 1.5105347817055106e-05, + "loss": 0.3661, + "step": 12829 + }, + { + "epoch": 34.95912806539509, + "grad_norm": 6.1794633865356445, + "learning_rate": 1.510458897789556e-05, + "loss": 0.434, + "step": 12830 + }, + { + "epoch": 34.961852861035425, + "grad_norm": 7.422924518585205, + "learning_rate": 1.5103830098981637e-05, + "loss": 0.3311, + "step": 12831 + }, + { + "epoch": 34.96457765667575, + "grad_norm": 6.644876480102539, + "learning_rate": 1.5103071180319254e-05, + "loss": 0.337, + "step": 12832 + }, + { + "epoch": 34.967302452316076, + "grad_norm": 7.06466007232666, + "learning_rate": 1.510231222191431e-05, + "loss": 0.3248, + "step": 12833 + }, + { + "epoch": 34.9700272479564, + "grad_norm": 6.119283676147461, + "learning_rate": 1.5101553223772728e-05, + "loss": 0.2797, + "step": 12834 + }, + { + "epoch": 34.97275204359673, + "grad_norm": 8.348386764526367, + "learning_rate": 1.5100794185900411e-05, + "loss": 0.3005, + "step": 12835 + }, + { + "epoch": 34.97547683923706, + "grad_norm": 6.874670505523682, + "learning_rate": 1.5100035108303278e-05, + "loss": 0.4833, + "step": 12836 + }, + { + "epoch": 34.97820163487739, + "grad_norm": 6.618953227996826, + "learning_rate": 1.509927599098723e-05, + "loss": 0.2442, + "step": 12837 + }, + { + "epoch": 34.98092643051771, + "grad_norm": 10.766705513000488, + "learning_rate": 1.5098516833958187e-05, + "loss": 0.3206, + "step": 12838 + }, + { + "epoch": 34.98365122615804, + "grad_norm": 9.001296997070312, + "learning_rate": 1.509775763722206e-05, + "loss": 0.4433, + "step": 12839 + }, + { + "epoch": 34.986376021798364, + "grad_norm": 8.988316535949707, + "learning_rate": 1.5096998400784756e-05, + "loss": 0.4554, + "step": 12840 + }, + { + "epoch": 34.98910081743869, + "grad_norm": 6.756176948547363, + "learning_rate": 1.5096239124652197e-05, + "loss": 0.2471, + "step": 12841 + }, + { + "epoch": 34.991825613079016, + "grad_norm": 7.477931022644043, + "learning_rate": 1.5095479808830292e-05, + "loss": 0.7057, + "step": 12842 + }, + { + "epoch": 34.99455040871935, + "grad_norm": 9.176545143127441, + "learning_rate": 1.5094720453324952e-05, + "loss": 0.3825, + "step": 12843 + }, + { + "epoch": 34.997275204359674, + "grad_norm": 7.517789363861084, + "learning_rate": 1.5093961058142095e-05, + "loss": 0.4518, + "step": 12844 + }, + { + "epoch": 35.0, + "grad_norm": 6.629086017608643, + "learning_rate": 1.5093201623287631e-05, + "loss": 0.3144, + "step": 12845 + }, + { + "epoch": 35.002724795640326, + "grad_norm": 5.785049915313721, + "learning_rate": 1.509244214876748e-05, + "loss": 0.4406, + "step": 12846 + }, + { + "epoch": 35.00544959128065, + "grad_norm": 5.573185443878174, + "learning_rate": 1.5091682634587547e-05, + "loss": 0.3493, + "step": 12847 + }, + { + "epoch": 35.00817438692098, + "grad_norm": 7.0667548179626465, + "learning_rate": 1.509092308075376e-05, + "loss": 0.3315, + "step": 12848 + }, + { + "epoch": 35.01089918256131, + "grad_norm": 8.357725143432617, + "learning_rate": 1.5090163487272027e-05, + "loss": 0.3625, + "step": 12849 + }, + { + "epoch": 35.013623978201636, + "grad_norm": 5.935133457183838, + "learning_rate": 1.5089403854148261e-05, + "loss": 0.2876, + "step": 12850 + }, + { + "epoch": 35.01634877384196, + "grad_norm": 7.409773826599121, + "learning_rate": 1.5088644181388386e-05, + "loss": 0.191, + "step": 12851 + }, + { + "epoch": 35.01907356948229, + "grad_norm": 6.038036823272705, + "learning_rate": 1.508788446899831e-05, + "loss": 0.4126, + "step": 12852 + }, + { + "epoch": 35.02179836512261, + "grad_norm": 5.311971187591553, + "learning_rate": 1.5087124716983956e-05, + "loss": 0.2346, + "step": 12853 + }, + { + "epoch": 35.02452316076294, + "grad_norm": 8.31474494934082, + "learning_rate": 1.5086364925351238e-05, + "loss": 0.2484, + "step": 12854 + }, + { + "epoch": 35.02724795640327, + "grad_norm": 6.290774822235107, + "learning_rate": 1.5085605094106072e-05, + "loss": 0.374, + "step": 12855 + }, + { + "epoch": 35.0299727520436, + "grad_norm": 6.906851768493652, + "learning_rate": 1.5084845223254381e-05, + "loss": 0.2697, + "step": 12856 + }, + { + "epoch": 35.032697547683924, + "grad_norm": 6.9600982666015625, + "learning_rate": 1.5084085312802075e-05, + "loss": 0.2094, + "step": 12857 + }, + { + "epoch": 35.03542234332425, + "grad_norm": 8.362553596496582, + "learning_rate": 1.5083325362755077e-05, + "loss": 0.3174, + "step": 12858 + }, + { + "epoch": 35.038147138964575, + "grad_norm": 6.994814872741699, + "learning_rate": 1.5082565373119307e-05, + "loss": 0.2646, + "step": 12859 + }, + { + "epoch": 35.0408719346049, + "grad_norm": 5.494656562805176, + "learning_rate": 1.508180534390068e-05, + "loss": 0.3244, + "step": 12860 + }, + { + "epoch": 35.043596730245234, + "grad_norm": 6.103918552398682, + "learning_rate": 1.5081045275105117e-05, + "loss": 0.3241, + "step": 12861 + }, + { + "epoch": 35.04632152588556, + "grad_norm": 5.130848407745361, + "learning_rate": 1.5080285166738535e-05, + "loss": 0.3754, + "step": 12862 + }, + { + "epoch": 35.049046321525886, + "grad_norm": 5.91086483001709, + "learning_rate": 1.5079525018806856e-05, + "loss": 0.2361, + "step": 12863 + }, + { + "epoch": 35.05177111716621, + "grad_norm": 5.534972667694092, + "learning_rate": 1.5078764831316002e-05, + "loss": 0.2357, + "step": 12864 + }, + { + "epoch": 35.05449591280654, + "grad_norm": 13.435774803161621, + "learning_rate": 1.507800460427189e-05, + "loss": 0.3418, + "step": 12865 + }, + { + "epoch": 35.05722070844686, + "grad_norm": 6.177347660064697, + "learning_rate": 1.5077244337680439e-05, + "loss": 0.2652, + "step": 12866 + }, + { + "epoch": 35.059945504087196, + "grad_norm": 5.603326320648193, + "learning_rate": 1.5076484031547578e-05, + "loss": 0.5273, + "step": 12867 + }, + { + "epoch": 35.06267029972752, + "grad_norm": 7.058253765106201, + "learning_rate": 1.5075723685879218e-05, + "loss": 0.3388, + "step": 12868 + }, + { + "epoch": 35.06539509536785, + "grad_norm": 6.102175235748291, + "learning_rate": 1.5074963300681286e-05, + "loss": 0.2981, + "step": 12869 + }, + { + "epoch": 35.06811989100817, + "grad_norm": 5.3113203048706055, + "learning_rate": 1.5074202875959704e-05, + "loss": 0.2601, + "step": 12870 + }, + { + "epoch": 35.0708446866485, + "grad_norm": 5.491559028625488, + "learning_rate": 1.5073442411720397e-05, + "loss": 0.4017, + "step": 12871 + }, + { + "epoch": 35.073569482288825, + "grad_norm": 7.598811626434326, + "learning_rate": 1.5072681907969277e-05, + "loss": 0.3106, + "step": 12872 + }, + { + "epoch": 35.07629427792916, + "grad_norm": 9.770064353942871, + "learning_rate": 1.5071921364712278e-05, + "loss": 0.2632, + "step": 12873 + }, + { + "epoch": 35.079019073569484, + "grad_norm": 9.12311840057373, + "learning_rate": 1.5071160781955316e-05, + "loss": 0.3592, + "step": 12874 + }, + { + "epoch": 35.08174386920981, + "grad_norm": 6.149101734161377, + "learning_rate": 1.5070400159704317e-05, + "loss": 0.3208, + "step": 12875 + }, + { + "epoch": 35.084468664850135, + "grad_norm": 5.999884128570557, + "learning_rate": 1.5069639497965205e-05, + "loss": 0.2534, + "step": 12876 + }, + { + "epoch": 35.08719346049046, + "grad_norm": 8.41357421875, + "learning_rate": 1.5068878796743907e-05, + "loss": 0.3031, + "step": 12877 + }, + { + "epoch": 35.08991825613079, + "grad_norm": 7.803460597991943, + "learning_rate": 1.5068118056046342e-05, + "loss": 0.2934, + "step": 12878 + }, + { + "epoch": 35.09264305177112, + "grad_norm": 13.252748489379883, + "learning_rate": 1.5067357275878438e-05, + "loss": 0.3236, + "step": 12879 + }, + { + "epoch": 35.095367847411445, + "grad_norm": 5.52808141708374, + "learning_rate": 1.5066596456246116e-05, + "loss": 0.2805, + "step": 12880 + }, + { + "epoch": 35.09809264305177, + "grad_norm": 6.531493663787842, + "learning_rate": 1.5065835597155305e-05, + "loss": 0.3039, + "step": 12881 + }, + { + "epoch": 35.1008174386921, + "grad_norm": 6.289060592651367, + "learning_rate": 1.506507469861193e-05, + "loss": 0.2648, + "step": 12882 + }, + { + "epoch": 35.10354223433242, + "grad_norm": 5.346847057342529, + "learning_rate": 1.5064313760621913e-05, + "loss": 0.1923, + "step": 12883 + }, + { + "epoch": 35.10626702997275, + "grad_norm": 6.987293243408203, + "learning_rate": 1.5063552783191186e-05, + "loss": 0.3647, + "step": 12884 + }, + { + "epoch": 35.10899182561308, + "grad_norm": 6.071861267089844, + "learning_rate": 1.5062791766325676e-05, + "loss": 0.2628, + "step": 12885 + }, + { + "epoch": 35.11171662125341, + "grad_norm": 6.821843147277832, + "learning_rate": 1.5062030710031304e-05, + "loss": 0.2214, + "step": 12886 + }, + { + "epoch": 35.11444141689373, + "grad_norm": 6.0386643409729, + "learning_rate": 1.5061269614314e-05, + "loss": 0.3656, + "step": 12887 + }, + { + "epoch": 35.11716621253406, + "grad_norm": 12.071297645568848, + "learning_rate": 1.506050847917969e-05, + "loss": 0.2701, + "step": 12888 + }, + { + "epoch": 35.119891008174385, + "grad_norm": 8.566832542419434, + "learning_rate": 1.5059747304634304e-05, + "loss": 0.4954, + "step": 12889 + }, + { + "epoch": 35.12261580381471, + "grad_norm": 6.731941223144531, + "learning_rate": 1.5058986090683767e-05, + "loss": 0.4046, + "step": 12890 + }, + { + "epoch": 35.12534059945504, + "grad_norm": 5.576921463012695, + "learning_rate": 1.5058224837334012e-05, + "loss": 0.3425, + "step": 12891 + }, + { + "epoch": 35.12806539509537, + "grad_norm": 7.817747592926025, + "learning_rate": 1.505746354459096e-05, + "loss": 0.3054, + "step": 12892 + }, + { + "epoch": 35.130790190735695, + "grad_norm": 5.836747646331787, + "learning_rate": 1.5056702212460547e-05, + "loss": 0.1724, + "step": 12893 + }, + { + "epoch": 35.13351498637602, + "grad_norm": 7.261024475097656, + "learning_rate": 1.5055940840948702e-05, + "loss": 0.2533, + "step": 12894 + }, + { + "epoch": 35.13623978201635, + "grad_norm": 6.892082691192627, + "learning_rate": 1.5055179430061354e-05, + "loss": 0.3005, + "step": 12895 + }, + { + "epoch": 35.13896457765667, + "grad_norm": 11.652900695800781, + "learning_rate": 1.5054417979804426e-05, + "loss": 0.2771, + "step": 12896 + }, + { + "epoch": 35.141689373297005, + "grad_norm": 6.214851379394531, + "learning_rate": 1.5053656490183856e-05, + "loss": 0.2691, + "step": 12897 + }, + { + "epoch": 35.14441416893733, + "grad_norm": 9.134818077087402, + "learning_rate": 1.5052894961205573e-05, + "loss": 0.3449, + "step": 12898 + }, + { + "epoch": 35.14713896457766, + "grad_norm": 6.546474933624268, + "learning_rate": 1.5052133392875505e-05, + "loss": 0.1782, + "step": 12899 + }, + { + "epoch": 35.14986376021798, + "grad_norm": 6.9917988777160645, + "learning_rate": 1.5051371785199585e-05, + "loss": 0.3135, + "step": 12900 + }, + { + "epoch": 35.15258855585831, + "grad_norm": 6.644484043121338, + "learning_rate": 1.5050610138183746e-05, + "loss": 0.3666, + "step": 12901 + }, + { + "epoch": 35.155313351498634, + "grad_norm": 5.416781902313232, + "learning_rate": 1.5049848451833912e-05, + "loss": 0.2019, + "step": 12902 + }, + { + "epoch": 35.15803814713897, + "grad_norm": 8.030413627624512, + "learning_rate": 1.5049086726156028e-05, + "loss": 0.2774, + "step": 12903 + }, + { + "epoch": 35.16076294277929, + "grad_norm": 6.396627902984619, + "learning_rate": 1.5048324961156016e-05, + "loss": 0.267, + "step": 12904 + }, + { + "epoch": 35.16348773841962, + "grad_norm": 5.942184925079346, + "learning_rate": 1.5047563156839812e-05, + "loss": 0.2117, + "step": 12905 + }, + { + "epoch": 35.166212534059945, + "grad_norm": 6.416858196258545, + "learning_rate": 1.5046801313213349e-05, + "loss": 0.3, + "step": 12906 + }, + { + "epoch": 35.16893732970027, + "grad_norm": 6.120514869689941, + "learning_rate": 1.5046039430282559e-05, + "loss": 0.4378, + "step": 12907 + }, + { + "epoch": 35.171662125340596, + "grad_norm": 8.632964134216309, + "learning_rate": 1.5045277508053376e-05, + "loss": 0.236, + "step": 12908 + }, + { + "epoch": 35.17438692098093, + "grad_norm": 7.408965110778809, + "learning_rate": 1.5044515546531733e-05, + "loss": 0.3813, + "step": 12909 + }, + { + "epoch": 35.177111716621255, + "grad_norm": 7.03118371963501, + "learning_rate": 1.5043753545723568e-05, + "loss": 0.2874, + "step": 12910 + }, + { + "epoch": 35.17983651226158, + "grad_norm": 7.311297416687012, + "learning_rate": 1.5042991505634812e-05, + "loss": 0.3885, + "step": 12911 + }, + { + "epoch": 35.182561307901906, + "grad_norm": 6.356116771697998, + "learning_rate": 1.50422294262714e-05, + "loss": 0.2529, + "step": 12912 + }, + { + "epoch": 35.18528610354223, + "grad_norm": 7.108633041381836, + "learning_rate": 1.5041467307639268e-05, + "loss": 0.2782, + "step": 12913 + }, + { + "epoch": 35.18801089918256, + "grad_norm": 47.94351577758789, + "learning_rate": 1.504070514974435e-05, + "loss": 0.3183, + "step": 12914 + }, + { + "epoch": 35.19073569482289, + "grad_norm": 5.8043365478515625, + "learning_rate": 1.5039942952592585e-05, + "loss": 0.2344, + "step": 12915 + }, + { + "epoch": 35.19346049046322, + "grad_norm": 9.831428527832031, + "learning_rate": 1.5039180716189903e-05, + "loss": 0.2695, + "step": 12916 + }, + { + "epoch": 35.19618528610354, + "grad_norm": 6.711259365081787, + "learning_rate": 1.5038418440542247e-05, + "loss": 0.2715, + "step": 12917 + }, + { + "epoch": 35.19891008174387, + "grad_norm": 7.609066009521484, + "learning_rate": 1.5037656125655543e-05, + "loss": 0.468, + "step": 12918 + }, + { + "epoch": 35.201634877384194, + "grad_norm": 6.482602119445801, + "learning_rate": 1.5036893771535743e-05, + "loss": 0.4118, + "step": 12919 + }, + { + "epoch": 35.20435967302452, + "grad_norm": 8.60822868347168, + "learning_rate": 1.5036131378188774e-05, + "loss": 0.4206, + "step": 12920 + }, + { + "epoch": 35.20708446866485, + "grad_norm": 7.4198689460754395, + "learning_rate": 1.5035368945620578e-05, + "loss": 0.332, + "step": 12921 + }, + { + "epoch": 35.20980926430518, + "grad_norm": 7.01581335067749, + "learning_rate": 1.503460647383709e-05, + "loss": 0.3773, + "step": 12922 + }, + { + "epoch": 35.212534059945504, + "grad_norm": 7.587332725524902, + "learning_rate": 1.5033843962844246e-05, + "loss": 0.3295, + "step": 12923 + }, + { + "epoch": 35.21525885558583, + "grad_norm": 10.930032730102539, + "learning_rate": 1.503308141264799e-05, + "loss": 0.6685, + "step": 12924 + }, + { + "epoch": 35.217983651226156, + "grad_norm": 6.387872695922852, + "learning_rate": 1.5032318823254257e-05, + "loss": 0.3438, + "step": 12925 + }, + { + "epoch": 35.22070844686648, + "grad_norm": 11.000805854797363, + "learning_rate": 1.5031556194668988e-05, + "loss": 0.3216, + "step": 12926 + }, + { + "epoch": 35.223433242506815, + "grad_norm": 12.715154647827148, + "learning_rate": 1.5030793526898118e-05, + "loss": 0.2976, + "step": 12927 + }, + { + "epoch": 35.22615803814714, + "grad_norm": 6.091267108917236, + "learning_rate": 1.5030030819947592e-05, + "loss": 0.3266, + "step": 12928 + }, + { + "epoch": 35.228882833787466, + "grad_norm": 7.640657901763916, + "learning_rate": 1.5029268073823349e-05, + "loss": 0.4821, + "step": 12929 + }, + { + "epoch": 35.23160762942779, + "grad_norm": 25.278005599975586, + "learning_rate": 1.5028505288531325e-05, + "loss": 0.2789, + "step": 12930 + }, + { + "epoch": 35.23433242506812, + "grad_norm": 9.08450984954834, + "learning_rate": 1.5027742464077468e-05, + "loss": 0.3575, + "step": 12931 + }, + { + "epoch": 35.237057220708444, + "grad_norm": 18.064441680908203, + "learning_rate": 1.502697960046771e-05, + "loss": 0.5448, + "step": 12932 + }, + { + "epoch": 35.23978201634878, + "grad_norm": 9.034799575805664, + "learning_rate": 1.5026216697708002e-05, + "loss": 0.425, + "step": 12933 + }, + { + "epoch": 35.2425068119891, + "grad_norm": 9.033137321472168, + "learning_rate": 1.5025453755804275e-05, + "loss": 0.4044, + "step": 12934 + }, + { + "epoch": 35.24523160762943, + "grad_norm": 6.852743625640869, + "learning_rate": 1.5024690774762478e-05, + "loss": 0.2435, + "step": 12935 + }, + { + "epoch": 35.247956403269754, + "grad_norm": 6.676074981689453, + "learning_rate": 1.5023927754588551e-05, + "loss": 0.2675, + "step": 12936 + }, + { + "epoch": 35.25068119891008, + "grad_norm": 5.360869884490967, + "learning_rate": 1.5023164695288435e-05, + "loss": 0.4157, + "step": 12937 + }, + { + "epoch": 35.253405994550405, + "grad_norm": 7.680437088012695, + "learning_rate": 1.502240159686808e-05, + "loss": 0.3692, + "step": 12938 + }, + { + "epoch": 35.25613079019074, + "grad_norm": 8.144967079162598, + "learning_rate": 1.5021638459333417e-05, + "loss": 0.3655, + "step": 12939 + }, + { + "epoch": 35.258855585831064, + "grad_norm": 7.062442779541016, + "learning_rate": 1.5020875282690392e-05, + "loss": 0.2522, + "step": 12940 + }, + { + "epoch": 35.26158038147139, + "grad_norm": 7.588070869445801, + "learning_rate": 1.502011206694496e-05, + "loss": 0.3133, + "step": 12941 + }, + { + "epoch": 35.264305177111716, + "grad_norm": 5.228339195251465, + "learning_rate": 1.5019348812103052e-05, + "loss": 0.276, + "step": 12942 + }, + { + "epoch": 35.26702997275204, + "grad_norm": 7.7266411781311035, + "learning_rate": 1.501858551817062e-05, + "loss": 0.2988, + "step": 12943 + }, + { + "epoch": 35.26975476839237, + "grad_norm": 9.450374603271484, + "learning_rate": 1.5017822185153602e-05, + "loss": 0.3086, + "step": 12944 + }, + { + "epoch": 35.2724795640327, + "grad_norm": 8.649518966674805, + "learning_rate": 1.5017058813057948e-05, + "loss": 0.4817, + "step": 12945 + }, + { + "epoch": 35.275204359673026, + "grad_norm": 7.016547679901123, + "learning_rate": 1.5016295401889602e-05, + "loss": 0.5093, + "step": 12946 + }, + { + "epoch": 35.27792915531335, + "grad_norm": 15.65822982788086, + "learning_rate": 1.501553195165451e-05, + "loss": 0.2648, + "step": 12947 + }, + { + "epoch": 35.28065395095368, + "grad_norm": 7.363132953643799, + "learning_rate": 1.5014768462358613e-05, + "loss": 0.3209, + "step": 12948 + }, + { + "epoch": 35.283378746594, + "grad_norm": 8.958174705505371, + "learning_rate": 1.5014004934007864e-05, + "loss": 0.3528, + "step": 12949 + }, + { + "epoch": 35.28610354223433, + "grad_norm": 6.925446033477783, + "learning_rate": 1.5013241366608202e-05, + "loss": 0.2886, + "step": 12950 + }, + { + "epoch": 35.28882833787466, + "grad_norm": 6.035683631896973, + "learning_rate": 1.5012477760165581e-05, + "loss": 0.2489, + "step": 12951 + }, + { + "epoch": 35.29155313351499, + "grad_norm": 7.717945575714111, + "learning_rate": 1.5011714114685942e-05, + "loss": 0.5134, + "step": 12952 + }, + { + "epoch": 35.294277929155314, + "grad_norm": 6.433282375335693, + "learning_rate": 1.5010950430175237e-05, + "loss": 0.2674, + "step": 12953 + }, + { + "epoch": 35.29700272479564, + "grad_norm": 7.275332450866699, + "learning_rate": 1.5010186706639412e-05, + "loss": 0.3405, + "step": 12954 + }, + { + "epoch": 35.299727520435965, + "grad_norm": 6.948375225067139, + "learning_rate": 1.5009422944084411e-05, + "loss": 0.3185, + "step": 12955 + }, + { + "epoch": 35.30245231607629, + "grad_norm": 9.078147888183594, + "learning_rate": 1.500865914251619e-05, + "loss": 0.4474, + "step": 12956 + }, + { + "epoch": 35.305177111716624, + "grad_norm": 7.218676567077637, + "learning_rate": 1.500789530194069e-05, + "loss": 0.3599, + "step": 12957 + }, + { + "epoch": 35.30790190735695, + "grad_norm": 8.05556869506836, + "learning_rate": 1.5007131422363864e-05, + "loss": 0.4174, + "step": 12958 + }, + { + "epoch": 35.310626702997276, + "grad_norm": 8.176007270812988, + "learning_rate": 1.5006367503791657e-05, + "loss": 0.3093, + "step": 12959 + }, + { + "epoch": 35.3133514986376, + "grad_norm": 8.308642387390137, + "learning_rate": 1.5005603546230024e-05, + "loss": 0.2853, + "step": 12960 + }, + { + "epoch": 35.31607629427793, + "grad_norm": 7.603718280792236, + "learning_rate": 1.5004839549684907e-05, + "loss": 0.2453, + "step": 12961 + }, + { + "epoch": 35.31880108991825, + "grad_norm": 8.311637878417969, + "learning_rate": 1.5004075514162264e-05, + "loss": 0.3121, + "step": 12962 + }, + { + "epoch": 35.321525885558586, + "grad_norm": 6.768898963928223, + "learning_rate": 1.5003311439668041e-05, + "loss": 0.3403, + "step": 12963 + }, + { + "epoch": 35.32425068119891, + "grad_norm": 9.002680778503418, + "learning_rate": 1.5002547326208193e-05, + "loss": 0.3454, + "step": 12964 + }, + { + "epoch": 35.32697547683924, + "grad_norm": 6.46567964553833, + "learning_rate": 1.5001783173788661e-05, + "loss": 0.2999, + "step": 12965 + }, + { + "epoch": 35.32970027247956, + "grad_norm": 8.28508472442627, + "learning_rate": 1.5001018982415407e-05, + "loss": 0.2375, + "step": 12966 + }, + { + "epoch": 35.33242506811989, + "grad_norm": 7.745180130004883, + "learning_rate": 1.5000254752094376e-05, + "loss": 0.3192, + "step": 12967 + }, + { + "epoch": 35.335149863760215, + "grad_norm": 6.4640913009643555, + "learning_rate": 1.4999490482831526e-05, + "loss": 0.3266, + "step": 12968 + }, + { + "epoch": 35.33787465940055, + "grad_norm": 6.967803001403809, + "learning_rate": 1.49987261746328e-05, + "loss": 0.2811, + "step": 12969 + }, + { + "epoch": 35.34059945504087, + "grad_norm": 6.355371952056885, + "learning_rate": 1.4997961827504156e-05, + "loss": 0.5119, + "step": 12970 + }, + { + "epoch": 35.3433242506812, + "grad_norm": 6.229894638061523, + "learning_rate": 1.499719744145155e-05, + "loss": 0.48, + "step": 12971 + }, + { + "epoch": 35.346049046321525, + "grad_norm": 6.700027942657471, + "learning_rate": 1.499643301648093e-05, + "loss": 0.3835, + "step": 12972 + }, + { + "epoch": 35.34877384196185, + "grad_norm": 6.299387454986572, + "learning_rate": 1.4995668552598249e-05, + "loss": 0.3477, + "step": 12973 + }, + { + "epoch": 35.35149863760218, + "grad_norm": 7.223231315612793, + "learning_rate": 1.4994904049809463e-05, + "loss": 0.3934, + "step": 12974 + }, + { + "epoch": 35.35422343324251, + "grad_norm": 6.085124969482422, + "learning_rate": 1.4994139508120524e-05, + "loss": 0.3353, + "step": 12975 + }, + { + "epoch": 35.356948228882835, + "grad_norm": 9.593476295471191, + "learning_rate": 1.499337492753739e-05, + "loss": 0.4173, + "step": 12976 + }, + { + "epoch": 35.35967302452316, + "grad_norm": 7.308346748352051, + "learning_rate": 1.4992610308066008e-05, + "loss": 0.3616, + "step": 12977 + }, + { + "epoch": 35.36239782016349, + "grad_norm": 8.746541976928711, + "learning_rate": 1.499184564971234e-05, + "loss": 0.3167, + "step": 12978 + }, + { + "epoch": 35.36512261580381, + "grad_norm": 8.048002243041992, + "learning_rate": 1.4991080952482337e-05, + "loss": 0.2381, + "step": 12979 + }, + { + "epoch": 35.36784741144414, + "grad_norm": 7.211552619934082, + "learning_rate": 1.4990316216381961e-05, + "loss": 0.2842, + "step": 12980 + }, + { + "epoch": 35.37057220708447, + "grad_norm": 6.82273530960083, + "learning_rate": 1.4989551441417159e-05, + "loss": 0.4873, + "step": 12981 + }, + { + "epoch": 35.3732970027248, + "grad_norm": 7.440096378326416, + "learning_rate": 1.4988786627593891e-05, + "loss": 0.428, + "step": 12982 + }, + { + "epoch": 35.37602179836512, + "grad_norm": 6.173402309417725, + "learning_rate": 1.4988021774918116e-05, + "loss": 0.3199, + "step": 12983 + }, + { + "epoch": 35.37874659400545, + "grad_norm": 7.369758605957031, + "learning_rate": 1.4987256883395786e-05, + "loss": 0.2651, + "step": 12984 + }, + { + "epoch": 35.381471389645775, + "grad_norm": 6.719857692718506, + "learning_rate": 1.498649195303286e-05, + "loss": 0.4166, + "step": 12985 + }, + { + "epoch": 35.3841961852861, + "grad_norm": 7.939483642578125, + "learning_rate": 1.4985726983835296e-05, + "loss": 0.3062, + "step": 12986 + }, + { + "epoch": 35.38692098092643, + "grad_norm": 8.635056495666504, + "learning_rate": 1.498496197580905e-05, + "loss": 0.3906, + "step": 12987 + }, + { + "epoch": 35.38964577656676, + "grad_norm": 5.695560455322266, + "learning_rate": 1.498419692896008e-05, + "loss": 0.2885, + "step": 12988 + }, + { + "epoch": 35.392370572207085, + "grad_norm": 12.678315162658691, + "learning_rate": 1.4983431843294345e-05, + "loss": 0.2282, + "step": 12989 + }, + { + "epoch": 35.39509536784741, + "grad_norm": 5.157857894897461, + "learning_rate": 1.4982666718817804e-05, + "loss": 0.2074, + "step": 12990 + }, + { + "epoch": 35.39782016348774, + "grad_norm": 7.161243438720703, + "learning_rate": 1.4981901555536414e-05, + "loss": 0.4799, + "step": 12991 + }, + { + "epoch": 35.40054495912806, + "grad_norm": 6.926211833953857, + "learning_rate": 1.4981136353456135e-05, + "loss": 0.3473, + "step": 12992 + }, + { + "epoch": 35.403269754768395, + "grad_norm": 5.929111003875732, + "learning_rate": 1.4980371112582927e-05, + "loss": 0.2735, + "step": 12993 + }, + { + "epoch": 35.40599455040872, + "grad_norm": 7.072702884674072, + "learning_rate": 1.497960583292275e-05, + "loss": 0.3306, + "step": 12994 + }, + { + "epoch": 35.40871934604905, + "grad_norm": 9.228020668029785, + "learning_rate": 1.497884051448156e-05, + "loss": 0.3293, + "step": 12995 + }, + { + "epoch": 35.41144414168937, + "grad_norm": 7.056519031524658, + "learning_rate": 1.4978075157265324e-05, + "loss": 0.3887, + "step": 12996 + }, + { + "epoch": 35.4141689373297, + "grad_norm": 5.909057140350342, + "learning_rate": 1.4977309761279997e-05, + "loss": 0.2881, + "step": 12997 + }, + { + "epoch": 35.416893732970024, + "grad_norm": 8.001152038574219, + "learning_rate": 1.4976544326531542e-05, + "loss": 0.3256, + "step": 12998 + }, + { + "epoch": 35.41961852861036, + "grad_norm": 7.966976642608643, + "learning_rate": 1.497577885302592e-05, + "loss": 0.3325, + "step": 12999 + }, + { + "epoch": 35.42234332425068, + "grad_norm": 7.403523921966553, + "learning_rate": 1.4975013340769094e-05, + "loss": 0.2838, + "step": 13000 + }, + { + "epoch": 35.42506811989101, + "grad_norm": 8.983705520629883, + "learning_rate": 1.497424778976702e-05, + "loss": 0.2521, + "step": 13001 + }, + { + "epoch": 35.427792915531334, + "grad_norm": 16.565153121948242, + "learning_rate": 1.4973482200025669e-05, + "loss": 0.395, + "step": 13002 + }, + { + "epoch": 35.43051771117166, + "grad_norm": 8.130942344665527, + "learning_rate": 1.4972716571550996e-05, + "loss": 0.3645, + "step": 13003 + }, + { + "epoch": 35.433242506811986, + "grad_norm": 6.450094223022461, + "learning_rate": 1.4971950904348966e-05, + "loss": 0.2584, + "step": 13004 + }, + { + "epoch": 35.43596730245232, + "grad_norm": 14.972867012023926, + "learning_rate": 1.4971185198425544e-05, + "loss": 0.3554, + "step": 13005 + }, + { + "epoch": 35.438692098092645, + "grad_norm": 8.811211585998535, + "learning_rate": 1.497041945378669e-05, + "loss": 0.4207, + "step": 13006 + }, + { + "epoch": 35.44141689373297, + "grad_norm": 10.867773056030273, + "learning_rate": 1.4969653670438372e-05, + "loss": 0.2978, + "step": 13007 + }, + { + "epoch": 35.444141689373296, + "grad_norm": 7.401322841644287, + "learning_rate": 1.496888784838655e-05, + "loss": 0.4389, + "step": 13008 + }, + { + "epoch": 35.44686648501362, + "grad_norm": 9.335734367370605, + "learning_rate": 1.4968121987637188e-05, + "loss": 0.4746, + "step": 13009 + }, + { + "epoch": 35.44959128065395, + "grad_norm": 12.53529167175293, + "learning_rate": 1.4967356088196252e-05, + "loss": 0.3506, + "step": 13010 + }, + { + "epoch": 35.45231607629428, + "grad_norm": 8.071320533752441, + "learning_rate": 1.496659015006971e-05, + "loss": 0.2522, + "step": 13011 + }, + { + "epoch": 35.45504087193461, + "grad_norm": 7.37003755569458, + "learning_rate": 1.4965824173263519e-05, + "loss": 0.2563, + "step": 13012 + }, + { + "epoch": 35.45776566757493, + "grad_norm": 6.280857563018799, + "learning_rate": 1.4965058157783651e-05, + "loss": 0.2775, + "step": 13013 + }, + { + "epoch": 35.46049046321526, + "grad_norm": 7.227498531341553, + "learning_rate": 1.4964292103636072e-05, + "loss": 0.3485, + "step": 13014 + }, + { + "epoch": 35.463215258855584, + "grad_norm": 7.105706691741943, + "learning_rate": 1.496352601082674e-05, + "loss": 0.3675, + "step": 13015 + }, + { + "epoch": 35.46594005449591, + "grad_norm": 7.031396865844727, + "learning_rate": 1.4962759879361635e-05, + "loss": 0.2964, + "step": 13016 + }, + { + "epoch": 35.46866485013624, + "grad_norm": 7.706293106079102, + "learning_rate": 1.4961993709246709e-05, + "loss": 0.4787, + "step": 13017 + }, + { + "epoch": 35.47138964577657, + "grad_norm": 6.265936374664307, + "learning_rate": 1.496122750048794e-05, + "loss": 0.2879, + "step": 13018 + }, + { + "epoch": 35.474114441416894, + "grad_norm": 9.70106315612793, + "learning_rate": 1.496046125309129e-05, + "loss": 0.3036, + "step": 13019 + }, + { + "epoch": 35.47683923705722, + "grad_norm": 9.175358772277832, + "learning_rate": 1.4959694967062727e-05, + "loss": 0.4707, + "step": 13020 + }, + { + "epoch": 35.479564032697546, + "grad_norm": 9.831436157226562, + "learning_rate": 1.4958928642408219e-05, + "loss": 0.3326, + "step": 13021 + }, + { + "epoch": 35.48228882833787, + "grad_norm": 18.738372802734375, + "learning_rate": 1.4958162279133734e-05, + "loss": 0.3783, + "step": 13022 + }, + { + "epoch": 35.485013623978205, + "grad_norm": 7.148810863494873, + "learning_rate": 1.4957395877245242e-05, + "loss": 0.4752, + "step": 13023 + }, + { + "epoch": 35.48773841961853, + "grad_norm": 8.935877799987793, + "learning_rate": 1.4956629436748712e-05, + "loss": 0.2694, + "step": 13024 + }, + { + "epoch": 35.490463215258856, + "grad_norm": 7.80535888671875, + "learning_rate": 1.4955862957650108e-05, + "loss": 0.4427, + "step": 13025 + }, + { + "epoch": 35.49318801089918, + "grad_norm": 8.087099075317383, + "learning_rate": 1.4955096439955404e-05, + "loss": 0.37, + "step": 13026 + }, + { + "epoch": 35.49591280653951, + "grad_norm": 6.996232032775879, + "learning_rate": 1.4954329883670569e-05, + "loss": 0.4202, + "step": 13027 + }, + { + "epoch": 35.49863760217983, + "grad_norm": 5.583734512329102, + "learning_rate": 1.4953563288801571e-05, + "loss": 0.3756, + "step": 13028 + }, + { + "epoch": 35.50136239782017, + "grad_norm": 12.677495002746582, + "learning_rate": 1.4952796655354383e-05, + "loss": 0.3509, + "step": 13029 + }, + { + "epoch": 35.50408719346049, + "grad_norm": 7.13171911239624, + "learning_rate": 1.4952029983334973e-05, + "loss": 0.2833, + "step": 13030 + }, + { + "epoch": 35.50681198910082, + "grad_norm": 9.175862312316895, + "learning_rate": 1.4951263272749313e-05, + "loss": 0.4503, + "step": 13031 + }, + { + "epoch": 35.509536784741144, + "grad_norm": 40.1395149230957, + "learning_rate": 1.4950496523603373e-05, + "loss": 0.2751, + "step": 13032 + }, + { + "epoch": 35.51226158038147, + "grad_norm": 8.28769588470459, + "learning_rate": 1.4949729735903127e-05, + "loss": 0.3824, + "step": 13033 + }, + { + "epoch": 35.514986376021795, + "grad_norm": 8.487380027770996, + "learning_rate": 1.4948962909654545e-05, + "loss": 0.3179, + "step": 13034 + }, + { + "epoch": 35.51771117166213, + "grad_norm": 8.022058486938477, + "learning_rate": 1.4948196044863599e-05, + "loss": 0.3322, + "step": 13035 + }, + { + "epoch": 35.520435967302454, + "grad_norm": 7.599024295806885, + "learning_rate": 1.4947429141536262e-05, + "loss": 0.5132, + "step": 13036 + }, + { + "epoch": 35.52316076294278, + "grad_norm": 6.896925926208496, + "learning_rate": 1.4946662199678503e-05, + "loss": 0.4443, + "step": 13037 + }, + { + "epoch": 35.525885558583106, + "grad_norm": 7.097535133361816, + "learning_rate": 1.49458952192963e-05, + "loss": 0.3708, + "step": 13038 + }, + { + "epoch": 35.52861035422343, + "grad_norm": 7.393113613128662, + "learning_rate": 1.4945128200395627e-05, + "loss": 0.4984, + "step": 13039 + }, + { + "epoch": 35.53133514986376, + "grad_norm": 16.788925170898438, + "learning_rate": 1.494436114298245e-05, + "loss": 0.339, + "step": 13040 + }, + { + "epoch": 35.53405994550409, + "grad_norm": 6.135458469390869, + "learning_rate": 1.4943594047062752e-05, + "loss": 0.3078, + "step": 13041 + }, + { + "epoch": 35.536784741144416, + "grad_norm": 22.487558364868164, + "learning_rate": 1.4942826912642501e-05, + "loss": 0.3701, + "step": 13042 + }, + { + "epoch": 35.53950953678474, + "grad_norm": 5.258029937744141, + "learning_rate": 1.4942059739727674e-05, + "loss": 0.2841, + "step": 13043 + }, + { + "epoch": 35.54223433242507, + "grad_norm": 6.1360039710998535, + "learning_rate": 1.4941292528324243e-05, + "loss": 0.4158, + "step": 13044 + }, + { + "epoch": 35.54495912806539, + "grad_norm": 17.92101287841797, + "learning_rate": 1.4940525278438185e-05, + "loss": 0.2211, + "step": 13045 + }, + { + "epoch": 35.54768392370572, + "grad_norm": 5.610847473144531, + "learning_rate": 1.4939757990075477e-05, + "loss": 0.3317, + "step": 13046 + }, + { + "epoch": 35.55040871934605, + "grad_norm": 7.047835826873779, + "learning_rate": 1.4938990663242088e-05, + "loss": 0.3626, + "step": 13047 + }, + { + "epoch": 35.55313351498638, + "grad_norm": 8.515892028808594, + "learning_rate": 1.4938223297944002e-05, + "loss": 0.4571, + "step": 13048 + }, + { + "epoch": 35.555858310626704, + "grad_norm": 8.290979385375977, + "learning_rate": 1.4937455894187194e-05, + "loss": 0.282, + "step": 13049 + }, + { + "epoch": 35.55858310626703, + "grad_norm": 8.804868698120117, + "learning_rate": 1.4936688451977634e-05, + "loss": 0.2292, + "step": 13050 + }, + { + "epoch": 35.561307901907355, + "grad_norm": 9.756802558898926, + "learning_rate": 1.4935920971321307e-05, + "loss": 0.4769, + "step": 13051 + }, + { + "epoch": 35.56403269754768, + "grad_norm": 9.684371948242188, + "learning_rate": 1.4935153452224182e-05, + "loss": 0.2839, + "step": 13052 + }, + { + "epoch": 35.566757493188014, + "grad_norm": 7.277624130249023, + "learning_rate": 1.4934385894692247e-05, + "loss": 0.3809, + "step": 13053 + }, + { + "epoch": 35.56948228882834, + "grad_norm": 7.828587055206299, + "learning_rate": 1.493361829873147e-05, + "loss": 0.3798, + "step": 13054 + }, + { + "epoch": 35.572207084468666, + "grad_norm": 6.445404052734375, + "learning_rate": 1.493285066434783e-05, + "loss": 0.4615, + "step": 13055 + }, + { + "epoch": 35.57493188010899, + "grad_norm": 8.173526763916016, + "learning_rate": 1.493208299154731e-05, + "loss": 0.3491, + "step": 13056 + }, + { + "epoch": 35.57765667574932, + "grad_norm": 13.190991401672363, + "learning_rate": 1.4931315280335888e-05, + "loss": 0.3542, + "step": 13057 + }, + { + "epoch": 35.58038147138964, + "grad_norm": 8.441964149475098, + "learning_rate": 1.4930547530719539e-05, + "loss": 0.2137, + "step": 13058 + }, + { + "epoch": 35.583106267029976, + "grad_norm": 15.430624008178711, + "learning_rate": 1.4929779742704246e-05, + "loss": 0.4155, + "step": 13059 + }, + { + "epoch": 35.5858310626703, + "grad_norm": 9.153474807739258, + "learning_rate": 1.4929011916295986e-05, + "loss": 0.2364, + "step": 13060 + }, + { + "epoch": 35.58855585831063, + "grad_norm": 8.394576072692871, + "learning_rate": 1.4928244051500742e-05, + "loss": 0.277, + "step": 13061 + }, + { + "epoch": 35.59128065395095, + "grad_norm": 6.277867317199707, + "learning_rate": 1.4927476148324488e-05, + "loss": 0.3002, + "step": 13062 + }, + { + "epoch": 35.59400544959128, + "grad_norm": 6.191000938415527, + "learning_rate": 1.4926708206773213e-05, + "loss": 0.4512, + "step": 13063 + }, + { + "epoch": 35.596730245231605, + "grad_norm": 6.844345569610596, + "learning_rate": 1.4925940226852889e-05, + "loss": 0.4242, + "step": 13064 + }, + { + "epoch": 35.59945504087194, + "grad_norm": 6.637400150299072, + "learning_rate": 1.4925172208569502e-05, + "loss": 0.3007, + "step": 13065 + }, + { + "epoch": 35.60217983651226, + "grad_norm": 14.81370735168457, + "learning_rate": 1.4924404151929033e-05, + "loss": 0.4465, + "step": 13066 + }, + { + "epoch": 35.60490463215259, + "grad_norm": 9.97683048248291, + "learning_rate": 1.4923636056937466e-05, + "loss": 0.2724, + "step": 13067 + }, + { + "epoch": 35.607629427792915, + "grad_norm": 28.20574378967285, + "learning_rate": 1.4922867923600774e-05, + "loss": 0.3198, + "step": 13068 + }, + { + "epoch": 35.61035422343324, + "grad_norm": 8.994606971740723, + "learning_rate": 1.492209975192495e-05, + "loss": 0.3557, + "step": 13069 + }, + { + "epoch": 35.61307901907357, + "grad_norm": 7.081641674041748, + "learning_rate": 1.492133154191597e-05, + "loss": 0.3023, + "step": 13070 + }, + { + "epoch": 35.6158038147139, + "grad_norm": 7.818090915679932, + "learning_rate": 1.4920563293579817e-05, + "loss": 0.4968, + "step": 13071 + }, + { + "epoch": 35.618528610354225, + "grad_norm": 6.1535162925720215, + "learning_rate": 1.4919795006922475e-05, + "loss": 0.2741, + "step": 13072 + }, + { + "epoch": 35.62125340599455, + "grad_norm": 7.111542701721191, + "learning_rate": 1.491902668194993e-05, + "loss": 0.3892, + "step": 13073 + }, + { + "epoch": 35.62397820163488, + "grad_norm": 12.075234413146973, + "learning_rate": 1.491825831866816e-05, + "loss": 0.2781, + "step": 13074 + }, + { + "epoch": 35.6267029972752, + "grad_norm": 7.627728462219238, + "learning_rate": 1.4917489917083157e-05, + "loss": 0.3509, + "step": 13075 + }, + { + "epoch": 35.62942779291553, + "grad_norm": 6.458619594573975, + "learning_rate": 1.49167214772009e-05, + "loss": 0.3506, + "step": 13076 + }, + { + "epoch": 35.63215258855586, + "grad_norm": 7.432330131530762, + "learning_rate": 1.4915952999027371e-05, + "loss": 0.359, + "step": 13077 + }, + { + "epoch": 35.63487738419619, + "grad_norm": 6.9332146644592285, + "learning_rate": 1.4915184482568562e-05, + "loss": 0.3243, + "step": 13078 + }, + { + "epoch": 35.63760217983651, + "grad_norm": 6.224339008331299, + "learning_rate": 1.4914415927830455e-05, + "loss": 0.3245, + "step": 13079 + }, + { + "epoch": 35.64032697547684, + "grad_norm": 7.042000770568848, + "learning_rate": 1.491364733481903e-05, + "loss": 0.4737, + "step": 13080 + }, + { + "epoch": 35.643051771117165, + "grad_norm": 6.224331855773926, + "learning_rate": 1.4912878703540281e-05, + "loss": 0.2442, + "step": 13081 + }, + { + "epoch": 35.64577656675749, + "grad_norm": 7.393121719360352, + "learning_rate": 1.4912110034000189e-05, + "loss": 0.403, + "step": 13082 + }, + { + "epoch": 35.64850136239782, + "grad_norm": 11.491524696350098, + "learning_rate": 1.4911341326204744e-05, + "loss": 0.2932, + "step": 13083 + }, + { + "epoch": 35.65122615803815, + "grad_norm": 5.53161096572876, + "learning_rate": 1.491057258015993e-05, + "loss": 0.2961, + "step": 13084 + }, + { + "epoch": 35.653950953678475, + "grad_norm": 8.468855857849121, + "learning_rate": 1.4909803795871738e-05, + "loss": 0.2301, + "step": 13085 + }, + { + "epoch": 35.6566757493188, + "grad_norm": 5.951993942260742, + "learning_rate": 1.4909034973346148e-05, + "loss": 0.3076, + "step": 13086 + }, + { + "epoch": 35.65940054495913, + "grad_norm": 7.281175136566162, + "learning_rate": 1.4908266112589154e-05, + "loss": 0.5266, + "step": 13087 + }, + { + "epoch": 35.66212534059945, + "grad_norm": 6.1608428955078125, + "learning_rate": 1.4907497213606738e-05, + "loss": 0.4055, + "step": 13088 + }, + { + "epoch": 35.664850136239785, + "grad_norm": 9.514596939086914, + "learning_rate": 1.4906728276404897e-05, + "loss": 0.3609, + "step": 13089 + }, + { + "epoch": 35.66757493188011, + "grad_norm": 8.773531913757324, + "learning_rate": 1.4905959300989607e-05, + "loss": 0.4261, + "step": 13090 + }, + { + "epoch": 35.67029972752044, + "grad_norm": 10.161262512207031, + "learning_rate": 1.4905190287366868e-05, + "loss": 0.305, + "step": 13091 + }, + { + "epoch": 35.67302452316076, + "grad_norm": 7.274245262145996, + "learning_rate": 1.4904421235542666e-05, + "loss": 0.2856, + "step": 13092 + }, + { + "epoch": 35.67574931880109, + "grad_norm": 6.7615227699279785, + "learning_rate": 1.4903652145522989e-05, + "loss": 0.3203, + "step": 13093 + }, + { + "epoch": 35.678474114441414, + "grad_norm": 5.8968095779418945, + "learning_rate": 1.4902883017313825e-05, + "loss": 0.3685, + "step": 13094 + }, + { + "epoch": 35.68119891008175, + "grad_norm": 8.771279335021973, + "learning_rate": 1.4902113850921169e-05, + "loss": 0.4639, + "step": 13095 + }, + { + "epoch": 35.68392370572207, + "grad_norm": 6.069421291351318, + "learning_rate": 1.4901344646351006e-05, + "loss": 0.2535, + "step": 13096 + }, + { + "epoch": 35.6866485013624, + "grad_norm": 6.342672348022461, + "learning_rate": 1.4900575403609328e-05, + "loss": 0.2945, + "step": 13097 + }, + { + "epoch": 35.689373297002724, + "grad_norm": 6.845711708068848, + "learning_rate": 1.4899806122702127e-05, + "loss": 0.4431, + "step": 13098 + }, + { + "epoch": 35.69209809264305, + "grad_norm": 7.4353814125061035, + "learning_rate": 1.4899036803635393e-05, + "loss": 0.4305, + "step": 13099 + }, + { + "epoch": 35.694822888283376, + "grad_norm": 7.208191871643066, + "learning_rate": 1.489826744641512e-05, + "loss": 0.2509, + "step": 13100 + }, + { + "epoch": 35.69754768392371, + "grad_norm": 7.7229156494140625, + "learning_rate": 1.4897498051047297e-05, + "loss": 0.2904, + "step": 13101 + }, + { + "epoch": 35.700272479564035, + "grad_norm": 6.398213863372803, + "learning_rate": 1.4896728617537914e-05, + "loss": 0.5042, + "step": 13102 + }, + { + "epoch": 35.70299727520436, + "grad_norm": 19.481176376342773, + "learning_rate": 1.489595914589297e-05, + "loss": 0.3272, + "step": 13103 + }, + { + "epoch": 35.705722070844686, + "grad_norm": 7.918393611907959, + "learning_rate": 1.4895189636118453e-05, + "loss": 0.3833, + "step": 13104 + }, + { + "epoch": 35.70844686648501, + "grad_norm": 6.956137657165527, + "learning_rate": 1.4894420088220356e-05, + "loss": 0.3163, + "step": 13105 + }, + { + "epoch": 35.71117166212534, + "grad_norm": 8.419601440429688, + "learning_rate": 1.4893650502204673e-05, + "loss": 0.311, + "step": 13106 + }, + { + "epoch": 35.71389645776567, + "grad_norm": 6.122564315795898, + "learning_rate": 1.4892880878077396e-05, + "loss": 0.5188, + "step": 13107 + }, + { + "epoch": 35.716621253406, + "grad_norm": 14.754682540893555, + "learning_rate": 1.4892111215844523e-05, + "loss": 0.2638, + "step": 13108 + }, + { + "epoch": 35.71934604904632, + "grad_norm": 8.965763092041016, + "learning_rate": 1.489134151551204e-05, + "loss": 0.4526, + "step": 13109 + }, + { + "epoch": 35.72207084468665, + "grad_norm": 7.389782428741455, + "learning_rate": 1.4890571777085954e-05, + "loss": 0.2732, + "step": 13110 + }, + { + "epoch": 35.724795640326974, + "grad_norm": 6.4090118408203125, + "learning_rate": 1.4889802000572247e-05, + "loss": 0.3694, + "step": 13111 + }, + { + "epoch": 35.7275204359673, + "grad_norm": 7.850404739379883, + "learning_rate": 1.4889032185976922e-05, + "loss": 0.3446, + "step": 13112 + }, + { + "epoch": 35.73024523160763, + "grad_norm": 7.053712844848633, + "learning_rate": 1.4888262333305971e-05, + "loss": 0.3712, + "step": 13113 + }, + { + "epoch": 35.73297002724796, + "grad_norm": 15.967446327209473, + "learning_rate": 1.488749244256539e-05, + "loss": 0.4603, + "step": 13114 + }, + { + "epoch": 35.735694822888284, + "grad_norm": 9.032360076904297, + "learning_rate": 1.4886722513761176e-05, + "loss": 0.3412, + "step": 13115 + }, + { + "epoch": 35.73841961852861, + "grad_norm": 6.181352138519287, + "learning_rate": 1.4885952546899323e-05, + "loss": 0.3625, + "step": 13116 + }, + { + "epoch": 35.741144414168936, + "grad_norm": 6.852163314819336, + "learning_rate": 1.4885182541985827e-05, + "loss": 0.3344, + "step": 13117 + }, + { + "epoch": 35.74386920980926, + "grad_norm": 6.599365711212158, + "learning_rate": 1.4884412499026693e-05, + "loss": 0.3532, + "step": 13118 + }, + { + "epoch": 35.746594005449595, + "grad_norm": 9.913313865661621, + "learning_rate": 1.4883642418027906e-05, + "loss": 0.3358, + "step": 13119 + }, + { + "epoch": 35.74931880108992, + "grad_norm": 7.836754322052002, + "learning_rate": 1.4882872298995472e-05, + "loss": 0.3151, + "step": 13120 + }, + { + "epoch": 35.752043596730246, + "grad_norm": 6.892861843109131, + "learning_rate": 1.4882102141935381e-05, + "loss": 0.2828, + "step": 13121 + }, + { + "epoch": 35.75476839237057, + "grad_norm": 6.486696243286133, + "learning_rate": 1.4881331946853643e-05, + "loss": 0.3953, + "step": 13122 + }, + { + "epoch": 35.7574931880109, + "grad_norm": 8.368975639343262, + "learning_rate": 1.4880561713756243e-05, + "loss": 0.3417, + "step": 13123 + }, + { + "epoch": 35.76021798365122, + "grad_norm": 6.539047718048096, + "learning_rate": 1.4879791442649188e-05, + "loss": 0.3057, + "step": 13124 + }, + { + "epoch": 35.762942779291556, + "grad_norm": 6.887070655822754, + "learning_rate": 1.4879021133538471e-05, + "loss": 0.4626, + "step": 13125 + }, + { + "epoch": 35.76566757493188, + "grad_norm": 5.815514087677002, + "learning_rate": 1.4878250786430099e-05, + "loss": 0.2421, + "step": 13126 + }, + { + "epoch": 35.76839237057221, + "grad_norm": 9.211060523986816, + "learning_rate": 1.4877480401330065e-05, + "loss": 0.4502, + "step": 13127 + }, + { + "epoch": 35.771117166212534, + "grad_norm": 11.286864280700684, + "learning_rate": 1.4876709978244372e-05, + "loss": 0.3573, + "step": 13128 + }, + { + "epoch": 35.77384196185286, + "grad_norm": 11.223306655883789, + "learning_rate": 1.4875939517179016e-05, + "loss": 0.3916, + "step": 13129 + }, + { + "epoch": 35.776566757493185, + "grad_norm": 12.014117240905762, + "learning_rate": 1.4875169018140003e-05, + "loss": 0.3492, + "step": 13130 + }, + { + "epoch": 35.77929155313352, + "grad_norm": 7.441474914550781, + "learning_rate": 1.4874398481133327e-05, + "loss": 0.4038, + "step": 13131 + }, + { + "epoch": 35.782016348773844, + "grad_norm": 12.697399139404297, + "learning_rate": 1.4873627906164997e-05, + "loss": 0.2928, + "step": 13132 + }, + { + "epoch": 35.78474114441417, + "grad_norm": 8.545955657958984, + "learning_rate": 1.4872857293241002e-05, + "loss": 0.2599, + "step": 13133 + }, + { + "epoch": 35.787465940054496, + "grad_norm": 10.86761474609375, + "learning_rate": 1.487208664236736e-05, + "loss": 0.1661, + "step": 13134 + }, + { + "epoch": 35.79019073569482, + "grad_norm": 9.067625045776367, + "learning_rate": 1.487131595355006e-05, + "loss": 0.3055, + "step": 13135 + }, + { + "epoch": 35.79291553133515, + "grad_norm": 7.21870231628418, + "learning_rate": 1.487054522679511e-05, + "loss": 0.3204, + "step": 13136 + }, + { + "epoch": 35.79564032697548, + "grad_norm": 6.984853744506836, + "learning_rate": 1.4869774462108506e-05, + "loss": 0.2603, + "step": 13137 + }, + { + "epoch": 35.798365122615806, + "grad_norm": 6.351567268371582, + "learning_rate": 1.4869003659496262e-05, + "loss": 0.2962, + "step": 13138 + }, + { + "epoch": 35.80108991825613, + "grad_norm": 8.221277236938477, + "learning_rate": 1.4868232818964368e-05, + "loss": 0.3925, + "step": 13139 + }, + { + "epoch": 35.80381471389646, + "grad_norm": 6.445461273193359, + "learning_rate": 1.4867461940518836e-05, + "loss": 0.2764, + "step": 13140 + }, + { + "epoch": 35.80653950953678, + "grad_norm": 10.9315185546875, + "learning_rate": 1.4866691024165665e-05, + "loss": 0.3392, + "step": 13141 + }, + { + "epoch": 35.80926430517711, + "grad_norm": 7.6769890785217285, + "learning_rate": 1.4865920069910865e-05, + "loss": 0.4421, + "step": 13142 + }, + { + "epoch": 35.81198910081744, + "grad_norm": 6.350608825683594, + "learning_rate": 1.4865149077760435e-05, + "loss": 0.3172, + "step": 13143 + }, + { + "epoch": 35.81471389645777, + "grad_norm": 7.1840291023254395, + "learning_rate": 1.486437804772038e-05, + "loss": 0.3192, + "step": 13144 + }, + { + "epoch": 35.817438692098094, + "grad_norm": 6.86708402633667, + "learning_rate": 1.4863606979796703e-05, + "loss": 0.3418, + "step": 13145 + }, + { + "epoch": 35.82016348773842, + "grad_norm": 7.209695339202881, + "learning_rate": 1.4862835873995416e-05, + "loss": 0.2687, + "step": 13146 + }, + { + "epoch": 35.822888283378745, + "grad_norm": 6.7395524978637695, + "learning_rate": 1.4862064730322516e-05, + "loss": 0.2544, + "step": 13147 + }, + { + "epoch": 35.82561307901907, + "grad_norm": 7.084775447845459, + "learning_rate": 1.4861293548784016e-05, + "loss": 0.2883, + "step": 13148 + }, + { + "epoch": 35.828337874659404, + "grad_norm": 9.86668872833252, + "learning_rate": 1.4860522329385914e-05, + "loss": 0.3532, + "step": 13149 + }, + { + "epoch": 35.83106267029973, + "grad_norm": 8.076080322265625, + "learning_rate": 1.485975107213422e-05, + "loss": 0.3002, + "step": 13150 + }, + { + "epoch": 35.833787465940055, + "grad_norm": 6.871728897094727, + "learning_rate": 1.4858979777034943e-05, + "loss": 0.2149, + "step": 13151 + }, + { + "epoch": 35.83651226158038, + "grad_norm": 6.7171759605407715, + "learning_rate": 1.4858208444094092e-05, + "loss": 0.3418, + "step": 13152 + }, + { + "epoch": 35.83923705722071, + "grad_norm": 7.652675151824951, + "learning_rate": 1.4857437073317665e-05, + "loss": 0.4183, + "step": 13153 + }, + { + "epoch": 35.84196185286103, + "grad_norm": 8.919107437133789, + "learning_rate": 1.4856665664711676e-05, + "loss": 0.3783, + "step": 13154 + }, + { + "epoch": 35.844686648501366, + "grad_norm": 12.379136085510254, + "learning_rate": 1.485589421828213e-05, + "loss": 0.4065, + "step": 13155 + }, + { + "epoch": 35.84741144414169, + "grad_norm": 8.966519355773926, + "learning_rate": 1.4855122734035037e-05, + "loss": 0.3304, + "step": 13156 + }, + { + "epoch": 35.85013623978202, + "grad_norm": 6.137722969055176, + "learning_rate": 1.4854351211976403e-05, + "loss": 0.3392, + "step": 13157 + }, + { + "epoch": 35.85286103542234, + "grad_norm": 7.204695701599121, + "learning_rate": 1.485357965211224e-05, + "loss": 0.4766, + "step": 13158 + }, + { + "epoch": 35.85558583106267, + "grad_norm": 5.848073482513428, + "learning_rate": 1.4852808054448553e-05, + "loss": 0.3183, + "step": 13159 + }, + { + "epoch": 35.858310626702995, + "grad_norm": 6.540821552276611, + "learning_rate": 1.4852036418991356e-05, + "loss": 0.2634, + "step": 13160 + }, + { + "epoch": 35.86103542234333, + "grad_norm": 7.086192607879639, + "learning_rate": 1.4851264745746653e-05, + "loss": 0.2425, + "step": 13161 + }, + { + "epoch": 35.86376021798365, + "grad_norm": 7.513698577880859, + "learning_rate": 1.4850493034720457e-05, + "loss": 0.2538, + "step": 13162 + }, + { + "epoch": 35.86648501362398, + "grad_norm": 9.127217292785645, + "learning_rate": 1.4849721285918777e-05, + "loss": 0.3346, + "step": 13163 + }, + { + "epoch": 35.869209809264305, + "grad_norm": 6.7912373542785645, + "learning_rate": 1.4848949499347625e-05, + "loss": 0.2762, + "step": 13164 + }, + { + "epoch": 35.87193460490463, + "grad_norm": 8.182476997375488, + "learning_rate": 1.4848177675013009e-05, + "loss": 0.2885, + "step": 13165 + }, + { + "epoch": 35.87465940054496, + "grad_norm": 7.489778518676758, + "learning_rate": 1.4847405812920943e-05, + "loss": 0.6197, + "step": 13166 + }, + { + "epoch": 35.87738419618529, + "grad_norm": 7.308894157409668, + "learning_rate": 1.4846633913077432e-05, + "loss": 0.2206, + "step": 13167 + }, + { + "epoch": 35.880108991825615, + "grad_norm": 7.15823221206665, + "learning_rate": 1.4845861975488495e-05, + "loss": 0.402, + "step": 13168 + }, + { + "epoch": 35.88283378746594, + "grad_norm": 5.423677444458008, + "learning_rate": 1.4845090000160142e-05, + "loss": 0.3098, + "step": 13169 + }, + { + "epoch": 35.88555858310627, + "grad_norm": 6.926116466522217, + "learning_rate": 1.4844317987098384e-05, + "loss": 0.2586, + "step": 13170 + }, + { + "epoch": 35.88828337874659, + "grad_norm": 6.592591762542725, + "learning_rate": 1.4843545936309233e-05, + "loss": 0.2909, + "step": 13171 + }, + { + "epoch": 35.89100817438692, + "grad_norm": 6.371806621551514, + "learning_rate": 1.4842773847798703e-05, + "loss": 0.3787, + "step": 13172 + }, + { + "epoch": 35.89373297002725, + "grad_norm": 6.53985595703125, + "learning_rate": 1.4842001721572804e-05, + "loss": 0.2646, + "step": 13173 + }, + { + "epoch": 35.89645776566758, + "grad_norm": 7.660606384277344, + "learning_rate": 1.4841229557637553e-05, + "loss": 0.3408, + "step": 13174 + }, + { + "epoch": 35.8991825613079, + "grad_norm": 9.842541694641113, + "learning_rate": 1.4840457355998963e-05, + "loss": 0.3557, + "step": 13175 + }, + { + "epoch": 35.90190735694823, + "grad_norm": 8.344846725463867, + "learning_rate": 1.4839685116663042e-05, + "loss": 0.2732, + "step": 13176 + }, + { + "epoch": 35.904632152588555, + "grad_norm": 5.782425880432129, + "learning_rate": 1.4838912839635813e-05, + "loss": 0.2045, + "step": 13177 + }, + { + "epoch": 35.90735694822888, + "grad_norm": 8.65829086303711, + "learning_rate": 1.4838140524923286e-05, + "loss": 0.3608, + "step": 13178 + }, + { + "epoch": 35.91008174386921, + "grad_norm": 7.713167667388916, + "learning_rate": 1.4837368172531477e-05, + "loss": 0.4244, + "step": 13179 + }, + { + "epoch": 35.91280653950954, + "grad_norm": 5.795069694519043, + "learning_rate": 1.4836595782466401e-05, + "loss": 0.462, + "step": 13180 + }, + { + "epoch": 35.915531335149865, + "grad_norm": 6.473036766052246, + "learning_rate": 1.4835823354734072e-05, + "loss": 0.366, + "step": 13181 + }, + { + "epoch": 35.91825613079019, + "grad_norm": 7.549315929412842, + "learning_rate": 1.4835050889340506e-05, + "loss": 0.3901, + "step": 13182 + }, + { + "epoch": 35.920980926430516, + "grad_norm": 8.299123764038086, + "learning_rate": 1.4834278386291718e-05, + "loss": 0.3112, + "step": 13183 + }, + { + "epoch": 35.92370572207084, + "grad_norm": 9.232878684997559, + "learning_rate": 1.4833505845593725e-05, + "loss": 0.4068, + "step": 13184 + }, + { + "epoch": 35.926430517711175, + "grad_norm": 7.171113967895508, + "learning_rate": 1.4832733267252545e-05, + "loss": 0.2828, + "step": 13185 + }, + { + "epoch": 35.9291553133515, + "grad_norm": 7.342721939086914, + "learning_rate": 1.4831960651274196e-05, + "loss": 0.2781, + "step": 13186 + }, + { + "epoch": 35.93188010899183, + "grad_norm": 7.980126857757568, + "learning_rate": 1.4831187997664691e-05, + "loss": 0.4585, + "step": 13187 + }, + { + "epoch": 35.93460490463215, + "grad_norm": 10.442893028259277, + "learning_rate": 1.4830415306430051e-05, + "loss": 0.5404, + "step": 13188 + }, + { + "epoch": 35.93732970027248, + "grad_norm": 7.508268356323242, + "learning_rate": 1.4829642577576289e-05, + "loss": 0.3302, + "step": 13189 + }, + { + "epoch": 35.940054495912804, + "grad_norm": 6.966134071350098, + "learning_rate": 1.482886981110943e-05, + "loss": 0.3431, + "step": 13190 + }, + { + "epoch": 35.94277929155314, + "grad_norm": 7.196403503417969, + "learning_rate": 1.4828097007035484e-05, + "loss": 0.3547, + "step": 13191 + }, + { + "epoch": 35.94550408719346, + "grad_norm": 7.072295188903809, + "learning_rate": 1.4827324165360478e-05, + "loss": 0.3083, + "step": 13192 + }, + { + "epoch": 35.94822888283379, + "grad_norm": 7.4165802001953125, + "learning_rate": 1.4826551286090425e-05, + "loss": 0.5513, + "step": 13193 + }, + { + "epoch": 35.950953678474114, + "grad_norm": 6.74781608581543, + "learning_rate": 1.4825778369231344e-05, + "loss": 0.2412, + "step": 13194 + }, + { + "epoch": 35.95367847411444, + "grad_norm": 7.24605131149292, + "learning_rate": 1.482500541478926e-05, + "loss": 0.45, + "step": 13195 + }, + { + "epoch": 35.956403269754766, + "grad_norm": 6.660770416259766, + "learning_rate": 1.4824232422770185e-05, + "loss": 0.3214, + "step": 13196 + }, + { + "epoch": 35.95912806539509, + "grad_norm": 11.896281242370605, + "learning_rate": 1.4823459393180147e-05, + "loss": 0.3054, + "step": 13197 + }, + { + "epoch": 35.961852861035425, + "grad_norm": 6.343620300292969, + "learning_rate": 1.482268632602516e-05, + "loss": 0.3669, + "step": 13198 + }, + { + "epoch": 35.96457765667575, + "grad_norm": 5.846088886260986, + "learning_rate": 1.4821913221311249e-05, + "loss": 0.315, + "step": 13199 + }, + { + "epoch": 35.967302452316076, + "grad_norm": 6.030350685119629, + "learning_rate": 1.482114007904443e-05, + "loss": 0.3785, + "step": 13200 + }, + { + "epoch": 35.9700272479564, + "grad_norm": 5.9081549644470215, + "learning_rate": 1.4820366899230729e-05, + "loss": 0.2973, + "step": 13201 + }, + { + "epoch": 35.97275204359673, + "grad_norm": 8.589384078979492, + "learning_rate": 1.4819593681876168e-05, + "loss": 0.4471, + "step": 13202 + }, + { + "epoch": 35.97547683923706, + "grad_norm": 9.04414176940918, + "learning_rate": 1.4818820426986763e-05, + "loss": 0.3004, + "step": 13203 + }, + { + "epoch": 35.97820163487739, + "grad_norm": 5.686853885650635, + "learning_rate": 1.481804713456854e-05, + "loss": 0.3357, + "step": 13204 + }, + { + "epoch": 35.98092643051771, + "grad_norm": 6.3393330574035645, + "learning_rate": 1.4817273804627526e-05, + "loss": 0.4384, + "step": 13205 + }, + { + "epoch": 35.98365122615804, + "grad_norm": 8.94064998626709, + "learning_rate": 1.4816500437169735e-05, + "loss": 0.4419, + "step": 13206 + }, + { + "epoch": 35.986376021798364, + "grad_norm": 6.159207820892334, + "learning_rate": 1.4815727032201192e-05, + "loss": 0.3942, + "step": 13207 + }, + { + "epoch": 35.98910081743869, + "grad_norm": 8.340045928955078, + "learning_rate": 1.4814953589727922e-05, + "loss": 0.2921, + "step": 13208 + }, + { + "epoch": 35.991825613079016, + "grad_norm": 9.072864532470703, + "learning_rate": 1.4814180109755954e-05, + "loss": 0.3489, + "step": 13209 + }, + { + "epoch": 35.99455040871935, + "grad_norm": 5.044756889343262, + "learning_rate": 1.4813406592291298e-05, + "loss": 0.4151, + "step": 13210 + }, + { + "epoch": 35.997275204359674, + "grad_norm": 7.601471424102783, + "learning_rate": 1.4812633037339992e-05, + "loss": 0.4428, + "step": 13211 + }, + { + "epoch": 36.0, + "grad_norm": 5.451930046081543, + "learning_rate": 1.4811859444908053e-05, + "loss": 0.5436, + "step": 13212 + }, + { + "epoch": 36.002724795640326, + "grad_norm": 8.351494789123535, + "learning_rate": 1.4811085815001507e-05, + "loss": 0.3569, + "step": 13213 + }, + { + "epoch": 36.00544959128065, + "grad_norm": 6.551837921142578, + "learning_rate": 1.481031214762638e-05, + "loss": 0.2808, + "step": 13214 + }, + { + "epoch": 36.00817438692098, + "grad_norm": 5.7202863693237305, + "learning_rate": 1.4809538442788698e-05, + "loss": 0.3351, + "step": 13215 + }, + { + "epoch": 36.01089918256131, + "grad_norm": 8.296695709228516, + "learning_rate": 1.4808764700494482e-05, + "loss": 0.3342, + "step": 13216 + }, + { + "epoch": 36.013623978201636, + "grad_norm": 5.594487190246582, + "learning_rate": 1.4807990920749766e-05, + "loss": 0.3683, + "step": 13217 + }, + { + "epoch": 36.01634877384196, + "grad_norm": 8.664252281188965, + "learning_rate": 1.4807217103560567e-05, + "loss": 0.3099, + "step": 13218 + }, + { + "epoch": 36.01907356948229, + "grad_norm": 7.050753593444824, + "learning_rate": 1.4806443248932917e-05, + "loss": 0.4896, + "step": 13219 + }, + { + "epoch": 36.02179836512261, + "grad_norm": 6.4368438720703125, + "learning_rate": 1.4805669356872843e-05, + "loss": 0.3148, + "step": 13220 + }, + { + "epoch": 36.02452316076294, + "grad_norm": 7.973339557647705, + "learning_rate": 1.4804895427386371e-05, + "loss": 0.3784, + "step": 13221 + }, + { + "epoch": 36.02724795640327, + "grad_norm": 7.606378555297852, + "learning_rate": 1.4804121460479528e-05, + "loss": 0.2506, + "step": 13222 + }, + { + "epoch": 36.0299727520436, + "grad_norm": 7.317055702209473, + "learning_rate": 1.4803347456158341e-05, + "loss": 0.4169, + "step": 13223 + }, + { + "epoch": 36.032697547683924, + "grad_norm": 6.236683368682861, + "learning_rate": 1.4802573414428837e-05, + "loss": 0.2888, + "step": 13224 + }, + { + "epoch": 36.03542234332425, + "grad_norm": 7.838255405426025, + "learning_rate": 1.4801799335297052e-05, + "loss": 0.2142, + "step": 13225 + }, + { + "epoch": 36.038147138964575, + "grad_norm": 5.358719348907471, + "learning_rate": 1.4801025218769001e-05, + "loss": 0.2151, + "step": 13226 + }, + { + "epoch": 36.0408719346049, + "grad_norm": 8.163990020751953, + "learning_rate": 1.4800251064850723e-05, + "loss": 0.4248, + "step": 13227 + }, + { + "epoch": 36.043596730245234, + "grad_norm": 9.340973854064941, + "learning_rate": 1.4799476873548244e-05, + "loss": 0.2144, + "step": 13228 + }, + { + "epoch": 36.04632152588556, + "grad_norm": 5.8173322677612305, + "learning_rate": 1.4798702644867596e-05, + "loss": 0.3967, + "step": 13229 + }, + { + "epoch": 36.049046321525886, + "grad_norm": 5.602415561676025, + "learning_rate": 1.47979283788148e-05, + "loss": 0.2408, + "step": 13230 + }, + { + "epoch": 36.05177111716621, + "grad_norm": 5.840487957000732, + "learning_rate": 1.4797154075395899e-05, + "loss": 0.2478, + "step": 13231 + }, + { + "epoch": 36.05449591280654, + "grad_norm": 6.682070732116699, + "learning_rate": 1.4796379734616912e-05, + "loss": 0.2356, + "step": 13232 + }, + { + "epoch": 36.05722070844686, + "grad_norm": 5.006386756896973, + "learning_rate": 1.4795605356483877e-05, + "loss": 0.3284, + "step": 13233 + }, + { + "epoch": 36.059945504087196, + "grad_norm": 7.425999641418457, + "learning_rate": 1.479483094100282e-05, + "loss": 0.5058, + "step": 13234 + }, + { + "epoch": 36.06267029972752, + "grad_norm": 6.135932445526123, + "learning_rate": 1.4794056488179776e-05, + "loss": 0.2256, + "step": 13235 + }, + { + "epoch": 36.06539509536785, + "grad_norm": 21.26055908203125, + "learning_rate": 1.479328199802077e-05, + "loss": 0.2314, + "step": 13236 + }, + { + "epoch": 36.06811989100817, + "grad_norm": 5.896805763244629, + "learning_rate": 1.4792507470531842e-05, + "loss": 0.3028, + "step": 13237 + }, + { + "epoch": 36.0708446866485, + "grad_norm": 8.05986213684082, + "learning_rate": 1.4791732905719019e-05, + "loss": 0.3826, + "step": 13238 + }, + { + "epoch": 36.073569482288825, + "grad_norm": 6.583298683166504, + "learning_rate": 1.4790958303588334e-05, + "loss": 0.2308, + "step": 13239 + }, + { + "epoch": 36.07629427792916, + "grad_norm": 5.833327293395996, + "learning_rate": 1.4790183664145821e-05, + "loss": 0.278, + "step": 13240 + }, + { + "epoch": 36.079019073569484, + "grad_norm": 6.4417924880981445, + "learning_rate": 1.4789408987397512e-05, + "loss": 0.4019, + "step": 13241 + }, + { + "epoch": 36.08174386920981, + "grad_norm": 8.08556842803955, + "learning_rate": 1.4788634273349439e-05, + "loss": 0.3405, + "step": 13242 + }, + { + "epoch": 36.084468664850135, + "grad_norm": 20.261943817138672, + "learning_rate": 1.4787859522007638e-05, + "loss": 0.3115, + "step": 13243 + }, + { + "epoch": 36.08719346049046, + "grad_norm": 5.491735458374023, + "learning_rate": 1.4787084733378138e-05, + "loss": 0.25, + "step": 13244 + }, + { + "epoch": 36.08991825613079, + "grad_norm": 5.954740524291992, + "learning_rate": 1.4786309907466975e-05, + "loss": 0.2966, + "step": 13245 + }, + { + "epoch": 36.09264305177112, + "grad_norm": 7.659736156463623, + "learning_rate": 1.4785535044280189e-05, + "loss": 0.2715, + "step": 13246 + }, + { + "epoch": 36.095367847411445, + "grad_norm": 5.393923759460449, + "learning_rate": 1.478476014382381e-05, + "loss": 0.2464, + "step": 13247 + }, + { + "epoch": 36.09809264305177, + "grad_norm": 6.913016319274902, + "learning_rate": 1.4783985206103868e-05, + "loss": 0.3614, + "step": 13248 + }, + { + "epoch": 36.1008174386921, + "grad_norm": 5.978140830993652, + "learning_rate": 1.4783210231126411e-05, + "loss": 0.2519, + "step": 13249 + }, + { + "epoch": 36.10354223433242, + "grad_norm": 6.325464725494385, + "learning_rate": 1.4782435218897459e-05, + "loss": 0.2686, + "step": 13250 + }, + { + "epoch": 36.10626702997275, + "grad_norm": 5.510571479797363, + "learning_rate": 1.478166016942306e-05, + "loss": 0.1749, + "step": 13251 + }, + { + "epoch": 36.10899182561308, + "grad_norm": 12.347222328186035, + "learning_rate": 1.4780885082709242e-05, + "loss": 0.3969, + "step": 13252 + }, + { + "epoch": 36.11171662125341, + "grad_norm": 7.096447944641113, + "learning_rate": 1.4780109958762049e-05, + "loss": 0.331, + "step": 13253 + }, + { + "epoch": 36.11444141689373, + "grad_norm": 6.075213432312012, + "learning_rate": 1.4779334797587508e-05, + "loss": 0.2931, + "step": 13254 + }, + { + "epoch": 36.11716621253406, + "grad_norm": 6.677272319793701, + "learning_rate": 1.4778559599191668e-05, + "loss": 0.2206, + "step": 13255 + }, + { + "epoch": 36.119891008174385, + "grad_norm": 8.224448204040527, + "learning_rate": 1.4777784363580553e-05, + "loss": 0.4144, + "step": 13256 + }, + { + "epoch": 36.12261580381471, + "grad_norm": 22.851787567138672, + "learning_rate": 1.4777009090760213e-05, + "loss": 0.3081, + "step": 13257 + }, + { + "epoch": 36.12534059945504, + "grad_norm": 6.327375888824463, + "learning_rate": 1.4776233780736677e-05, + "loss": 0.184, + "step": 13258 + }, + { + "epoch": 36.12806539509537, + "grad_norm": 6.861517429351807, + "learning_rate": 1.4775458433515988e-05, + "loss": 0.2499, + "step": 13259 + }, + { + "epoch": 36.130790190735695, + "grad_norm": 5.776194095611572, + "learning_rate": 1.477468304910418e-05, + "loss": 0.2825, + "step": 13260 + }, + { + "epoch": 36.13351498637602, + "grad_norm": 6.355883598327637, + "learning_rate": 1.4773907627507296e-05, + "loss": 0.2797, + "step": 13261 + }, + { + "epoch": 36.13623978201635, + "grad_norm": 7.135884761810303, + "learning_rate": 1.4773132168731372e-05, + "loss": 0.2202, + "step": 13262 + }, + { + "epoch": 36.13896457765667, + "grad_norm": 5.922659397125244, + "learning_rate": 1.4772356672782448e-05, + "loss": 0.4088, + "step": 13263 + }, + { + "epoch": 36.141689373297005, + "grad_norm": 4.835375785827637, + "learning_rate": 1.4771581139666564e-05, + "loss": 0.3039, + "step": 13264 + }, + { + "epoch": 36.14441416893733, + "grad_norm": 5.040340900421143, + "learning_rate": 1.4770805569389762e-05, + "loss": 0.3017, + "step": 13265 + }, + { + "epoch": 36.14713896457766, + "grad_norm": 6.48061466217041, + "learning_rate": 1.4770029961958075e-05, + "loss": 0.3271, + "step": 13266 + }, + { + "epoch": 36.14986376021798, + "grad_norm": 6.813900947570801, + "learning_rate": 1.4769254317377553e-05, + "loss": 0.2408, + "step": 13267 + }, + { + "epoch": 36.15258855585831, + "grad_norm": 4.941844940185547, + "learning_rate": 1.476847863565423e-05, + "loss": 0.3785, + "step": 13268 + }, + { + "epoch": 36.155313351498634, + "grad_norm": 7.042545318603516, + "learning_rate": 1.4767702916794149e-05, + "loss": 0.3079, + "step": 13269 + }, + { + "epoch": 36.15803814713897, + "grad_norm": 5.209319114685059, + "learning_rate": 1.476692716080335e-05, + "loss": 0.2709, + "step": 13270 + }, + { + "epoch": 36.16076294277929, + "grad_norm": 5.897314548492432, + "learning_rate": 1.4766151367687875e-05, + "loss": 0.2773, + "step": 13271 + }, + { + "epoch": 36.16348773841962, + "grad_norm": 6.35041618347168, + "learning_rate": 1.476537553745377e-05, + "loss": 0.6002, + "step": 13272 + }, + { + "epoch": 36.166212534059945, + "grad_norm": 6.693200588226318, + "learning_rate": 1.476459967010707e-05, + "loss": 0.2687, + "step": 13273 + }, + { + "epoch": 36.16893732970027, + "grad_norm": 6.460749626159668, + "learning_rate": 1.4763823765653824e-05, + "loss": 0.3471, + "step": 13274 + }, + { + "epoch": 36.171662125340596, + "grad_norm": 8.597285270690918, + "learning_rate": 1.476304782410007e-05, + "loss": 0.357, + "step": 13275 + }, + { + "epoch": 36.17438692098093, + "grad_norm": 6.624594211578369, + "learning_rate": 1.4762271845451852e-05, + "loss": 0.2743, + "step": 13276 + }, + { + "epoch": 36.177111716621255, + "grad_norm": 4.66386079788208, + "learning_rate": 1.4761495829715219e-05, + "loss": 0.3172, + "step": 13277 + }, + { + "epoch": 36.17983651226158, + "grad_norm": 5.907938003540039, + "learning_rate": 1.4760719776896205e-05, + "loss": 0.3369, + "step": 13278 + }, + { + "epoch": 36.182561307901906, + "grad_norm": 6.306649684906006, + "learning_rate": 1.4759943687000858e-05, + "loss": 0.4182, + "step": 13279 + }, + { + "epoch": 36.18528610354223, + "grad_norm": 5.4794230461120605, + "learning_rate": 1.4759167560035226e-05, + "loss": 0.2356, + "step": 13280 + }, + { + "epoch": 36.18801089918256, + "grad_norm": 6.161020755767822, + "learning_rate": 1.475839139600535e-05, + "loss": 0.3469, + "step": 13281 + }, + { + "epoch": 36.19073569482289, + "grad_norm": 7.272459030151367, + "learning_rate": 1.4757615194917274e-05, + "loss": 0.3511, + "step": 13282 + }, + { + "epoch": 36.19346049046322, + "grad_norm": 5.768618106842041, + "learning_rate": 1.4756838956777043e-05, + "loss": 0.2256, + "step": 13283 + }, + { + "epoch": 36.19618528610354, + "grad_norm": 5.862088680267334, + "learning_rate": 1.4756062681590706e-05, + "loss": 0.286, + "step": 13284 + }, + { + "epoch": 36.19891008174387, + "grad_norm": 4.525655269622803, + "learning_rate": 1.4755286369364301e-05, + "loss": 0.3037, + "step": 13285 + }, + { + "epoch": 36.201634877384194, + "grad_norm": 6.0322113037109375, + "learning_rate": 1.4754510020103883e-05, + "loss": 0.2969, + "step": 13286 + }, + { + "epoch": 36.20435967302452, + "grad_norm": 6.035339832305908, + "learning_rate": 1.4753733633815492e-05, + "loss": 0.2284, + "step": 13287 + }, + { + "epoch": 36.20708446866485, + "grad_norm": 5.587437629699707, + "learning_rate": 1.4752957210505179e-05, + "loss": 0.185, + "step": 13288 + }, + { + "epoch": 36.20980926430518, + "grad_norm": 5.474676132202148, + "learning_rate": 1.4752180750178986e-05, + "loss": 0.2577, + "step": 13289 + }, + { + "epoch": 36.212534059945504, + "grad_norm": 7.268446922302246, + "learning_rate": 1.4751404252842962e-05, + "loss": 0.3511, + "step": 13290 + }, + { + "epoch": 36.21525885558583, + "grad_norm": 7.861775875091553, + "learning_rate": 1.4750627718503156e-05, + "loss": 0.3217, + "step": 13291 + }, + { + "epoch": 36.217983651226156, + "grad_norm": 5.511539459228516, + "learning_rate": 1.4749851147165615e-05, + "loss": 0.3541, + "step": 13292 + }, + { + "epoch": 36.22070844686648, + "grad_norm": 6.481141567230225, + "learning_rate": 1.4749074538836384e-05, + "loss": 0.2819, + "step": 13293 + }, + { + "epoch": 36.223433242506815, + "grad_norm": 5.233092784881592, + "learning_rate": 1.4748297893521515e-05, + "loss": 0.3057, + "step": 13294 + }, + { + "epoch": 36.22615803814714, + "grad_norm": 5.9000115394592285, + "learning_rate": 1.4747521211227054e-05, + "loss": 0.3302, + "step": 13295 + }, + { + "epoch": 36.228882833787466, + "grad_norm": 6.1863694190979, + "learning_rate": 1.4746744491959049e-05, + "loss": 0.341, + "step": 13296 + }, + { + "epoch": 36.23160762942779, + "grad_norm": 7.300392150878906, + "learning_rate": 1.4745967735723552e-05, + "loss": 0.3684, + "step": 13297 + }, + { + "epoch": 36.23433242506812, + "grad_norm": 5.948448181152344, + "learning_rate": 1.4745190942526613e-05, + "loss": 0.3226, + "step": 13298 + }, + { + "epoch": 36.237057220708444, + "grad_norm": 5.368710041046143, + "learning_rate": 1.4744414112374274e-05, + "loss": 0.3194, + "step": 13299 + }, + { + "epoch": 36.23978201634878, + "grad_norm": 5.769564151763916, + "learning_rate": 1.4743637245272598e-05, + "loss": 0.2969, + "step": 13300 + }, + { + "epoch": 36.2425068119891, + "grad_norm": 6.390039920806885, + "learning_rate": 1.4742860341227622e-05, + "loss": 0.2234, + "step": 13301 + }, + { + "epoch": 36.24523160762943, + "grad_norm": 5.80669641494751, + "learning_rate": 1.4742083400245406e-05, + "loss": 0.3753, + "step": 13302 + }, + { + "epoch": 36.247956403269754, + "grad_norm": 6.172638416290283, + "learning_rate": 1.4741306422331995e-05, + "loss": 0.2963, + "step": 13303 + }, + { + "epoch": 36.25068119891008, + "grad_norm": 6.281661510467529, + "learning_rate": 1.4740529407493444e-05, + "loss": 0.2376, + "step": 13304 + }, + { + "epoch": 36.253405994550405, + "grad_norm": 6.107354164123535, + "learning_rate": 1.4739752355735799e-05, + "loss": 0.3358, + "step": 13305 + }, + { + "epoch": 36.25613079019074, + "grad_norm": 6.2487969398498535, + "learning_rate": 1.4738975267065118e-05, + "loss": 0.3114, + "step": 13306 + }, + { + "epoch": 36.258855585831064, + "grad_norm": 6.440620422363281, + "learning_rate": 1.473819814148745e-05, + "loss": 0.2623, + "step": 13307 + }, + { + "epoch": 36.26158038147139, + "grad_norm": 6.070278167724609, + "learning_rate": 1.473742097900885e-05, + "loss": 0.29, + "step": 13308 + }, + { + "epoch": 36.264305177111716, + "grad_norm": 6.380928039550781, + "learning_rate": 1.4736643779635362e-05, + "loss": 0.2677, + "step": 13309 + }, + { + "epoch": 36.26702997275204, + "grad_norm": 5.88615083694458, + "learning_rate": 1.473586654337305e-05, + "loss": 0.3181, + "step": 13310 + }, + { + "epoch": 36.26975476839237, + "grad_norm": 4.7790327072143555, + "learning_rate": 1.4735089270227958e-05, + "loss": 0.3222, + "step": 13311 + }, + { + "epoch": 36.2724795640327, + "grad_norm": 5.748852252960205, + "learning_rate": 1.4734311960206147e-05, + "loss": 0.3753, + "step": 13312 + }, + { + "epoch": 36.275204359673026, + "grad_norm": 6.661259174346924, + "learning_rate": 1.473353461331366e-05, + "loss": 0.3835, + "step": 13313 + }, + { + "epoch": 36.27792915531335, + "grad_norm": 5.821951389312744, + "learning_rate": 1.4732757229556565e-05, + "loss": 0.2562, + "step": 13314 + }, + { + "epoch": 36.28065395095368, + "grad_norm": 6.301092624664307, + "learning_rate": 1.4731979808940906e-05, + "loss": 0.3367, + "step": 13315 + }, + { + "epoch": 36.283378746594, + "grad_norm": 7.271420001983643, + "learning_rate": 1.4731202351472741e-05, + "loss": 0.3906, + "step": 13316 + }, + { + "epoch": 36.28610354223433, + "grad_norm": 6.201592445373535, + "learning_rate": 1.4730424857158123e-05, + "loss": 0.2709, + "step": 13317 + }, + { + "epoch": 36.28882833787466, + "grad_norm": 8.571123123168945, + "learning_rate": 1.472964732600311e-05, + "loss": 0.2953, + "step": 13318 + }, + { + "epoch": 36.29155313351499, + "grad_norm": 4.723077297210693, + "learning_rate": 1.4728869758013758e-05, + "loss": 0.2857, + "step": 13319 + }, + { + "epoch": 36.294277929155314, + "grad_norm": 6.588447570800781, + "learning_rate": 1.4728092153196119e-05, + "loss": 0.2544, + "step": 13320 + }, + { + "epoch": 36.29700272479564, + "grad_norm": 5.947713851928711, + "learning_rate": 1.4727314511556248e-05, + "loss": 0.5516, + "step": 13321 + }, + { + "epoch": 36.299727520435965, + "grad_norm": 5.802780628204346, + "learning_rate": 1.4726536833100204e-05, + "loss": 0.3207, + "step": 13322 + }, + { + "epoch": 36.30245231607629, + "grad_norm": 7.036726474761963, + "learning_rate": 1.4725759117834045e-05, + "loss": 0.2175, + "step": 13323 + }, + { + "epoch": 36.305177111716624, + "grad_norm": 5.762254238128662, + "learning_rate": 1.4724981365763826e-05, + "loss": 0.3055, + "step": 13324 + }, + { + "epoch": 36.30790190735695, + "grad_norm": 6.607092380523682, + "learning_rate": 1.4724203576895604e-05, + "loss": 0.2481, + "step": 13325 + }, + { + "epoch": 36.310626702997276, + "grad_norm": 7.0382914543151855, + "learning_rate": 1.4723425751235436e-05, + "loss": 0.273, + "step": 13326 + }, + { + "epoch": 36.3133514986376, + "grad_norm": 5.677168846130371, + "learning_rate": 1.4722647888789382e-05, + "loss": 0.2465, + "step": 13327 + }, + { + "epoch": 36.31607629427793, + "grad_norm": 5.887604713439941, + "learning_rate": 1.4721869989563495e-05, + "loss": 0.1993, + "step": 13328 + }, + { + "epoch": 36.31880108991825, + "grad_norm": 5.209313869476318, + "learning_rate": 1.472109205356384e-05, + "loss": 0.2846, + "step": 13329 + }, + { + "epoch": 36.321525885558586, + "grad_norm": 5.660128593444824, + "learning_rate": 1.4720314080796469e-05, + "loss": 0.4316, + "step": 13330 + }, + { + "epoch": 36.32425068119891, + "grad_norm": 5.628818035125732, + "learning_rate": 1.4719536071267443e-05, + "loss": 0.1807, + "step": 13331 + }, + { + "epoch": 36.32697547683924, + "grad_norm": 7.614799499511719, + "learning_rate": 1.4718758024982827e-05, + "loss": 0.2442, + "step": 13332 + }, + { + "epoch": 36.32970027247956, + "grad_norm": 6.920741081237793, + "learning_rate": 1.4717979941948672e-05, + "loss": 0.2404, + "step": 13333 + }, + { + "epoch": 36.33242506811989, + "grad_norm": 6.268089771270752, + "learning_rate": 1.4717201822171043e-05, + "loss": 0.2939, + "step": 13334 + }, + { + "epoch": 36.335149863760215, + "grad_norm": 7.400482654571533, + "learning_rate": 1.4716423665655995e-05, + "loss": 0.2523, + "step": 13335 + }, + { + "epoch": 36.33787465940055, + "grad_norm": 6.6051506996154785, + "learning_rate": 1.4715645472409594e-05, + "loss": 0.4303, + "step": 13336 + }, + { + "epoch": 36.34059945504087, + "grad_norm": 5.198501110076904, + "learning_rate": 1.4714867242437896e-05, + "loss": 0.2853, + "step": 13337 + }, + { + "epoch": 36.3433242506812, + "grad_norm": 7.610172271728516, + "learning_rate": 1.4714088975746967e-05, + "loss": 0.2253, + "step": 13338 + }, + { + "epoch": 36.346049046321525, + "grad_norm": 5.972766876220703, + "learning_rate": 1.471331067234286e-05, + "loss": 0.3062, + "step": 13339 + }, + { + "epoch": 36.34877384196185, + "grad_norm": 5.427735805511475, + "learning_rate": 1.4712532332231644e-05, + "loss": 0.2979, + "step": 13340 + }, + { + "epoch": 36.35149863760218, + "grad_norm": 5.4658684730529785, + "learning_rate": 1.4711753955419376e-05, + "loss": 0.2765, + "step": 13341 + }, + { + "epoch": 36.35422343324251, + "grad_norm": 9.625960350036621, + "learning_rate": 1.4710975541912122e-05, + "loss": 0.2669, + "step": 13342 + }, + { + "epoch": 36.356948228882835, + "grad_norm": 6.750884532928467, + "learning_rate": 1.471019709171594e-05, + "loss": 0.2986, + "step": 13343 + }, + { + "epoch": 36.35967302452316, + "grad_norm": 8.63830852508545, + "learning_rate": 1.4709418604836898e-05, + "loss": 0.4565, + "step": 13344 + }, + { + "epoch": 36.36239782016349, + "grad_norm": 6.362757205963135, + "learning_rate": 1.4708640081281054e-05, + "loss": 0.2891, + "step": 13345 + }, + { + "epoch": 36.36512261580381, + "grad_norm": 6.810002326965332, + "learning_rate": 1.4707861521054471e-05, + "loss": 0.1971, + "step": 13346 + }, + { + "epoch": 36.36784741144414, + "grad_norm": 5.628415107727051, + "learning_rate": 1.4707082924163216e-05, + "loss": 0.3101, + "step": 13347 + }, + { + "epoch": 36.37057220708447, + "grad_norm": 6.321719169616699, + "learning_rate": 1.470630429061335e-05, + "loss": 0.2809, + "step": 13348 + }, + { + "epoch": 36.3732970027248, + "grad_norm": 9.022990226745605, + "learning_rate": 1.4705525620410936e-05, + "loss": 0.2779, + "step": 13349 + }, + { + "epoch": 36.37602179836512, + "grad_norm": 13.800345420837402, + "learning_rate": 1.4704746913562043e-05, + "loss": 0.2912, + "step": 13350 + }, + { + "epoch": 36.37874659400545, + "grad_norm": 7.537498950958252, + "learning_rate": 1.470396817007273e-05, + "loss": 0.2954, + "step": 13351 + }, + { + "epoch": 36.381471389645775, + "grad_norm": 5.671634197235107, + "learning_rate": 1.4703189389949066e-05, + "loss": 0.2158, + "step": 13352 + }, + { + "epoch": 36.3841961852861, + "grad_norm": 6.502307891845703, + "learning_rate": 1.4702410573197112e-05, + "loss": 0.3534, + "step": 13353 + }, + { + "epoch": 36.38692098092643, + "grad_norm": 5.736046314239502, + "learning_rate": 1.4701631719822937e-05, + "loss": 0.3752, + "step": 13354 + }, + { + "epoch": 36.38964577656676, + "grad_norm": 5.479292869567871, + "learning_rate": 1.4700852829832605e-05, + "loss": 0.221, + "step": 13355 + }, + { + "epoch": 36.392370572207085, + "grad_norm": 5.3284196853637695, + "learning_rate": 1.4700073903232184e-05, + "loss": 0.2644, + "step": 13356 + }, + { + "epoch": 36.39509536784741, + "grad_norm": 5.863639831542969, + "learning_rate": 1.469929494002774e-05, + "loss": 0.395, + "step": 13357 + }, + { + "epoch": 36.39782016348774, + "grad_norm": 6.0642523765563965, + "learning_rate": 1.4698515940225333e-05, + "loss": 0.2675, + "step": 13358 + }, + { + "epoch": 36.40054495912806, + "grad_norm": 7.674149513244629, + "learning_rate": 1.4697736903831041e-05, + "loss": 0.2501, + "step": 13359 + }, + { + "epoch": 36.403269754768395, + "grad_norm": 6.642250061035156, + "learning_rate": 1.4696957830850922e-05, + "loss": 0.3921, + "step": 13360 + }, + { + "epoch": 36.40599455040872, + "grad_norm": 8.71288776397705, + "learning_rate": 1.4696178721291048e-05, + "loss": 0.3495, + "step": 13361 + }, + { + "epoch": 36.40871934604905, + "grad_norm": 8.118603706359863, + "learning_rate": 1.4695399575157483e-05, + "loss": 0.357, + "step": 13362 + }, + { + "epoch": 36.41144414168937, + "grad_norm": 7.166381359100342, + "learning_rate": 1.4694620392456299e-05, + "loss": 0.2482, + "step": 13363 + }, + { + "epoch": 36.4141689373297, + "grad_norm": 6.337353229522705, + "learning_rate": 1.4693841173193562e-05, + "loss": 0.2439, + "step": 13364 + }, + { + "epoch": 36.416893732970024, + "grad_norm": 5.224032402038574, + "learning_rate": 1.469306191737534e-05, + "loss": 0.306, + "step": 13365 + }, + { + "epoch": 36.41961852861036, + "grad_norm": 6.916603088378906, + "learning_rate": 1.4692282625007703e-05, + "loss": 0.3333, + "step": 13366 + }, + { + "epoch": 36.42234332425068, + "grad_norm": 10.736503601074219, + "learning_rate": 1.4691503296096721e-05, + "loss": 0.3271, + "step": 13367 + }, + { + "epoch": 36.42506811989101, + "grad_norm": 6.419002056121826, + "learning_rate": 1.4690723930648463e-05, + "loss": 0.2392, + "step": 13368 + }, + { + "epoch": 36.427792915531334, + "grad_norm": 6.702088832855225, + "learning_rate": 1.4689944528668997e-05, + "loss": 0.2708, + "step": 13369 + }, + { + "epoch": 36.43051771117166, + "grad_norm": 6.408752918243408, + "learning_rate": 1.4689165090164395e-05, + "loss": 0.2514, + "step": 13370 + }, + { + "epoch": 36.433242506811986, + "grad_norm": 6.2014617919921875, + "learning_rate": 1.4688385615140726e-05, + "loss": 0.2501, + "step": 13371 + }, + { + "epoch": 36.43596730245232, + "grad_norm": 8.093091011047363, + "learning_rate": 1.4687606103604057e-05, + "loss": 0.3111, + "step": 13372 + }, + { + "epoch": 36.438692098092645, + "grad_norm": 7.146554946899414, + "learning_rate": 1.4686826555560468e-05, + "loss": 0.435, + "step": 13373 + }, + { + "epoch": 36.44141689373297, + "grad_norm": 5.736241817474365, + "learning_rate": 1.468604697101602e-05, + "loss": 0.2479, + "step": 13374 + }, + { + "epoch": 36.444141689373296, + "grad_norm": 5.841864585876465, + "learning_rate": 1.468526734997679e-05, + "loss": 0.2032, + "step": 13375 + }, + { + "epoch": 36.44686648501362, + "grad_norm": 6.242249965667725, + "learning_rate": 1.468448769244885e-05, + "loss": 0.2147, + "step": 13376 + }, + { + "epoch": 36.44959128065395, + "grad_norm": 5.7653303146362305, + "learning_rate": 1.4683707998438273e-05, + "loss": 0.3541, + "step": 13377 + }, + { + "epoch": 36.45231607629428, + "grad_norm": 6.387267589569092, + "learning_rate": 1.4682928267951124e-05, + "loss": 0.2736, + "step": 13378 + }, + { + "epoch": 36.45504087193461, + "grad_norm": 6.599924087524414, + "learning_rate": 1.4682148500993486e-05, + "loss": 0.4249, + "step": 13379 + }, + { + "epoch": 36.45776566757493, + "grad_norm": 5.238255500793457, + "learning_rate": 1.4681368697571421e-05, + "loss": 0.2681, + "step": 13380 + }, + { + "epoch": 36.46049046321526, + "grad_norm": 5.064724922180176, + "learning_rate": 1.4680588857691009e-05, + "loss": 0.3273, + "step": 13381 + }, + { + "epoch": 36.463215258855584, + "grad_norm": 6.155890464782715, + "learning_rate": 1.4679808981358319e-05, + "loss": 0.1873, + "step": 13382 + }, + { + "epoch": 36.46594005449591, + "grad_norm": 5.978591442108154, + "learning_rate": 1.4679029068579432e-05, + "loss": 0.3087, + "step": 13383 + }, + { + "epoch": 36.46866485013624, + "grad_norm": 5.726358890533447, + "learning_rate": 1.4678249119360415e-05, + "loss": 0.3177, + "step": 13384 + }, + { + "epoch": 36.47138964577657, + "grad_norm": 5.267200469970703, + "learning_rate": 1.4677469133707346e-05, + "loss": 0.3525, + "step": 13385 + }, + { + "epoch": 36.474114441416894, + "grad_norm": 5.896948337554932, + "learning_rate": 1.4676689111626294e-05, + "loss": 0.3116, + "step": 13386 + }, + { + "epoch": 36.47683923705722, + "grad_norm": 5.342823505401611, + "learning_rate": 1.4675909053123342e-05, + "loss": 0.2621, + "step": 13387 + }, + { + "epoch": 36.479564032697546, + "grad_norm": 5.99827241897583, + "learning_rate": 1.4675128958204559e-05, + "loss": 0.2905, + "step": 13388 + }, + { + "epoch": 36.48228882833787, + "grad_norm": 5.374172210693359, + "learning_rate": 1.4674348826876024e-05, + "loss": 0.4813, + "step": 13389 + }, + { + "epoch": 36.485013623978205, + "grad_norm": 5.049845218658447, + "learning_rate": 1.4673568659143806e-05, + "loss": 0.2846, + "step": 13390 + }, + { + "epoch": 36.48773841961853, + "grad_norm": 5.735440731048584, + "learning_rate": 1.4672788455013988e-05, + "loss": 0.2975, + "step": 13391 + }, + { + "epoch": 36.490463215258856, + "grad_norm": 5.560763835906982, + "learning_rate": 1.4672008214492643e-05, + "loss": 0.3355, + "step": 13392 + }, + { + "epoch": 36.49318801089918, + "grad_norm": 7.372814655303955, + "learning_rate": 1.4671227937585853e-05, + "loss": 0.3286, + "step": 13393 + }, + { + "epoch": 36.49591280653951, + "grad_norm": 11.579628944396973, + "learning_rate": 1.4670447624299685e-05, + "loss": 0.1994, + "step": 13394 + }, + { + "epoch": 36.49863760217983, + "grad_norm": 5.694832801818848, + "learning_rate": 1.4669667274640227e-05, + "loss": 0.249, + "step": 13395 + }, + { + "epoch": 36.50136239782017, + "grad_norm": 7.621641159057617, + "learning_rate": 1.4668886888613545e-05, + "loss": 0.5377, + "step": 13396 + }, + { + "epoch": 36.50408719346049, + "grad_norm": 5.279268741607666, + "learning_rate": 1.4668106466225724e-05, + "loss": 0.3796, + "step": 13397 + }, + { + "epoch": 36.50681198910082, + "grad_norm": 5.475941181182861, + "learning_rate": 1.466732600748284e-05, + "loss": 0.2565, + "step": 13398 + }, + { + "epoch": 36.509536784741144, + "grad_norm": 5.412313461303711, + "learning_rate": 1.4666545512390971e-05, + "loss": 0.3062, + "step": 13399 + }, + { + "epoch": 36.51226158038147, + "grad_norm": 6.111344337463379, + "learning_rate": 1.4665764980956196e-05, + "loss": 0.5159, + "step": 13400 + }, + { + "epoch": 36.514986376021795, + "grad_norm": 6.7449564933776855, + "learning_rate": 1.4664984413184595e-05, + "loss": 0.3046, + "step": 13401 + }, + { + "epoch": 36.51771117166213, + "grad_norm": 6.346858501434326, + "learning_rate": 1.4664203809082242e-05, + "loss": 0.3814, + "step": 13402 + }, + { + "epoch": 36.520435967302454, + "grad_norm": 5.561699867248535, + "learning_rate": 1.4663423168655224e-05, + "loss": 0.3898, + "step": 13403 + }, + { + "epoch": 36.52316076294278, + "grad_norm": 7.484636306762695, + "learning_rate": 1.4662642491909613e-05, + "loss": 0.2744, + "step": 13404 + }, + { + "epoch": 36.525885558583106, + "grad_norm": 7.572459697723389, + "learning_rate": 1.4661861778851495e-05, + "loss": 0.3589, + "step": 13405 + }, + { + "epoch": 36.52861035422343, + "grad_norm": 5.904122352600098, + "learning_rate": 1.4661081029486947e-05, + "loss": 0.2995, + "step": 13406 + }, + { + "epoch": 36.53133514986376, + "grad_norm": 6.616388320922852, + "learning_rate": 1.466030024382205e-05, + "loss": 0.3282, + "step": 13407 + }, + { + "epoch": 36.53405994550409, + "grad_norm": 9.58329963684082, + "learning_rate": 1.4659519421862882e-05, + "loss": 0.3186, + "step": 13408 + }, + { + "epoch": 36.536784741144416, + "grad_norm": 4.5477705001831055, + "learning_rate": 1.4658738563615528e-05, + "loss": 0.3818, + "step": 13409 + }, + { + "epoch": 36.53950953678474, + "grad_norm": 6.984385013580322, + "learning_rate": 1.4657957669086068e-05, + "loss": 0.2544, + "step": 13410 + }, + { + "epoch": 36.54223433242507, + "grad_norm": 6.979449272155762, + "learning_rate": 1.4657176738280587e-05, + "loss": 0.4612, + "step": 13411 + }, + { + "epoch": 36.54495912806539, + "grad_norm": 9.876516342163086, + "learning_rate": 1.4656395771205159e-05, + "loss": 0.2459, + "step": 13412 + }, + { + "epoch": 36.54768392370572, + "grad_norm": 8.801257133483887, + "learning_rate": 1.4655614767865874e-05, + "loss": 0.2674, + "step": 13413 + }, + { + "epoch": 36.55040871934605, + "grad_norm": 5.759488105773926, + "learning_rate": 1.4654833728268809e-05, + "loss": 0.2815, + "step": 13414 + }, + { + "epoch": 36.55313351498638, + "grad_norm": 6.719549179077148, + "learning_rate": 1.465405265242005e-05, + "loss": 0.2354, + "step": 13415 + }, + { + "epoch": 36.555858310626704, + "grad_norm": 5.147261619567871, + "learning_rate": 1.4653271540325678e-05, + "loss": 0.2369, + "step": 13416 + }, + { + "epoch": 36.55858310626703, + "grad_norm": 4.3034892082214355, + "learning_rate": 1.4652490391991776e-05, + "loss": 0.3875, + "step": 13417 + }, + { + "epoch": 36.561307901907355, + "grad_norm": 5.992101192474365, + "learning_rate": 1.4651709207424427e-05, + "loss": 0.2996, + "step": 13418 + }, + { + "epoch": 36.56403269754768, + "grad_norm": 7.512600421905518, + "learning_rate": 1.4650927986629721e-05, + "loss": 0.304, + "step": 13419 + }, + { + "epoch": 36.566757493188014, + "grad_norm": 8.687450408935547, + "learning_rate": 1.4650146729613735e-05, + "loss": 0.315, + "step": 13420 + }, + { + "epoch": 36.56948228882834, + "grad_norm": 8.934673309326172, + "learning_rate": 1.4649365436382557e-05, + "loss": 0.2188, + "step": 13421 + }, + { + "epoch": 36.572207084468666, + "grad_norm": 7.995282173156738, + "learning_rate": 1.464858410694227e-05, + "loss": 0.3398, + "step": 13422 + }, + { + "epoch": 36.57493188010899, + "grad_norm": 6.303302764892578, + "learning_rate": 1.464780274129896e-05, + "loss": 0.6181, + "step": 13423 + }, + { + "epoch": 36.57765667574932, + "grad_norm": 5.564570903778076, + "learning_rate": 1.464702133945871e-05, + "loss": 0.3231, + "step": 13424 + }, + { + "epoch": 36.58038147138964, + "grad_norm": 5.620957851409912, + "learning_rate": 1.4646239901427608e-05, + "loss": 0.2775, + "step": 13425 + }, + { + "epoch": 36.583106267029976, + "grad_norm": 7.0095744132995605, + "learning_rate": 1.464545842721174e-05, + "loss": 0.3576, + "step": 13426 + }, + { + "epoch": 36.5858310626703, + "grad_norm": 6.371780872344971, + "learning_rate": 1.4644676916817191e-05, + "loss": 0.3585, + "step": 13427 + }, + { + "epoch": 36.58855585831063, + "grad_norm": 6.885015964508057, + "learning_rate": 1.4643895370250048e-05, + "loss": 0.232, + "step": 13428 + }, + { + "epoch": 36.59128065395095, + "grad_norm": 6.714498996734619, + "learning_rate": 1.4643113787516398e-05, + "loss": 0.1946, + "step": 13429 + }, + { + "epoch": 36.59400544959128, + "grad_norm": 5.592657566070557, + "learning_rate": 1.4642332168622326e-05, + "loss": 0.3248, + "step": 13430 + }, + { + "epoch": 36.596730245231605, + "grad_norm": 5.791368007659912, + "learning_rate": 1.4641550513573922e-05, + "loss": 0.1738, + "step": 13431 + }, + { + "epoch": 36.59945504087194, + "grad_norm": 6.553666591644287, + "learning_rate": 1.464076882237727e-05, + "loss": 0.3313, + "step": 13432 + }, + { + "epoch": 36.60217983651226, + "grad_norm": 5.692700386047363, + "learning_rate": 1.4639987095038462e-05, + "loss": 0.2475, + "step": 13433 + }, + { + "epoch": 36.60490463215259, + "grad_norm": 6.713046073913574, + "learning_rate": 1.4639205331563582e-05, + "loss": 0.2303, + "step": 13434 + }, + { + "epoch": 36.607629427792915, + "grad_norm": 6.671408176422119, + "learning_rate": 1.4638423531958719e-05, + "loss": 0.3086, + "step": 13435 + }, + { + "epoch": 36.61035422343324, + "grad_norm": 7.590618133544922, + "learning_rate": 1.4637641696229967e-05, + "loss": 0.2469, + "step": 13436 + }, + { + "epoch": 36.61307901907357, + "grad_norm": 6.4383087158203125, + "learning_rate": 1.4636859824383406e-05, + "loss": 0.1952, + "step": 13437 + }, + { + "epoch": 36.6158038147139, + "grad_norm": 6.405405044555664, + "learning_rate": 1.4636077916425133e-05, + "loss": 0.2763, + "step": 13438 + }, + { + "epoch": 36.618528610354225, + "grad_norm": 6.324481010437012, + "learning_rate": 1.4635295972361235e-05, + "loss": 0.3177, + "step": 13439 + }, + { + "epoch": 36.62125340599455, + "grad_norm": 6.219964027404785, + "learning_rate": 1.4634513992197798e-05, + "loss": 0.2487, + "step": 13440 + }, + { + "epoch": 36.62397820163488, + "grad_norm": 7.315922737121582, + "learning_rate": 1.463373197594092e-05, + "loss": 0.2831, + "step": 13441 + }, + { + "epoch": 36.6267029972752, + "grad_norm": 6.487116813659668, + "learning_rate": 1.4632949923596681e-05, + "loss": 0.3255, + "step": 13442 + }, + { + "epoch": 36.62942779291553, + "grad_norm": 11.113147735595703, + "learning_rate": 1.4632167835171177e-05, + "loss": 0.2622, + "step": 13443 + }, + { + "epoch": 36.63215258855586, + "grad_norm": 5.978334903717041, + "learning_rate": 1.4631385710670505e-05, + "loss": 0.4852, + "step": 13444 + }, + { + "epoch": 36.63487738419619, + "grad_norm": 5.589931488037109, + "learning_rate": 1.4630603550100747e-05, + "loss": 0.3033, + "step": 13445 + }, + { + "epoch": 36.63760217983651, + "grad_norm": 5.926933288574219, + "learning_rate": 1.4629821353467997e-05, + "loss": 0.2702, + "step": 13446 + }, + { + "epoch": 36.64032697547684, + "grad_norm": 10.75122356414795, + "learning_rate": 1.4629039120778345e-05, + "loss": 0.2697, + "step": 13447 + }, + { + "epoch": 36.643051771117165, + "grad_norm": 7.649288654327393, + "learning_rate": 1.462825685203789e-05, + "loss": 0.2147, + "step": 13448 + }, + { + "epoch": 36.64577656675749, + "grad_norm": 7.236257076263428, + "learning_rate": 1.4627474547252718e-05, + "loss": 0.3286, + "step": 13449 + }, + { + "epoch": 36.64850136239782, + "grad_norm": 7.800262928009033, + "learning_rate": 1.462669220642892e-05, + "loss": 0.2531, + "step": 13450 + }, + { + "epoch": 36.65122615803815, + "grad_norm": 6.149899005889893, + "learning_rate": 1.4625909829572596e-05, + "loss": 0.2659, + "step": 13451 + }, + { + "epoch": 36.653950953678475, + "grad_norm": 10.267043113708496, + "learning_rate": 1.4625127416689834e-05, + "loss": 0.3417, + "step": 13452 + }, + { + "epoch": 36.6566757493188, + "grad_norm": 7.2573652267456055, + "learning_rate": 1.4624344967786729e-05, + "loss": 0.2353, + "step": 13453 + }, + { + "epoch": 36.65940054495913, + "grad_norm": 7.371579170227051, + "learning_rate": 1.4623562482869373e-05, + "loss": 0.3017, + "step": 13454 + }, + { + "epoch": 36.66212534059945, + "grad_norm": 5.899842262268066, + "learning_rate": 1.462277996194386e-05, + "loss": 0.321, + "step": 13455 + }, + { + "epoch": 36.664850136239785, + "grad_norm": 7.154221534729004, + "learning_rate": 1.462199740501629e-05, + "loss": 0.257, + "step": 13456 + }, + { + "epoch": 36.66757493188011, + "grad_norm": 7.6316118240356445, + "learning_rate": 1.462121481209275e-05, + "loss": 0.4272, + "step": 13457 + }, + { + "epoch": 36.67029972752044, + "grad_norm": 6.10270881652832, + "learning_rate": 1.4620432183179339e-05, + "loss": 0.3264, + "step": 13458 + }, + { + "epoch": 36.67302452316076, + "grad_norm": 7.653482913970947, + "learning_rate": 1.461964951828215e-05, + "loss": 0.3745, + "step": 13459 + }, + { + "epoch": 36.67574931880109, + "grad_norm": 6.101099014282227, + "learning_rate": 1.4618866817407276e-05, + "loss": 0.2604, + "step": 13460 + }, + { + "epoch": 36.678474114441414, + "grad_norm": 5.745018482208252, + "learning_rate": 1.4618084080560819e-05, + "loss": 0.2885, + "step": 13461 + }, + { + "epoch": 36.68119891008175, + "grad_norm": 6.850214004516602, + "learning_rate": 1.4617301307748872e-05, + "loss": 0.2923, + "step": 13462 + }, + { + "epoch": 36.68392370572207, + "grad_norm": 6.942055702209473, + "learning_rate": 1.461651849897753e-05, + "loss": 0.2498, + "step": 13463 + }, + { + "epoch": 36.6866485013624, + "grad_norm": 6.727579116821289, + "learning_rate": 1.4615735654252894e-05, + "loss": 0.2479, + "step": 13464 + }, + { + "epoch": 36.689373297002724, + "grad_norm": 5.656120300292969, + "learning_rate": 1.4614952773581052e-05, + "loss": 0.3414, + "step": 13465 + }, + { + "epoch": 36.69209809264305, + "grad_norm": 8.685868263244629, + "learning_rate": 1.461416985696811e-05, + "loss": 0.335, + "step": 13466 + }, + { + "epoch": 36.694822888283376, + "grad_norm": 7.29338264465332, + "learning_rate": 1.4613386904420161e-05, + "loss": 0.3169, + "step": 13467 + }, + { + "epoch": 36.69754768392371, + "grad_norm": 7.772313117980957, + "learning_rate": 1.4612603915943302e-05, + "loss": 0.422, + "step": 13468 + }, + { + "epoch": 36.700272479564035, + "grad_norm": 6.467717170715332, + "learning_rate": 1.4611820891543632e-05, + "loss": 0.2767, + "step": 13469 + }, + { + "epoch": 36.70299727520436, + "grad_norm": 11.327056884765625, + "learning_rate": 1.461103783122725e-05, + "loss": 0.2394, + "step": 13470 + }, + { + "epoch": 36.705722070844686, + "grad_norm": 6.666938781738281, + "learning_rate": 1.4610254735000254e-05, + "loss": 0.2871, + "step": 13471 + }, + { + "epoch": 36.70844686648501, + "grad_norm": 5.195796489715576, + "learning_rate": 1.4609471602868743e-05, + "loss": 0.4612, + "step": 13472 + }, + { + "epoch": 36.71117166212534, + "grad_norm": 6.200788974761963, + "learning_rate": 1.4608688434838816e-05, + "loss": 0.4299, + "step": 13473 + }, + { + "epoch": 36.71389645776567, + "grad_norm": 6.3313140869140625, + "learning_rate": 1.460790523091657e-05, + "loss": 0.3321, + "step": 13474 + }, + { + "epoch": 36.716621253406, + "grad_norm": 6.990638732910156, + "learning_rate": 1.4607121991108109e-05, + "loss": 0.2406, + "step": 13475 + }, + { + "epoch": 36.71934604904632, + "grad_norm": 6.073096752166748, + "learning_rate": 1.4606338715419528e-05, + "loss": 0.1578, + "step": 13476 + }, + { + "epoch": 36.72207084468665, + "grad_norm": 8.439026832580566, + "learning_rate": 1.4605555403856928e-05, + "loss": 0.3236, + "step": 13477 + }, + { + "epoch": 36.724795640326974, + "grad_norm": 5.879141330718994, + "learning_rate": 1.4604772056426412e-05, + "loss": 0.2809, + "step": 13478 + }, + { + "epoch": 36.7275204359673, + "grad_norm": 5.959609031677246, + "learning_rate": 1.460398867313408e-05, + "loss": 0.3346, + "step": 13479 + }, + { + "epoch": 36.73024523160763, + "grad_norm": 7.834115982055664, + "learning_rate": 1.4603205253986034e-05, + "loss": 0.358, + "step": 13480 + }, + { + "epoch": 36.73297002724796, + "grad_norm": 10.48446273803711, + "learning_rate": 1.4602421798988371e-05, + "loss": 0.39, + "step": 13481 + }, + { + "epoch": 36.735694822888284, + "grad_norm": 5.4694366455078125, + "learning_rate": 1.4601638308147196e-05, + "loss": 0.2053, + "step": 13482 + }, + { + "epoch": 36.73841961852861, + "grad_norm": 6.326745986938477, + "learning_rate": 1.4600854781468611e-05, + "loss": 0.2877, + "step": 13483 + }, + { + "epoch": 36.741144414168936, + "grad_norm": 7.83394193649292, + "learning_rate": 1.4600071218958718e-05, + "loss": 0.2609, + "step": 13484 + }, + { + "epoch": 36.74386920980926, + "grad_norm": 6.081604957580566, + "learning_rate": 1.4599287620623612e-05, + "loss": 0.2216, + "step": 13485 + }, + { + "epoch": 36.746594005449595, + "grad_norm": 6.674520969390869, + "learning_rate": 1.4598503986469408e-05, + "loss": 0.3105, + "step": 13486 + }, + { + "epoch": 36.74931880108992, + "grad_norm": 13.587553977966309, + "learning_rate": 1.4597720316502201e-05, + "loss": 0.3659, + "step": 13487 + }, + { + "epoch": 36.752043596730246, + "grad_norm": 5.815481662750244, + "learning_rate": 1.4596936610728098e-05, + "loss": 0.2341, + "step": 13488 + }, + { + "epoch": 36.75476839237057, + "grad_norm": 6.632508754730225, + "learning_rate": 1.4596152869153199e-05, + "loss": 0.2267, + "step": 13489 + }, + { + "epoch": 36.7574931880109, + "grad_norm": 14.098983764648438, + "learning_rate": 1.459536909178361e-05, + "loss": 0.3257, + "step": 13490 + }, + { + "epoch": 36.76021798365122, + "grad_norm": 6.832345485687256, + "learning_rate": 1.4594585278625435e-05, + "loss": 0.2021, + "step": 13491 + }, + { + "epoch": 36.762942779291556, + "grad_norm": 6.347101211547852, + "learning_rate": 1.4593801429684778e-05, + "loss": 0.4977, + "step": 13492 + }, + { + "epoch": 36.76566757493188, + "grad_norm": 6.067656993865967, + "learning_rate": 1.4593017544967741e-05, + "loss": 0.3394, + "step": 13493 + }, + { + "epoch": 36.76839237057221, + "grad_norm": 6.473677635192871, + "learning_rate": 1.4592233624480432e-05, + "loss": 0.2516, + "step": 13494 + }, + { + "epoch": 36.771117166212534, + "grad_norm": 6.269806385040283, + "learning_rate": 1.4591449668228954e-05, + "loss": 0.3989, + "step": 13495 + }, + { + "epoch": 36.77384196185286, + "grad_norm": 6.156412124633789, + "learning_rate": 1.4590665676219416e-05, + "loss": 0.2751, + "step": 13496 + }, + { + "epoch": 36.776566757493185, + "grad_norm": 5.466747760772705, + "learning_rate": 1.458988164845792e-05, + "loss": 0.2327, + "step": 13497 + }, + { + "epoch": 36.77929155313352, + "grad_norm": 6.75571346282959, + "learning_rate": 1.4589097584950576e-05, + "loss": 0.2463, + "step": 13498 + }, + { + "epoch": 36.782016348773844, + "grad_norm": 7.74921178817749, + "learning_rate": 1.4588313485703484e-05, + "loss": 0.1803, + "step": 13499 + }, + { + "epoch": 36.78474114441417, + "grad_norm": 6.87742805480957, + "learning_rate": 1.4587529350722758e-05, + "loss": 0.3144, + "step": 13500 + }, + { + "epoch": 36.787465940054496, + "grad_norm": 6.258539199829102, + "learning_rate": 1.4586745180014498e-05, + "loss": 0.291, + "step": 13501 + }, + { + "epoch": 36.79019073569482, + "grad_norm": 6.405124664306641, + "learning_rate": 1.4585960973584819e-05, + "loss": 0.2778, + "step": 13502 + }, + { + "epoch": 36.79291553133515, + "grad_norm": 6.355350494384766, + "learning_rate": 1.4585176731439816e-05, + "loss": 0.5846, + "step": 13503 + }, + { + "epoch": 36.79564032697548, + "grad_norm": 6.275414943695068, + "learning_rate": 1.458439245358561e-05, + "loss": 0.2856, + "step": 13504 + }, + { + "epoch": 36.798365122615806, + "grad_norm": 6.55458402633667, + "learning_rate": 1.4583608140028301e-05, + "loss": 0.4235, + "step": 13505 + }, + { + "epoch": 36.80108991825613, + "grad_norm": 6.362923622131348, + "learning_rate": 1.4582823790774001e-05, + "loss": 0.1937, + "step": 13506 + }, + { + "epoch": 36.80381471389646, + "grad_norm": 6.119221210479736, + "learning_rate": 1.4582039405828813e-05, + "loss": 0.2638, + "step": 13507 + }, + { + "epoch": 36.80653950953678, + "grad_norm": 6.98737907409668, + "learning_rate": 1.4581254985198854e-05, + "loss": 0.4198, + "step": 13508 + }, + { + "epoch": 36.80926430517711, + "grad_norm": 8.595921516418457, + "learning_rate": 1.4580470528890227e-05, + "loss": 0.3013, + "step": 13509 + }, + { + "epoch": 36.81198910081744, + "grad_norm": 6.572314739227295, + "learning_rate": 1.4579686036909043e-05, + "loss": 0.2438, + "step": 13510 + }, + { + "epoch": 36.81471389645777, + "grad_norm": 6.793776035308838, + "learning_rate": 1.457890150926141e-05, + "loss": 0.3829, + "step": 13511 + }, + { + "epoch": 36.817438692098094, + "grad_norm": 7.48348331451416, + "learning_rate": 1.457811694595344e-05, + "loss": 0.3203, + "step": 13512 + }, + { + "epoch": 36.82016348773842, + "grad_norm": 8.285489082336426, + "learning_rate": 1.4577332346991244e-05, + "loss": 0.3666, + "step": 13513 + }, + { + "epoch": 36.822888283378745, + "grad_norm": 5.748161792755127, + "learning_rate": 1.4576547712380931e-05, + "loss": 0.2483, + "step": 13514 + }, + { + "epoch": 36.82561307901907, + "grad_norm": 8.75537395477295, + "learning_rate": 1.457576304212861e-05, + "loss": 0.4648, + "step": 13515 + }, + { + "epoch": 36.828337874659404, + "grad_norm": 6.129855632781982, + "learning_rate": 1.4574978336240396e-05, + "loss": 0.3243, + "step": 13516 + }, + { + "epoch": 36.83106267029973, + "grad_norm": 6.249845504760742, + "learning_rate": 1.4574193594722394e-05, + "loss": 0.4031, + "step": 13517 + }, + { + "epoch": 36.833787465940055, + "grad_norm": 13.521490097045898, + "learning_rate": 1.4573408817580723e-05, + "loss": 0.2516, + "step": 13518 + }, + { + "epoch": 36.83651226158038, + "grad_norm": 8.591753959655762, + "learning_rate": 1.457262400482149e-05, + "loss": 0.3831, + "step": 13519 + }, + { + "epoch": 36.83923705722071, + "grad_norm": 9.518485069274902, + "learning_rate": 1.4571839156450809e-05, + "loss": 0.3139, + "step": 13520 + }, + { + "epoch": 36.84196185286103, + "grad_norm": 7.928452491760254, + "learning_rate": 1.4571054272474791e-05, + "loss": 0.3539, + "step": 13521 + }, + { + "epoch": 36.844686648501366, + "grad_norm": 6.2169294357299805, + "learning_rate": 1.457026935289955e-05, + "loss": 0.2234, + "step": 13522 + }, + { + "epoch": 36.84741144414169, + "grad_norm": 5.923735618591309, + "learning_rate": 1.45694843977312e-05, + "loss": 0.2801, + "step": 13523 + }, + { + "epoch": 36.85013623978202, + "grad_norm": 6.010656833648682, + "learning_rate": 1.456869940697585e-05, + "loss": 0.2323, + "step": 13524 + }, + { + "epoch": 36.85286103542234, + "grad_norm": 6.384903430938721, + "learning_rate": 1.4567914380639617e-05, + "loss": 0.3567, + "step": 13525 + }, + { + "epoch": 36.85558583106267, + "grad_norm": 6.307415962219238, + "learning_rate": 1.4567129318728614e-05, + "loss": 0.2615, + "step": 13526 + }, + { + "epoch": 36.858310626702995, + "grad_norm": 5.263106346130371, + "learning_rate": 1.4566344221248957e-05, + "loss": 0.3254, + "step": 13527 + }, + { + "epoch": 36.86103542234333, + "grad_norm": 8.703821182250977, + "learning_rate": 1.4565559088206753e-05, + "loss": 0.2455, + "step": 13528 + }, + { + "epoch": 36.86376021798365, + "grad_norm": 7.47613000869751, + "learning_rate": 1.4564773919608125e-05, + "loss": 0.3584, + "step": 13529 + }, + { + "epoch": 36.86648501362398, + "grad_norm": 5.817327499389648, + "learning_rate": 1.4563988715459185e-05, + "loss": 0.2518, + "step": 13530 + }, + { + "epoch": 36.869209809264305, + "grad_norm": 6.253386974334717, + "learning_rate": 1.4563203475766048e-05, + "loss": 0.3105, + "step": 13531 + }, + { + "epoch": 36.87193460490463, + "grad_norm": 6.917342662811279, + "learning_rate": 1.4562418200534827e-05, + "loss": 0.3243, + "step": 13532 + }, + { + "epoch": 36.87465940054496, + "grad_norm": 9.005016326904297, + "learning_rate": 1.4561632889771642e-05, + "loss": 0.2649, + "step": 13533 + }, + { + "epoch": 36.87738419618529, + "grad_norm": 6.099979400634766, + "learning_rate": 1.4560847543482605e-05, + "loss": 0.4409, + "step": 13534 + }, + { + "epoch": 36.880108991825615, + "grad_norm": 6.624093532562256, + "learning_rate": 1.4560062161673838e-05, + "loss": 0.3391, + "step": 13535 + }, + { + "epoch": 36.88283378746594, + "grad_norm": 5.857081413269043, + "learning_rate": 1.455927674435145e-05, + "loss": 0.3004, + "step": 13536 + }, + { + "epoch": 36.88555858310627, + "grad_norm": 6.330967426300049, + "learning_rate": 1.4558491291521561e-05, + "loss": 0.2773, + "step": 13537 + }, + { + "epoch": 36.88828337874659, + "grad_norm": 6.213892459869385, + "learning_rate": 1.455770580319029e-05, + "loss": 0.4926, + "step": 13538 + }, + { + "epoch": 36.89100817438692, + "grad_norm": 6.335833549499512, + "learning_rate": 1.4556920279363754e-05, + "loss": 0.404, + "step": 13539 + }, + { + "epoch": 36.89373297002725, + "grad_norm": 7.174566745758057, + "learning_rate": 1.4556134720048066e-05, + "loss": 0.3728, + "step": 13540 + }, + { + "epoch": 36.89645776566758, + "grad_norm": 12.14997673034668, + "learning_rate": 1.4555349125249353e-05, + "loss": 0.357, + "step": 13541 + }, + { + "epoch": 36.8991825613079, + "grad_norm": 5.641149997711182, + "learning_rate": 1.4554563494973721e-05, + "loss": 0.5276, + "step": 13542 + }, + { + "epoch": 36.90190735694823, + "grad_norm": 7.460294723510742, + "learning_rate": 1.45537778292273e-05, + "loss": 0.229, + "step": 13543 + }, + { + "epoch": 36.904632152588555, + "grad_norm": 5.240541458129883, + "learning_rate": 1.4552992128016202e-05, + "loss": 0.337, + "step": 13544 + }, + { + "epoch": 36.90735694822888, + "grad_norm": 7.271333694458008, + "learning_rate": 1.4552206391346548e-05, + "loss": 0.521, + "step": 13545 + }, + { + "epoch": 36.91008174386921, + "grad_norm": 5.819964408874512, + "learning_rate": 1.4551420619224455e-05, + "loss": 0.322, + "step": 13546 + }, + { + "epoch": 36.91280653950954, + "grad_norm": 6.316477298736572, + "learning_rate": 1.4550634811656048e-05, + "loss": 0.3957, + "step": 13547 + }, + { + "epoch": 36.915531335149865, + "grad_norm": 7.788074016571045, + "learning_rate": 1.4549848968647441e-05, + "loss": 0.2825, + "step": 13548 + }, + { + "epoch": 36.91825613079019, + "grad_norm": 6.44636869430542, + "learning_rate": 1.454906309020476e-05, + "loss": 0.3064, + "step": 13549 + }, + { + "epoch": 36.920980926430516, + "grad_norm": 7.1698832511901855, + "learning_rate": 1.4548277176334121e-05, + "loss": 0.3694, + "step": 13550 + }, + { + "epoch": 36.92370572207084, + "grad_norm": 7.369454860687256, + "learning_rate": 1.4547491227041643e-05, + "loss": 0.3172, + "step": 13551 + }, + { + "epoch": 36.926430517711175, + "grad_norm": 5.6260271072387695, + "learning_rate": 1.4546705242333452e-05, + "loss": 0.3223, + "step": 13552 + }, + { + "epoch": 36.9291553133515, + "grad_norm": 6.899228096008301, + "learning_rate": 1.4545919222215668e-05, + "loss": 0.5161, + "step": 13553 + }, + { + "epoch": 36.93188010899183, + "grad_norm": 5.509049892425537, + "learning_rate": 1.4545133166694408e-05, + "loss": 0.3986, + "step": 13554 + }, + { + "epoch": 36.93460490463215, + "grad_norm": 5.448057174682617, + "learning_rate": 1.45443470757758e-05, + "loss": 0.2816, + "step": 13555 + }, + { + "epoch": 36.93732970027248, + "grad_norm": 6.382065296173096, + "learning_rate": 1.4543560949465963e-05, + "loss": 0.2829, + "step": 13556 + }, + { + "epoch": 36.940054495912804, + "grad_norm": 5.697299003601074, + "learning_rate": 1.4542774787771019e-05, + "loss": 0.2551, + "step": 13557 + }, + { + "epoch": 36.94277929155314, + "grad_norm": 6.731752872467041, + "learning_rate": 1.4541988590697089e-05, + "loss": 0.3117, + "step": 13558 + }, + { + "epoch": 36.94550408719346, + "grad_norm": 6.797028541564941, + "learning_rate": 1.4541202358250301e-05, + "loss": 0.2345, + "step": 13559 + }, + { + "epoch": 36.94822888283379, + "grad_norm": 6.267938613891602, + "learning_rate": 1.4540416090436775e-05, + "loss": 0.3517, + "step": 13560 + }, + { + "epoch": 36.950953678474114, + "grad_norm": 7.315567493438721, + "learning_rate": 1.4539629787262635e-05, + "loss": 0.3029, + "step": 13561 + }, + { + "epoch": 36.95367847411444, + "grad_norm": 5.532219409942627, + "learning_rate": 1.4538843448734001e-05, + "loss": 0.3416, + "step": 13562 + }, + { + "epoch": 36.956403269754766, + "grad_norm": 6.393294334411621, + "learning_rate": 1.4538057074857004e-05, + "loss": 0.4073, + "step": 13563 + }, + { + "epoch": 36.95912806539509, + "grad_norm": 6.493333339691162, + "learning_rate": 1.4537270665637762e-05, + "loss": 0.2682, + "step": 13564 + }, + { + "epoch": 36.961852861035425, + "grad_norm": 6.927456378936768, + "learning_rate": 1.4536484221082403e-05, + "loss": 0.2459, + "step": 13565 + }, + { + "epoch": 36.96457765667575, + "grad_norm": 5.922084808349609, + "learning_rate": 1.453569774119705e-05, + "loss": 0.3593, + "step": 13566 + }, + { + "epoch": 36.967302452316076, + "grad_norm": 5.5476884841918945, + "learning_rate": 1.4534911225987832e-05, + "loss": 0.4234, + "step": 13567 + }, + { + "epoch": 36.9700272479564, + "grad_norm": 6.00234842300415, + "learning_rate": 1.4534124675460868e-05, + "loss": 0.3124, + "step": 13568 + }, + { + "epoch": 36.97275204359673, + "grad_norm": 7.949798583984375, + "learning_rate": 1.453333808962229e-05, + "loss": 0.3183, + "step": 13569 + }, + { + "epoch": 36.97547683923706, + "grad_norm": 12.44044017791748, + "learning_rate": 1.4532551468478217e-05, + "loss": 0.3472, + "step": 13570 + }, + { + "epoch": 36.97820163487739, + "grad_norm": 5.803534030914307, + "learning_rate": 1.4531764812034781e-05, + "loss": 0.3768, + "step": 13571 + }, + { + "epoch": 36.98092643051771, + "grad_norm": 6.589306354522705, + "learning_rate": 1.4530978120298108e-05, + "loss": 0.2889, + "step": 13572 + }, + { + "epoch": 36.98365122615804, + "grad_norm": 7.242832183837891, + "learning_rate": 1.4530191393274322e-05, + "loss": 0.2752, + "step": 13573 + }, + { + "epoch": 36.986376021798364, + "grad_norm": 10.549457550048828, + "learning_rate": 1.452940463096955e-05, + "loss": 0.2005, + "step": 13574 + }, + { + "epoch": 36.98910081743869, + "grad_norm": 8.42289924621582, + "learning_rate": 1.4528617833389925e-05, + "loss": 0.3764, + "step": 13575 + }, + { + "epoch": 36.991825613079016, + "grad_norm": 5.723546981811523, + "learning_rate": 1.4527831000541564e-05, + "loss": 0.3205, + "step": 13576 + }, + { + "epoch": 36.99455040871935, + "grad_norm": 7.526780605316162, + "learning_rate": 1.4527044132430605e-05, + "loss": 0.4643, + "step": 13577 + }, + { + "epoch": 36.997275204359674, + "grad_norm": 5.826638698577881, + "learning_rate": 1.452625722906317e-05, + "loss": 0.3167, + "step": 13578 + }, + { + "epoch": 37.0, + "grad_norm": 6.392323970794678, + "learning_rate": 1.4525470290445392e-05, + "loss": 0.2362, + "step": 13579 + }, + { + "epoch": 37.002724795640326, + "grad_norm": 5.40487003326416, + "learning_rate": 1.4524683316583392e-05, + "loss": 0.3614, + "step": 13580 + }, + { + "epoch": 37.00544959128065, + "grad_norm": 6.00352668762207, + "learning_rate": 1.4523896307483308e-05, + "loss": 0.3345, + "step": 13581 + }, + { + "epoch": 37.00817438692098, + "grad_norm": 5.279332160949707, + "learning_rate": 1.4523109263151262e-05, + "loss": 0.2882, + "step": 13582 + }, + { + "epoch": 37.01089918256131, + "grad_norm": 5.116689682006836, + "learning_rate": 1.4522322183593392e-05, + "loss": 0.2096, + "step": 13583 + }, + { + "epoch": 37.013623978201636, + "grad_norm": 5.397965908050537, + "learning_rate": 1.4521535068815817e-05, + "loss": 0.3013, + "step": 13584 + }, + { + "epoch": 37.01634877384196, + "grad_norm": 10.295614242553711, + "learning_rate": 1.4520747918824676e-05, + "loss": 0.2728, + "step": 13585 + }, + { + "epoch": 37.01907356948229, + "grad_norm": 6.142119884490967, + "learning_rate": 1.4519960733626093e-05, + "loss": 0.2662, + "step": 13586 + }, + { + "epoch": 37.02179836512261, + "grad_norm": 5.42104434967041, + "learning_rate": 1.4519173513226203e-05, + "loss": 0.255, + "step": 13587 + }, + { + "epoch": 37.02452316076294, + "grad_norm": 6.4026618003845215, + "learning_rate": 1.4518386257631135e-05, + "loss": 0.2265, + "step": 13588 + }, + { + "epoch": 37.02724795640327, + "grad_norm": 5.611619472503662, + "learning_rate": 1.4517598966847019e-05, + "loss": 0.3412, + "step": 13589 + }, + { + "epoch": 37.0299727520436, + "grad_norm": 5.409390926361084, + "learning_rate": 1.4516811640879988e-05, + "loss": 0.2619, + "step": 13590 + }, + { + "epoch": 37.032697547683924, + "grad_norm": 4.898901462554932, + "learning_rate": 1.4516024279736177e-05, + "loss": 0.3071, + "step": 13591 + }, + { + "epoch": 37.03542234332425, + "grad_norm": 5.6210479736328125, + "learning_rate": 1.4515236883421708e-05, + "loss": 0.1871, + "step": 13592 + }, + { + "epoch": 37.038147138964575, + "grad_norm": 5.9645161628723145, + "learning_rate": 1.4514449451942725e-05, + "loss": 0.3825, + "step": 13593 + }, + { + "epoch": 37.0408719346049, + "grad_norm": 5.265384674072266, + "learning_rate": 1.4513661985305351e-05, + "loss": 0.3369, + "step": 13594 + }, + { + "epoch": 37.043596730245234, + "grad_norm": 6.3180832862854, + "learning_rate": 1.4512874483515727e-05, + "loss": 0.3513, + "step": 13595 + }, + { + "epoch": 37.04632152588556, + "grad_norm": 5.28624153137207, + "learning_rate": 1.4512086946579977e-05, + "loss": 0.4906, + "step": 13596 + }, + { + "epoch": 37.049046321525886, + "grad_norm": 5.494368553161621, + "learning_rate": 1.4511299374504242e-05, + "loss": 0.3748, + "step": 13597 + }, + { + "epoch": 37.05177111716621, + "grad_norm": 6.383624076843262, + "learning_rate": 1.4510511767294653e-05, + "loss": 0.1972, + "step": 13598 + }, + { + "epoch": 37.05449591280654, + "grad_norm": 7.064739227294922, + "learning_rate": 1.4509724124957341e-05, + "loss": 0.2488, + "step": 13599 + }, + { + "epoch": 37.05722070844686, + "grad_norm": 5.792699337005615, + "learning_rate": 1.4508936447498442e-05, + "loss": 0.2599, + "step": 13600 + }, + { + "epoch": 37.059945504087196, + "grad_norm": 6.29413366317749, + "learning_rate": 1.4508148734924095e-05, + "loss": 0.2135, + "step": 13601 + }, + { + "epoch": 37.06267029972752, + "grad_norm": 11.314350128173828, + "learning_rate": 1.4507360987240429e-05, + "loss": 0.2141, + "step": 13602 + }, + { + "epoch": 37.06539509536785, + "grad_norm": 6.594211101531982, + "learning_rate": 1.450657320445358e-05, + "loss": 0.4008, + "step": 13603 + }, + { + "epoch": 37.06811989100817, + "grad_norm": 6.072294235229492, + "learning_rate": 1.4505785386569686e-05, + "loss": 0.2754, + "step": 13604 + }, + { + "epoch": 37.0708446866485, + "grad_norm": 7.498562812805176, + "learning_rate": 1.4504997533594881e-05, + "loss": 0.2602, + "step": 13605 + }, + { + "epoch": 37.073569482288825, + "grad_norm": 7.032705307006836, + "learning_rate": 1.4504209645535294e-05, + "loss": 0.259, + "step": 13606 + }, + { + "epoch": 37.07629427792916, + "grad_norm": 6.204941749572754, + "learning_rate": 1.450342172239707e-05, + "loss": 0.2395, + "step": 13607 + }, + { + "epoch": 37.079019073569484, + "grad_norm": 6.8277907371521, + "learning_rate": 1.4502633764186346e-05, + "loss": 0.3278, + "step": 13608 + }, + { + "epoch": 37.08174386920981, + "grad_norm": 5.717363357543945, + "learning_rate": 1.4501845770909253e-05, + "loss": 0.2976, + "step": 13609 + }, + { + "epoch": 37.084468664850135, + "grad_norm": 4.983062267303467, + "learning_rate": 1.4501057742571931e-05, + "loss": 0.2898, + "step": 13610 + }, + { + "epoch": 37.08719346049046, + "grad_norm": 6.429154396057129, + "learning_rate": 1.4500269679180513e-05, + "loss": 0.4847, + "step": 13611 + }, + { + "epoch": 37.08991825613079, + "grad_norm": 5.963826656341553, + "learning_rate": 1.4499481580741144e-05, + "loss": 0.2522, + "step": 13612 + }, + { + "epoch": 37.09264305177112, + "grad_norm": 6.59958028793335, + "learning_rate": 1.4498693447259956e-05, + "loss": 0.3997, + "step": 13613 + }, + { + "epoch": 37.095367847411445, + "grad_norm": 4.506076812744141, + "learning_rate": 1.4497905278743086e-05, + "loss": 0.2088, + "step": 13614 + }, + { + "epoch": 37.09809264305177, + "grad_norm": 6.12763786315918, + "learning_rate": 1.4497117075196677e-05, + "loss": 0.2474, + "step": 13615 + }, + { + "epoch": 37.1008174386921, + "grad_norm": 7.154154300689697, + "learning_rate": 1.4496328836626863e-05, + "loss": 0.3685, + "step": 13616 + }, + { + "epoch": 37.10354223433242, + "grad_norm": 6.3774285316467285, + "learning_rate": 1.4495540563039785e-05, + "loss": 0.2685, + "step": 13617 + }, + { + "epoch": 37.10626702997275, + "grad_norm": 4.6779279708862305, + "learning_rate": 1.4494752254441585e-05, + "loss": 0.2375, + "step": 13618 + }, + { + "epoch": 37.10899182561308, + "grad_norm": 5.380875110626221, + "learning_rate": 1.4493963910838393e-05, + "loss": 0.391, + "step": 13619 + }, + { + "epoch": 37.11171662125341, + "grad_norm": 5.728816986083984, + "learning_rate": 1.4493175532236361e-05, + "loss": 0.2866, + "step": 13620 + }, + { + "epoch": 37.11444141689373, + "grad_norm": 5.909167289733887, + "learning_rate": 1.4492387118641618e-05, + "loss": 0.2805, + "step": 13621 + }, + { + "epoch": 37.11716621253406, + "grad_norm": 5.537550926208496, + "learning_rate": 1.4491598670060312e-05, + "loss": 0.3844, + "step": 13622 + }, + { + "epoch": 37.119891008174385, + "grad_norm": 5.119868278503418, + "learning_rate": 1.4490810186498577e-05, + "loss": 0.2268, + "step": 13623 + }, + { + "epoch": 37.12261580381471, + "grad_norm": 7.367032051086426, + "learning_rate": 1.4490021667962556e-05, + "loss": 0.2613, + "step": 13624 + }, + { + "epoch": 37.12534059945504, + "grad_norm": 5.83549690246582, + "learning_rate": 1.4489233114458394e-05, + "loss": 0.3523, + "step": 13625 + }, + { + "epoch": 37.12806539509537, + "grad_norm": 5.785162448883057, + "learning_rate": 1.448844452599223e-05, + "loss": 0.3449, + "step": 13626 + }, + { + "epoch": 37.130790190735695, + "grad_norm": 5.571055889129639, + "learning_rate": 1.4487655902570201e-05, + "loss": 0.3671, + "step": 13627 + }, + { + "epoch": 37.13351498637602, + "grad_norm": 6.009766578674316, + "learning_rate": 1.4486867244198455e-05, + "loss": 0.3368, + "step": 13628 + }, + { + "epoch": 37.13623978201635, + "grad_norm": 6.343024730682373, + "learning_rate": 1.4486078550883129e-05, + "loss": 0.2497, + "step": 13629 + }, + { + "epoch": 37.13896457765667, + "grad_norm": 5.5884599685668945, + "learning_rate": 1.448528982263037e-05, + "loss": 0.224, + "step": 13630 + }, + { + "epoch": 37.141689373297005, + "grad_norm": 5.679103851318359, + "learning_rate": 1.4484501059446317e-05, + "loss": 0.3214, + "step": 13631 + }, + { + "epoch": 37.14441416893733, + "grad_norm": 4.739778518676758, + "learning_rate": 1.4483712261337113e-05, + "loss": 0.3524, + "step": 13632 + }, + { + "epoch": 37.14713896457766, + "grad_norm": 8.464988708496094, + "learning_rate": 1.4482923428308904e-05, + "loss": 0.4272, + "step": 13633 + }, + { + "epoch": 37.14986376021798, + "grad_norm": 5.842249870300293, + "learning_rate": 1.448213456036783e-05, + "loss": 0.2496, + "step": 13634 + }, + { + "epoch": 37.15258855585831, + "grad_norm": 5.07939338684082, + "learning_rate": 1.4481345657520036e-05, + "loss": 0.4718, + "step": 13635 + }, + { + "epoch": 37.155313351498634, + "grad_norm": 6.1155595779418945, + "learning_rate": 1.4480556719771671e-05, + "loss": 0.2461, + "step": 13636 + }, + { + "epoch": 37.15803814713897, + "grad_norm": 7.305619239807129, + "learning_rate": 1.447976774712887e-05, + "loss": 0.1876, + "step": 13637 + }, + { + "epoch": 37.16076294277929, + "grad_norm": 5.101131916046143, + "learning_rate": 1.4478978739597781e-05, + "loss": 0.2981, + "step": 13638 + }, + { + "epoch": 37.16348773841962, + "grad_norm": 6.35480260848999, + "learning_rate": 1.4478189697184553e-05, + "loss": 0.1937, + "step": 13639 + }, + { + "epoch": 37.166212534059945, + "grad_norm": 4.870874881744385, + "learning_rate": 1.4477400619895326e-05, + "loss": 0.1893, + "step": 13640 + }, + { + "epoch": 37.16893732970027, + "grad_norm": 5.622579574584961, + "learning_rate": 1.4476611507736244e-05, + "loss": 0.2455, + "step": 13641 + }, + { + "epoch": 37.171662125340596, + "grad_norm": 6.2390947341918945, + "learning_rate": 1.4475822360713463e-05, + "loss": 0.3851, + "step": 13642 + }, + { + "epoch": 37.17438692098093, + "grad_norm": 7.213648319244385, + "learning_rate": 1.4475033178833116e-05, + "loss": 0.2074, + "step": 13643 + }, + { + "epoch": 37.177111716621255, + "grad_norm": 5.573960304260254, + "learning_rate": 1.4474243962101357e-05, + "loss": 0.2524, + "step": 13644 + }, + { + "epoch": 37.17983651226158, + "grad_norm": 6.93544340133667, + "learning_rate": 1.4473454710524328e-05, + "loss": 0.2539, + "step": 13645 + }, + { + "epoch": 37.182561307901906, + "grad_norm": 6.557056903839111, + "learning_rate": 1.447266542410818e-05, + "loss": 0.2092, + "step": 13646 + }, + { + "epoch": 37.18528610354223, + "grad_norm": 6.192226409912109, + "learning_rate": 1.4471876102859057e-05, + "loss": 0.2141, + "step": 13647 + }, + { + "epoch": 37.18801089918256, + "grad_norm": 6.104713439941406, + "learning_rate": 1.4471086746783108e-05, + "loss": 0.3153, + "step": 13648 + }, + { + "epoch": 37.19073569482289, + "grad_norm": 6.464320182800293, + "learning_rate": 1.4470297355886476e-05, + "loss": 0.2886, + "step": 13649 + }, + { + "epoch": 37.19346049046322, + "grad_norm": 6.354846954345703, + "learning_rate": 1.4469507930175313e-05, + "loss": 0.2008, + "step": 13650 + }, + { + "epoch": 37.19618528610354, + "grad_norm": 6.795820236206055, + "learning_rate": 1.4468718469655766e-05, + "loss": 0.2286, + "step": 13651 + }, + { + "epoch": 37.19891008174387, + "grad_norm": 6.503321647644043, + "learning_rate": 1.4467928974333987e-05, + "loss": 0.3454, + "step": 13652 + }, + { + "epoch": 37.201634877384194, + "grad_norm": 5.964447975158691, + "learning_rate": 1.4467139444216117e-05, + "loss": 0.3126, + "step": 13653 + }, + { + "epoch": 37.20435967302452, + "grad_norm": 5.265637397766113, + "learning_rate": 1.446634987930831e-05, + "loss": 0.2384, + "step": 13654 + }, + { + "epoch": 37.20708446866485, + "grad_norm": 5.736026287078857, + "learning_rate": 1.4465560279616714e-05, + "loss": 0.1817, + "step": 13655 + }, + { + "epoch": 37.20980926430518, + "grad_norm": 6.372326850891113, + "learning_rate": 1.446477064514748e-05, + "loss": 0.2786, + "step": 13656 + }, + { + "epoch": 37.212534059945504, + "grad_norm": 9.852974891662598, + "learning_rate": 1.4463980975906753e-05, + "loss": 0.293, + "step": 13657 + }, + { + "epoch": 37.21525885558583, + "grad_norm": 5.008190631866455, + "learning_rate": 1.4463191271900686e-05, + "loss": 0.1955, + "step": 13658 + }, + { + "epoch": 37.217983651226156, + "grad_norm": 5.530735015869141, + "learning_rate": 1.4462401533135429e-05, + "loss": 0.2639, + "step": 13659 + }, + { + "epoch": 37.22070844686648, + "grad_norm": 6.269716739654541, + "learning_rate": 1.4461611759617134e-05, + "loss": 0.1737, + "step": 13660 + }, + { + "epoch": 37.223433242506815, + "grad_norm": 6.597443580627441, + "learning_rate": 1.446082195135195e-05, + "loss": 0.3604, + "step": 13661 + }, + { + "epoch": 37.22615803814714, + "grad_norm": 7.4416375160217285, + "learning_rate": 1.4460032108346029e-05, + "loss": 0.3043, + "step": 13662 + }, + { + "epoch": 37.228882833787466, + "grad_norm": 6.190356731414795, + "learning_rate": 1.445924223060552e-05, + "loss": 0.4641, + "step": 13663 + }, + { + "epoch": 37.23160762942779, + "grad_norm": 5.487213134765625, + "learning_rate": 1.4458452318136575e-05, + "loss": 0.2169, + "step": 13664 + }, + { + "epoch": 37.23433242506812, + "grad_norm": 7.421302795410156, + "learning_rate": 1.4457662370945348e-05, + "loss": 0.2897, + "step": 13665 + }, + { + "epoch": 37.237057220708444, + "grad_norm": 6.267577171325684, + "learning_rate": 1.445687238903799e-05, + "loss": 0.3732, + "step": 13666 + }, + { + "epoch": 37.23978201634878, + "grad_norm": 5.17593240737915, + "learning_rate": 1.4456082372420652e-05, + "loss": 0.3845, + "step": 13667 + }, + { + "epoch": 37.2425068119891, + "grad_norm": 4.650514602661133, + "learning_rate": 1.4455292321099492e-05, + "loss": 0.4111, + "step": 13668 + }, + { + "epoch": 37.24523160762943, + "grad_norm": 5.345720291137695, + "learning_rate": 1.4454502235080654e-05, + "loss": 0.2173, + "step": 13669 + }, + { + "epoch": 37.247956403269754, + "grad_norm": 5.987113952636719, + "learning_rate": 1.44537121143703e-05, + "loss": 0.3471, + "step": 13670 + }, + { + "epoch": 37.25068119891008, + "grad_norm": 5.843854904174805, + "learning_rate": 1.4452921958974578e-05, + "loss": 0.2214, + "step": 13671 + }, + { + "epoch": 37.253405994550405, + "grad_norm": 6.542635917663574, + "learning_rate": 1.4452131768899641e-05, + "loss": 0.2692, + "step": 13672 + }, + { + "epoch": 37.25613079019074, + "grad_norm": 12.215797424316406, + "learning_rate": 1.4451341544151647e-05, + "loss": 0.3048, + "step": 13673 + }, + { + "epoch": 37.258855585831064, + "grad_norm": 6.043381214141846, + "learning_rate": 1.4450551284736748e-05, + "loss": 0.3226, + "step": 13674 + }, + { + "epoch": 37.26158038147139, + "grad_norm": 6.124060153961182, + "learning_rate": 1.4449760990661098e-05, + "loss": 0.2841, + "step": 13675 + }, + { + "epoch": 37.264305177111716, + "grad_norm": 5.762239456176758, + "learning_rate": 1.4448970661930854e-05, + "loss": 0.2475, + "step": 13676 + }, + { + "epoch": 37.26702997275204, + "grad_norm": 6.271738052368164, + "learning_rate": 1.4448180298552168e-05, + "loss": 0.2762, + "step": 13677 + }, + { + "epoch": 37.26975476839237, + "grad_norm": 5.748197555541992, + "learning_rate": 1.4447389900531199e-05, + "loss": 0.2891, + "step": 13678 + }, + { + "epoch": 37.2724795640327, + "grad_norm": 5.341134071350098, + "learning_rate": 1.44465994678741e-05, + "loss": 0.2315, + "step": 13679 + }, + { + "epoch": 37.275204359673026, + "grad_norm": 6.73088264465332, + "learning_rate": 1.4445809000587027e-05, + "loss": 0.3155, + "step": 13680 + }, + { + "epoch": 37.27792915531335, + "grad_norm": 10.141463279724121, + "learning_rate": 1.4445018498676135e-05, + "loss": 0.4325, + "step": 13681 + }, + { + "epoch": 37.28065395095368, + "grad_norm": 6.6343207359313965, + "learning_rate": 1.4444227962147586e-05, + "loss": 0.4275, + "step": 13682 + }, + { + "epoch": 37.283378746594, + "grad_norm": 6.762706756591797, + "learning_rate": 1.4443437391007531e-05, + "loss": 0.2278, + "step": 13683 + }, + { + "epoch": 37.28610354223433, + "grad_norm": 6.540870189666748, + "learning_rate": 1.4442646785262126e-05, + "loss": 0.4446, + "step": 13684 + }, + { + "epoch": 37.28882833787466, + "grad_norm": 5.8193206787109375, + "learning_rate": 1.4441856144917535e-05, + "loss": 0.4615, + "step": 13685 + }, + { + "epoch": 37.29155313351499, + "grad_norm": 5.472895622253418, + "learning_rate": 1.4441065469979908e-05, + "loss": 0.3626, + "step": 13686 + }, + { + "epoch": 37.294277929155314, + "grad_norm": 5.899320602416992, + "learning_rate": 1.4440274760455406e-05, + "loss": 0.3423, + "step": 13687 + }, + { + "epoch": 37.29700272479564, + "grad_norm": 6.971601486206055, + "learning_rate": 1.443948401635019e-05, + "loss": 0.2655, + "step": 13688 + }, + { + "epoch": 37.299727520435965, + "grad_norm": 5.75792932510376, + "learning_rate": 1.4438693237670412e-05, + "loss": 0.3479, + "step": 13689 + }, + { + "epoch": 37.30245231607629, + "grad_norm": 5.564891815185547, + "learning_rate": 1.4437902424422236e-05, + "loss": 0.468, + "step": 13690 + }, + { + "epoch": 37.305177111716624, + "grad_norm": 5.492071628570557, + "learning_rate": 1.443711157661182e-05, + "loss": 0.2078, + "step": 13691 + }, + { + "epoch": 37.30790190735695, + "grad_norm": 4.296332359313965, + "learning_rate": 1.4436320694245318e-05, + "loss": 0.1584, + "step": 13692 + }, + { + "epoch": 37.310626702997276, + "grad_norm": 4.209894180297852, + "learning_rate": 1.4435529777328895e-05, + "loss": 0.1995, + "step": 13693 + }, + { + "epoch": 37.3133514986376, + "grad_norm": 5.265773296356201, + "learning_rate": 1.443473882586871e-05, + "loss": 0.2421, + "step": 13694 + }, + { + "epoch": 37.31607629427793, + "grad_norm": 4.542918682098389, + "learning_rate": 1.4433947839870924e-05, + "loss": 0.2087, + "step": 13695 + }, + { + "epoch": 37.31880108991825, + "grad_norm": 9.200000762939453, + "learning_rate": 1.443315681934169e-05, + "loss": 0.2547, + "step": 13696 + }, + { + "epoch": 37.321525885558586, + "grad_norm": 6.090592861175537, + "learning_rate": 1.4432365764287175e-05, + "loss": 0.325, + "step": 13697 + }, + { + "epoch": 37.32425068119891, + "grad_norm": 6.258579730987549, + "learning_rate": 1.4431574674713538e-05, + "loss": 0.312, + "step": 13698 + }, + { + "epoch": 37.32697547683924, + "grad_norm": 5.172791004180908, + "learning_rate": 1.443078355062694e-05, + "loss": 0.1498, + "step": 13699 + }, + { + "epoch": 37.32970027247956, + "grad_norm": 5.496511459350586, + "learning_rate": 1.4429992392033545e-05, + "loss": 0.4258, + "step": 13700 + }, + { + "epoch": 37.33242506811989, + "grad_norm": 6.028332710266113, + "learning_rate": 1.4429201198939508e-05, + "loss": 0.2749, + "step": 13701 + }, + { + "epoch": 37.335149863760215, + "grad_norm": 7.874242305755615, + "learning_rate": 1.4428409971350994e-05, + "loss": 0.2789, + "step": 13702 + }, + { + "epoch": 37.33787465940055, + "grad_norm": 5.639641284942627, + "learning_rate": 1.442761870927417e-05, + "loss": 0.1975, + "step": 13703 + }, + { + "epoch": 37.34059945504087, + "grad_norm": 6.8148884773254395, + "learning_rate": 1.4426827412715192e-05, + "loss": 0.3941, + "step": 13704 + }, + { + "epoch": 37.3433242506812, + "grad_norm": 8.138447761535645, + "learning_rate": 1.4426036081680223e-05, + "loss": 0.2075, + "step": 13705 + }, + { + "epoch": 37.346049046321525, + "grad_norm": 5.802258014678955, + "learning_rate": 1.4425244716175431e-05, + "loss": 0.4133, + "step": 13706 + }, + { + "epoch": 37.34877384196185, + "grad_norm": 8.083141326904297, + "learning_rate": 1.4424453316206974e-05, + "loss": 0.3503, + "step": 13707 + }, + { + "epoch": 37.35149863760218, + "grad_norm": 4.53306770324707, + "learning_rate": 1.4423661881781014e-05, + "loss": 0.1835, + "step": 13708 + }, + { + "epoch": 37.35422343324251, + "grad_norm": 6.26450777053833, + "learning_rate": 1.442287041290372e-05, + "loss": 0.3317, + "step": 13709 + }, + { + "epoch": 37.356948228882835, + "grad_norm": 5.232570648193359, + "learning_rate": 1.4422078909581253e-05, + "loss": 0.25, + "step": 13710 + }, + { + "epoch": 37.35967302452316, + "grad_norm": 5.264657974243164, + "learning_rate": 1.4421287371819781e-05, + "loss": 0.2209, + "step": 13711 + }, + { + "epoch": 37.36239782016349, + "grad_norm": 5.533340930938721, + "learning_rate": 1.442049579962546e-05, + "loss": 0.2596, + "step": 13712 + }, + { + "epoch": 37.36512261580381, + "grad_norm": 6.200746059417725, + "learning_rate": 1.4419704193004464e-05, + "loss": 0.2444, + "step": 13713 + }, + { + "epoch": 37.36784741144414, + "grad_norm": 6.443899631500244, + "learning_rate": 1.4418912551962953e-05, + "loss": 0.2205, + "step": 13714 + }, + { + "epoch": 37.37057220708447, + "grad_norm": 7.062668323516846, + "learning_rate": 1.4418120876507093e-05, + "loss": 0.1915, + "step": 13715 + }, + { + "epoch": 37.3732970027248, + "grad_norm": 7.006562232971191, + "learning_rate": 1.441732916664305e-05, + "loss": 0.333, + "step": 13716 + }, + { + "epoch": 37.37602179836512, + "grad_norm": 6.008820533752441, + "learning_rate": 1.441653742237699e-05, + "loss": 0.3147, + "step": 13717 + }, + { + "epoch": 37.37874659400545, + "grad_norm": 6.851540565490723, + "learning_rate": 1.4415745643715075e-05, + "loss": 0.2743, + "step": 13718 + }, + { + "epoch": 37.381471389645775, + "grad_norm": 5.677096843719482, + "learning_rate": 1.4414953830663478e-05, + "loss": 0.4421, + "step": 13719 + }, + { + "epoch": 37.3841961852861, + "grad_norm": 5.402856349945068, + "learning_rate": 1.4414161983228362e-05, + "loss": 0.297, + "step": 13720 + }, + { + "epoch": 37.38692098092643, + "grad_norm": 4.693260192871094, + "learning_rate": 1.4413370101415898e-05, + "loss": 0.189, + "step": 13721 + }, + { + "epoch": 37.38964577656676, + "grad_norm": 7.506068706512451, + "learning_rate": 1.4412578185232246e-05, + "loss": 0.435, + "step": 13722 + }, + { + "epoch": 37.392370572207085, + "grad_norm": 6.2235283851623535, + "learning_rate": 1.441178623468358e-05, + "loss": 0.3595, + "step": 13723 + }, + { + "epoch": 37.39509536784741, + "grad_norm": 6.36119270324707, + "learning_rate": 1.441099424977606e-05, + "loss": 0.2841, + "step": 13724 + }, + { + "epoch": 37.39782016348774, + "grad_norm": 5.588457107543945, + "learning_rate": 1.4410202230515865e-05, + "loss": 0.162, + "step": 13725 + }, + { + "epoch": 37.40054495912806, + "grad_norm": 5.098292827606201, + "learning_rate": 1.440941017690915e-05, + "loss": 0.1873, + "step": 13726 + }, + { + "epoch": 37.403269754768395, + "grad_norm": 7.046430587768555, + "learning_rate": 1.4408618088962096e-05, + "loss": 0.3149, + "step": 13727 + }, + { + "epoch": 37.40599455040872, + "grad_norm": 5.249959468841553, + "learning_rate": 1.4407825966680862e-05, + "loss": 0.2182, + "step": 13728 + }, + { + "epoch": 37.40871934604905, + "grad_norm": 9.688139915466309, + "learning_rate": 1.4407033810071624e-05, + "loss": 0.2852, + "step": 13729 + }, + { + "epoch": 37.41144414168937, + "grad_norm": 4.626587867736816, + "learning_rate": 1.4406241619140549e-05, + "loss": 0.1972, + "step": 13730 + }, + { + "epoch": 37.4141689373297, + "grad_norm": 5.785120964050293, + "learning_rate": 1.4405449393893807e-05, + "loss": 0.2773, + "step": 13731 + }, + { + "epoch": 37.416893732970024, + "grad_norm": 6.856450080871582, + "learning_rate": 1.4404657134337562e-05, + "loss": 0.2383, + "step": 13732 + }, + { + "epoch": 37.41961852861036, + "grad_norm": 5.6097259521484375, + "learning_rate": 1.4403864840477994e-05, + "loss": 0.4141, + "step": 13733 + }, + { + "epoch": 37.42234332425068, + "grad_norm": 8.284987449645996, + "learning_rate": 1.4403072512321266e-05, + "loss": 0.2511, + "step": 13734 + }, + { + "epoch": 37.42506811989101, + "grad_norm": 8.898246765136719, + "learning_rate": 1.440228014987355e-05, + "loss": 0.2932, + "step": 13735 + }, + { + "epoch": 37.427792915531334, + "grad_norm": 5.818563461303711, + "learning_rate": 1.440148775314102e-05, + "loss": 0.2899, + "step": 13736 + }, + { + "epoch": 37.43051771117166, + "grad_norm": 5.395720481872559, + "learning_rate": 1.4400695322129846e-05, + "loss": 0.3019, + "step": 13737 + }, + { + "epoch": 37.433242506811986, + "grad_norm": 5.264636039733887, + "learning_rate": 1.4399902856846195e-05, + "loss": 0.2049, + "step": 13738 + }, + { + "epoch": 37.43596730245232, + "grad_norm": 6.397223949432373, + "learning_rate": 1.4399110357296244e-05, + "loss": 0.3132, + "step": 13739 + }, + { + "epoch": 37.438692098092645, + "grad_norm": 5.450150489807129, + "learning_rate": 1.4398317823486164e-05, + "loss": 0.2116, + "step": 13740 + }, + { + "epoch": 37.44141689373297, + "grad_norm": 5.349878311157227, + "learning_rate": 1.4397525255422125e-05, + "loss": 0.2759, + "step": 13741 + }, + { + "epoch": 37.444141689373296, + "grad_norm": 7.868896961212158, + "learning_rate": 1.4396732653110302e-05, + "loss": 0.2057, + "step": 13742 + }, + { + "epoch": 37.44686648501362, + "grad_norm": 10.411602973937988, + "learning_rate": 1.4395940016556867e-05, + "loss": 0.2873, + "step": 13743 + }, + { + "epoch": 37.44959128065395, + "grad_norm": 7.2601542472839355, + "learning_rate": 1.4395147345767988e-05, + "loss": 0.4367, + "step": 13744 + }, + { + "epoch": 37.45231607629428, + "grad_norm": 5.517092227935791, + "learning_rate": 1.4394354640749848e-05, + "loss": 0.2008, + "step": 13745 + }, + { + "epoch": 37.45504087193461, + "grad_norm": 8.747833251953125, + "learning_rate": 1.4393561901508613e-05, + "loss": 0.2881, + "step": 13746 + }, + { + "epoch": 37.45776566757493, + "grad_norm": 5.685414791107178, + "learning_rate": 1.439276912805046e-05, + "loss": 0.2178, + "step": 13747 + }, + { + "epoch": 37.46049046321526, + "grad_norm": 5.122185230255127, + "learning_rate": 1.4391976320381562e-05, + "loss": 0.166, + "step": 13748 + }, + { + "epoch": 37.463215258855584, + "grad_norm": 7.064228057861328, + "learning_rate": 1.4391183478508098e-05, + "loss": 0.2955, + "step": 13749 + }, + { + "epoch": 37.46594005449591, + "grad_norm": 7.867053031921387, + "learning_rate": 1.4390390602436232e-05, + "loss": 0.2117, + "step": 13750 + }, + { + "epoch": 37.46866485013624, + "grad_norm": 5.2257466316223145, + "learning_rate": 1.438959769217215e-05, + "loss": 0.3257, + "step": 13751 + }, + { + "epoch": 37.47138964577657, + "grad_norm": 6.032914638519287, + "learning_rate": 1.4388804747722018e-05, + "loss": 0.2724, + "step": 13752 + }, + { + "epoch": 37.474114441416894, + "grad_norm": 5.87555456161499, + "learning_rate": 1.4388011769092018e-05, + "loss": 0.2836, + "step": 13753 + }, + { + "epoch": 37.47683923705722, + "grad_norm": 5.952106952667236, + "learning_rate": 1.4387218756288323e-05, + "loss": 0.3994, + "step": 13754 + }, + { + "epoch": 37.479564032697546, + "grad_norm": 6.191522598266602, + "learning_rate": 1.4386425709317113e-05, + "loss": 0.2023, + "step": 13755 + }, + { + "epoch": 37.48228882833787, + "grad_norm": 6.224193096160889, + "learning_rate": 1.4385632628184558e-05, + "loss": 0.2334, + "step": 13756 + }, + { + "epoch": 37.485013623978205, + "grad_norm": 7.023881912231445, + "learning_rate": 1.4384839512896837e-05, + "loss": 0.2537, + "step": 13757 + }, + { + "epoch": 37.48773841961853, + "grad_norm": 6.266427516937256, + "learning_rate": 1.4384046363460129e-05, + "loss": 0.2319, + "step": 13758 + }, + { + "epoch": 37.490463215258856, + "grad_norm": 6.77350378036499, + "learning_rate": 1.4383253179880607e-05, + "loss": 0.5074, + "step": 13759 + }, + { + "epoch": 37.49318801089918, + "grad_norm": 5.959731101989746, + "learning_rate": 1.4382459962164452e-05, + "loss": 0.2427, + "step": 13760 + }, + { + "epoch": 37.49591280653951, + "grad_norm": 6.488434314727783, + "learning_rate": 1.4381666710317837e-05, + "loss": 0.2007, + "step": 13761 + }, + { + "epoch": 37.49863760217983, + "grad_norm": 7.6190185546875, + "learning_rate": 1.4380873424346945e-05, + "loss": 0.2081, + "step": 13762 + }, + { + "epoch": 37.50136239782017, + "grad_norm": 8.222481727600098, + "learning_rate": 1.438008010425795e-05, + "loss": 0.3317, + "step": 13763 + }, + { + "epoch": 37.50408719346049, + "grad_norm": 7.253337860107422, + "learning_rate": 1.4379286750057033e-05, + "loss": 0.2043, + "step": 13764 + }, + { + "epoch": 37.50681198910082, + "grad_norm": 18.86480140686035, + "learning_rate": 1.4378493361750374e-05, + "loss": 0.3537, + "step": 13765 + }, + { + "epoch": 37.509536784741144, + "grad_norm": 6.140002250671387, + "learning_rate": 1.4377699939344148e-05, + "loss": 0.2787, + "step": 13766 + }, + { + "epoch": 37.51226158038147, + "grad_norm": 6.517630100250244, + "learning_rate": 1.4376906482844534e-05, + "loss": 0.2522, + "step": 13767 + }, + { + "epoch": 37.514986376021795, + "grad_norm": 5.6096649169921875, + "learning_rate": 1.4376112992257714e-05, + "loss": 0.2505, + "step": 13768 + }, + { + "epoch": 37.51771117166213, + "grad_norm": 6.280866622924805, + "learning_rate": 1.4375319467589868e-05, + "loss": 0.3471, + "step": 13769 + }, + { + "epoch": 37.520435967302454, + "grad_norm": 5.432213306427002, + "learning_rate": 1.4374525908847175e-05, + "loss": 0.24, + "step": 13770 + }, + { + "epoch": 37.52316076294278, + "grad_norm": 6.034014701843262, + "learning_rate": 1.4373732316035813e-05, + "loss": 0.2612, + "step": 13771 + }, + { + "epoch": 37.525885558583106, + "grad_norm": 5.9695000648498535, + "learning_rate": 1.4372938689161969e-05, + "loss": 0.3268, + "step": 13772 + }, + { + "epoch": 37.52861035422343, + "grad_norm": 6.036328315734863, + "learning_rate": 1.4372145028231814e-05, + "loss": 0.2262, + "step": 13773 + }, + { + "epoch": 37.53133514986376, + "grad_norm": 5.686705112457275, + "learning_rate": 1.4371351333251535e-05, + "loss": 0.2376, + "step": 13774 + }, + { + "epoch": 37.53405994550409, + "grad_norm": 6.202902793884277, + "learning_rate": 1.4370557604227316e-05, + "loss": 0.3719, + "step": 13775 + }, + { + "epoch": 37.536784741144416, + "grad_norm": 6.547354698181152, + "learning_rate": 1.4369763841165331e-05, + "loss": 0.2327, + "step": 13776 + }, + { + "epoch": 37.53950953678474, + "grad_norm": 12.354787826538086, + "learning_rate": 1.4368970044071768e-05, + "loss": 0.2022, + "step": 13777 + }, + { + "epoch": 37.54223433242507, + "grad_norm": 4.935760974884033, + "learning_rate": 1.4368176212952807e-05, + "loss": 0.2329, + "step": 13778 + }, + { + "epoch": 37.54495912806539, + "grad_norm": 6.330197811126709, + "learning_rate": 1.4367382347814628e-05, + "loss": 0.226, + "step": 13779 + }, + { + "epoch": 37.54768392370572, + "grad_norm": 5.834701061248779, + "learning_rate": 1.436658844866342e-05, + "loss": 0.3147, + "step": 13780 + }, + { + "epoch": 37.55040871934605, + "grad_norm": 5.683170795440674, + "learning_rate": 1.4365794515505359e-05, + "loss": 0.2083, + "step": 13781 + }, + { + "epoch": 37.55313351498638, + "grad_norm": 7.662569046020508, + "learning_rate": 1.4365000548346633e-05, + "loss": 0.3043, + "step": 13782 + }, + { + "epoch": 37.555858310626704, + "grad_norm": 6.115015506744385, + "learning_rate": 1.436420654719342e-05, + "loss": 0.2692, + "step": 13783 + }, + { + "epoch": 37.55858310626703, + "grad_norm": 7.078417778015137, + "learning_rate": 1.4363412512051908e-05, + "loss": 0.228, + "step": 13784 + }, + { + "epoch": 37.561307901907355, + "grad_norm": 6.246332168579102, + "learning_rate": 1.436261844292828e-05, + "loss": 0.3627, + "step": 13785 + }, + { + "epoch": 37.56403269754768, + "grad_norm": 6.897421836853027, + "learning_rate": 1.4361824339828718e-05, + "loss": 0.3459, + "step": 13786 + }, + { + "epoch": 37.566757493188014, + "grad_norm": 6.10270357131958, + "learning_rate": 1.4361030202759412e-05, + "loss": 0.3805, + "step": 13787 + }, + { + "epoch": 37.56948228882834, + "grad_norm": 6.087770938873291, + "learning_rate": 1.4360236031726543e-05, + "loss": 0.2395, + "step": 13788 + }, + { + "epoch": 37.572207084468666, + "grad_norm": 5.868922233581543, + "learning_rate": 1.4359441826736294e-05, + "loss": 0.3105, + "step": 13789 + }, + { + "epoch": 37.57493188010899, + "grad_norm": 6.516274452209473, + "learning_rate": 1.4358647587794851e-05, + "loss": 0.285, + "step": 13790 + }, + { + "epoch": 37.57765667574932, + "grad_norm": 6.568358898162842, + "learning_rate": 1.4357853314908403e-05, + "loss": 0.2906, + "step": 13791 + }, + { + "epoch": 37.58038147138964, + "grad_norm": 5.451956272125244, + "learning_rate": 1.4357059008083133e-05, + "loss": 0.3814, + "step": 13792 + }, + { + "epoch": 37.583106267029976, + "grad_norm": 6.1217427253723145, + "learning_rate": 1.4356264667325231e-05, + "loss": 0.2633, + "step": 13793 + }, + { + "epoch": 37.5858310626703, + "grad_norm": 5.793474197387695, + "learning_rate": 1.4355470292640879e-05, + "loss": 0.3409, + "step": 13794 + }, + { + "epoch": 37.58855585831063, + "grad_norm": 7.553661823272705, + "learning_rate": 1.4354675884036257e-05, + "loss": 0.3251, + "step": 13795 + }, + { + "epoch": 37.59128065395095, + "grad_norm": 5.576457500457764, + "learning_rate": 1.4353881441517568e-05, + "loss": 0.3749, + "step": 13796 + }, + { + "epoch": 37.59400544959128, + "grad_norm": 4.476280212402344, + "learning_rate": 1.4353086965090985e-05, + "loss": 0.2102, + "step": 13797 + }, + { + "epoch": 37.596730245231605, + "grad_norm": 5.663008689880371, + "learning_rate": 1.4352292454762705e-05, + "loss": 0.2438, + "step": 13798 + }, + { + "epoch": 37.59945504087194, + "grad_norm": 7.217907428741455, + "learning_rate": 1.435149791053891e-05, + "loss": 0.296, + "step": 13799 + }, + { + "epoch": 37.60217983651226, + "grad_norm": 6.813621997833252, + "learning_rate": 1.4350703332425791e-05, + "loss": 0.3095, + "step": 13800 + }, + { + "epoch": 37.60490463215259, + "grad_norm": 6.3153815269470215, + "learning_rate": 1.4349908720429531e-05, + "loss": 0.4815, + "step": 13801 + }, + { + "epoch": 37.607629427792915, + "grad_norm": 6.94346809387207, + "learning_rate": 1.4349114074556326e-05, + "loss": 0.3065, + "step": 13802 + }, + { + "epoch": 37.61035422343324, + "grad_norm": 6.070793151855469, + "learning_rate": 1.4348319394812355e-05, + "loss": 0.227, + "step": 13803 + }, + { + "epoch": 37.61307901907357, + "grad_norm": 9.789314270019531, + "learning_rate": 1.4347524681203817e-05, + "loss": 0.2587, + "step": 13804 + }, + { + "epoch": 37.6158038147139, + "grad_norm": 5.945764064788818, + "learning_rate": 1.4346729933736894e-05, + "loss": 0.3088, + "step": 13805 + }, + { + "epoch": 37.618528610354225, + "grad_norm": 5.794508457183838, + "learning_rate": 1.434593515241778e-05, + "loss": 0.3408, + "step": 13806 + }, + { + "epoch": 37.62125340599455, + "grad_norm": 5.566441059112549, + "learning_rate": 1.4345140337252663e-05, + "loss": 0.412, + "step": 13807 + }, + { + "epoch": 37.62397820163488, + "grad_norm": 5.600670337677002, + "learning_rate": 1.4344345488247733e-05, + "loss": 0.2984, + "step": 13808 + }, + { + "epoch": 37.6267029972752, + "grad_norm": 6.36623477935791, + "learning_rate": 1.4343550605409178e-05, + "loss": 0.374, + "step": 13809 + }, + { + "epoch": 37.62942779291553, + "grad_norm": 7.658454895019531, + "learning_rate": 1.4342755688743192e-05, + "loss": 0.2512, + "step": 13810 + }, + { + "epoch": 37.63215258855586, + "grad_norm": 6.459691524505615, + "learning_rate": 1.4341960738255965e-05, + "loss": 0.3131, + "step": 13811 + }, + { + "epoch": 37.63487738419619, + "grad_norm": 5.796911239624023, + "learning_rate": 1.4341165753953688e-05, + "loss": 0.2245, + "step": 13812 + }, + { + "epoch": 37.63760217983651, + "grad_norm": 6.59001350402832, + "learning_rate": 1.4340370735842548e-05, + "loss": 0.3234, + "step": 13813 + }, + { + "epoch": 37.64032697547684, + "grad_norm": 5.7899370193481445, + "learning_rate": 1.4339575683928746e-05, + "loss": 0.2126, + "step": 13814 + }, + { + "epoch": 37.643051771117165, + "grad_norm": 5.424726963043213, + "learning_rate": 1.4338780598218465e-05, + "loss": 0.3813, + "step": 13815 + }, + { + "epoch": 37.64577656675749, + "grad_norm": 6.8555989265441895, + "learning_rate": 1.4337985478717902e-05, + "loss": 0.2491, + "step": 13816 + }, + { + "epoch": 37.64850136239782, + "grad_norm": 7.039730548858643, + "learning_rate": 1.4337190325433246e-05, + "loss": 0.2726, + "step": 13817 + }, + { + "epoch": 37.65122615803815, + "grad_norm": 5.639499664306641, + "learning_rate": 1.4336395138370694e-05, + "loss": 0.2294, + "step": 13818 + }, + { + "epoch": 37.653950953678475, + "grad_norm": 6.956472873687744, + "learning_rate": 1.4335599917536432e-05, + "loss": 0.252, + "step": 13819 + }, + { + "epoch": 37.6566757493188, + "grad_norm": 10.79681396484375, + "learning_rate": 1.4334804662936661e-05, + "loss": 0.3697, + "step": 13820 + }, + { + "epoch": 37.65940054495913, + "grad_norm": 6.606871128082275, + "learning_rate": 1.4334009374577566e-05, + "loss": 0.2361, + "step": 13821 + }, + { + "epoch": 37.66212534059945, + "grad_norm": 6.776033401489258, + "learning_rate": 1.433321405246535e-05, + "loss": 0.2047, + "step": 13822 + }, + { + "epoch": 37.664850136239785, + "grad_norm": 6.886871814727783, + "learning_rate": 1.43324186966062e-05, + "loss": 0.2916, + "step": 13823 + }, + { + "epoch": 37.66757493188011, + "grad_norm": 5.7386040687561035, + "learning_rate": 1.4331623307006316e-05, + "loss": 0.2835, + "step": 13824 + }, + { + "epoch": 37.67029972752044, + "grad_norm": 7.095458030700684, + "learning_rate": 1.4330827883671885e-05, + "loss": 0.258, + "step": 13825 + }, + { + "epoch": 37.67302452316076, + "grad_norm": 9.257341384887695, + "learning_rate": 1.433003242660911e-05, + "loss": 0.3476, + "step": 13826 + }, + { + "epoch": 37.67574931880109, + "grad_norm": 11.596256256103516, + "learning_rate": 1.432923693582418e-05, + "loss": 0.287, + "step": 13827 + }, + { + "epoch": 37.678474114441414, + "grad_norm": 4.983880043029785, + "learning_rate": 1.4328441411323292e-05, + "loss": 0.3643, + "step": 13828 + }, + { + "epoch": 37.68119891008175, + "grad_norm": 8.73643970489502, + "learning_rate": 1.432764585311264e-05, + "loss": 0.2546, + "step": 13829 + }, + { + "epoch": 37.68392370572207, + "grad_norm": 14.080904960632324, + "learning_rate": 1.4326850261198422e-05, + "loss": 0.4435, + "step": 13830 + }, + { + "epoch": 37.6866485013624, + "grad_norm": 7.07788610458374, + "learning_rate": 1.4326054635586833e-05, + "loss": 0.1955, + "step": 13831 + }, + { + "epoch": 37.689373297002724, + "grad_norm": 6.612051486968994, + "learning_rate": 1.4325258976284073e-05, + "loss": 0.346, + "step": 13832 + }, + { + "epoch": 37.69209809264305, + "grad_norm": 8.311551094055176, + "learning_rate": 1.4324463283296332e-05, + "loss": 0.235, + "step": 13833 + }, + { + "epoch": 37.694822888283376, + "grad_norm": 6.00632381439209, + "learning_rate": 1.4323667556629812e-05, + "loss": 0.2324, + "step": 13834 + }, + { + "epoch": 37.69754768392371, + "grad_norm": 24.169116973876953, + "learning_rate": 1.4322871796290707e-05, + "loss": 0.3493, + "step": 13835 + }, + { + "epoch": 37.700272479564035, + "grad_norm": 5.777043342590332, + "learning_rate": 1.4322076002285216e-05, + "loss": 0.3258, + "step": 13836 + }, + { + "epoch": 37.70299727520436, + "grad_norm": 7.018303871154785, + "learning_rate": 1.4321280174619538e-05, + "loss": 0.351, + "step": 13837 + }, + { + "epoch": 37.705722070844686, + "grad_norm": 8.782502174377441, + "learning_rate": 1.4320484313299865e-05, + "loss": 0.2552, + "step": 13838 + }, + { + "epoch": 37.70844686648501, + "grad_norm": 7.098335266113281, + "learning_rate": 1.43196884183324e-05, + "loss": 0.2238, + "step": 13839 + }, + { + "epoch": 37.71117166212534, + "grad_norm": 5.654666900634766, + "learning_rate": 1.4318892489723345e-05, + "loss": 0.3625, + "step": 13840 + }, + { + "epoch": 37.71389645776567, + "grad_norm": 6.63136625289917, + "learning_rate": 1.431809652747889e-05, + "loss": 0.2601, + "step": 13841 + }, + { + "epoch": 37.716621253406, + "grad_norm": 15.09497356414795, + "learning_rate": 1.4317300531605241e-05, + "loss": 0.4105, + "step": 13842 + }, + { + "epoch": 37.71934604904632, + "grad_norm": 8.670364379882812, + "learning_rate": 1.4316504502108592e-05, + "loss": 0.3698, + "step": 13843 + }, + { + "epoch": 37.72207084468665, + "grad_norm": 7.739365577697754, + "learning_rate": 1.4315708438995148e-05, + "loss": 0.2654, + "step": 13844 + }, + { + "epoch": 37.724795640326974, + "grad_norm": 7.329006195068359, + "learning_rate": 1.4314912342271103e-05, + "loss": 0.3591, + "step": 13845 + }, + { + "epoch": 37.7275204359673, + "grad_norm": 5.840755462646484, + "learning_rate": 1.431411621194266e-05, + "loss": 0.2794, + "step": 13846 + }, + { + "epoch": 37.73024523160763, + "grad_norm": 5.9024200439453125, + "learning_rate": 1.431332004801602e-05, + "loss": 0.26, + "step": 13847 + }, + { + "epoch": 37.73297002724796, + "grad_norm": 7.745482921600342, + "learning_rate": 1.431252385049738e-05, + "loss": 0.2239, + "step": 13848 + }, + { + "epoch": 37.735694822888284, + "grad_norm": 7.3622145652771, + "learning_rate": 1.4311727619392944e-05, + "loss": 0.3758, + "step": 13849 + }, + { + "epoch": 37.73841961852861, + "grad_norm": 10.321468353271484, + "learning_rate": 1.4310931354708913e-05, + "loss": 0.4225, + "step": 13850 + }, + { + "epoch": 37.741144414168936, + "grad_norm": 6.619589328765869, + "learning_rate": 1.4310135056451486e-05, + "loss": 0.3065, + "step": 13851 + }, + { + "epoch": 37.74386920980926, + "grad_norm": 7.6803483963012695, + "learning_rate": 1.4309338724626869e-05, + "loss": 0.6291, + "step": 13852 + }, + { + "epoch": 37.746594005449595, + "grad_norm": 6.695158958435059, + "learning_rate": 1.4308542359241257e-05, + "loss": 0.4344, + "step": 13853 + }, + { + "epoch": 37.74931880108992, + "grad_norm": 11.790595054626465, + "learning_rate": 1.4307745960300858e-05, + "loss": 0.3157, + "step": 13854 + }, + { + "epoch": 37.752043596730246, + "grad_norm": 7.67926549911499, + "learning_rate": 1.430694952781187e-05, + "loss": 0.2043, + "step": 13855 + }, + { + "epoch": 37.75476839237057, + "grad_norm": 5.822719097137451, + "learning_rate": 1.43061530617805e-05, + "loss": 0.2033, + "step": 13856 + }, + { + "epoch": 37.7574931880109, + "grad_norm": 7.06847620010376, + "learning_rate": 1.4305356562212947e-05, + "loss": 0.2908, + "step": 13857 + }, + { + "epoch": 37.76021798365122, + "grad_norm": 5.968804836273193, + "learning_rate": 1.4304560029115415e-05, + "loss": 0.2198, + "step": 13858 + }, + { + "epoch": 37.762942779291556, + "grad_norm": 8.030414581298828, + "learning_rate": 1.4303763462494112e-05, + "loss": 0.2816, + "step": 13859 + }, + { + "epoch": 37.76566757493188, + "grad_norm": 10.792121887207031, + "learning_rate": 1.4302966862355235e-05, + "loss": 0.2744, + "step": 13860 + }, + { + "epoch": 37.76839237057221, + "grad_norm": 7.105438709259033, + "learning_rate": 1.4302170228704987e-05, + "loss": 0.2207, + "step": 13861 + }, + { + "epoch": 37.771117166212534, + "grad_norm": 5.91572904586792, + "learning_rate": 1.430137356154958e-05, + "loss": 0.1683, + "step": 13862 + }, + { + "epoch": 37.77384196185286, + "grad_norm": 6.855401515960693, + "learning_rate": 1.4300576860895215e-05, + "loss": 0.3463, + "step": 13863 + }, + { + "epoch": 37.776566757493185, + "grad_norm": 6.339083671569824, + "learning_rate": 1.4299780126748091e-05, + "loss": 0.2751, + "step": 13864 + }, + { + "epoch": 37.77929155313352, + "grad_norm": 6.983968257904053, + "learning_rate": 1.4298983359114422e-05, + "loss": 0.565, + "step": 13865 + }, + { + "epoch": 37.782016348773844, + "grad_norm": 7.245323657989502, + "learning_rate": 1.4298186558000406e-05, + "loss": 0.3568, + "step": 13866 + }, + { + "epoch": 37.78474114441417, + "grad_norm": 6.835300445556641, + "learning_rate": 1.4297389723412256e-05, + "loss": 0.3072, + "step": 13867 + }, + { + "epoch": 37.787465940054496, + "grad_norm": 5.132641792297363, + "learning_rate": 1.429659285535617e-05, + "loss": 0.2679, + "step": 13868 + }, + { + "epoch": 37.79019073569482, + "grad_norm": 18.43865394592285, + "learning_rate": 1.4295795953838358e-05, + "loss": 0.284, + "step": 13869 + }, + { + "epoch": 37.79291553133515, + "grad_norm": 5.493300914764404, + "learning_rate": 1.4294999018865023e-05, + "loss": 0.4596, + "step": 13870 + }, + { + "epoch": 37.79564032697548, + "grad_norm": 6.84777307510376, + "learning_rate": 1.4294202050442379e-05, + "loss": 0.4657, + "step": 13871 + }, + { + "epoch": 37.798365122615806, + "grad_norm": 5.2925124168396, + "learning_rate": 1.4293405048576623e-05, + "loss": 0.2627, + "step": 13872 + }, + { + "epoch": 37.80108991825613, + "grad_norm": 6.45269250869751, + "learning_rate": 1.4292608013273968e-05, + "loss": 0.1688, + "step": 13873 + }, + { + "epoch": 37.80381471389646, + "grad_norm": 5.663297176361084, + "learning_rate": 1.4291810944540619e-05, + "loss": 0.3882, + "step": 13874 + }, + { + "epoch": 37.80653950953678, + "grad_norm": 5.370720863342285, + "learning_rate": 1.4291013842382785e-05, + "loss": 0.4996, + "step": 13875 + }, + { + "epoch": 37.80926430517711, + "grad_norm": 7.206972122192383, + "learning_rate": 1.4290216706806675e-05, + "loss": 0.23, + "step": 13876 + }, + { + "epoch": 37.81198910081744, + "grad_norm": 7.181276321411133, + "learning_rate": 1.4289419537818494e-05, + "loss": 0.3261, + "step": 13877 + }, + { + "epoch": 37.81471389645777, + "grad_norm": 6.361824035644531, + "learning_rate": 1.4288622335424452e-05, + "loss": 0.3921, + "step": 13878 + }, + { + "epoch": 37.817438692098094, + "grad_norm": 6.072926998138428, + "learning_rate": 1.4287825099630759e-05, + "loss": 0.2404, + "step": 13879 + }, + { + "epoch": 37.82016348773842, + "grad_norm": 6.359704494476318, + "learning_rate": 1.4287027830443618e-05, + "loss": 0.2664, + "step": 13880 + }, + { + "epoch": 37.822888283378745, + "grad_norm": 5.395126819610596, + "learning_rate": 1.4286230527869245e-05, + "loss": 0.1834, + "step": 13881 + }, + { + "epoch": 37.82561307901907, + "grad_norm": 5.825087070465088, + "learning_rate": 1.4285433191913845e-05, + "loss": 0.2545, + "step": 13882 + }, + { + "epoch": 37.828337874659404, + "grad_norm": 6.945882797241211, + "learning_rate": 1.4284635822583632e-05, + "loss": 0.3561, + "step": 13883 + }, + { + "epoch": 37.83106267029973, + "grad_norm": 6.538568019866943, + "learning_rate": 1.428383841988481e-05, + "loss": 0.2595, + "step": 13884 + }, + { + "epoch": 37.833787465940055, + "grad_norm": 5.49812650680542, + "learning_rate": 1.4283040983823594e-05, + "loss": 0.2719, + "step": 13885 + }, + { + "epoch": 37.83651226158038, + "grad_norm": 7.490963459014893, + "learning_rate": 1.4282243514406192e-05, + "loss": 0.3662, + "step": 13886 + }, + { + "epoch": 37.83923705722071, + "grad_norm": 5.736569881439209, + "learning_rate": 1.4281446011638818e-05, + "loss": 0.3821, + "step": 13887 + }, + { + "epoch": 37.84196185286103, + "grad_norm": 6.814878463745117, + "learning_rate": 1.4280648475527676e-05, + "loss": 0.3307, + "step": 13888 + }, + { + "epoch": 37.844686648501366, + "grad_norm": 7.027327537536621, + "learning_rate": 1.4279850906078984e-05, + "loss": 0.3086, + "step": 13889 + }, + { + "epoch": 37.84741144414169, + "grad_norm": 5.297640323638916, + "learning_rate": 1.427905330329895e-05, + "loss": 0.3211, + "step": 13890 + }, + { + "epoch": 37.85013623978202, + "grad_norm": 5.85853385925293, + "learning_rate": 1.4278255667193785e-05, + "loss": 0.2456, + "step": 13891 + }, + { + "epoch": 37.85286103542234, + "grad_norm": 8.093560218811035, + "learning_rate": 1.4277457997769707e-05, + "loss": 0.2427, + "step": 13892 + }, + { + "epoch": 37.85558583106267, + "grad_norm": 5.991091728210449, + "learning_rate": 1.427666029503292e-05, + "loss": 0.2615, + "step": 13893 + }, + { + "epoch": 37.858310626702995, + "grad_norm": 5.490238666534424, + "learning_rate": 1.4275862558989642e-05, + "loss": 0.2807, + "step": 13894 + }, + { + "epoch": 37.86103542234333, + "grad_norm": 5.897800445556641, + "learning_rate": 1.4275064789646085e-05, + "loss": 0.2792, + "step": 13895 + }, + { + "epoch": 37.86376021798365, + "grad_norm": 5.740957260131836, + "learning_rate": 1.4274266987008459e-05, + "loss": 0.3357, + "step": 13896 + }, + { + "epoch": 37.86648501362398, + "grad_norm": 5.91965389251709, + "learning_rate": 1.427346915108298e-05, + "loss": 0.4214, + "step": 13897 + }, + { + "epoch": 37.869209809264305, + "grad_norm": 6.701809883117676, + "learning_rate": 1.4272671281875857e-05, + "loss": 0.3539, + "step": 13898 + }, + { + "epoch": 37.87193460490463, + "grad_norm": 5.178858280181885, + "learning_rate": 1.4271873379393314e-05, + "loss": 0.3049, + "step": 13899 + }, + { + "epoch": 37.87465940054496, + "grad_norm": 6.695412635803223, + "learning_rate": 1.4271075443641552e-05, + "loss": 0.2471, + "step": 13900 + }, + { + "epoch": 37.87738419618529, + "grad_norm": 6.38279390335083, + "learning_rate": 1.4270277474626799e-05, + "loss": 0.4324, + "step": 13901 + }, + { + "epoch": 37.880108991825615, + "grad_norm": 5.44714879989624, + "learning_rate": 1.4269479472355259e-05, + "loss": 0.2364, + "step": 13902 + }, + { + "epoch": 37.88283378746594, + "grad_norm": 6.585297584533691, + "learning_rate": 1.4268681436833149e-05, + "loss": 0.2476, + "step": 13903 + }, + { + "epoch": 37.88555858310627, + "grad_norm": 5.468698024749756, + "learning_rate": 1.4267883368066688e-05, + "loss": 0.2676, + "step": 13904 + }, + { + "epoch": 37.88828337874659, + "grad_norm": 6.195644378662109, + "learning_rate": 1.4267085266062088e-05, + "loss": 0.2874, + "step": 13905 + }, + { + "epoch": 37.89100817438692, + "grad_norm": 9.75532341003418, + "learning_rate": 1.4266287130825564e-05, + "loss": 0.3411, + "step": 13906 + }, + { + "epoch": 37.89373297002725, + "grad_norm": 5.855805397033691, + "learning_rate": 1.4265488962363334e-05, + "loss": 0.2052, + "step": 13907 + }, + { + "epoch": 37.89645776566758, + "grad_norm": 7.247859954833984, + "learning_rate": 1.4264690760681613e-05, + "loss": 0.4378, + "step": 13908 + }, + { + "epoch": 37.8991825613079, + "grad_norm": 6.3888654708862305, + "learning_rate": 1.4263892525786617e-05, + "loss": 0.3044, + "step": 13909 + }, + { + "epoch": 37.90190735694823, + "grad_norm": 6.496111869812012, + "learning_rate": 1.4263094257684564e-05, + "loss": 0.4275, + "step": 13910 + }, + { + "epoch": 37.904632152588555, + "grad_norm": 6.1391825675964355, + "learning_rate": 1.426229595638167e-05, + "loss": 0.2492, + "step": 13911 + }, + { + "epoch": 37.90735694822888, + "grad_norm": 11.097859382629395, + "learning_rate": 1.4261497621884152e-05, + "loss": 0.2425, + "step": 13912 + }, + { + "epoch": 37.91008174386921, + "grad_norm": 5.487829685211182, + "learning_rate": 1.4260699254198231e-05, + "loss": 0.2703, + "step": 13913 + }, + { + "epoch": 37.91280653950954, + "grad_norm": 6.309706211090088, + "learning_rate": 1.4259900853330116e-05, + "loss": 0.2534, + "step": 13914 + }, + { + "epoch": 37.915531335149865, + "grad_norm": 6.878724575042725, + "learning_rate": 1.4259102419286035e-05, + "loss": 0.2386, + "step": 13915 + }, + { + "epoch": 37.91825613079019, + "grad_norm": 5.6779985427856445, + "learning_rate": 1.4258303952072197e-05, + "loss": 0.3365, + "step": 13916 + }, + { + "epoch": 37.920980926430516, + "grad_norm": 6.016035079956055, + "learning_rate": 1.4257505451694826e-05, + "loss": 0.2068, + "step": 13917 + }, + { + "epoch": 37.92370572207084, + "grad_norm": 5.624186992645264, + "learning_rate": 1.4256706918160142e-05, + "loss": 0.3402, + "step": 13918 + }, + { + "epoch": 37.926430517711175, + "grad_norm": 6.045122146606445, + "learning_rate": 1.4255908351474358e-05, + "loss": 0.195, + "step": 13919 + }, + { + "epoch": 37.9291553133515, + "grad_norm": 7.068624973297119, + "learning_rate": 1.4255109751643698e-05, + "loss": 0.2797, + "step": 13920 + }, + { + "epoch": 37.93188010899183, + "grad_norm": 5.509274959564209, + "learning_rate": 1.4254311118674385e-05, + "loss": 0.3661, + "step": 13921 + }, + { + "epoch": 37.93460490463215, + "grad_norm": 6.219267845153809, + "learning_rate": 1.4253512452572629e-05, + "loss": 0.1712, + "step": 13922 + }, + { + "epoch": 37.93732970027248, + "grad_norm": 5.982593059539795, + "learning_rate": 1.4252713753344656e-05, + "loss": 0.33, + "step": 13923 + }, + { + "epoch": 37.940054495912804, + "grad_norm": 9.742803573608398, + "learning_rate": 1.4251915020996686e-05, + "loss": 0.3737, + "step": 13924 + }, + { + "epoch": 37.94277929155314, + "grad_norm": 5.775113105773926, + "learning_rate": 1.4251116255534936e-05, + "loss": 0.3099, + "step": 13925 + }, + { + "epoch": 37.94550408719346, + "grad_norm": 7.870527744293213, + "learning_rate": 1.425031745696563e-05, + "loss": 0.1759, + "step": 13926 + }, + { + "epoch": 37.94822888283379, + "grad_norm": 9.597245216369629, + "learning_rate": 1.4249518625294991e-05, + "loss": 0.3413, + "step": 13927 + }, + { + "epoch": 37.950953678474114, + "grad_norm": 5.649352073669434, + "learning_rate": 1.4248719760529235e-05, + "loss": 0.3091, + "step": 13928 + }, + { + "epoch": 37.95367847411444, + "grad_norm": 6.283723831176758, + "learning_rate": 1.4247920862674589e-05, + "loss": 0.3779, + "step": 13929 + }, + { + "epoch": 37.956403269754766, + "grad_norm": 7.923952579498291, + "learning_rate": 1.4247121931737269e-05, + "loss": 0.4114, + "step": 13930 + }, + { + "epoch": 37.95912806539509, + "grad_norm": 7.428585529327393, + "learning_rate": 1.4246322967723502e-05, + "loss": 0.1706, + "step": 13931 + }, + { + "epoch": 37.961852861035425, + "grad_norm": 5.831275939941406, + "learning_rate": 1.424552397063951e-05, + "loss": 0.4125, + "step": 13932 + }, + { + "epoch": 37.96457765667575, + "grad_norm": 6.238661766052246, + "learning_rate": 1.424472494049151e-05, + "loss": 0.2897, + "step": 13933 + }, + { + "epoch": 37.967302452316076, + "grad_norm": 6.399302959442139, + "learning_rate": 1.4243925877285731e-05, + "loss": 0.369, + "step": 13934 + }, + { + "epoch": 37.9700272479564, + "grad_norm": 7.374026298522949, + "learning_rate": 1.4243126781028393e-05, + "loss": 0.3454, + "step": 13935 + }, + { + "epoch": 37.97275204359673, + "grad_norm": 6.311505317687988, + "learning_rate": 1.424232765172572e-05, + "loss": 0.2968, + "step": 13936 + }, + { + "epoch": 37.97547683923706, + "grad_norm": 7.2645955085754395, + "learning_rate": 1.4241528489383938e-05, + "loss": 0.2826, + "step": 13937 + }, + { + "epoch": 37.97820163487739, + "grad_norm": 6.588016986846924, + "learning_rate": 1.4240729294009268e-05, + "loss": 0.2749, + "step": 13938 + }, + { + "epoch": 37.98092643051771, + "grad_norm": 7.065012454986572, + "learning_rate": 1.4239930065607934e-05, + "loss": 0.326, + "step": 13939 + }, + { + "epoch": 37.98365122615804, + "grad_norm": 9.638312339782715, + "learning_rate": 1.4239130804186161e-05, + "loss": 0.2731, + "step": 13940 + }, + { + "epoch": 37.986376021798364, + "grad_norm": 7.051853179931641, + "learning_rate": 1.4238331509750173e-05, + "loss": 0.4256, + "step": 13941 + }, + { + "epoch": 37.98910081743869, + "grad_norm": 7.029924392700195, + "learning_rate": 1.4237532182306198e-05, + "loss": 0.2442, + "step": 13942 + }, + { + "epoch": 37.991825613079016, + "grad_norm": 6.4894633293151855, + "learning_rate": 1.4236732821860456e-05, + "loss": 0.1772, + "step": 13943 + }, + { + "epoch": 37.99455040871935, + "grad_norm": 6.099433898925781, + "learning_rate": 1.4235933428419177e-05, + "loss": 0.2225, + "step": 13944 + }, + { + "epoch": 37.997275204359674, + "grad_norm": 9.0189847946167, + "learning_rate": 1.4235134001988584e-05, + "loss": 0.3329, + "step": 13945 + }, + { + "epoch": 38.0, + "grad_norm": 6.745449066162109, + "learning_rate": 1.4234334542574906e-05, + "loss": 0.3312, + "step": 13946 + }, + { + "epoch": 38.002724795640326, + "grad_norm": 5.828391075134277, + "learning_rate": 1.4233535050184362e-05, + "loss": 0.1915, + "step": 13947 + }, + { + "epoch": 38.00544959128065, + "grad_norm": 6.628112316131592, + "learning_rate": 1.4232735524823187e-05, + "loss": 0.3048, + "step": 13948 + }, + { + "epoch": 38.00817438692098, + "grad_norm": 7.644171714782715, + "learning_rate": 1.4231935966497603e-05, + "loss": 0.211, + "step": 13949 + }, + { + "epoch": 38.01089918256131, + "grad_norm": 7.779391288757324, + "learning_rate": 1.4231136375213837e-05, + "loss": 0.34, + "step": 13950 + }, + { + "epoch": 38.013623978201636, + "grad_norm": 5.219463348388672, + "learning_rate": 1.4230336750978117e-05, + "loss": 0.1672, + "step": 13951 + }, + { + "epoch": 38.01634877384196, + "grad_norm": 6.442633628845215, + "learning_rate": 1.4229537093796672e-05, + "loss": 0.363, + "step": 13952 + }, + { + "epoch": 38.01907356948229, + "grad_norm": 5.483616828918457, + "learning_rate": 1.4228737403675727e-05, + "loss": 0.21, + "step": 13953 + }, + { + "epoch": 38.02179836512261, + "grad_norm": 5.897453784942627, + "learning_rate": 1.4227937680621513e-05, + "loss": 0.3088, + "step": 13954 + }, + { + "epoch": 38.02452316076294, + "grad_norm": 5.241434574127197, + "learning_rate": 1.4227137924640255e-05, + "loss": 0.2805, + "step": 13955 + }, + { + "epoch": 38.02724795640327, + "grad_norm": 4.7049126625061035, + "learning_rate": 1.4226338135738185e-05, + "loss": 0.234, + "step": 13956 + }, + { + "epoch": 38.0299727520436, + "grad_norm": 6.1228413581848145, + "learning_rate": 1.4225538313921527e-05, + "loss": 0.2327, + "step": 13957 + }, + { + "epoch": 38.032697547683924, + "grad_norm": 6.522132873535156, + "learning_rate": 1.4224738459196514e-05, + "loss": 0.2843, + "step": 13958 + }, + { + "epoch": 38.03542234332425, + "grad_norm": 5.426480770111084, + "learning_rate": 1.4223938571569371e-05, + "loss": 0.2536, + "step": 13959 + }, + { + "epoch": 38.038147138964575, + "grad_norm": 7.3476409912109375, + "learning_rate": 1.4223138651046333e-05, + "loss": 0.292, + "step": 13960 + }, + { + "epoch": 38.0408719346049, + "grad_norm": 5.566215515136719, + "learning_rate": 1.4222338697633627e-05, + "loss": 0.2537, + "step": 13961 + }, + { + "epoch": 38.043596730245234, + "grad_norm": 5.8920207023620605, + "learning_rate": 1.4221538711337483e-05, + "loss": 0.1773, + "step": 13962 + }, + { + "epoch": 38.04632152588556, + "grad_norm": 7.461595058441162, + "learning_rate": 1.4220738692164132e-05, + "loss": 0.2825, + "step": 13963 + }, + { + "epoch": 38.049046321525886, + "grad_norm": 5.866862773895264, + "learning_rate": 1.4219938640119803e-05, + "loss": 0.2876, + "step": 13964 + }, + { + "epoch": 38.05177111716621, + "grad_norm": 5.897693157196045, + "learning_rate": 1.4219138555210727e-05, + "loss": 0.4412, + "step": 13965 + }, + { + "epoch": 38.05449591280654, + "grad_norm": 5.753302097320557, + "learning_rate": 1.421833843744314e-05, + "loss": 0.2656, + "step": 13966 + }, + { + "epoch": 38.05722070844686, + "grad_norm": 6.437390327453613, + "learning_rate": 1.4217538286823262e-05, + "loss": 0.1365, + "step": 13967 + }, + { + "epoch": 38.059945504087196, + "grad_norm": 5.829328536987305, + "learning_rate": 1.4216738103357335e-05, + "loss": 0.2829, + "step": 13968 + }, + { + "epoch": 38.06267029972752, + "grad_norm": 9.179716110229492, + "learning_rate": 1.4215937887051588e-05, + "loss": 0.2632, + "step": 13969 + }, + { + "epoch": 38.06539509536785, + "grad_norm": 6.491574287414551, + "learning_rate": 1.4215137637912252e-05, + "loss": 0.3179, + "step": 13970 + }, + { + "epoch": 38.06811989100817, + "grad_norm": 8.215079307556152, + "learning_rate": 1.421433735594556e-05, + "loss": 0.2418, + "step": 13971 + }, + { + "epoch": 38.0708446866485, + "grad_norm": 5.035507678985596, + "learning_rate": 1.4213537041157746e-05, + "loss": 0.1278, + "step": 13972 + }, + { + "epoch": 38.073569482288825, + "grad_norm": 7.004916191101074, + "learning_rate": 1.4212736693555038e-05, + "loss": 0.2279, + "step": 13973 + }, + { + "epoch": 38.07629427792916, + "grad_norm": 5.82853364944458, + "learning_rate": 1.4211936313143673e-05, + "loss": 0.2233, + "step": 13974 + }, + { + "epoch": 38.079019073569484, + "grad_norm": 6.827931880950928, + "learning_rate": 1.4211135899929885e-05, + "loss": 0.2453, + "step": 13975 + }, + { + "epoch": 38.08174386920981, + "grad_norm": 5.678162574768066, + "learning_rate": 1.4210335453919904e-05, + "loss": 0.2307, + "step": 13976 + }, + { + "epoch": 38.084468664850135, + "grad_norm": 6.095455169677734, + "learning_rate": 1.4209534975119965e-05, + "loss": 0.2744, + "step": 13977 + }, + { + "epoch": 38.08719346049046, + "grad_norm": 7.953395366668701, + "learning_rate": 1.4208734463536307e-05, + "loss": 0.215, + "step": 13978 + }, + { + "epoch": 38.08991825613079, + "grad_norm": 6.966280460357666, + "learning_rate": 1.4207933919175157e-05, + "loss": 0.2914, + "step": 13979 + }, + { + "epoch": 38.09264305177112, + "grad_norm": 5.814003944396973, + "learning_rate": 1.4207133342042756e-05, + "loss": 0.3221, + "step": 13980 + }, + { + "epoch": 38.095367847411445, + "grad_norm": 6.032495021820068, + "learning_rate": 1.4206332732145334e-05, + "loss": 0.3495, + "step": 13981 + }, + { + "epoch": 38.09809264305177, + "grad_norm": 7.486771106719971, + "learning_rate": 1.420553208948913e-05, + "loss": 0.2506, + "step": 13982 + }, + { + "epoch": 38.1008174386921, + "grad_norm": 5.105815410614014, + "learning_rate": 1.4204731414080375e-05, + "loss": 0.3923, + "step": 13983 + }, + { + "epoch": 38.10354223433242, + "grad_norm": 5.73434591293335, + "learning_rate": 1.4203930705925308e-05, + "loss": 0.3165, + "step": 13984 + }, + { + "epoch": 38.10626702997275, + "grad_norm": 5.713719367980957, + "learning_rate": 1.4203129965030162e-05, + "loss": 0.1771, + "step": 13985 + }, + { + "epoch": 38.10899182561308, + "grad_norm": 8.072136878967285, + "learning_rate": 1.4202329191401178e-05, + "loss": 0.2828, + "step": 13986 + }, + { + "epoch": 38.11171662125341, + "grad_norm": 6.253368854522705, + "learning_rate": 1.4201528385044589e-05, + "loss": 0.2762, + "step": 13987 + }, + { + "epoch": 38.11444141689373, + "grad_norm": 7.055810451507568, + "learning_rate": 1.4200727545966633e-05, + "loss": 0.3133, + "step": 13988 + }, + { + "epoch": 38.11716621253406, + "grad_norm": 4.999205589294434, + "learning_rate": 1.4199926674173545e-05, + "loss": 0.2086, + "step": 13989 + }, + { + "epoch": 38.119891008174385, + "grad_norm": 5.597371578216553, + "learning_rate": 1.4199125769671564e-05, + "loss": 0.3203, + "step": 13990 + }, + { + "epoch": 38.12261580381471, + "grad_norm": 5.3502373695373535, + "learning_rate": 1.4198324832466925e-05, + "loss": 0.32, + "step": 13991 + }, + { + "epoch": 38.12534059945504, + "grad_norm": 8.164291381835938, + "learning_rate": 1.419752386256587e-05, + "loss": 0.4567, + "step": 13992 + }, + { + "epoch": 38.12806539509537, + "grad_norm": 5.968377590179443, + "learning_rate": 1.4196722859974629e-05, + "loss": 0.2638, + "step": 13993 + }, + { + "epoch": 38.130790190735695, + "grad_norm": 6.087549209594727, + "learning_rate": 1.419592182469945e-05, + "loss": 0.1793, + "step": 13994 + }, + { + "epoch": 38.13351498637602, + "grad_norm": 6.813994884490967, + "learning_rate": 1.4195120756746566e-05, + "loss": 0.3072, + "step": 13995 + }, + { + "epoch": 38.13623978201635, + "grad_norm": 7.23217248916626, + "learning_rate": 1.4194319656122217e-05, + "loss": 0.2021, + "step": 13996 + }, + { + "epoch": 38.13896457765667, + "grad_norm": 4.884246349334717, + "learning_rate": 1.4193518522832642e-05, + "loss": 0.2717, + "step": 13997 + }, + { + "epoch": 38.141689373297005, + "grad_norm": 5.066684722900391, + "learning_rate": 1.4192717356884078e-05, + "loss": 0.2404, + "step": 13998 + }, + { + "epoch": 38.14441416893733, + "grad_norm": 6.179629325866699, + "learning_rate": 1.4191916158282766e-05, + "loss": 0.2885, + "step": 13999 + }, + { + "epoch": 38.14713896457766, + "grad_norm": 5.496793270111084, + "learning_rate": 1.4191114927034949e-05, + "loss": 0.1613, + "step": 14000 + }, + { + "epoch": 38.14986376021798, + "grad_norm": 5.1892290115356445, + "learning_rate": 1.4190313663146859e-05, + "loss": 0.2329, + "step": 14001 + }, + { + "epoch": 38.15258855585831, + "grad_norm": 6.829507827758789, + "learning_rate": 1.4189512366624745e-05, + "loss": 0.3313, + "step": 14002 + }, + { + "epoch": 38.155313351498634, + "grad_norm": 6.3000054359436035, + "learning_rate": 1.418871103747484e-05, + "loss": 0.2714, + "step": 14003 + }, + { + "epoch": 38.15803814713897, + "grad_norm": 7.200273513793945, + "learning_rate": 1.4187909675703391e-05, + "loss": 0.2042, + "step": 14004 + }, + { + "epoch": 38.16076294277929, + "grad_norm": 6.331015586853027, + "learning_rate": 1.4187108281316635e-05, + "loss": 0.3781, + "step": 14005 + }, + { + "epoch": 38.16348773841962, + "grad_norm": 6.415987014770508, + "learning_rate": 1.4186306854320817e-05, + "loss": 0.2836, + "step": 14006 + }, + { + "epoch": 38.166212534059945, + "grad_norm": 7.1509199142456055, + "learning_rate": 1.4185505394722172e-05, + "loss": 0.283, + "step": 14007 + }, + { + "epoch": 38.16893732970027, + "grad_norm": 5.582503795623779, + "learning_rate": 1.418470390252695e-05, + "loss": 0.2593, + "step": 14008 + }, + { + "epoch": 38.171662125340596, + "grad_norm": 7.300879001617432, + "learning_rate": 1.4183902377741385e-05, + "loss": 0.3265, + "step": 14009 + }, + { + "epoch": 38.17438692098093, + "grad_norm": 5.514047145843506, + "learning_rate": 1.4183100820371723e-05, + "loss": 0.2384, + "step": 14010 + }, + { + "epoch": 38.177111716621255, + "grad_norm": 6.768276691436768, + "learning_rate": 1.418229923042421e-05, + "loss": 0.3659, + "step": 14011 + }, + { + "epoch": 38.17983651226158, + "grad_norm": 7.209909439086914, + "learning_rate": 1.4181497607905082e-05, + "loss": 0.3259, + "step": 14012 + }, + { + "epoch": 38.182561307901906, + "grad_norm": 6.693050384521484, + "learning_rate": 1.4180695952820585e-05, + "loss": 0.2859, + "step": 14013 + }, + { + "epoch": 38.18528610354223, + "grad_norm": 5.3056206703186035, + "learning_rate": 1.4179894265176964e-05, + "loss": 0.3568, + "step": 14014 + }, + { + "epoch": 38.18801089918256, + "grad_norm": 6.389018535614014, + "learning_rate": 1.4179092544980459e-05, + "loss": 0.1603, + "step": 14015 + }, + { + "epoch": 38.19073569482289, + "grad_norm": 11.500627517700195, + "learning_rate": 1.4178290792237319e-05, + "loss": 0.2413, + "step": 14016 + }, + { + "epoch": 38.19346049046322, + "grad_norm": 4.9877214431762695, + "learning_rate": 1.4177489006953784e-05, + "loss": 0.2359, + "step": 14017 + }, + { + "epoch": 38.19618528610354, + "grad_norm": 4.357906341552734, + "learning_rate": 1.4176687189136098e-05, + "loss": 0.1855, + "step": 14018 + }, + { + "epoch": 38.19891008174387, + "grad_norm": 6.749527931213379, + "learning_rate": 1.4175885338790507e-05, + "loss": 0.4336, + "step": 14019 + }, + { + "epoch": 38.201634877384194, + "grad_norm": 5.563653945922852, + "learning_rate": 1.4175083455923254e-05, + "loss": 0.2687, + "step": 14020 + }, + { + "epoch": 38.20435967302452, + "grad_norm": 6.073885917663574, + "learning_rate": 1.417428154054059e-05, + "loss": 0.3654, + "step": 14021 + }, + { + "epoch": 38.20708446866485, + "grad_norm": 5.087289810180664, + "learning_rate": 1.417347959264875e-05, + "loss": 0.2058, + "step": 14022 + }, + { + "epoch": 38.20980926430518, + "grad_norm": 6.296276092529297, + "learning_rate": 1.4172677612253987e-05, + "loss": 0.2492, + "step": 14023 + }, + { + "epoch": 38.212534059945504, + "grad_norm": 7.721444606781006, + "learning_rate": 1.4171875599362545e-05, + "loss": 0.3712, + "step": 14024 + }, + { + "epoch": 38.21525885558583, + "grad_norm": 5.24257230758667, + "learning_rate": 1.4171073553980673e-05, + "loss": 0.2746, + "step": 14025 + }, + { + "epoch": 38.217983651226156, + "grad_norm": 7.223959922790527, + "learning_rate": 1.4170271476114612e-05, + "loss": 0.1926, + "step": 14026 + }, + { + "epoch": 38.22070844686648, + "grad_norm": 5.934112071990967, + "learning_rate": 1.416946936577061e-05, + "loss": 0.1913, + "step": 14027 + }, + { + "epoch": 38.223433242506815, + "grad_norm": 5.871982574462891, + "learning_rate": 1.4168667222954915e-05, + "loss": 0.2797, + "step": 14028 + }, + { + "epoch": 38.22615803814714, + "grad_norm": 5.042227745056152, + "learning_rate": 1.4167865047673775e-05, + "loss": 0.283, + "step": 14029 + }, + { + "epoch": 38.228882833787466, + "grad_norm": 5.960148811340332, + "learning_rate": 1.4167062839933437e-05, + "loss": 0.2523, + "step": 14030 + }, + { + "epoch": 38.23160762942779, + "grad_norm": 11.43106746673584, + "learning_rate": 1.4166260599740148e-05, + "loss": 0.2967, + "step": 14031 + }, + { + "epoch": 38.23433242506812, + "grad_norm": 6.651676177978516, + "learning_rate": 1.4165458327100152e-05, + "loss": 0.2797, + "step": 14032 + }, + { + "epoch": 38.237057220708444, + "grad_norm": 5.880712985992432, + "learning_rate": 1.4164656022019702e-05, + "loss": 0.3331, + "step": 14033 + }, + { + "epoch": 38.23978201634878, + "grad_norm": 6.207973957061768, + "learning_rate": 1.4163853684505046e-05, + "loss": 0.3976, + "step": 14034 + }, + { + "epoch": 38.2425068119891, + "grad_norm": 4.574272155761719, + "learning_rate": 1.416305131456243e-05, + "loss": 0.1279, + "step": 14035 + }, + { + "epoch": 38.24523160762943, + "grad_norm": 4.726644992828369, + "learning_rate": 1.4162248912198107e-05, + "loss": 0.256, + "step": 14036 + }, + { + "epoch": 38.247956403269754, + "grad_norm": 5.637514591217041, + "learning_rate": 1.4161446477418322e-05, + "loss": 0.2778, + "step": 14037 + }, + { + "epoch": 38.25068119891008, + "grad_norm": 5.931151390075684, + "learning_rate": 1.4160644010229325e-05, + "loss": 0.2351, + "step": 14038 + }, + { + "epoch": 38.253405994550405, + "grad_norm": 5.666237831115723, + "learning_rate": 1.4159841510637368e-05, + "loss": 0.2453, + "step": 14039 + }, + { + "epoch": 38.25613079019074, + "grad_norm": 5.902411460876465, + "learning_rate": 1.4159038978648698e-05, + "loss": 0.3376, + "step": 14040 + }, + { + "epoch": 38.258855585831064, + "grad_norm": 5.361380100250244, + "learning_rate": 1.4158236414269569e-05, + "loss": 0.2046, + "step": 14041 + }, + { + "epoch": 38.26158038147139, + "grad_norm": 5.141907691955566, + "learning_rate": 1.4157433817506224e-05, + "loss": 0.2404, + "step": 14042 + }, + { + "epoch": 38.264305177111716, + "grad_norm": 5.590311527252197, + "learning_rate": 1.4156631188364922e-05, + "loss": 0.2377, + "step": 14043 + }, + { + "epoch": 38.26702997275204, + "grad_norm": 5.858974933624268, + "learning_rate": 1.4155828526851907e-05, + "loss": 0.1895, + "step": 14044 + }, + { + "epoch": 38.26975476839237, + "grad_norm": 5.813584804534912, + "learning_rate": 1.4155025832973435e-05, + "loss": 0.2008, + "step": 14045 + }, + { + "epoch": 38.2724795640327, + "grad_norm": 5.5272369384765625, + "learning_rate": 1.4154223106735754e-05, + "loss": 0.2745, + "step": 14046 + }, + { + "epoch": 38.275204359673026, + "grad_norm": 5.37410831451416, + "learning_rate": 1.415342034814512e-05, + "loss": 0.4397, + "step": 14047 + }, + { + "epoch": 38.27792915531335, + "grad_norm": 6.916401386260986, + "learning_rate": 1.4152617557207779e-05, + "loss": 0.2548, + "step": 14048 + }, + { + "epoch": 38.28065395095368, + "grad_norm": 5.114424705505371, + "learning_rate": 1.4151814733929989e-05, + "loss": 0.1748, + "step": 14049 + }, + { + "epoch": 38.283378746594, + "grad_norm": 7.644888401031494, + "learning_rate": 1.4151011878317998e-05, + "loss": 0.2413, + "step": 14050 + }, + { + "epoch": 38.28610354223433, + "grad_norm": 5.31462287902832, + "learning_rate": 1.415020899037806e-05, + "loss": 0.27, + "step": 14051 + }, + { + "epoch": 38.28882833787466, + "grad_norm": 11.65475082397461, + "learning_rate": 1.4149406070116429e-05, + "loss": 0.3211, + "step": 14052 + }, + { + "epoch": 38.29155313351499, + "grad_norm": 12.475391387939453, + "learning_rate": 1.4148603117539354e-05, + "loss": 0.1888, + "step": 14053 + }, + { + "epoch": 38.294277929155314, + "grad_norm": 5.723780155181885, + "learning_rate": 1.4147800132653093e-05, + "loss": 0.3493, + "step": 14054 + }, + { + "epoch": 38.29700272479564, + "grad_norm": 5.613542556762695, + "learning_rate": 1.4146997115463901e-05, + "loss": 0.4031, + "step": 14055 + }, + { + "epoch": 38.299727520435965, + "grad_norm": 7.107828617095947, + "learning_rate": 1.4146194065978024e-05, + "loss": 0.4164, + "step": 14056 + }, + { + "epoch": 38.30245231607629, + "grad_norm": 5.172051906585693, + "learning_rate": 1.4145390984201726e-05, + "loss": 0.1524, + "step": 14057 + }, + { + "epoch": 38.305177111716624, + "grad_norm": 5.915720462799072, + "learning_rate": 1.4144587870141252e-05, + "loss": 0.362, + "step": 14058 + }, + { + "epoch": 38.30790190735695, + "grad_norm": 7.770023822784424, + "learning_rate": 1.4143784723802865e-05, + "loss": 0.3484, + "step": 14059 + }, + { + "epoch": 38.310626702997276, + "grad_norm": 5.6410698890686035, + "learning_rate": 1.4142981545192814e-05, + "loss": 0.2348, + "step": 14060 + }, + { + "epoch": 38.3133514986376, + "grad_norm": 5.968530178070068, + "learning_rate": 1.4142178334317356e-05, + "loss": 0.3093, + "step": 14061 + }, + { + "epoch": 38.31607629427793, + "grad_norm": 6.009503364562988, + "learning_rate": 1.4141375091182746e-05, + "loss": 0.274, + "step": 14062 + }, + { + "epoch": 38.31880108991825, + "grad_norm": 5.930474758148193, + "learning_rate": 1.4140571815795242e-05, + "loss": 0.2842, + "step": 14063 + }, + { + "epoch": 38.321525885558586, + "grad_norm": 7.296756744384766, + "learning_rate": 1.4139768508161097e-05, + "loss": 0.413, + "step": 14064 + }, + { + "epoch": 38.32425068119891, + "grad_norm": 6.180625915527344, + "learning_rate": 1.4138965168286567e-05, + "loss": 0.2228, + "step": 14065 + }, + { + "epoch": 38.32697547683924, + "grad_norm": 5.570156574249268, + "learning_rate": 1.4138161796177909e-05, + "loss": 0.3784, + "step": 14066 + }, + { + "epoch": 38.32970027247956, + "grad_norm": 6.180319786071777, + "learning_rate": 1.4137358391841383e-05, + "loss": 0.2585, + "step": 14067 + }, + { + "epoch": 38.33242506811989, + "grad_norm": 13.237462997436523, + "learning_rate": 1.413655495528324e-05, + "loss": 0.2354, + "step": 14068 + }, + { + "epoch": 38.335149863760215, + "grad_norm": 5.750713348388672, + "learning_rate": 1.4135751486509743e-05, + "loss": 0.3899, + "step": 14069 + }, + { + "epoch": 38.33787465940055, + "grad_norm": 5.069406032562256, + "learning_rate": 1.4134947985527143e-05, + "loss": 0.2599, + "step": 14070 + }, + { + "epoch": 38.34059945504087, + "grad_norm": 5.973121643066406, + "learning_rate": 1.4134144452341702e-05, + "loss": 0.3579, + "step": 14071 + }, + { + "epoch": 38.3433242506812, + "grad_norm": 7.9918904304504395, + "learning_rate": 1.4133340886959678e-05, + "loss": 0.2699, + "step": 14072 + }, + { + "epoch": 38.346049046321525, + "grad_norm": 5.275363922119141, + "learning_rate": 1.4132537289387331e-05, + "loss": 0.2417, + "step": 14073 + }, + { + "epoch": 38.34877384196185, + "grad_norm": 10.604673385620117, + "learning_rate": 1.4131733659630913e-05, + "loss": 0.2502, + "step": 14074 + }, + { + "epoch": 38.35149863760218, + "grad_norm": 4.963611602783203, + "learning_rate": 1.4130929997696688e-05, + "loss": 0.3596, + "step": 14075 + }, + { + "epoch": 38.35422343324251, + "grad_norm": 6.919105052947998, + "learning_rate": 1.4130126303590911e-05, + "loss": 0.3586, + "step": 14076 + }, + { + "epoch": 38.356948228882835, + "grad_norm": 7.2395501136779785, + "learning_rate": 1.4129322577319846e-05, + "loss": 0.2636, + "step": 14077 + }, + { + "epoch": 38.35967302452316, + "grad_norm": 6.036019802093506, + "learning_rate": 1.4128518818889747e-05, + "loss": 0.424, + "step": 14078 + }, + { + "epoch": 38.36239782016349, + "grad_norm": 8.016825675964355, + "learning_rate": 1.4127715028306879e-05, + "loss": 0.2052, + "step": 14079 + }, + { + "epoch": 38.36512261580381, + "grad_norm": 7.741454601287842, + "learning_rate": 1.4126911205577495e-05, + "loss": 0.2644, + "step": 14080 + }, + { + "epoch": 38.36784741144414, + "grad_norm": 6.438891887664795, + "learning_rate": 1.4126107350707865e-05, + "loss": 0.3134, + "step": 14081 + }, + { + "epoch": 38.37057220708447, + "grad_norm": 5.113155364990234, + "learning_rate": 1.4125303463704241e-05, + "loss": 0.2095, + "step": 14082 + }, + { + "epoch": 38.3732970027248, + "grad_norm": 5.299055576324463, + "learning_rate": 1.4124499544572887e-05, + "loss": 0.355, + "step": 14083 + }, + { + "epoch": 38.37602179836512, + "grad_norm": 6.142955780029297, + "learning_rate": 1.4123695593320062e-05, + "loss": 0.2477, + "step": 14084 + }, + { + "epoch": 38.37874659400545, + "grad_norm": 6.0444488525390625, + "learning_rate": 1.4122891609952029e-05, + "loss": 0.2831, + "step": 14085 + }, + { + "epoch": 38.381471389645775, + "grad_norm": 8.738221168518066, + "learning_rate": 1.4122087594475049e-05, + "loss": 0.2417, + "step": 14086 + }, + { + "epoch": 38.3841961852861, + "grad_norm": 6.144389629364014, + "learning_rate": 1.4121283546895384e-05, + "loss": 0.2614, + "step": 14087 + }, + { + "epoch": 38.38692098092643, + "grad_norm": 6.7994384765625, + "learning_rate": 1.4120479467219292e-05, + "loss": 0.2132, + "step": 14088 + }, + { + "epoch": 38.38964577656676, + "grad_norm": 5.979526042938232, + "learning_rate": 1.4119675355453044e-05, + "loss": 0.2659, + "step": 14089 + }, + { + "epoch": 38.392370572207085, + "grad_norm": 5.767601490020752, + "learning_rate": 1.4118871211602893e-05, + "loss": 0.2061, + "step": 14090 + }, + { + "epoch": 38.39509536784741, + "grad_norm": 5.567809581756592, + "learning_rate": 1.411806703567511e-05, + "loss": 0.2214, + "step": 14091 + }, + { + "epoch": 38.39782016348774, + "grad_norm": 5.281261444091797, + "learning_rate": 1.4117262827675946e-05, + "loss": 0.1668, + "step": 14092 + }, + { + "epoch": 38.40054495912806, + "grad_norm": 5.884829044342041, + "learning_rate": 1.4116458587611678e-05, + "loss": 0.2425, + "step": 14093 + }, + { + "epoch": 38.403269754768395, + "grad_norm": 5.767762184143066, + "learning_rate": 1.411565431548856e-05, + "loss": 0.285, + "step": 14094 + }, + { + "epoch": 38.40599455040872, + "grad_norm": 5.065497398376465, + "learning_rate": 1.4114850011312861e-05, + "loss": 0.4338, + "step": 14095 + }, + { + "epoch": 38.40871934604905, + "grad_norm": 6.914985656738281, + "learning_rate": 1.411404567509084e-05, + "loss": 0.3231, + "step": 14096 + }, + { + "epoch": 38.41144414168937, + "grad_norm": 4.989675521850586, + "learning_rate": 1.4113241306828764e-05, + "loss": 0.2965, + "step": 14097 + }, + { + "epoch": 38.4141689373297, + "grad_norm": 14.356376647949219, + "learning_rate": 1.4112436906532898e-05, + "loss": 0.2072, + "step": 14098 + }, + { + "epoch": 38.416893732970024, + "grad_norm": 5.906617641448975, + "learning_rate": 1.4111632474209506e-05, + "loss": 0.2074, + "step": 14099 + }, + { + "epoch": 38.41961852861036, + "grad_norm": 5.60844612121582, + "learning_rate": 1.4110828009864853e-05, + "loss": 0.2516, + "step": 14100 + }, + { + "epoch": 38.42234332425068, + "grad_norm": 6.221306324005127, + "learning_rate": 1.4110023513505201e-05, + "loss": 0.2279, + "step": 14101 + }, + { + "epoch": 38.42506811989101, + "grad_norm": 5.365349769592285, + "learning_rate": 1.410921898513682e-05, + "loss": 0.185, + "step": 14102 + }, + { + "epoch": 38.427792915531334, + "grad_norm": 5.050516128540039, + "learning_rate": 1.4108414424765978e-05, + "loss": 0.2157, + "step": 14103 + }, + { + "epoch": 38.43051771117166, + "grad_norm": 5.983419895172119, + "learning_rate": 1.410760983239893e-05, + "loss": 0.3295, + "step": 14104 + }, + { + "epoch": 38.433242506811986, + "grad_norm": 6.8474531173706055, + "learning_rate": 1.4106805208041951e-05, + "loss": 0.2852, + "step": 14105 + }, + { + "epoch": 38.43596730245232, + "grad_norm": 7.26201057434082, + "learning_rate": 1.4106000551701309e-05, + "loss": 0.1926, + "step": 14106 + }, + { + "epoch": 38.438692098092645, + "grad_norm": 5.860100269317627, + "learning_rate": 1.4105195863383261e-05, + "loss": 0.2115, + "step": 14107 + }, + { + "epoch": 38.44141689373297, + "grad_norm": 6.6750688552856445, + "learning_rate": 1.4104391143094086e-05, + "loss": 0.2304, + "step": 14108 + }, + { + "epoch": 38.444141689373296, + "grad_norm": 9.718730926513672, + "learning_rate": 1.4103586390840038e-05, + "loss": 0.3804, + "step": 14109 + }, + { + "epoch": 38.44686648501362, + "grad_norm": 18.901268005371094, + "learning_rate": 1.4102781606627393e-05, + "loss": 0.2413, + "step": 14110 + }, + { + "epoch": 38.44959128065395, + "grad_norm": 5.725854873657227, + "learning_rate": 1.4101976790462421e-05, + "loss": 0.3876, + "step": 14111 + }, + { + "epoch": 38.45231607629428, + "grad_norm": 5.962811470031738, + "learning_rate": 1.4101171942351381e-05, + "loss": 0.3008, + "step": 14112 + }, + { + "epoch": 38.45504087193461, + "grad_norm": 8.318543434143066, + "learning_rate": 1.4100367062300548e-05, + "loss": 0.2971, + "step": 14113 + }, + { + "epoch": 38.45776566757493, + "grad_norm": 10.843289375305176, + "learning_rate": 1.409956215031619e-05, + "loss": 0.2088, + "step": 14114 + }, + { + "epoch": 38.46049046321526, + "grad_norm": 7.146448135375977, + "learning_rate": 1.4098757206404572e-05, + "loss": 0.3005, + "step": 14115 + }, + { + "epoch": 38.463215258855584, + "grad_norm": 5.454993724822998, + "learning_rate": 1.4097952230571965e-05, + "loss": 0.4388, + "step": 14116 + }, + { + "epoch": 38.46594005449591, + "grad_norm": 6.234476089477539, + "learning_rate": 1.4097147222824639e-05, + "loss": 0.2959, + "step": 14117 + }, + { + "epoch": 38.46866485013624, + "grad_norm": 5.893165111541748, + "learning_rate": 1.4096342183168861e-05, + "loss": 0.2718, + "step": 14118 + }, + { + "epoch": 38.47138964577657, + "grad_norm": 6.857761383056641, + "learning_rate": 1.4095537111610903e-05, + "loss": 0.3173, + "step": 14119 + }, + { + "epoch": 38.474114441416894, + "grad_norm": 6.331696033477783, + "learning_rate": 1.4094732008157032e-05, + "loss": 0.2225, + "step": 14120 + }, + { + "epoch": 38.47683923705722, + "grad_norm": 6.403774738311768, + "learning_rate": 1.409392687281352e-05, + "loss": 0.3651, + "step": 14121 + }, + { + "epoch": 38.479564032697546, + "grad_norm": 7.785304546356201, + "learning_rate": 1.4093121705586637e-05, + "loss": 0.2133, + "step": 14122 + }, + { + "epoch": 38.48228882833787, + "grad_norm": 6.4889397621154785, + "learning_rate": 1.4092316506482656e-05, + "loss": 0.3135, + "step": 14123 + }, + { + "epoch": 38.485013623978205, + "grad_norm": 6.590969085693359, + "learning_rate": 1.4091511275507845e-05, + "loss": 0.2579, + "step": 14124 + }, + { + "epoch": 38.48773841961853, + "grad_norm": 5.812717914581299, + "learning_rate": 1.4090706012668474e-05, + "loss": 0.1655, + "step": 14125 + }, + { + "epoch": 38.490463215258856, + "grad_norm": 6.541272163391113, + "learning_rate": 1.4089900717970819e-05, + "loss": 0.3709, + "step": 14126 + }, + { + "epoch": 38.49318801089918, + "grad_norm": 5.469993591308594, + "learning_rate": 1.4089095391421148e-05, + "loss": 0.3217, + "step": 14127 + }, + { + "epoch": 38.49591280653951, + "grad_norm": 5.711572170257568, + "learning_rate": 1.4088290033025736e-05, + "loss": 0.2817, + "step": 14128 + }, + { + "epoch": 38.49863760217983, + "grad_norm": 12.279172897338867, + "learning_rate": 1.4087484642790847e-05, + "loss": 0.1995, + "step": 14129 + }, + { + "epoch": 38.50136239782017, + "grad_norm": 8.407028198242188, + "learning_rate": 1.4086679220722765e-05, + "loss": 0.2884, + "step": 14130 + }, + { + "epoch": 38.50408719346049, + "grad_norm": 7.350332736968994, + "learning_rate": 1.4085873766827751e-05, + "loss": 0.2821, + "step": 14131 + }, + { + "epoch": 38.50681198910082, + "grad_norm": 7.881537914276123, + "learning_rate": 1.408506828111209e-05, + "loss": 0.2552, + "step": 14132 + }, + { + "epoch": 38.509536784741144, + "grad_norm": 21.630401611328125, + "learning_rate": 1.4084262763582044e-05, + "loss": 0.4385, + "step": 14133 + }, + { + "epoch": 38.51226158038147, + "grad_norm": 6.939113140106201, + "learning_rate": 1.4083457214243891e-05, + "loss": 0.3754, + "step": 14134 + }, + { + "epoch": 38.514986376021795, + "grad_norm": 5.386192798614502, + "learning_rate": 1.4082651633103908e-05, + "loss": 0.2091, + "step": 14135 + }, + { + "epoch": 38.51771117166213, + "grad_norm": 7.200022220611572, + "learning_rate": 1.4081846020168363e-05, + "loss": 0.3168, + "step": 14136 + }, + { + "epoch": 38.520435967302454, + "grad_norm": 6.039146423339844, + "learning_rate": 1.4081040375443533e-05, + "loss": 0.2479, + "step": 14137 + }, + { + "epoch": 38.52316076294278, + "grad_norm": 5.907276630401611, + "learning_rate": 1.4080234698935693e-05, + "loss": 0.3587, + "step": 14138 + }, + { + "epoch": 38.525885558583106, + "grad_norm": 7.188309669494629, + "learning_rate": 1.4079428990651113e-05, + "loss": 0.2617, + "step": 14139 + }, + { + "epoch": 38.52861035422343, + "grad_norm": 5.692146301269531, + "learning_rate": 1.4078623250596075e-05, + "loss": 0.3438, + "step": 14140 + }, + { + "epoch": 38.53133514986376, + "grad_norm": 6.520361423492432, + "learning_rate": 1.407781747877685e-05, + "loss": 0.1848, + "step": 14141 + }, + { + "epoch": 38.53405994550409, + "grad_norm": 6.540200710296631, + "learning_rate": 1.4077011675199713e-05, + "loss": 0.2134, + "step": 14142 + }, + { + "epoch": 38.536784741144416, + "grad_norm": 5.5721845626831055, + "learning_rate": 1.407620583987094e-05, + "loss": 0.2358, + "step": 14143 + }, + { + "epoch": 38.53950953678474, + "grad_norm": 6.2767510414123535, + "learning_rate": 1.4075399972796808e-05, + "loss": 0.3628, + "step": 14144 + }, + { + "epoch": 38.54223433242507, + "grad_norm": 6.600429058074951, + "learning_rate": 1.4074594073983592e-05, + "loss": 0.3173, + "step": 14145 + }, + { + "epoch": 38.54495912806539, + "grad_norm": 5.381121635437012, + "learning_rate": 1.4073788143437568e-05, + "loss": 0.2903, + "step": 14146 + }, + { + "epoch": 38.54768392370572, + "grad_norm": 8.758638381958008, + "learning_rate": 1.4072982181165014e-05, + "loss": 0.4308, + "step": 14147 + }, + { + "epoch": 38.55040871934605, + "grad_norm": 6.545938491821289, + "learning_rate": 1.4072176187172204e-05, + "loss": 0.2765, + "step": 14148 + }, + { + "epoch": 38.55313351498638, + "grad_norm": 6.275467872619629, + "learning_rate": 1.4071370161465417e-05, + "loss": 0.3501, + "step": 14149 + }, + { + "epoch": 38.555858310626704, + "grad_norm": 6.002571105957031, + "learning_rate": 1.407056410405093e-05, + "loss": 0.3592, + "step": 14150 + }, + { + "epoch": 38.55858310626703, + "grad_norm": 6.76323127746582, + "learning_rate": 1.4069758014935023e-05, + "loss": 0.2618, + "step": 14151 + }, + { + "epoch": 38.561307901907355, + "grad_norm": 5.465998649597168, + "learning_rate": 1.406895189412397e-05, + "loss": 0.2019, + "step": 14152 + }, + { + "epoch": 38.56403269754768, + "grad_norm": 5.174844741821289, + "learning_rate": 1.406814574162405e-05, + "loss": 0.2363, + "step": 14153 + }, + { + "epoch": 38.566757493188014, + "grad_norm": 5.759891033172607, + "learning_rate": 1.4067339557441546e-05, + "loss": 0.447, + "step": 14154 + }, + { + "epoch": 38.56948228882834, + "grad_norm": 7.666831970214844, + "learning_rate": 1.406653334158273e-05, + "loss": 0.2877, + "step": 14155 + }, + { + "epoch": 38.572207084468666, + "grad_norm": 8.34528923034668, + "learning_rate": 1.406572709405388e-05, + "loss": 0.293, + "step": 14156 + }, + { + "epoch": 38.57493188010899, + "grad_norm": 5.085103988647461, + "learning_rate": 1.406492081486128e-05, + "loss": 0.1782, + "step": 14157 + }, + { + "epoch": 38.57765667574932, + "grad_norm": 6.896602630615234, + "learning_rate": 1.406411450401121e-05, + "loss": 0.3162, + "step": 14158 + }, + { + "epoch": 38.58038147138964, + "grad_norm": 7.838594913482666, + "learning_rate": 1.4063308161509945e-05, + "loss": 0.2968, + "step": 14159 + }, + { + "epoch": 38.583106267029976, + "grad_norm": 6.963497638702393, + "learning_rate": 1.406250178736377e-05, + "loss": 0.1873, + "step": 14160 + }, + { + "epoch": 38.5858310626703, + "grad_norm": 12.829331398010254, + "learning_rate": 1.4061695381578957e-05, + "loss": 0.4227, + "step": 14161 + }, + { + "epoch": 38.58855585831063, + "grad_norm": 6.674540042877197, + "learning_rate": 1.4060888944161795e-05, + "loss": 0.1976, + "step": 14162 + }, + { + "epoch": 38.59128065395095, + "grad_norm": 6.406482696533203, + "learning_rate": 1.4060082475118558e-05, + "loss": 0.3204, + "step": 14163 + }, + { + "epoch": 38.59400544959128, + "grad_norm": 10.174060821533203, + "learning_rate": 1.4059275974455531e-05, + "loss": 0.2983, + "step": 14164 + }, + { + "epoch": 38.596730245231605, + "grad_norm": 5.605705738067627, + "learning_rate": 1.4058469442178987e-05, + "loss": 0.306, + "step": 14165 + }, + { + "epoch": 38.59945504087194, + "grad_norm": 6.45618200302124, + "learning_rate": 1.4057662878295221e-05, + "loss": 0.2862, + "step": 14166 + }, + { + "epoch": 38.60217983651226, + "grad_norm": 8.21015453338623, + "learning_rate": 1.4056856282810505e-05, + "loss": 0.2853, + "step": 14167 + }, + { + "epoch": 38.60490463215259, + "grad_norm": 6.817403316497803, + "learning_rate": 1.4056049655731125e-05, + "loss": 0.3779, + "step": 14168 + }, + { + "epoch": 38.607629427792915, + "grad_norm": 5.516331672668457, + "learning_rate": 1.4055242997063359e-05, + "loss": 0.2109, + "step": 14169 + }, + { + "epoch": 38.61035422343324, + "grad_norm": 6.00640869140625, + "learning_rate": 1.4054436306813491e-05, + "loss": 0.2894, + "step": 14170 + }, + { + "epoch": 38.61307901907357, + "grad_norm": 6.030162811279297, + "learning_rate": 1.4053629584987802e-05, + "loss": 0.212, + "step": 14171 + }, + { + "epoch": 38.6158038147139, + "grad_norm": 5.575711250305176, + "learning_rate": 1.405282283159258e-05, + "loss": 0.228, + "step": 14172 + }, + { + "epoch": 38.618528610354225, + "grad_norm": 5.750463962554932, + "learning_rate": 1.4052016046634101e-05, + "loss": 0.2615, + "step": 14173 + }, + { + "epoch": 38.62125340599455, + "grad_norm": 6.629801273345947, + "learning_rate": 1.4051209230118652e-05, + "loss": 0.3496, + "step": 14174 + }, + { + "epoch": 38.62397820163488, + "grad_norm": 7.826570987701416, + "learning_rate": 1.4050402382052514e-05, + "loss": 0.3402, + "step": 14175 + }, + { + "epoch": 38.6267029972752, + "grad_norm": 4.923995494842529, + "learning_rate": 1.4049595502441977e-05, + "loss": 0.2725, + "step": 14176 + }, + { + "epoch": 38.62942779291553, + "grad_norm": 5.763731956481934, + "learning_rate": 1.4048788591293318e-05, + "loss": 0.2625, + "step": 14177 + }, + { + "epoch": 38.63215258855586, + "grad_norm": 6.039249897003174, + "learning_rate": 1.4047981648612824e-05, + "loss": 0.2596, + "step": 14178 + }, + { + "epoch": 38.63487738419619, + "grad_norm": 7.992038726806641, + "learning_rate": 1.4047174674406781e-05, + "loss": 0.2342, + "step": 14179 + }, + { + "epoch": 38.63760217983651, + "grad_norm": 6.105435848236084, + "learning_rate": 1.4046367668681471e-05, + "loss": 0.2958, + "step": 14180 + }, + { + "epoch": 38.64032697547684, + "grad_norm": 5.173197269439697, + "learning_rate": 1.4045560631443178e-05, + "loss": 0.2477, + "step": 14181 + }, + { + "epoch": 38.643051771117165, + "grad_norm": 7.096261978149414, + "learning_rate": 1.4044753562698188e-05, + "loss": 0.2266, + "step": 14182 + }, + { + "epoch": 38.64577656675749, + "grad_norm": 6.047508239746094, + "learning_rate": 1.4043946462452791e-05, + "loss": 0.3668, + "step": 14183 + }, + { + "epoch": 38.64850136239782, + "grad_norm": 8.10651969909668, + "learning_rate": 1.4043139330713267e-05, + "loss": 0.1872, + "step": 14184 + }, + { + "epoch": 38.65122615803815, + "grad_norm": 7.908143997192383, + "learning_rate": 1.4042332167485904e-05, + "loss": 0.2151, + "step": 14185 + }, + { + "epoch": 38.653950953678475, + "grad_norm": 7.34572696685791, + "learning_rate": 1.4041524972776989e-05, + "loss": 0.3318, + "step": 14186 + }, + { + "epoch": 38.6566757493188, + "grad_norm": 6.163498401641846, + "learning_rate": 1.404071774659281e-05, + "loss": 0.2318, + "step": 14187 + }, + { + "epoch": 38.65940054495913, + "grad_norm": 5.7085652351379395, + "learning_rate": 1.4039910488939648e-05, + "loss": 0.5327, + "step": 14188 + }, + { + "epoch": 38.66212534059945, + "grad_norm": 6.371049880981445, + "learning_rate": 1.4039103199823794e-05, + "loss": 0.3045, + "step": 14189 + }, + { + "epoch": 38.664850136239785, + "grad_norm": 6.019608974456787, + "learning_rate": 1.4038295879251535e-05, + "loss": 0.2065, + "step": 14190 + }, + { + "epoch": 38.66757493188011, + "grad_norm": 6.799952030181885, + "learning_rate": 1.4037488527229156e-05, + "loss": 0.1905, + "step": 14191 + }, + { + "epoch": 38.67029972752044, + "grad_norm": 6.0175018310546875, + "learning_rate": 1.4036681143762945e-05, + "loss": 0.3696, + "step": 14192 + }, + { + "epoch": 38.67302452316076, + "grad_norm": 5.6262922286987305, + "learning_rate": 1.4035873728859195e-05, + "loss": 0.4247, + "step": 14193 + }, + { + "epoch": 38.67574931880109, + "grad_norm": 5.667084693908691, + "learning_rate": 1.4035066282524188e-05, + "loss": 0.1786, + "step": 14194 + }, + { + "epoch": 38.678474114441414, + "grad_norm": 6.430644512176514, + "learning_rate": 1.4034258804764217e-05, + "loss": 0.2489, + "step": 14195 + }, + { + "epoch": 38.68119891008175, + "grad_norm": 6.629088878631592, + "learning_rate": 1.4033451295585565e-05, + "loss": 0.2445, + "step": 14196 + }, + { + "epoch": 38.68392370572207, + "grad_norm": 5.922722816467285, + "learning_rate": 1.4032643754994526e-05, + "loss": 0.26, + "step": 14197 + }, + { + "epoch": 38.6866485013624, + "grad_norm": 6.801407337188721, + "learning_rate": 1.4031836182997387e-05, + "loss": 0.2057, + "step": 14198 + }, + { + "epoch": 38.689373297002724, + "grad_norm": 7.064025402069092, + "learning_rate": 1.4031028579600436e-05, + "loss": 0.2804, + "step": 14199 + }, + { + "epoch": 38.69209809264305, + "grad_norm": 6.30210018157959, + "learning_rate": 1.4030220944809965e-05, + "loss": 0.2088, + "step": 14200 + }, + { + "epoch": 38.694822888283376, + "grad_norm": 5.764710903167725, + "learning_rate": 1.4029413278632266e-05, + "loss": 0.2938, + "step": 14201 + }, + { + "epoch": 38.69754768392371, + "grad_norm": 4.9857096672058105, + "learning_rate": 1.4028605581073623e-05, + "loss": 0.3989, + "step": 14202 + }, + { + "epoch": 38.700272479564035, + "grad_norm": 5.339354038238525, + "learning_rate": 1.402779785214033e-05, + "loss": 0.3175, + "step": 14203 + }, + { + "epoch": 38.70299727520436, + "grad_norm": 7.36276912689209, + "learning_rate": 1.4026990091838677e-05, + "loss": 0.3404, + "step": 14204 + }, + { + "epoch": 38.705722070844686, + "grad_norm": 6.679203510284424, + "learning_rate": 1.4026182300174955e-05, + "loss": 0.2287, + "step": 14205 + }, + { + "epoch": 38.70844686648501, + "grad_norm": 5.4260711669921875, + "learning_rate": 1.4025374477155453e-05, + "loss": 0.2688, + "step": 14206 + }, + { + "epoch": 38.71117166212534, + "grad_norm": 6.5926079750061035, + "learning_rate": 1.4024566622786468e-05, + "loss": 0.2319, + "step": 14207 + }, + { + "epoch": 38.71389645776567, + "grad_norm": 6.10131311416626, + "learning_rate": 1.4023758737074284e-05, + "loss": 0.3527, + "step": 14208 + }, + { + "epoch": 38.716621253406, + "grad_norm": 5.418936252593994, + "learning_rate": 1.4022950820025198e-05, + "loss": 0.2347, + "step": 14209 + }, + { + "epoch": 38.71934604904632, + "grad_norm": 6.062687397003174, + "learning_rate": 1.40221428716455e-05, + "loss": 0.2633, + "step": 14210 + }, + { + "epoch": 38.72207084468665, + "grad_norm": 6.946159839630127, + "learning_rate": 1.4021334891941484e-05, + "loss": 0.2942, + "step": 14211 + }, + { + "epoch": 38.724795640326974, + "grad_norm": 7.638200283050537, + "learning_rate": 1.4020526880919439e-05, + "loss": 0.2323, + "step": 14212 + }, + { + "epoch": 38.7275204359673, + "grad_norm": 6.2911601066589355, + "learning_rate": 1.4019718838585664e-05, + "loss": 0.2085, + "step": 14213 + }, + { + "epoch": 38.73024523160763, + "grad_norm": 5.667962074279785, + "learning_rate": 1.4018910764946445e-05, + "loss": 0.3607, + "step": 14214 + }, + { + "epoch": 38.73297002724796, + "grad_norm": 5.755716800689697, + "learning_rate": 1.4018102660008079e-05, + "loss": 0.2263, + "step": 14215 + }, + { + "epoch": 38.735694822888284, + "grad_norm": 6.369229793548584, + "learning_rate": 1.4017294523776859e-05, + "loss": 0.3123, + "step": 14216 + }, + { + "epoch": 38.73841961852861, + "grad_norm": 6.430229663848877, + "learning_rate": 1.4016486356259076e-05, + "loss": 0.2245, + "step": 14217 + }, + { + "epoch": 38.741144414168936, + "grad_norm": 7.5628252029418945, + "learning_rate": 1.4015678157461028e-05, + "loss": 0.3125, + "step": 14218 + }, + { + "epoch": 38.74386920980926, + "grad_norm": 6.894842624664307, + "learning_rate": 1.401486992738901e-05, + "loss": 0.323, + "step": 14219 + }, + { + "epoch": 38.746594005449595, + "grad_norm": 5.481640338897705, + "learning_rate": 1.4014061666049312e-05, + "loss": 0.2659, + "step": 14220 + }, + { + "epoch": 38.74931880108992, + "grad_norm": 5.837904453277588, + "learning_rate": 1.4013253373448232e-05, + "loss": 0.1764, + "step": 14221 + }, + { + "epoch": 38.752043596730246, + "grad_norm": 6.2947893142700195, + "learning_rate": 1.4012445049592063e-05, + "loss": 0.3758, + "step": 14222 + }, + { + "epoch": 38.75476839237057, + "grad_norm": 6.084985733032227, + "learning_rate": 1.4011636694487103e-05, + "loss": 0.2057, + "step": 14223 + }, + { + "epoch": 38.7574931880109, + "grad_norm": 9.457454681396484, + "learning_rate": 1.4010828308139644e-05, + "loss": 0.2041, + "step": 14224 + }, + { + "epoch": 38.76021798365122, + "grad_norm": 6.452712535858154, + "learning_rate": 1.4010019890555982e-05, + "loss": 0.2663, + "step": 14225 + }, + { + "epoch": 38.762942779291556, + "grad_norm": 5.780202388763428, + "learning_rate": 1.4009211441742413e-05, + "loss": 0.394, + "step": 14226 + }, + { + "epoch": 38.76566757493188, + "grad_norm": 7.74014139175415, + "learning_rate": 1.4008402961705238e-05, + "loss": 0.3185, + "step": 14227 + }, + { + "epoch": 38.76839237057221, + "grad_norm": 6.427647590637207, + "learning_rate": 1.400759445045075e-05, + "loss": 0.2703, + "step": 14228 + }, + { + "epoch": 38.771117166212534, + "grad_norm": 6.909052848815918, + "learning_rate": 1.4006785907985245e-05, + "loss": 0.2979, + "step": 14229 + }, + { + "epoch": 38.77384196185286, + "grad_norm": 5.844265460968018, + "learning_rate": 1.4005977334315017e-05, + "loss": 0.4356, + "step": 14230 + }, + { + "epoch": 38.776566757493185, + "grad_norm": 5.299291133880615, + "learning_rate": 1.4005168729446372e-05, + "loss": 0.1722, + "step": 14231 + }, + { + "epoch": 38.77929155313352, + "grad_norm": 5.50273323059082, + "learning_rate": 1.4004360093385599e-05, + "loss": 0.3339, + "step": 14232 + }, + { + "epoch": 38.782016348773844, + "grad_norm": 6.551215171813965, + "learning_rate": 1.4003551426138998e-05, + "loss": 0.2394, + "step": 14233 + }, + { + "epoch": 38.78474114441417, + "grad_norm": 7.548563480377197, + "learning_rate": 1.4002742727712863e-05, + "loss": 0.3318, + "step": 14234 + }, + { + "epoch": 38.787465940054496, + "grad_norm": 5.244667053222656, + "learning_rate": 1.4001933998113504e-05, + "loss": 0.2234, + "step": 14235 + }, + { + "epoch": 38.79019073569482, + "grad_norm": 6.541910648345947, + "learning_rate": 1.4001125237347206e-05, + "loss": 0.2836, + "step": 14236 + }, + { + "epoch": 38.79291553133515, + "grad_norm": 5.8126091957092285, + "learning_rate": 1.4000316445420279e-05, + "loss": 0.23, + "step": 14237 + }, + { + "epoch": 38.79564032697548, + "grad_norm": 7.460387706756592, + "learning_rate": 1.3999507622339013e-05, + "loss": 0.2507, + "step": 14238 + }, + { + "epoch": 38.798365122615806, + "grad_norm": 6.648134708404541, + "learning_rate": 1.399869876810971e-05, + "loss": 0.3432, + "step": 14239 + }, + { + "epoch": 38.80108991825613, + "grad_norm": 7.125775337219238, + "learning_rate": 1.3997889882738671e-05, + "loss": 0.2813, + "step": 14240 + }, + { + "epoch": 38.80381471389646, + "grad_norm": 5.923659801483154, + "learning_rate": 1.3997080966232195e-05, + "loss": 0.1668, + "step": 14241 + }, + { + "epoch": 38.80653950953678, + "grad_norm": 7.02187442779541, + "learning_rate": 1.399627201859658e-05, + "loss": 0.2254, + "step": 14242 + }, + { + "epoch": 38.80926430517711, + "grad_norm": 8.10549259185791, + "learning_rate": 1.3995463039838123e-05, + "loss": 0.2408, + "step": 14243 + }, + { + "epoch": 38.81198910081744, + "grad_norm": 4.8937883377075195, + "learning_rate": 1.3994654029963132e-05, + "loss": 0.3194, + "step": 14244 + }, + { + "epoch": 38.81471389645777, + "grad_norm": 6.10452127456665, + "learning_rate": 1.3993844988977907e-05, + "loss": 0.2596, + "step": 14245 + }, + { + "epoch": 38.817438692098094, + "grad_norm": 7.868805408477783, + "learning_rate": 1.3993035916888742e-05, + "loss": 0.313, + "step": 14246 + }, + { + "epoch": 38.82016348773842, + "grad_norm": 8.325532913208008, + "learning_rate": 1.3992226813701946e-05, + "loss": 0.2721, + "step": 14247 + }, + { + "epoch": 38.822888283378745, + "grad_norm": 6.1731276512146, + "learning_rate": 1.399141767942381e-05, + "loss": 0.2142, + "step": 14248 + }, + { + "epoch": 38.82561307901907, + "grad_norm": 5.461709022521973, + "learning_rate": 1.3990608514060646e-05, + "loss": 0.3013, + "step": 14249 + }, + { + "epoch": 38.828337874659404, + "grad_norm": 5.8272552490234375, + "learning_rate": 1.3989799317618751e-05, + "loss": 0.2695, + "step": 14250 + }, + { + "epoch": 38.83106267029973, + "grad_norm": 5.033504962921143, + "learning_rate": 1.3988990090104424e-05, + "loss": 0.2505, + "step": 14251 + }, + { + "epoch": 38.833787465940055, + "grad_norm": 6.392061233520508, + "learning_rate": 1.3988180831523972e-05, + "loss": 0.2032, + "step": 14252 + }, + { + "epoch": 38.83651226158038, + "grad_norm": 6.937142372131348, + "learning_rate": 1.3987371541883699e-05, + "loss": 0.2637, + "step": 14253 + }, + { + "epoch": 38.83923705722071, + "grad_norm": 5.689050197601318, + "learning_rate": 1.3986562221189902e-05, + "loss": 0.3088, + "step": 14254 + }, + { + "epoch": 38.84196185286103, + "grad_norm": 5.71989631652832, + "learning_rate": 1.3985752869448888e-05, + "loss": 0.3759, + "step": 14255 + }, + { + "epoch": 38.844686648501366, + "grad_norm": 6.083313941955566, + "learning_rate": 1.3984943486666957e-05, + "loss": 0.2458, + "step": 14256 + }, + { + "epoch": 38.84741144414169, + "grad_norm": 4.9870123863220215, + "learning_rate": 1.3984134072850417e-05, + "loss": 0.2922, + "step": 14257 + }, + { + "epoch": 38.85013623978202, + "grad_norm": 5.492220401763916, + "learning_rate": 1.3983324628005566e-05, + "loss": 0.2931, + "step": 14258 + }, + { + "epoch": 38.85286103542234, + "grad_norm": 5.595819473266602, + "learning_rate": 1.3982515152138713e-05, + "loss": 0.1908, + "step": 14259 + }, + { + "epoch": 38.85558583106267, + "grad_norm": 30.5610408782959, + "learning_rate": 1.3981705645256161e-05, + "loss": 0.3721, + "step": 14260 + }, + { + "epoch": 38.858310626702995, + "grad_norm": 6.095954895019531, + "learning_rate": 1.3980896107364212e-05, + "loss": 0.3642, + "step": 14261 + }, + { + "epoch": 38.86103542234333, + "grad_norm": 7.429832935333252, + "learning_rate": 1.398008653846917e-05, + "loss": 0.3167, + "step": 14262 + }, + { + "epoch": 38.86376021798365, + "grad_norm": 5.93065071105957, + "learning_rate": 1.3979276938577347e-05, + "loss": 0.2809, + "step": 14263 + }, + { + "epoch": 38.86648501362398, + "grad_norm": 9.602701187133789, + "learning_rate": 1.397846730769504e-05, + "loss": 0.3329, + "step": 14264 + }, + { + "epoch": 38.869209809264305, + "grad_norm": 6.699948787689209, + "learning_rate": 1.3977657645828559e-05, + "loss": 0.3971, + "step": 14265 + }, + { + "epoch": 38.87193460490463, + "grad_norm": 7.0116448402404785, + "learning_rate": 1.3976847952984209e-05, + "loss": 0.2015, + "step": 14266 + }, + { + "epoch": 38.87465940054496, + "grad_norm": 5.536526679992676, + "learning_rate": 1.3976038229168296e-05, + "loss": 0.2613, + "step": 14267 + }, + { + "epoch": 38.87738419618529, + "grad_norm": 7.464479446411133, + "learning_rate": 1.3975228474387122e-05, + "loss": 0.26, + "step": 14268 + }, + { + "epoch": 38.880108991825615, + "grad_norm": 7.937355995178223, + "learning_rate": 1.3974418688646997e-05, + "loss": 0.271, + "step": 14269 + }, + { + "epoch": 38.88283378746594, + "grad_norm": 7.095129489898682, + "learning_rate": 1.397360887195423e-05, + "loss": 0.2693, + "step": 14270 + }, + { + "epoch": 38.88555858310627, + "grad_norm": 6.2759928703308105, + "learning_rate": 1.3972799024315123e-05, + "loss": 0.391, + "step": 14271 + }, + { + "epoch": 38.88828337874659, + "grad_norm": 8.566492080688477, + "learning_rate": 1.3971989145735982e-05, + "loss": 0.3997, + "step": 14272 + }, + { + "epoch": 38.89100817438692, + "grad_norm": 7.450653076171875, + "learning_rate": 1.3971179236223122e-05, + "loss": 0.2993, + "step": 14273 + }, + { + "epoch": 38.89373297002725, + "grad_norm": 7.209585189819336, + "learning_rate": 1.3970369295782844e-05, + "loss": 0.2408, + "step": 14274 + }, + { + "epoch": 38.89645776566758, + "grad_norm": 7.133180141448975, + "learning_rate": 1.396955932442146e-05, + "loss": 0.311, + "step": 14275 + }, + { + "epoch": 38.8991825613079, + "grad_norm": 9.923151016235352, + "learning_rate": 1.3968749322145274e-05, + "loss": 0.4052, + "step": 14276 + }, + { + "epoch": 38.90190735694823, + "grad_norm": 6.90376615524292, + "learning_rate": 1.3967939288960595e-05, + "loss": 0.2784, + "step": 14277 + }, + { + "epoch": 38.904632152588555, + "grad_norm": 6.0615458488464355, + "learning_rate": 1.3967129224873734e-05, + "loss": 0.1817, + "step": 14278 + }, + { + "epoch": 38.90735694822888, + "grad_norm": 5.877019882202148, + "learning_rate": 1.3966319129890997e-05, + "loss": 0.205, + "step": 14279 + }, + { + "epoch": 38.91008174386921, + "grad_norm": 6.62255859375, + "learning_rate": 1.3965509004018695e-05, + "loss": 0.2224, + "step": 14280 + }, + { + "epoch": 38.91280653950954, + "grad_norm": 6.7541656494140625, + "learning_rate": 1.3964698847263138e-05, + "loss": 0.4018, + "step": 14281 + }, + { + "epoch": 38.915531335149865, + "grad_norm": 5.898073196411133, + "learning_rate": 1.3963888659630634e-05, + "loss": 0.4525, + "step": 14282 + }, + { + "epoch": 38.91825613079019, + "grad_norm": 6.852269172668457, + "learning_rate": 1.396307844112749e-05, + "loss": 0.287, + "step": 14283 + }, + { + "epoch": 38.920980926430516, + "grad_norm": 7.012596607208252, + "learning_rate": 1.3962268191760019e-05, + "loss": 0.3561, + "step": 14284 + }, + { + "epoch": 38.92370572207084, + "grad_norm": 7.041779041290283, + "learning_rate": 1.3961457911534532e-05, + "loss": 0.2817, + "step": 14285 + }, + { + "epoch": 38.926430517711175, + "grad_norm": 7.059216022491455, + "learning_rate": 1.3960647600457338e-05, + "loss": 0.252, + "step": 14286 + }, + { + "epoch": 38.9291553133515, + "grad_norm": 7.676758766174316, + "learning_rate": 1.3959837258534748e-05, + "loss": 0.3079, + "step": 14287 + }, + { + "epoch": 38.93188010899183, + "grad_norm": 6.447818279266357, + "learning_rate": 1.3959026885773072e-05, + "loss": 0.3198, + "step": 14288 + }, + { + "epoch": 38.93460490463215, + "grad_norm": 6.1130266189575195, + "learning_rate": 1.3958216482178623e-05, + "loss": 0.2326, + "step": 14289 + }, + { + "epoch": 38.93732970027248, + "grad_norm": 6.401403427124023, + "learning_rate": 1.3957406047757714e-05, + "loss": 0.3269, + "step": 14290 + }, + { + "epoch": 38.940054495912804, + "grad_norm": 7.1712541580200195, + "learning_rate": 1.395659558251665e-05, + "loss": 0.2905, + "step": 14291 + }, + { + "epoch": 38.94277929155314, + "grad_norm": 6.875960350036621, + "learning_rate": 1.3955785086461749e-05, + "loss": 0.3475, + "step": 14292 + }, + { + "epoch": 38.94550408719346, + "grad_norm": 6.088695526123047, + "learning_rate": 1.395497455959932e-05, + "loss": 0.3795, + "step": 14293 + }, + { + "epoch": 38.94822888283379, + "grad_norm": 10.818563461303711, + "learning_rate": 1.3954164001935674e-05, + "loss": 0.4487, + "step": 14294 + }, + { + "epoch": 38.950953678474114, + "grad_norm": 5.353722095489502, + "learning_rate": 1.3953353413477132e-05, + "loss": 0.3378, + "step": 14295 + }, + { + "epoch": 38.95367847411444, + "grad_norm": 8.669241905212402, + "learning_rate": 1.3952542794229998e-05, + "loss": 0.2861, + "step": 14296 + }, + { + "epoch": 38.956403269754766, + "grad_norm": 5.692200183868408, + "learning_rate": 1.3951732144200584e-05, + "loss": 0.2019, + "step": 14297 + }, + { + "epoch": 38.95912806539509, + "grad_norm": 10.162614822387695, + "learning_rate": 1.3950921463395213e-05, + "loss": 0.1877, + "step": 14298 + }, + { + "epoch": 38.961852861035425, + "grad_norm": 6.350072383880615, + "learning_rate": 1.3950110751820192e-05, + "loss": 0.2676, + "step": 14299 + }, + { + "epoch": 38.96457765667575, + "grad_norm": 5.5919013023376465, + "learning_rate": 1.3949300009481835e-05, + "loss": 0.2422, + "step": 14300 + }, + { + "epoch": 38.967302452316076, + "grad_norm": 7.189586162567139, + "learning_rate": 1.3948489236386454e-05, + "loss": 0.1902, + "step": 14301 + }, + { + "epoch": 38.9700272479564, + "grad_norm": 7.617172718048096, + "learning_rate": 1.3947678432540368e-05, + "loss": 0.2649, + "step": 14302 + }, + { + "epoch": 38.97275204359673, + "grad_norm": 5.228553771972656, + "learning_rate": 1.3946867597949887e-05, + "loss": 0.2438, + "step": 14303 + }, + { + "epoch": 38.97547683923706, + "grad_norm": 6.238590717315674, + "learning_rate": 1.3946056732621332e-05, + "loss": 0.265, + "step": 14304 + }, + { + "epoch": 38.97820163487739, + "grad_norm": 7.42759895324707, + "learning_rate": 1.3945245836561013e-05, + "loss": 0.6329, + "step": 14305 + }, + { + "epoch": 38.98092643051771, + "grad_norm": 10.85505199432373, + "learning_rate": 1.3944434909775247e-05, + "loss": 0.3737, + "step": 14306 + }, + { + "epoch": 38.98365122615804, + "grad_norm": 6.245872497558594, + "learning_rate": 1.3943623952270346e-05, + "loss": 0.2907, + "step": 14307 + }, + { + "epoch": 38.986376021798364, + "grad_norm": 8.080317497253418, + "learning_rate": 1.3942812964052632e-05, + "loss": 0.2971, + "step": 14308 + }, + { + "epoch": 38.98910081743869, + "grad_norm": 5.9236836433410645, + "learning_rate": 1.3942001945128416e-05, + "loss": 0.2373, + "step": 14309 + }, + { + "epoch": 38.991825613079016, + "grad_norm": 6.837869644165039, + "learning_rate": 1.3941190895504015e-05, + "loss": 0.31, + "step": 14310 + }, + { + "epoch": 38.99455040871935, + "grad_norm": 6.478810787200928, + "learning_rate": 1.3940379815185746e-05, + "loss": 0.3202, + "step": 14311 + }, + { + "epoch": 38.997275204359674, + "grad_norm": 7.109516143798828, + "learning_rate": 1.3939568704179926e-05, + "loss": 0.5093, + "step": 14312 + }, + { + "epoch": 39.0, + "grad_norm": 6.694377422332764, + "learning_rate": 1.3938757562492873e-05, + "loss": 0.1959, + "step": 14313 + }, + { + "epoch": 39.002724795640326, + "grad_norm": 5.328964710235596, + "learning_rate": 1.3937946390130904e-05, + "loss": 0.2201, + "step": 14314 + }, + { + "epoch": 39.00544959128065, + "grad_norm": 5.843469142913818, + "learning_rate": 1.3937135187100332e-05, + "loss": 0.2167, + "step": 14315 + }, + { + "epoch": 39.00817438692098, + "grad_norm": 5.099860668182373, + "learning_rate": 1.393632395340748e-05, + "loss": 0.3085, + "step": 14316 + }, + { + "epoch": 39.01089918256131, + "grad_norm": 6.607177257537842, + "learning_rate": 1.3935512689058663e-05, + "loss": 0.2555, + "step": 14317 + }, + { + "epoch": 39.013623978201636, + "grad_norm": 6.643643856048584, + "learning_rate": 1.3934701394060202e-05, + "loss": 0.2245, + "step": 14318 + }, + { + "epoch": 39.01634877384196, + "grad_norm": 5.466268062591553, + "learning_rate": 1.393389006841841e-05, + "loss": 0.4362, + "step": 14319 + }, + { + "epoch": 39.01907356948229, + "grad_norm": 4.7354021072387695, + "learning_rate": 1.3933078712139607e-05, + "loss": 0.1747, + "step": 14320 + }, + { + "epoch": 39.02179836512261, + "grad_norm": 6.899024963378906, + "learning_rate": 1.3932267325230118e-05, + "loss": 0.2903, + "step": 14321 + }, + { + "epoch": 39.02452316076294, + "grad_norm": 6.467222690582275, + "learning_rate": 1.3931455907696257e-05, + "loss": 0.211, + "step": 14322 + }, + { + "epoch": 39.02724795640327, + "grad_norm": 6.949442386627197, + "learning_rate": 1.3930644459544343e-05, + "loss": 0.3762, + "step": 14323 + }, + { + "epoch": 39.0299727520436, + "grad_norm": 7.553343772888184, + "learning_rate": 1.3929832980780696e-05, + "loss": 0.2569, + "step": 14324 + }, + { + "epoch": 39.032697547683924, + "grad_norm": 5.200009822845459, + "learning_rate": 1.3929021471411637e-05, + "loss": 0.1993, + "step": 14325 + }, + { + "epoch": 39.03542234332425, + "grad_norm": 28.745405197143555, + "learning_rate": 1.3928209931443487e-05, + "loss": 0.2299, + "step": 14326 + }, + { + "epoch": 39.038147138964575, + "grad_norm": 8.111405372619629, + "learning_rate": 1.392739836088256e-05, + "loss": 0.3381, + "step": 14327 + }, + { + "epoch": 39.0408719346049, + "grad_norm": 7.686152935028076, + "learning_rate": 1.3926586759735185e-05, + "loss": 0.2045, + "step": 14328 + }, + { + "epoch": 39.043596730245234, + "grad_norm": 5.327547073364258, + "learning_rate": 1.3925775128007674e-05, + "loss": 0.3247, + "step": 14329 + }, + { + "epoch": 39.04632152588556, + "grad_norm": 5.757328033447266, + "learning_rate": 1.3924963465706358e-05, + "loss": 0.3708, + "step": 14330 + }, + { + "epoch": 39.049046321525886, + "grad_norm": 5.843682289123535, + "learning_rate": 1.3924151772837549e-05, + "loss": 0.2439, + "step": 14331 + }, + { + "epoch": 39.05177111716621, + "grad_norm": 9.030362129211426, + "learning_rate": 1.3923340049407576e-05, + "loss": 0.4127, + "step": 14332 + }, + { + "epoch": 39.05449591280654, + "grad_norm": 7.151304721832275, + "learning_rate": 1.3922528295422755e-05, + "loss": 0.3836, + "step": 14333 + }, + { + "epoch": 39.05722070844686, + "grad_norm": 6.7778096199035645, + "learning_rate": 1.392171651088941e-05, + "loss": 0.2563, + "step": 14334 + }, + { + "epoch": 39.059945504087196, + "grad_norm": 8.462702751159668, + "learning_rate": 1.3920904695813861e-05, + "loss": 0.2613, + "step": 14335 + }, + { + "epoch": 39.06267029972752, + "grad_norm": 6.116037845611572, + "learning_rate": 1.3920092850202435e-05, + "loss": 0.2851, + "step": 14336 + }, + { + "epoch": 39.06539509536785, + "grad_norm": 5.209856033325195, + "learning_rate": 1.391928097406145e-05, + "loss": 0.277, + "step": 14337 + }, + { + "epoch": 39.06811989100817, + "grad_norm": 7.555953502655029, + "learning_rate": 1.3918469067397233e-05, + "loss": 0.2476, + "step": 14338 + }, + { + "epoch": 39.0708446866485, + "grad_norm": 8.173412322998047, + "learning_rate": 1.3917657130216103e-05, + "loss": 0.3123, + "step": 14339 + }, + { + "epoch": 39.073569482288825, + "grad_norm": 6.560594081878662, + "learning_rate": 1.3916845162524388e-05, + "loss": 0.2472, + "step": 14340 + }, + { + "epoch": 39.07629427792916, + "grad_norm": 4.919372081756592, + "learning_rate": 1.3916033164328406e-05, + "loss": 0.1607, + "step": 14341 + }, + { + "epoch": 39.079019073569484, + "grad_norm": 7.3588151931762695, + "learning_rate": 1.3915221135634487e-05, + "loss": 0.2097, + "step": 14342 + }, + { + "epoch": 39.08174386920981, + "grad_norm": 6.464593887329102, + "learning_rate": 1.391440907644895e-05, + "loss": 0.3798, + "step": 14343 + }, + { + "epoch": 39.084468664850135, + "grad_norm": 7.673997402191162, + "learning_rate": 1.3913596986778123e-05, + "loss": 0.2715, + "step": 14344 + }, + { + "epoch": 39.08719346049046, + "grad_norm": 7.415081024169922, + "learning_rate": 1.3912784866628326e-05, + "loss": 0.3838, + "step": 14345 + }, + { + "epoch": 39.08991825613079, + "grad_norm": 4.880640506744385, + "learning_rate": 1.3911972716005887e-05, + "loss": 0.1909, + "step": 14346 + }, + { + "epoch": 39.09264305177112, + "grad_norm": 5.719912052154541, + "learning_rate": 1.391116053491713e-05, + "loss": 0.2416, + "step": 14347 + }, + { + "epoch": 39.095367847411445, + "grad_norm": 5.737791061401367, + "learning_rate": 1.3910348323368381e-05, + "loss": 0.1778, + "step": 14348 + }, + { + "epoch": 39.09809264305177, + "grad_norm": 7.773014545440674, + "learning_rate": 1.3909536081365964e-05, + "loss": 0.2668, + "step": 14349 + }, + { + "epoch": 39.1008174386921, + "grad_norm": 5.769792556762695, + "learning_rate": 1.390872380891621e-05, + "loss": 0.2946, + "step": 14350 + }, + { + "epoch": 39.10354223433242, + "grad_norm": 6.600955963134766, + "learning_rate": 1.3907911506025436e-05, + "loss": 0.2388, + "step": 14351 + }, + { + "epoch": 39.10626702997275, + "grad_norm": 6.24024772644043, + "learning_rate": 1.3907099172699976e-05, + "loss": 0.2556, + "step": 14352 + }, + { + "epoch": 39.10899182561308, + "grad_norm": 7.633904457092285, + "learning_rate": 1.390628680894615e-05, + "loss": 0.2729, + "step": 14353 + }, + { + "epoch": 39.11171662125341, + "grad_norm": 6.381833553314209, + "learning_rate": 1.390547441477029e-05, + "loss": 0.2037, + "step": 14354 + }, + { + "epoch": 39.11444141689373, + "grad_norm": 5.045418739318848, + "learning_rate": 1.3904661990178723e-05, + "loss": 0.187, + "step": 14355 + }, + { + "epoch": 39.11716621253406, + "grad_norm": 5.261258125305176, + "learning_rate": 1.390384953517777e-05, + "loss": 0.1665, + "step": 14356 + }, + { + "epoch": 39.119891008174385, + "grad_norm": 5.163601875305176, + "learning_rate": 1.3903037049773769e-05, + "loss": 0.3376, + "step": 14357 + }, + { + "epoch": 39.12261580381471, + "grad_norm": 6.772798538208008, + "learning_rate": 1.3902224533973034e-05, + "loss": 0.4315, + "step": 14358 + }, + { + "epoch": 39.12534059945504, + "grad_norm": 8.250518798828125, + "learning_rate": 1.3901411987781904e-05, + "loss": 0.437, + "step": 14359 + }, + { + "epoch": 39.12806539509537, + "grad_norm": 5.6278276443481445, + "learning_rate": 1.3900599411206704e-05, + "loss": 0.2517, + "step": 14360 + }, + { + "epoch": 39.130790190735695, + "grad_norm": 6.756508827209473, + "learning_rate": 1.3899786804253757e-05, + "loss": 0.321, + "step": 14361 + }, + { + "epoch": 39.13351498637602, + "grad_norm": 5.385969638824463, + "learning_rate": 1.3898974166929398e-05, + "loss": 0.3564, + "step": 14362 + }, + { + "epoch": 39.13623978201635, + "grad_norm": 5.501603126525879, + "learning_rate": 1.3898161499239952e-05, + "loss": 0.2124, + "step": 14363 + }, + { + "epoch": 39.13896457765667, + "grad_norm": 7.773250579833984, + "learning_rate": 1.3897348801191752e-05, + "loss": 0.3246, + "step": 14364 + }, + { + "epoch": 39.141689373297005, + "grad_norm": 5.84032678604126, + "learning_rate": 1.3896536072791125e-05, + "loss": 0.2693, + "step": 14365 + }, + { + "epoch": 39.14441416893733, + "grad_norm": 6.377506256103516, + "learning_rate": 1.38957233140444e-05, + "loss": 0.2886, + "step": 14366 + }, + { + "epoch": 39.14713896457766, + "grad_norm": 5.796489715576172, + "learning_rate": 1.3894910524957907e-05, + "loss": 0.2948, + "step": 14367 + }, + { + "epoch": 39.14986376021798, + "grad_norm": 11.502608299255371, + "learning_rate": 1.3894097705537977e-05, + "loss": 0.2247, + "step": 14368 + }, + { + "epoch": 39.15258855585831, + "grad_norm": 7.887616157531738, + "learning_rate": 1.389328485579094e-05, + "loss": 0.4033, + "step": 14369 + }, + { + "epoch": 39.155313351498634, + "grad_norm": 5.441971778869629, + "learning_rate": 1.3892471975723122e-05, + "loss": 0.2924, + "step": 14370 + }, + { + "epoch": 39.15803814713897, + "grad_norm": 6.963483810424805, + "learning_rate": 1.3891659065340861e-05, + "loss": 0.2221, + "step": 14371 + }, + { + "epoch": 39.16076294277929, + "grad_norm": 5.960539817810059, + "learning_rate": 1.3890846124650482e-05, + "loss": 0.2971, + "step": 14372 + }, + { + "epoch": 39.16348773841962, + "grad_norm": 5.39940881729126, + "learning_rate": 1.3890033153658322e-05, + "loss": 0.2168, + "step": 14373 + }, + { + "epoch": 39.166212534059945, + "grad_norm": 5.560946941375732, + "learning_rate": 1.3889220152370706e-05, + "loss": 0.2249, + "step": 14374 + }, + { + "epoch": 39.16893732970027, + "grad_norm": 5.56072473526001, + "learning_rate": 1.3888407120793973e-05, + "loss": 0.2118, + "step": 14375 + }, + { + "epoch": 39.171662125340596, + "grad_norm": 6.4710259437561035, + "learning_rate": 1.3887594058934444e-05, + "loss": 0.3568, + "step": 14376 + }, + { + "epoch": 39.17438692098093, + "grad_norm": 7.413678169250488, + "learning_rate": 1.3886780966798464e-05, + "loss": 0.2221, + "step": 14377 + }, + { + "epoch": 39.177111716621255, + "grad_norm": 5.558591842651367, + "learning_rate": 1.3885967844392354e-05, + "loss": 0.2545, + "step": 14378 + }, + { + "epoch": 39.17983651226158, + "grad_norm": 5.393101215362549, + "learning_rate": 1.3885154691722453e-05, + "loss": 0.2334, + "step": 14379 + }, + { + "epoch": 39.182561307901906, + "grad_norm": 6.346226215362549, + "learning_rate": 1.3884341508795092e-05, + "loss": 0.2947, + "step": 14380 + }, + { + "epoch": 39.18528610354223, + "grad_norm": 6.576112270355225, + "learning_rate": 1.3883528295616606e-05, + "loss": 0.2093, + "step": 14381 + }, + { + "epoch": 39.18801089918256, + "grad_norm": 6.0815958976745605, + "learning_rate": 1.3882715052193323e-05, + "loss": 0.273, + "step": 14382 + }, + { + "epoch": 39.19073569482289, + "grad_norm": 5.966588973999023, + "learning_rate": 1.3881901778531583e-05, + "loss": 0.5629, + "step": 14383 + }, + { + "epoch": 39.19346049046322, + "grad_norm": 8.157422065734863, + "learning_rate": 1.3881088474637716e-05, + "loss": 0.2407, + "step": 14384 + }, + { + "epoch": 39.19618528610354, + "grad_norm": 6.78936767578125, + "learning_rate": 1.388027514051806e-05, + "loss": 0.2205, + "step": 14385 + }, + { + "epoch": 39.19891008174387, + "grad_norm": 6.487745761871338, + "learning_rate": 1.3879461776178943e-05, + "loss": 0.3394, + "step": 14386 + }, + { + "epoch": 39.201634877384194, + "grad_norm": 7.317575931549072, + "learning_rate": 1.3878648381626704e-05, + "loss": 0.2415, + "step": 14387 + }, + { + "epoch": 39.20435967302452, + "grad_norm": 5.161836624145508, + "learning_rate": 1.3877834956867675e-05, + "loss": 0.2265, + "step": 14388 + }, + { + "epoch": 39.20708446866485, + "grad_norm": 5.480639457702637, + "learning_rate": 1.387702150190819e-05, + "loss": 0.2178, + "step": 14389 + }, + { + "epoch": 39.20980926430518, + "grad_norm": 8.126582145690918, + "learning_rate": 1.3876208016754589e-05, + "loss": 0.209, + "step": 14390 + }, + { + "epoch": 39.212534059945504, + "grad_norm": 7.839139461517334, + "learning_rate": 1.3875394501413206e-05, + "loss": 0.3221, + "step": 14391 + }, + { + "epoch": 39.21525885558583, + "grad_norm": 8.001127243041992, + "learning_rate": 1.3874580955890374e-05, + "loss": 0.2136, + "step": 14392 + }, + { + "epoch": 39.217983651226156, + "grad_norm": 10.482834815979004, + "learning_rate": 1.3873767380192431e-05, + "loss": 0.1745, + "step": 14393 + }, + { + "epoch": 39.22070844686648, + "grad_norm": 5.722413063049316, + "learning_rate": 1.387295377432571e-05, + "loss": 0.2396, + "step": 14394 + }, + { + "epoch": 39.223433242506815, + "grad_norm": 5.641980171203613, + "learning_rate": 1.3872140138296553e-05, + "loss": 0.2631, + "step": 14395 + }, + { + "epoch": 39.22615803814714, + "grad_norm": 4.87531852722168, + "learning_rate": 1.387132647211129e-05, + "loss": 0.2508, + "step": 14396 + }, + { + "epoch": 39.228882833787466, + "grad_norm": 6.67892599105835, + "learning_rate": 1.3870512775776262e-05, + "loss": 0.2729, + "step": 14397 + }, + { + "epoch": 39.23160762942779, + "grad_norm": 6.84233283996582, + "learning_rate": 1.3869699049297805e-05, + "loss": 0.189, + "step": 14398 + }, + { + "epoch": 39.23433242506812, + "grad_norm": 5.77467679977417, + "learning_rate": 1.3868885292682258e-05, + "loss": 0.2601, + "step": 14399 + }, + { + "epoch": 39.237057220708444, + "grad_norm": 4.727165222167969, + "learning_rate": 1.3868071505935953e-05, + "loss": 0.3941, + "step": 14400 + }, + { + "epoch": 39.23978201634878, + "grad_norm": 5.63623046875, + "learning_rate": 1.3867257689065237e-05, + "loss": 0.2054, + "step": 14401 + }, + { + "epoch": 39.2425068119891, + "grad_norm": 6.149964809417725, + "learning_rate": 1.3866443842076438e-05, + "loss": 0.2709, + "step": 14402 + }, + { + "epoch": 39.24523160762943, + "grad_norm": 7.443466663360596, + "learning_rate": 1.3865629964975901e-05, + "loss": 0.1891, + "step": 14403 + }, + { + "epoch": 39.247956403269754, + "grad_norm": 6.356564044952393, + "learning_rate": 1.3864816057769961e-05, + "loss": 0.2976, + "step": 14404 + }, + { + "epoch": 39.25068119891008, + "grad_norm": 6.187931060791016, + "learning_rate": 1.3864002120464962e-05, + "loss": 0.1702, + "step": 14405 + }, + { + "epoch": 39.253405994550405, + "grad_norm": 5.51117467880249, + "learning_rate": 1.3863188153067233e-05, + "loss": 0.3435, + "step": 14406 + }, + { + "epoch": 39.25613079019074, + "grad_norm": 5.29209041595459, + "learning_rate": 1.3862374155583122e-05, + "loss": 0.2872, + "step": 14407 + }, + { + "epoch": 39.258855585831064, + "grad_norm": 5.761871337890625, + "learning_rate": 1.3861560128018962e-05, + "loss": 0.2604, + "step": 14408 + }, + { + "epoch": 39.26158038147139, + "grad_norm": 6.281421184539795, + "learning_rate": 1.3860746070381101e-05, + "loss": 0.2898, + "step": 14409 + }, + { + "epoch": 39.264305177111716, + "grad_norm": 5.377538681030273, + "learning_rate": 1.3859931982675872e-05, + "loss": 0.2023, + "step": 14410 + }, + { + "epoch": 39.26702997275204, + "grad_norm": 5.567324161529541, + "learning_rate": 1.3859117864909619e-05, + "loss": 0.1759, + "step": 14411 + }, + { + "epoch": 39.26975476839237, + "grad_norm": 6.55522346496582, + "learning_rate": 1.3858303717088676e-05, + "loss": 0.2079, + "step": 14412 + }, + { + "epoch": 39.2724795640327, + "grad_norm": 5.562514781951904, + "learning_rate": 1.3857489539219393e-05, + "loss": 0.2517, + "step": 14413 + }, + { + "epoch": 39.275204359673026, + "grad_norm": 5.650949954986572, + "learning_rate": 1.38566753313081e-05, + "loss": 0.2165, + "step": 14414 + }, + { + "epoch": 39.27792915531335, + "grad_norm": 6.258750915527344, + "learning_rate": 1.3855861093361144e-05, + "loss": 0.3011, + "step": 14415 + }, + { + "epoch": 39.28065395095368, + "grad_norm": 6.140244960784912, + "learning_rate": 1.3855046825384868e-05, + "loss": 0.3481, + "step": 14416 + }, + { + "epoch": 39.283378746594, + "grad_norm": 10.04259967803955, + "learning_rate": 1.3854232527385614e-05, + "loss": 0.2651, + "step": 14417 + }, + { + "epoch": 39.28610354223433, + "grad_norm": 6.4561896324157715, + "learning_rate": 1.3853418199369717e-05, + "loss": 0.2029, + "step": 14418 + }, + { + "epoch": 39.28882833787466, + "grad_norm": 5.495051860809326, + "learning_rate": 1.3852603841343525e-05, + "loss": 0.1995, + "step": 14419 + }, + { + "epoch": 39.29155313351499, + "grad_norm": 5.664775848388672, + "learning_rate": 1.385178945331338e-05, + "loss": 0.2686, + "step": 14420 + }, + { + "epoch": 39.294277929155314, + "grad_norm": 7.046104431152344, + "learning_rate": 1.385097503528562e-05, + "loss": 0.2892, + "step": 14421 + }, + { + "epoch": 39.29700272479564, + "grad_norm": 5.487584114074707, + "learning_rate": 1.385016058726659e-05, + "loss": 0.2466, + "step": 14422 + }, + { + "epoch": 39.299727520435965, + "grad_norm": 6.687308311462402, + "learning_rate": 1.3849346109262634e-05, + "loss": 0.2345, + "step": 14423 + }, + { + "epoch": 39.30245231607629, + "grad_norm": 5.87015438079834, + "learning_rate": 1.3848531601280095e-05, + "loss": 0.2002, + "step": 14424 + }, + { + "epoch": 39.305177111716624, + "grad_norm": 7.049134731292725, + "learning_rate": 1.3847717063325316e-05, + "loss": 0.1947, + "step": 14425 + }, + { + "epoch": 39.30790190735695, + "grad_norm": 5.7420654296875, + "learning_rate": 1.384690249540464e-05, + "loss": 0.2124, + "step": 14426 + }, + { + "epoch": 39.310626702997276, + "grad_norm": 6.156968116760254, + "learning_rate": 1.3846087897524412e-05, + "loss": 0.1808, + "step": 14427 + }, + { + "epoch": 39.3133514986376, + "grad_norm": 6.691866397857666, + "learning_rate": 1.3845273269690973e-05, + "loss": 0.2945, + "step": 14428 + }, + { + "epoch": 39.31607629427793, + "grad_norm": 5.193544864654541, + "learning_rate": 1.3844458611910671e-05, + "loss": 0.2237, + "step": 14429 + }, + { + "epoch": 39.31880108991825, + "grad_norm": 6.388106346130371, + "learning_rate": 1.384364392418985e-05, + "loss": 0.2084, + "step": 14430 + }, + { + "epoch": 39.321525885558586, + "grad_norm": 6.0377583503723145, + "learning_rate": 1.3842829206534854e-05, + "loss": 0.4066, + "step": 14431 + }, + { + "epoch": 39.32425068119891, + "grad_norm": 5.002970218658447, + "learning_rate": 1.3842014458952025e-05, + "loss": 0.1642, + "step": 14432 + }, + { + "epoch": 39.32697547683924, + "grad_norm": 6.982475757598877, + "learning_rate": 1.3841199681447713e-05, + "loss": 0.1986, + "step": 14433 + }, + { + "epoch": 39.32970027247956, + "grad_norm": 5.248578071594238, + "learning_rate": 1.3840384874028262e-05, + "loss": 0.2947, + "step": 14434 + }, + { + "epoch": 39.33242506811989, + "grad_norm": 6.221617221832275, + "learning_rate": 1.3839570036700015e-05, + "loss": 0.3211, + "step": 14435 + }, + { + "epoch": 39.335149863760215, + "grad_norm": 6.641686916351318, + "learning_rate": 1.383875516946932e-05, + "loss": 0.2894, + "step": 14436 + }, + { + "epoch": 39.33787465940055, + "grad_norm": 6.050511360168457, + "learning_rate": 1.3837940272342525e-05, + "loss": 0.3503, + "step": 14437 + }, + { + "epoch": 39.34059945504087, + "grad_norm": 6.534960746765137, + "learning_rate": 1.3837125345325975e-05, + "loss": 0.2766, + "step": 14438 + }, + { + "epoch": 39.3433242506812, + "grad_norm": 5.614215850830078, + "learning_rate": 1.3836310388426015e-05, + "loss": 0.3974, + "step": 14439 + }, + { + "epoch": 39.346049046321525, + "grad_norm": 6.731872081756592, + "learning_rate": 1.3835495401648995e-05, + "loss": 0.3325, + "step": 14440 + }, + { + "epoch": 39.34877384196185, + "grad_norm": 8.455556869506836, + "learning_rate": 1.3834680385001257e-05, + "loss": 0.2448, + "step": 14441 + }, + { + "epoch": 39.35149863760218, + "grad_norm": 8.348003387451172, + "learning_rate": 1.3833865338489156e-05, + "loss": 0.3221, + "step": 14442 + }, + { + "epoch": 39.35422343324251, + "grad_norm": 5.993939399719238, + "learning_rate": 1.383305026211903e-05, + "loss": 0.1674, + "step": 14443 + }, + { + "epoch": 39.356948228882835, + "grad_norm": 5.404088973999023, + "learning_rate": 1.3832235155897237e-05, + "loss": 0.3732, + "step": 14444 + }, + { + "epoch": 39.35967302452316, + "grad_norm": 4.829730987548828, + "learning_rate": 1.3831420019830118e-05, + "loss": 0.2053, + "step": 14445 + }, + { + "epoch": 39.36239782016349, + "grad_norm": 6.515233516693115, + "learning_rate": 1.3830604853924021e-05, + "loss": 0.2587, + "step": 14446 + }, + { + "epoch": 39.36512261580381, + "grad_norm": 6.463160991668701, + "learning_rate": 1.3829789658185299e-05, + "loss": 0.3481, + "step": 14447 + }, + { + "epoch": 39.36784741144414, + "grad_norm": 6.9467997550964355, + "learning_rate": 1.3828974432620297e-05, + "loss": 0.3206, + "step": 14448 + }, + { + "epoch": 39.37057220708447, + "grad_norm": 6.457395553588867, + "learning_rate": 1.3828159177235368e-05, + "loss": 0.2884, + "step": 14449 + }, + { + "epoch": 39.3732970027248, + "grad_norm": 7.020283222198486, + "learning_rate": 1.3827343892036855e-05, + "loss": 0.2181, + "step": 14450 + }, + { + "epoch": 39.37602179836512, + "grad_norm": 6.745564937591553, + "learning_rate": 1.3826528577031113e-05, + "loss": 0.2353, + "step": 14451 + }, + { + "epoch": 39.37874659400545, + "grad_norm": 8.310040473937988, + "learning_rate": 1.3825713232224492e-05, + "loss": 0.2115, + "step": 14452 + }, + { + "epoch": 39.381471389645775, + "grad_norm": 5.74802827835083, + "learning_rate": 1.3824897857623336e-05, + "loss": 0.2852, + "step": 14453 + }, + { + "epoch": 39.3841961852861, + "grad_norm": 6.839849948883057, + "learning_rate": 1.3824082453234e-05, + "loss": 0.2355, + "step": 14454 + }, + { + "epoch": 39.38692098092643, + "grad_norm": 6.283200263977051, + "learning_rate": 1.3823267019062832e-05, + "loss": 0.2132, + "step": 14455 + }, + { + "epoch": 39.38964577656676, + "grad_norm": 5.922610759735107, + "learning_rate": 1.3822451555116186e-05, + "loss": 0.2582, + "step": 14456 + }, + { + "epoch": 39.392370572207085, + "grad_norm": 5.901951313018799, + "learning_rate": 1.3821636061400407e-05, + "loss": 0.3616, + "step": 14457 + }, + { + "epoch": 39.39509536784741, + "grad_norm": 5.894443988800049, + "learning_rate": 1.3820820537921849e-05, + "loss": 0.3356, + "step": 14458 + }, + { + "epoch": 39.39782016348774, + "grad_norm": 4.748549461364746, + "learning_rate": 1.3820004984686866e-05, + "loss": 0.2984, + "step": 14459 + }, + { + "epoch": 39.40054495912806, + "grad_norm": 7.824007987976074, + "learning_rate": 1.3819189401701807e-05, + "loss": 0.3224, + "step": 14460 + }, + { + "epoch": 39.403269754768395, + "grad_norm": 5.506160736083984, + "learning_rate": 1.381837378897302e-05, + "loss": 0.3262, + "step": 14461 + }, + { + "epoch": 39.40599455040872, + "grad_norm": 6.4132304191589355, + "learning_rate": 1.3817558146506867e-05, + "loss": 0.4223, + "step": 14462 + }, + { + "epoch": 39.40871934604905, + "grad_norm": 6.343233108520508, + "learning_rate": 1.381674247430969e-05, + "loss": 0.216, + "step": 14463 + }, + { + "epoch": 39.41144414168937, + "grad_norm": 7.911228656768799, + "learning_rate": 1.3815926772387847e-05, + "loss": 0.1699, + "step": 14464 + }, + { + "epoch": 39.4141689373297, + "grad_norm": 6.358527660369873, + "learning_rate": 1.3815111040747688e-05, + "loss": 0.1799, + "step": 14465 + }, + { + "epoch": 39.416893732970024, + "grad_norm": 7.4972357749938965, + "learning_rate": 1.3814295279395566e-05, + "loss": 0.2331, + "step": 14466 + }, + { + "epoch": 39.41961852861036, + "grad_norm": 10.910237312316895, + "learning_rate": 1.3813479488337838e-05, + "loss": 0.265, + "step": 14467 + }, + { + "epoch": 39.42234332425068, + "grad_norm": 7.198177337646484, + "learning_rate": 1.3812663667580855e-05, + "loss": 0.3017, + "step": 14468 + }, + { + "epoch": 39.42506811989101, + "grad_norm": 5.954398155212402, + "learning_rate": 1.3811847817130965e-05, + "loss": 0.3837, + "step": 14469 + }, + { + "epoch": 39.427792915531334, + "grad_norm": 6.609823226928711, + "learning_rate": 1.3811031936994533e-05, + "loss": 0.3177, + "step": 14470 + }, + { + "epoch": 39.43051771117166, + "grad_norm": 6.191345691680908, + "learning_rate": 1.3810216027177903e-05, + "loss": 0.2287, + "step": 14471 + }, + { + "epoch": 39.433242506811986, + "grad_norm": 5.148782730102539, + "learning_rate": 1.3809400087687434e-05, + "loss": 0.4851, + "step": 14472 + }, + { + "epoch": 39.43596730245232, + "grad_norm": 6.095325469970703, + "learning_rate": 1.380858411852948e-05, + "loss": 0.2578, + "step": 14473 + }, + { + "epoch": 39.438692098092645, + "grad_norm": 4.201200008392334, + "learning_rate": 1.3807768119710397e-05, + "loss": 0.1481, + "step": 14474 + }, + { + "epoch": 39.44141689373297, + "grad_norm": 6.30897331237793, + "learning_rate": 1.3806952091236533e-05, + "loss": 0.4306, + "step": 14475 + }, + { + "epoch": 39.444141689373296, + "grad_norm": 5.3930511474609375, + "learning_rate": 1.3806136033114255e-05, + "loss": 0.3352, + "step": 14476 + }, + { + "epoch": 39.44686648501362, + "grad_norm": 6.518143177032471, + "learning_rate": 1.3805319945349908e-05, + "loss": 0.3578, + "step": 14477 + }, + { + "epoch": 39.44959128065395, + "grad_norm": 5.120165824890137, + "learning_rate": 1.3804503827949855e-05, + "loss": 0.2277, + "step": 14478 + }, + { + "epoch": 39.45231607629428, + "grad_norm": 5.436894416809082, + "learning_rate": 1.3803687680920446e-05, + "loss": 0.2536, + "step": 14479 + }, + { + "epoch": 39.45504087193461, + "grad_norm": 6.164616584777832, + "learning_rate": 1.3802871504268043e-05, + "loss": 0.1834, + "step": 14480 + }, + { + "epoch": 39.45776566757493, + "grad_norm": 7.045543670654297, + "learning_rate": 1.3802055297998996e-05, + "loss": 0.3184, + "step": 14481 + }, + { + "epoch": 39.46049046321526, + "grad_norm": 6.383248329162598, + "learning_rate": 1.3801239062119666e-05, + "loss": 0.3735, + "step": 14482 + }, + { + "epoch": 39.463215258855584, + "grad_norm": 6.647173881530762, + "learning_rate": 1.3800422796636406e-05, + "loss": 0.2435, + "step": 14483 + }, + { + "epoch": 39.46594005449591, + "grad_norm": 5.340779781341553, + "learning_rate": 1.3799606501555578e-05, + "loss": 0.1776, + "step": 14484 + }, + { + "epoch": 39.46866485013624, + "grad_norm": 6.516035556793213, + "learning_rate": 1.3798790176883536e-05, + "loss": 0.1985, + "step": 14485 + }, + { + "epoch": 39.47138964577657, + "grad_norm": 5.881908893585205, + "learning_rate": 1.379797382262664e-05, + "loss": 0.4826, + "step": 14486 + }, + { + "epoch": 39.474114441416894, + "grad_norm": 4.972786903381348, + "learning_rate": 1.3797157438791244e-05, + "loss": 0.2321, + "step": 14487 + }, + { + "epoch": 39.47683923705722, + "grad_norm": 15.548818588256836, + "learning_rate": 1.379634102538371e-05, + "loss": 0.2608, + "step": 14488 + }, + { + "epoch": 39.479564032697546, + "grad_norm": 6.68283224105835, + "learning_rate": 1.3795524582410394e-05, + "loss": 0.2219, + "step": 14489 + }, + { + "epoch": 39.48228882833787, + "grad_norm": 5.611134052276611, + "learning_rate": 1.3794708109877655e-05, + "loss": 0.1968, + "step": 14490 + }, + { + "epoch": 39.485013623978205, + "grad_norm": 4.328458309173584, + "learning_rate": 1.379389160779185e-05, + "loss": 0.1002, + "step": 14491 + }, + { + "epoch": 39.48773841961853, + "grad_norm": 5.882762908935547, + "learning_rate": 1.379307507615934e-05, + "loss": 0.2224, + "step": 14492 + }, + { + "epoch": 39.490463215258856, + "grad_norm": 8.353507995605469, + "learning_rate": 1.3792258514986481e-05, + "loss": 0.3127, + "step": 14493 + }, + { + "epoch": 39.49318801089918, + "grad_norm": 6.130002021789551, + "learning_rate": 1.3791441924279638e-05, + "loss": 0.2527, + "step": 14494 + }, + { + "epoch": 39.49591280653951, + "grad_norm": 5.884676933288574, + "learning_rate": 1.3790625304045165e-05, + "loss": 0.2389, + "step": 14495 + }, + { + "epoch": 39.49863760217983, + "grad_norm": 7.270334243774414, + "learning_rate": 1.3789808654289428e-05, + "loss": 0.2778, + "step": 14496 + }, + { + "epoch": 39.50136239782017, + "grad_norm": 6.881333827972412, + "learning_rate": 1.3788991975018777e-05, + "loss": 0.2471, + "step": 14497 + }, + { + "epoch": 39.50408719346049, + "grad_norm": 6.791107654571533, + "learning_rate": 1.3788175266239585e-05, + "loss": 0.3028, + "step": 14498 + }, + { + "epoch": 39.50681198910082, + "grad_norm": 7.451920986175537, + "learning_rate": 1.37873585279582e-05, + "loss": 0.2419, + "step": 14499 + }, + { + "epoch": 39.509536784741144, + "grad_norm": 5.3681721687316895, + "learning_rate": 1.3786541760180994e-05, + "loss": 0.1921, + "step": 14500 + }, + { + "epoch": 39.51226158038147, + "grad_norm": 7.38743257522583, + "learning_rate": 1.3785724962914317e-05, + "loss": 0.3115, + "step": 14501 + }, + { + "epoch": 39.514986376021795, + "grad_norm": 5.627354621887207, + "learning_rate": 1.378490813616454e-05, + "loss": 0.3022, + "step": 14502 + }, + { + "epoch": 39.51771117166213, + "grad_norm": 6.181478500366211, + "learning_rate": 1.3784091279938019e-05, + "loss": 0.2282, + "step": 14503 + }, + { + "epoch": 39.520435967302454, + "grad_norm": 6.117964267730713, + "learning_rate": 1.3783274394241119e-05, + "loss": 0.3128, + "step": 14504 + }, + { + "epoch": 39.52316076294278, + "grad_norm": 5.2905964851379395, + "learning_rate": 1.3782457479080198e-05, + "loss": 0.4057, + "step": 14505 + }, + { + "epoch": 39.525885558583106, + "grad_norm": 4.802488803863525, + "learning_rate": 1.378164053446162e-05, + "loss": 0.2117, + "step": 14506 + }, + { + "epoch": 39.52861035422343, + "grad_norm": 6.579444408416748, + "learning_rate": 1.3780823560391748e-05, + "loss": 0.1497, + "step": 14507 + }, + { + "epoch": 39.53133514986376, + "grad_norm": 5.356363296508789, + "learning_rate": 1.378000655687694e-05, + "loss": 0.3481, + "step": 14508 + }, + { + "epoch": 39.53405994550409, + "grad_norm": 7.40226411819458, + "learning_rate": 1.3779189523923568e-05, + "loss": 0.2441, + "step": 14509 + }, + { + "epoch": 39.536784741144416, + "grad_norm": 6.068542003631592, + "learning_rate": 1.3778372461537985e-05, + "loss": 0.2196, + "step": 14510 + }, + { + "epoch": 39.53950953678474, + "grad_norm": 6.02263069152832, + "learning_rate": 1.3777555369726561e-05, + "loss": 0.2503, + "step": 14511 + }, + { + "epoch": 39.54223433242507, + "grad_norm": 7.612646579742432, + "learning_rate": 1.3776738248495659e-05, + "loss": 0.2763, + "step": 14512 + }, + { + "epoch": 39.54495912806539, + "grad_norm": 4.873693466186523, + "learning_rate": 1.3775921097851637e-05, + "loss": 0.2158, + "step": 14513 + }, + { + "epoch": 39.54768392370572, + "grad_norm": 5.309380054473877, + "learning_rate": 1.3775103917800867e-05, + "loss": 0.2633, + "step": 14514 + }, + { + "epoch": 39.55040871934605, + "grad_norm": 5.206650733947754, + "learning_rate": 1.3774286708349706e-05, + "loss": 0.206, + "step": 14515 + }, + { + "epoch": 39.55313351498638, + "grad_norm": 5.255007743835449, + "learning_rate": 1.3773469469504526e-05, + "loss": 0.2872, + "step": 14516 + }, + { + "epoch": 39.555858310626704, + "grad_norm": 6.5827717781066895, + "learning_rate": 1.3772652201271684e-05, + "loss": 0.265, + "step": 14517 + }, + { + "epoch": 39.55858310626703, + "grad_norm": 6.465464115142822, + "learning_rate": 1.3771834903657548e-05, + "loss": 0.2229, + "step": 14518 + }, + { + "epoch": 39.561307901907355, + "grad_norm": 5.544752597808838, + "learning_rate": 1.3771017576668485e-05, + "loss": 0.2967, + "step": 14519 + }, + { + "epoch": 39.56403269754768, + "grad_norm": 6.1680989265441895, + "learning_rate": 1.3770200220310855e-05, + "loss": 0.2068, + "step": 14520 + }, + { + "epoch": 39.566757493188014, + "grad_norm": 6.143753528594971, + "learning_rate": 1.3769382834591029e-05, + "loss": 0.2755, + "step": 14521 + }, + { + "epoch": 39.56948228882834, + "grad_norm": 4.713968753814697, + "learning_rate": 1.3768565419515371e-05, + "loss": 0.3034, + "step": 14522 + }, + { + "epoch": 39.572207084468666, + "grad_norm": 5.635724067687988, + "learning_rate": 1.3767747975090247e-05, + "loss": 0.4184, + "step": 14523 + }, + { + "epoch": 39.57493188010899, + "grad_norm": 12.68502426147461, + "learning_rate": 1.3766930501322024e-05, + "loss": 0.2532, + "step": 14524 + }, + { + "epoch": 39.57765667574932, + "grad_norm": 6.0208611488342285, + "learning_rate": 1.3766112998217064e-05, + "loss": 0.1414, + "step": 14525 + }, + { + "epoch": 39.58038147138964, + "grad_norm": 8.426074028015137, + "learning_rate": 1.376529546578174e-05, + "loss": 0.2204, + "step": 14526 + }, + { + "epoch": 39.583106267029976, + "grad_norm": 5.933780193328857, + "learning_rate": 1.3764477904022417e-05, + "loss": 0.2143, + "step": 14527 + }, + { + "epoch": 39.5858310626703, + "grad_norm": 9.801464080810547, + "learning_rate": 1.3763660312945459e-05, + "loss": 0.2581, + "step": 14528 + }, + { + "epoch": 39.58855585831063, + "grad_norm": 5.783325672149658, + "learning_rate": 1.3762842692557236e-05, + "loss": 0.2134, + "step": 14529 + }, + { + "epoch": 39.59128065395095, + "grad_norm": 7.276175498962402, + "learning_rate": 1.3762025042864116e-05, + "loss": 0.2136, + "step": 14530 + }, + { + "epoch": 39.59400544959128, + "grad_norm": 5.434111595153809, + "learning_rate": 1.3761207363872466e-05, + "loss": 0.3399, + "step": 14531 + }, + { + "epoch": 39.596730245231605, + "grad_norm": 5.848511219024658, + "learning_rate": 1.3760389655588656e-05, + "loss": 0.178, + "step": 14532 + }, + { + "epoch": 39.59945504087194, + "grad_norm": 5.863616943359375, + "learning_rate": 1.3759571918019048e-05, + "loss": 0.2931, + "step": 14533 + }, + { + "epoch": 39.60217983651226, + "grad_norm": 6.135962009429932, + "learning_rate": 1.375875415117002e-05, + "loss": 0.2129, + "step": 14534 + }, + { + "epoch": 39.60490463215259, + "grad_norm": 7.874301910400391, + "learning_rate": 1.375793635504793e-05, + "loss": 0.2667, + "step": 14535 + }, + { + "epoch": 39.607629427792915, + "grad_norm": 12.337894439697266, + "learning_rate": 1.3757118529659155e-05, + "loss": 0.3004, + "step": 14536 + }, + { + "epoch": 39.61035422343324, + "grad_norm": 5.171806812286377, + "learning_rate": 1.3756300675010064e-05, + "loss": 0.2465, + "step": 14537 + }, + { + "epoch": 39.61307901907357, + "grad_norm": 4.8838934898376465, + "learning_rate": 1.375548279110702e-05, + "loss": 0.243, + "step": 14538 + }, + { + "epoch": 39.6158038147139, + "grad_norm": 6.0601654052734375, + "learning_rate": 1.3754664877956401e-05, + "loss": 0.2417, + "step": 14539 + }, + { + "epoch": 39.618528610354225, + "grad_norm": 6.87872838973999, + "learning_rate": 1.375384693556457e-05, + "loss": 0.2371, + "step": 14540 + }, + { + "epoch": 39.62125340599455, + "grad_norm": 7.159520149230957, + "learning_rate": 1.3753028963937902e-05, + "loss": 0.2317, + "step": 14541 + }, + { + "epoch": 39.62397820163488, + "grad_norm": 6.424330711364746, + "learning_rate": 1.3752210963082764e-05, + "loss": 0.2436, + "step": 14542 + }, + { + "epoch": 39.6267029972752, + "grad_norm": 6.434669494628906, + "learning_rate": 1.375139293300553e-05, + "loss": 0.2291, + "step": 14543 + }, + { + "epoch": 39.62942779291553, + "grad_norm": 5.746603488922119, + "learning_rate": 1.3750574873712563e-05, + "loss": 0.2731, + "step": 14544 + }, + { + "epoch": 39.63215258855586, + "grad_norm": 6.475936412811279, + "learning_rate": 1.3749756785210245e-05, + "loss": 0.275, + "step": 14545 + }, + { + "epoch": 39.63487738419619, + "grad_norm": 6.085830211639404, + "learning_rate": 1.3748938667504938e-05, + "loss": 0.224, + "step": 14546 + }, + { + "epoch": 39.63760217983651, + "grad_norm": 9.126067161560059, + "learning_rate": 1.3748120520603022e-05, + "loss": 0.4167, + "step": 14547 + }, + { + "epoch": 39.64032697547684, + "grad_norm": 7.992452621459961, + "learning_rate": 1.374730234451086e-05, + "loss": 0.2461, + "step": 14548 + }, + { + "epoch": 39.643051771117165, + "grad_norm": 5.556773662567139, + "learning_rate": 1.374648413923483e-05, + "loss": 0.3287, + "step": 14549 + }, + { + "epoch": 39.64577656675749, + "grad_norm": 5.716811656951904, + "learning_rate": 1.37456659047813e-05, + "loss": 0.2177, + "step": 14550 + }, + { + "epoch": 39.64850136239782, + "grad_norm": 5.8144989013671875, + "learning_rate": 1.3744847641156649e-05, + "loss": 0.2023, + "step": 14551 + }, + { + "epoch": 39.65122615803815, + "grad_norm": 10.226764678955078, + "learning_rate": 1.3744029348367238e-05, + "loss": 0.2317, + "step": 14552 + }, + { + "epoch": 39.653950953678475, + "grad_norm": 5.7301859855651855, + "learning_rate": 1.3743211026419452e-05, + "loss": 0.2363, + "step": 14553 + }, + { + "epoch": 39.6566757493188, + "grad_norm": 8.517986297607422, + "learning_rate": 1.3742392675319657e-05, + "loss": 0.3702, + "step": 14554 + }, + { + "epoch": 39.65940054495913, + "grad_norm": 5.571247577667236, + "learning_rate": 1.3741574295074232e-05, + "loss": 0.4313, + "step": 14555 + }, + { + "epoch": 39.66212534059945, + "grad_norm": 5.858706474304199, + "learning_rate": 1.3740755885689541e-05, + "loss": 0.3682, + "step": 14556 + }, + { + "epoch": 39.664850136239785, + "grad_norm": 4.895678520202637, + "learning_rate": 1.373993744717197e-05, + "loss": 0.4425, + "step": 14557 + }, + { + "epoch": 39.66757493188011, + "grad_norm": 5.619413375854492, + "learning_rate": 1.3739118979527882e-05, + "loss": 0.2836, + "step": 14558 + }, + { + "epoch": 39.67029972752044, + "grad_norm": 5.4406046867370605, + "learning_rate": 1.3738300482763655e-05, + "loss": 0.2448, + "step": 14559 + }, + { + "epoch": 39.67302452316076, + "grad_norm": 4.460606575012207, + "learning_rate": 1.3737481956885668e-05, + "loss": 0.1949, + "step": 14560 + }, + { + "epoch": 39.67574931880109, + "grad_norm": 6.217899322509766, + "learning_rate": 1.3736663401900288e-05, + "loss": 0.2768, + "step": 14561 + }, + { + "epoch": 39.678474114441414, + "grad_norm": 5.351813793182373, + "learning_rate": 1.3735844817813895e-05, + "loss": 0.2784, + "step": 14562 + }, + { + "epoch": 39.68119891008175, + "grad_norm": 5.458523273468018, + "learning_rate": 1.3735026204632864e-05, + "loss": 0.2043, + "step": 14563 + }, + { + "epoch": 39.68392370572207, + "grad_norm": 5.464929103851318, + "learning_rate": 1.3734207562363568e-05, + "loss": 0.2792, + "step": 14564 + }, + { + "epoch": 39.6866485013624, + "grad_norm": 6.421558380126953, + "learning_rate": 1.3733388891012385e-05, + "loss": 0.2537, + "step": 14565 + }, + { + "epoch": 39.689373297002724, + "grad_norm": 6.545646667480469, + "learning_rate": 1.3732570190585689e-05, + "loss": 0.239, + "step": 14566 + }, + { + "epoch": 39.69209809264305, + "grad_norm": 6.9950432777404785, + "learning_rate": 1.3731751461089858e-05, + "loss": 0.2151, + "step": 14567 + }, + { + "epoch": 39.694822888283376, + "grad_norm": 6.908062934875488, + "learning_rate": 1.3730932702531261e-05, + "loss": 0.3112, + "step": 14568 + }, + { + "epoch": 39.69754768392371, + "grad_norm": 6.2741899490356445, + "learning_rate": 1.3730113914916285e-05, + "loss": 0.2596, + "step": 14569 + }, + { + "epoch": 39.700272479564035, + "grad_norm": 6.59345817565918, + "learning_rate": 1.37292950982513e-05, + "loss": 0.2039, + "step": 14570 + }, + { + "epoch": 39.70299727520436, + "grad_norm": 11.277990341186523, + "learning_rate": 1.3728476252542687e-05, + "loss": 0.2684, + "step": 14571 + }, + { + "epoch": 39.705722070844686, + "grad_norm": 8.434755325317383, + "learning_rate": 1.3727657377796816e-05, + "loss": 0.2751, + "step": 14572 + }, + { + "epoch": 39.70844686648501, + "grad_norm": 6.903609752655029, + "learning_rate": 1.3726838474020077e-05, + "loss": 0.238, + "step": 14573 + }, + { + "epoch": 39.71117166212534, + "grad_norm": 5.95989990234375, + "learning_rate": 1.3726019541218833e-05, + "loss": 0.2779, + "step": 14574 + }, + { + "epoch": 39.71389645776567, + "grad_norm": 6.068815231323242, + "learning_rate": 1.3725200579399474e-05, + "loss": 0.184, + "step": 14575 + }, + { + "epoch": 39.716621253406, + "grad_norm": 8.695172309875488, + "learning_rate": 1.372438158856837e-05, + "loss": 0.2631, + "step": 14576 + }, + { + "epoch": 39.71934604904632, + "grad_norm": 14.273383140563965, + "learning_rate": 1.3723562568731903e-05, + "loss": 0.2376, + "step": 14577 + }, + { + "epoch": 39.72207084468665, + "grad_norm": 7.18869686126709, + "learning_rate": 1.3722743519896447e-05, + "loss": 0.2187, + "step": 14578 + }, + { + "epoch": 39.724795640326974, + "grad_norm": 6.22044563293457, + "learning_rate": 1.3721924442068388e-05, + "loss": 0.1456, + "step": 14579 + }, + { + "epoch": 39.7275204359673, + "grad_norm": 6.530173301696777, + "learning_rate": 1.37211053352541e-05, + "loss": 0.2498, + "step": 14580 + }, + { + "epoch": 39.73024523160763, + "grad_norm": 6.607137680053711, + "learning_rate": 1.3720286199459967e-05, + "loss": 0.2833, + "step": 14581 + }, + { + "epoch": 39.73297002724796, + "grad_norm": 7.22041130065918, + "learning_rate": 1.371946703469236e-05, + "loss": 0.2257, + "step": 14582 + }, + { + "epoch": 39.735694822888284, + "grad_norm": 5.8552565574646, + "learning_rate": 1.3718647840957666e-05, + "loss": 0.2111, + "step": 14583 + }, + { + "epoch": 39.73841961852861, + "grad_norm": 6.913836479187012, + "learning_rate": 1.3717828618262261e-05, + "loss": 0.1929, + "step": 14584 + }, + { + "epoch": 39.741144414168936, + "grad_norm": 5.870815277099609, + "learning_rate": 1.3717009366612528e-05, + "loss": 0.1751, + "step": 14585 + }, + { + "epoch": 39.74386920980926, + "grad_norm": 6.600525379180908, + "learning_rate": 1.3716190086014844e-05, + "loss": 0.1993, + "step": 14586 + }, + { + "epoch": 39.746594005449595, + "grad_norm": 7.7413740158081055, + "learning_rate": 1.3715370776475591e-05, + "loss": 0.3372, + "step": 14587 + }, + { + "epoch": 39.74931880108992, + "grad_norm": 7.063012599945068, + "learning_rate": 1.3714551438001149e-05, + "loss": 0.2917, + "step": 14588 + }, + { + "epoch": 39.752043596730246, + "grad_norm": 8.96944522857666, + "learning_rate": 1.3713732070597902e-05, + "loss": 0.3526, + "step": 14589 + }, + { + "epoch": 39.75476839237057, + "grad_norm": 6.1891560554504395, + "learning_rate": 1.371291267427223e-05, + "loss": 0.2988, + "step": 14590 + }, + { + "epoch": 39.7574931880109, + "grad_norm": 10.691773414611816, + "learning_rate": 1.3712093249030513e-05, + "loss": 0.2568, + "step": 14591 + }, + { + "epoch": 39.76021798365122, + "grad_norm": 6.2613935470581055, + "learning_rate": 1.3711273794879131e-05, + "loss": 0.2761, + "step": 14592 + }, + { + "epoch": 39.762942779291556, + "grad_norm": 6.848296165466309, + "learning_rate": 1.3710454311824472e-05, + "loss": 0.2192, + "step": 14593 + }, + { + "epoch": 39.76566757493188, + "grad_norm": 8.631440162658691, + "learning_rate": 1.370963479987291e-05, + "loss": 0.278, + "step": 14594 + }, + { + "epoch": 39.76839237057221, + "grad_norm": 8.44626235961914, + "learning_rate": 1.3708815259030835e-05, + "loss": 0.2311, + "step": 14595 + }, + { + "epoch": 39.771117166212534, + "grad_norm": 5.785213470458984, + "learning_rate": 1.3707995689304626e-05, + "loss": 0.3227, + "step": 14596 + }, + { + "epoch": 39.77384196185286, + "grad_norm": 7.679196357727051, + "learning_rate": 1.3707176090700662e-05, + "loss": 0.3581, + "step": 14597 + }, + { + "epoch": 39.776566757493185, + "grad_norm": 7.344898223876953, + "learning_rate": 1.3706356463225332e-05, + "loss": 0.4623, + "step": 14598 + }, + { + "epoch": 39.77929155313352, + "grad_norm": 6.047147274017334, + "learning_rate": 1.3705536806885018e-05, + "loss": 0.2981, + "step": 14599 + }, + { + "epoch": 39.782016348773844, + "grad_norm": 4.970607280731201, + "learning_rate": 1.3704717121686103e-05, + "loss": 0.1991, + "step": 14600 + }, + { + "epoch": 39.78474114441417, + "grad_norm": 6.093405246734619, + "learning_rate": 1.3703897407634971e-05, + "loss": 0.5023, + "step": 14601 + }, + { + "epoch": 39.787465940054496, + "grad_norm": 6.924727916717529, + "learning_rate": 1.3703077664738002e-05, + "loss": 0.273, + "step": 14602 + }, + { + "epoch": 39.79019073569482, + "grad_norm": 5.4926228523254395, + "learning_rate": 1.3702257893001588e-05, + "loss": 0.2254, + "step": 14603 + }, + { + "epoch": 39.79291553133515, + "grad_norm": 6.771979331970215, + "learning_rate": 1.3701438092432104e-05, + "loss": 0.1754, + "step": 14604 + }, + { + "epoch": 39.79564032697548, + "grad_norm": 6.45460319519043, + "learning_rate": 1.3700618263035941e-05, + "loss": 0.2474, + "step": 14605 + }, + { + "epoch": 39.798365122615806, + "grad_norm": 7.092337608337402, + "learning_rate": 1.3699798404819485e-05, + "loss": 0.3309, + "step": 14606 + }, + { + "epoch": 39.80108991825613, + "grad_norm": 5.740354537963867, + "learning_rate": 1.3698978517789112e-05, + "loss": 0.1925, + "step": 14607 + }, + { + "epoch": 39.80381471389646, + "grad_norm": 5.312353610992432, + "learning_rate": 1.3698158601951217e-05, + "loss": 0.3696, + "step": 14608 + }, + { + "epoch": 39.80653950953678, + "grad_norm": 6.3158063888549805, + "learning_rate": 1.3697338657312183e-05, + "loss": 0.3152, + "step": 14609 + }, + { + "epoch": 39.80926430517711, + "grad_norm": 5.625290870666504, + "learning_rate": 1.3696518683878392e-05, + "loss": 0.1586, + "step": 14610 + }, + { + "epoch": 39.81198910081744, + "grad_norm": 10.652303695678711, + "learning_rate": 1.3695698681656233e-05, + "loss": 0.2413, + "step": 14611 + }, + { + "epoch": 39.81471389645777, + "grad_norm": 6.256007194519043, + "learning_rate": 1.3694878650652092e-05, + "loss": 0.2786, + "step": 14612 + }, + { + "epoch": 39.817438692098094, + "grad_norm": 4.749094486236572, + "learning_rate": 1.3694058590872354e-05, + "loss": 0.185, + "step": 14613 + }, + { + "epoch": 39.82016348773842, + "grad_norm": 6.310389518737793, + "learning_rate": 1.369323850232341e-05, + "loss": 0.4304, + "step": 14614 + }, + { + "epoch": 39.822888283378745, + "grad_norm": 6.497410297393799, + "learning_rate": 1.3692418385011639e-05, + "loss": 0.2418, + "step": 14615 + }, + { + "epoch": 39.82561307901907, + "grad_norm": 7.917486667633057, + "learning_rate": 1.3691598238943438e-05, + "loss": 0.3297, + "step": 14616 + }, + { + "epoch": 39.828337874659404, + "grad_norm": 6.416966438293457, + "learning_rate": 1.3690778064125182e-05, + "loss": 0.2968, + "step": 14617 + }, + { + "epoch": 39.83106267029973, + "grad_norm": 5.088503837585449, + "learning_rate": 1.368995786056327e-05, + "loss": 0.5073, + "step": 14618 + }, + { + "epoch": 39.833787465940055, + "grad_norm": 6.163337707519531, + "learning_rate": 1.3689137628264085e-05, + "loss": 0.2898, + "step": 14619 + }, + { + "epoch": 39.83651226158038, + "grad_norm": 4.374394416809082, + "learning_rate": 1.368831736723401e-05, + "loss": 0.2234, + "step": 14620 + }, + { + "epoch": 39.83923705722071, + "grad_norm": 6.270904064178467, + "learning_rate": 1.3687497077479441e-05, + "loss": 0.1773, + "step": 14621 + }, + { + "epoch": 39.84196185286103, + "grad_norm": 5.866994857788086, + "learning_rate": 1.3686676759006764e-05, + "loss": 0.3527, + "step": 14622 + }, + { + "epoch": 39.844686648501366, + "grad_norm": 5.5044426918029785, + "learning_rate": 1.3685856411822367e-05, + "loss": 0.3417, + "step": 14623 + }, + { + "epoch": 39.84741144414169, + "grad_norm": 5.12974214553833, + "learning_rate": 1.3685036035932639e-05, + "loss": 0.165, + "step": 14624 + }, + { + "epoch": 39.85013623978202, + "grad_norm": 6.531769752502441, + "learning_rate": 1.3684215631343969e-05, + "loss": 0.2958, + "step": 14625 + }, + { + "epoch": 39.85286103542234, + "grad_norm": 18.12469482421875, + "learning_rate": 1.3683395198062747e-05, + "loss": 0.4338, + "step": 14626 + }, + { + "epoch": 39.85558583106267, + "grad_norm": 5.587963581085205, + "learning_rate": 1.368257473609536e-05, + "loss": 0.3274, + "step": 14627 + }, + { + "epoch": 39.858310626702995, + "grad_norm": 6.947348117828369, + "learning_rate": 1.3681754245448202e-05, + "loss": 0.2568, + "step": 14628 + }, + { + "epoch": 39.86103542234333, + "grad_norm": 6.23321008682251, + "learning_rate": 1.3680933726127656e-05, + "loss": 0.286, + "step": 14629 + }, + { + "epoch": 39.86376021798365, + "grad_norm": 4.902149200439453, + "learning_rate": 1.368011317814012e-05, + "loss": 0.2003, + "step": 14630 + }, + { + "epoch": 39.86648501362398, + "grad_norm": 7.079772472381592, + "learning_rate": 1.367929260149198e-05, + "loss": 0.3779, + "step": 14631 + }, + { + "epoch": 39.869209809264305, + "grad_norm": 5.892935276031494, + "learning_rate": 1.3678471996189629e-05, + "loss": 0.2592, + "step": 14632 + }, + { + "epoch": 39.87193460490463, + "grad_norm": 5.965717315673828, + "learning_rate": 1.3677651362239454e-05, + "loss": 0.2357, + "step": 14633 + }, + { + "epoch": 39.87465940054496, + "grad_norm": 6.772895336151123, + "learning_rate": 1.3676830699647852e-05, + "loss": 0.1866, + "step": 14634 + }, + { + "epoch": 39.87738419618529, + "grad_norm": 6.63701057434082, + "learning_rate": 1.3676010008421208e-05, + "loss": 0.2314, + "step": 14635 + }, + { + "epoch": 39.880108991825615, + "grad_norm": 4.581226825714111, + "learning_rate": 1.3675189288565918e-05, + "loss": 0.2225, + "step": 14636 + }, + { + "epoch": 39.88283378746594, + "grad_norm": 4.762144088745117, + "learning_rate": 1.367436854008837e-05, + "loss": 0.322, + "step": 14637 + }, + { + "epoch": 39.88555858310627, + "grad_norm": 5.054895401000977, + "learning_rate": 1.3673547762994959e-05, + "loss": 0.2633, + "step": 14638 + }, + { + "epoch": 39.88828337874659, + "grad_norm": 4.342443466186523, + "learning_rate": 1.3672726957292075e-05, + "loss": 0.306, + "step": 14639 + }, + { + "epoch": 39.89100817438692, + "grad_norm": 4.6823272705078125, + "learning_rate": 1.3671906122986114e-05, + "loss": 0.4968, + "step": 14640 + }, + { + "epoch": 39.89373297002725, + "grad_norm": 6.215219974517822, + "learning_rate": 1.3671085260083465e-05, + "loss": 0.1587, + "step": 14641 + }, + { + "epoch": 39.89645776566758, + "grad_norm": 6.84375524520874, + "learning_rate": 1.3670264368590524e-05, + "loss": 0.2072, + "step": 14642 + }, + { + "epoch": 39.8991825613079, + "grad_norm": 5.9075727462768555, + "learning_rate": 1.3669443448513679e-05, + "loss": 0.316, + "step": 14643 + }, + { + "epoch": 39.90190735694823, + "grad_norm": 7.016509532928467, + "learning_rate": 1.366862249985933e-05, + "loss": 0.3074, + "step": 14644 + }, + { + "epoch": 39.904632152588555, + "grad_norm": 5.5128254890441895, + "learning_rate": 1.3667801522633866e-05, + "loss": 0.1993, + "step": 14645 + }, + { + "epoch": 39.90735694822888, + "grad_norm": 6.173662185668945, + "learning_rate": 1.3666980516843682e-05, + "loss": 0.2124, + "step": 14646 + }, + { + "epoch": 39.91008174386921, + "grad_norm": 5.529973983764648, + "learning_rate": 1.3666159482495167e-05, + "loss": 0.2811, + "step": 14647 + }, + { + "epoch": 39.91280653950954, + "grad_norm": 5.944946765899658, + "learning_rate": 1.3665338419594725e-05, + "loss": 0.1991, + "step": 14648 + }, + { + "epoch": 39.915531335149865, + "grad_norm": 4.5183820724487305, + "learning_rate": 1.3664517328148744e-05, + "loss": 0.2014, + "step": 14649 + }, + { + "epoch": 39.91825613079019, + "grad_norm": 6.031014919281006, + "learning_rate": 1.3663696208163622e-05, + "loss": 0.2306, + "step": 14650 + }, + { + "epoch": 39.920980926430516, + "grad_norm": 5.391735076904297, + "learning_rate": 1.366287505964575e-05, + "loss": 0.4026, + "step": 14651 + }, + { + "epoch": 39.92370572207084, + "grad_norm": 5.912613391876221, + "learning_rate": 1.3662053882601525e-05, + "loss": 0.2459, + "step": 14652 + }, + { + "epoch": 39.926430517711175, + "grad_norm": 6.257481098175049, + "learning_rate": 1.3661232677037341e-05, + "loss": 0.3528, + "step": 14653 + }, + { + "epoch": 39.9291553133515, + "grad_norm": 5.020956993103027, + "learning_rate": 1.3660411442959597e-05, + "loss": 0.2401, + "step": 14654 + }, + { + "epoch": 39.93188010899183, + "grad_norm": 5.578127384185791, + "learning_rate": 1.3659590180374685e-05, + "loss": 0.1824, + "step": 14655 + }, + { + "epoch": 39.93460490463215, + "grad_norm": 7.9125494956970215, + "learning_rate": 1.3658768889289003e-05, + "loss": 0.2713, + "step": 14656 + }, + { + "epoch": 39.93732970027248, + "grad_norm": 4.773212432861328, + "learning_rate": 1.3657947569708946e-05, + "loss": 0.2169, + "step": 14657 + }, + { + "epoch": 39.940054495912804, + "grad_norm": 5.907552719116211, + "learning_rate": 1.3657126221640914e-05, + "loss": 0.2264, + "step": 14658 + }, + { + "epoch": 39.94277929155314, + "grad_norm": 5.584198474884033, + "learning_rate": 1.3656304845091298e-05, + "loss": 0.3464, + "step": 14659 + }, + { + "epoch": 39.94550408719346, + "grad_norm": 6.994326591491699, + "learning_rate": 1.3655483440066496e-05, + "loss": 0.3241, + "step": 14660 + }, + { + "epoch": 39.94822888283379, + "grad_norm": 5.74834680557251, + "learning_rate": 1.3654662006572909e-05, + "loss": 0.3925, + "step": 14661 + }, + { + "epoch": 39.950953678474114, + "grad_norm": 5.148861885070801, + "learning_rate": 1.3653840544616932e-05, + "loss": 0.2659, + "step": 14662 + }, + { + "epoch": 39.95367847411444, + "grad_norm": 8.553078651428223, + "learning_rate": 1.3653019054204962e-05, + "loss": 0.2401, + "step": 14663 + }, + { + "epoch": 39.956403269754766, + "grad_norm": 5.828797817230225, + "learning_rate": 1.3652197535343396e-05, + "loss": 0.2697, + "step": 14664 + }, + { + "epoch": 39.95912806539509, + "grad_norm": 4.388965606689453, + "learning_rate": 1.3651375988038633e-05, + "loss": 0.1892, + "step": 14665 + }, + { + "epoch": 39.961852861035425, + "grad_norm": 7.490252494812012, + "learning_rate": 1.3650554412297075e-05, + "loss": 0.193, + "step": 14666 + }, + { + "epoch": 39.96457765667575, + "grad_norm": 6.492657661437988, + "learning_rate": 1.3649732808125114e-05, + "loss": 0.3375, + "step": 14667 + }, + { + "epoch": 39.967302452316076, + "grad_norm": 9.734619140625, + "learning_rate": 1.3648911175529151e-05, + "loss": 0.3243, + "step": 14668 + }, + { + "epoch": 39.9700272479564, + "grad_norm": 6.138456344604492, + "learning_rate": 1.3648089514515585e-05, + "loss": 0.2633, + "step": 14669 + }, + { + "epoch": 39.97275204359673, + "grad_norm": 6.453230381011963, + "learning_rate": 1.3647267825090818e-05, + "loss": 0.2957, + "step": 14670 + }, + { + "epoch": 39.97547683923706, + "grad_norm": 6.128805637359619, + "learning_rate": 1.3646446107261244e-05, + "loss": 0.2565, + "step": 14671 + }, + { + "epoch": 39.97820163487739, + "grad_norm": 5.4172139167785645, + "learning_rate": 1.3645624361033268e-05, + "loss": 0.1973, + "step": 14672 + }, + { + "epoch": 39.98092643051771, + "grad_norm": 5.549086093902588, + "learning_rate": 1.364480258641328e-05, + "loss": 0.2594, + "step": 14673 + }, + { + "epoch": 39.98365122615804, + "grad_norm": 5.352941989898682, + "learning_rate": 1.3643980783407693e-05, + "loss": 0.3738, + "step": 14674 + }, + { + "epoch": 39.986376021798364, + "grad_norm": 8.064535140991211, + "learning_rate": 1.36431589520229e-05, + "loss": 0.2649, + "step": 14675 + }, + { + "epoch": 39.98910081743869, + "grad_norm": 5.839471340179443, + "learning_rate": 1.3642337092265301e-05, + "loss": 0.2395, + "step": 14676 + }, + { + "epoch": 39.991825613079016, + "grad_norm": 5.32957124710083, + "learning_rate": 1.3641515204141297e-05, + "loss": 0.1831, + "step": 14677 + }, + { + "epoch": 39.99455040871935, + "grad_norm": 6.660703182220459, + "learning_rate": 1.3640693287657294e-05, + "loss": 0.2849, + "step": 14678 + }, + { + "epoch": 39.997275204359674, + "grad_norm": 5.129420757293701, + "learning_rate": 1.3639871342819686e-05, + "loss": 0.3918, + "step": 14679 + }, + { + "epoch": 40.0, + "grad_norm": 5.764123439788818, + "learning_rate": 1.3639049369634878e-05, + "loss": 0.2851, + "step": 14680 + }, + { + "epoch": 40.002724795640326, + "grad_norm": 4.670469760894775, + "learning_rate": 1.3638227368109268e-05, + "loss": 0.2391, + "step": 14681 + }, + { + "epoch": 40.00544959128065, + "grad_norm": 4.787637233734131, + "learning_rate": 1.3637405338249261e-05, + "loss": 0.1769, + "step": 14682 + }, + { + "epoch": 40.00817438692098, + "grad_norm": 4.994102478027344, + "learning_rate": 1.3636583280061262e-05, + "loss": 0.353, + "step": 14683 + }, + { + "epoch": 40.01089918256131, + "grad_norm": 5.163061618804932, + "learning_rate": 1.3635761193551666e-05, + "loss": 0.2016, + "step": 14684 + }, + { + "epoch": 40.013623978201636, + "grad_norm": 5.797138214111328, + "learning_rate": 1.3634939078726878e-05, + "loss": 0.3666, + "step": 14685 + }, + { + "epoch": 40.01634877384196, + "grad_norm": 5.63509464263916, + "learning_rate": 1.3634116935593307e-05, + "loss": 0.4189, + "step": 14686 + }, + { + "epoch": 40.01907356948229, + "grad_norm": 7.220623970031738, + "learning_rate": 1.3633294764157344e-05, + "loss": 0.3734, + "step": 14687 + }, + { + "epoch": 40.02179836512261, + "grad_norm": 20.821069717407227, + "learning_rate": 1.3632472564425402e-05, + "loss": 0.2023, + "step": 14688 + }, + { + "epoch": 40.02452316076294, + "grad_norm": 6.66929292678833, + "learning_rate": 1.3631650336403879e-05, + "loss": 0.2946, + "step": 14689 + }, + { + "epoch": 40.02724795640327, + "grad_norm": 5.437743663787842, + "learning_rate": 1.3630828080099181e-05, + "loss": 0.1693, + "step": 14690 + }, + { + "epoch": 40.0299727520436, + "grad_norm": 4.195618152618408, + "learning_rate": 1.3630005795517712e-05, + "loss": 0.1515, + "step": 14691 + }, + { + "epoch": 40.032697547683924, + "grad_norm": 6.934732913970947, + "learning_rate": 1.362918348266587e-05, + "loss": 0.2677, + "step": 14692 + }, + { + "epoch": 40.03542234332425, + "grad_norm": 5.9340996742248535, + "learning_rate": 1.3628361141550068e-05, + "loss": 0.2761, + "step": 14693 + }, + { + "epoch": 40.038147138964575, + "grad_norm": 9.502779960632324, + "learning_rate": 1.3627538772176705e-05, + "loss": 0.3185, + "step": 14694 + }, + { + "epoch": 40.0408719346049, + "grad_norm": 5.000411510467529, + "learning_rate": 1.3626716374552187e-05, + "loss": 0.1497, + "step": 14695 + }, + { + "epoch": 40.043596730245234, + "grad_norm": 5.282544136047363, + "learning_rate": 1.3625893948682919e-05, + "loss": 0.266, + "step": 14696 + }, + { + "epoch": 40.04632152588556, + "grad_norm": 5.492834091186523, + "learning_rate": 1.3625071494575304e-05, + "loss": 0.1529, + "step": 14697 + }, + { + "epoch": 40.049046321525886, + "grad_norm": 4.832657337188721, + "learning_rate": 1.3624249012235748e-05, + "loss": 0.1769, + "step": 14698 + }, + { + "epoch": 40.05177111716621, + "grad_norm": 5.096675872802734, + "learning_rate": 1.3623426501670662e-05, + "loss": 0.2924, + "step": 14699 + }, + { + "epoch": 40.05449591280654, + "grad_norm": 5.773919582366943, + "learning_rate": 1.3622603962886443e-05, + "loss": 0.2339, + "step": 14700 + }, + { + "epoch": 40.05722070844686, + "grad_norm": 8.40015697479248, + "learning_rate": 1.3621781395889503e-05, + "loss": 0.3245, + "step": 14701 + }, + { + "epoch": 40.059945504087196, + "grad_norm": 6.444672107696533, + "learning_rate": 1.3620958800686246e-05, + "loss": 0.3568, + "step": 14702 + }, + { + "epoch": 40.06267029972752, + "grad_norm": 5.762142181396484, + "learning_rate": 1.3620136177283078e-05, + "loss": 0.1714, + "step": 14703 + }, + { + "epoch": 40.06539509536785, + "grad_norm": 11.245086669921875, + "learning_rate": 1.3619313525686407e-05, + "loss": 0.2463, + "step": 14704 + }, + { + "epoch": 40.06811989100817, + "grad_norm": 4.8663411140441895, + "learning_rate": 1.3618490845902637e-05, + "loss": 0.1648, + "step": 14705 + }, + { + "epoch": 40.0708446866485, + "grad_norm": 4.974968433380127, + "learning_rate": 1.3617668137938176e-05, + "loss": 0.3024, + "step": 14706 + }, + { + "epoch": 40.073569482288825, + "grad_norm": 4.860438346862793, + "learning_rate": 1.3616845401799433e-05, + "loss": 0.2716, + "step": 14707 + }, + { + "epoch": 40.07629427792916, + "grad_norm": 5.657793998718262, + "learning_rate": 1.3616022637492814e-05, + "loss": 0.2576, + "step": 14708 + }, + { + "epoch": 40.079019073569484, + "grad_norm": 17.060792922973633, + "learning_rate": 1.3615199845024729e-05, + "loss": 0.2642, + "step": 14709 + }, + { + "epoch": 40.08174386920981, + "grad_norm": 4.534100532531738, + "learning_rate": 1.3614377024401581e-05, + "loss": 0.3705, + "step": 14710 + }, + { + "epoch": 40.084468664850135, + "grad_norm": 5.813042640686035, + "learning_rate": 1.3613554175629783e-05, + "loss": 0.2808, + "step": 14711 + }, + { + "epoch": 40.08719346049046, + "grad_norm": 5.779947280883789, + "learning_rate": 1.3612731298715743e-05, + "loss": 0.2162, + "step": 14712 + }, + { + "epoch": 40.08991825613079, + "grad_norm": 5.839858055114746, + "learning_rate": 1.3611908393665866e-05, + "loss": 0.3207, + "step": 14713 + }, + { + "epoch": 40.09264305177112, + "grad_norm": 7.131965637207031, + "learning_rate": 1.3611085460486561e-05, + "loss": 0.1586, + "step": 14714 + }, + { + "epoch": 40.095367847411445, + "grad_norm": 5.477025032043457, + "learning_rate": 1.3610262499184241e-05, + "loss": 0.2087, + "step": 14715 + }, + { + "epoch": 40.09809264305177, + "grad_norm": 8.843849182128906, + "learning_rate": 1.360943950976531e-05, + "loss": 0.2567, + "step": 14716 + }, + { + "epoch": 40.1008174386921, + "grad_norm": 5.079222679138184, + "learning_rate": 1.3608616492236185e-05, + "loss": 0.2525, + "step": 14717 + }, + { + "epoch": 40.10354223433242, + "grad_norm": 5.357724666595459, + "learning_rate": 1.3607793446603266e-05, + "loss": 0.3328, + "step": 14718 + }, + { + "epoch": 40.10626702997275, + "grad_norm": 5.058252334594727, + "learning_rate": 1.3606970372872972e-05, + "loss": 0.2778, + "step": 14719 + }, + { + "epoch": 40.10899182561308, + "grad_norm": 6.287322044372559, + "learning_rate": 1.3606147271051706e-05, + "loss": 0.1813, + "step": 14720 + }, + { + "epoch": 40.11171662125341, + "grad_norm": 5.835550308227539, + "learning_rate": 1.3605324141145883e-05, + "loss": 0.2213, + "step": 14721 + }, + { + "epoch": 40.11444141689373, + "grad_norm": 6.14241886138916, + "learning_rate": 1.3604500983161911e-05, + "loss": 0.2883, + "step": 14722 + }, + { + "epoch": 40.11716621253406, + "grad_norm": 5.560632228851318, + "learning_rate": 1.36036777971062e-05, + "loss": 0.2858, + "step": 14723 + }, + { + "epoch": 40.119891008174385, + "grad_norm": 5.573838233947754, + "learning_rate": 1.3602854582985163e-05, + "loss": 0.3586, + "step": 14724 + }, + { + "epoch": 40.12261580381471, + "grad_norm": 6.711114406585693, + "learning_rate": 1.360203134080521e-05, + "loss": 0.2218, + "step": 14725 + }, + { + "epoch": 40.12534059945504, + "grad_norm": 7.186511993408203, + "learning_rate": 1.3601208070572754e-05, + "loss": 0.2581, + "step": 14726 + }, + { + "epoch": 40.12806539509537, + "grad_norm": 9.657685279846191, + "learning_rate": 1.3600384772294206e-05, + "loss": 0.3543, + "step": 14727 + }, + { + "epoch": 40.130790190735695, + "grad_norm": 4.581483840942383, + "learning_rate": 1.3599561445975975e-05, + "loss": 0.347, + "step": 14728 + }, + { + "epoch": 40.13351498637602, + "grad_norm": 6.904247283935547, + "learning_rate": 1.3598738091624477e-05, + "loss": 0.2191, + "step": 14729 + }, + { + "epoch": 40.13623978201635, + "grad_norm": 5.889281749725342, + "learning_rate": 1.3597914709246122e-05, + "loss": 0.2881, + "step": 14730 + }, + { + "epoch": 40.13896457765667, + "grad_norm": 5.417539596557617, + "learning_rate": 1.3597091298847325e-05, + "loss": 0.2457, + "step": 14731 + }, + { + "epoch": 40.141689373297005, + "grad_norm": 6.106906414031982, + "learning_rate": 1.3596267860434496e-05, + "loss": 0.281, + "step": 14732 + }, + { + "epoch": 40.14441416893733, + "grad_norm": 5.275127410888672, + "learning_rate": 1.3595444394014046e-05, + "loss": 0.2599, + "step": 14733 + }, + { + "epoch": 40.14713896457766, + "grad_norm": 7.4308319091796875, + "learning_rate": 1.359462089959239e-05, + "loss": 0.216, + "step": 14734 + }, + { + "epoch": 40.14986376021798, + "grad_norm": 4.960119247436523, + "learning_rate": 1.3593797377175949e-05, + "loss": 0.3427, + "step": 14735 + }, + { + "epoch": 40.15258855585831, + "grad_norm": 5.1894636154174805, + "learning_rate": 1.3592973826771123e-05, + "loss": 0.2075, + "step": 14736 + }, + { + "epoch": 40.155313351498634, + "grad_norm": 6.531680583953857, + "learning_rate": 1.3592150248384334e-05, + "loss": 0.4168, + "step": 14737 + }, + { + "epoch": 40.15803814713897, + "grad_norm": 4.947193145751953, + "learning_rate": 1.3591326642021996e-05, + "loss": 0.229, + "step": 14738 + }, + { + "epoch": 40.16076294277929, + "grad_norm": 7.752299785614014, + "learning_rate": 1.3590503007690523e-05, + "loss": 0.333, + "step": 14739 + }, + { + "epoch": 40.16348773841962, + "grad_norm": 5.813737869262695, + "learning_rate": 1.3589679345396323e-05, + "loss": 0.1799, + "step": 14740 + }, + { + "epoch": 40.166212534059945, + "grad_norm": 4.673559188842773, + "learning_rate": 1.3588855655145819e-05, + "loss": 0.2692, + "step": 14741 + }, + { + "epoch": 40.16893732970027, + "grad_norm": 5.340415000915527, + "learning_rate": 1.3588031936945423e-05, + "loss": 0.3775, + "step": 14742 + }, + { + "epoch": 40.171662125340596, + "grad_norm": 5.528367519378662, + "learning_rate": 1.3587208190801549e-05, + "loss": 0.2867, + "step": 14743 + }, + { + "epoch": 40.17438692098093, + "grad_norm": 5.196868896484375, + "learning_rate": 1.3586384416720612e-05, + "loss": 0.167, + "step": 14744 + }, + { + "epoch": 40.177111716621255, + "grad_norm": 5.872586250305176, + "learning_rate": 1.3585560614709033e-05, + "loss": 0.1531, + "step": 14745 + }, + { + "epoch": 40.17983651226158, + "grad_norm": 7.798600196838379, + "learning_rate": 1.3584736784773218e-05, + "loss": 0.2896, + "step": 14746 + }, + { + "epoch": 40.182561307901906, + "grad_norm": 6.427639007568359, + "learning_rate": 1.3583912926919594e-05, + "loss": 0.1616, + "step": 14747 + }, + { + "epoch": 40.18528610354223, + "grad_norm": 5.750645637512207, + "learning_rate": 1.3583089041154565e-05, + "loss": 0.3266, + "step": 14748 + }, + { + "epoch": 40.18801089918256, + "grad_norm": 5.34175968170166, + "learning_rate": 1.358226512748456e-05, + "loss": 0.1887, + "step": 14749 + }, + { + "epoch": 40.19073569482289, + "grad_norm": 6.367232322692871, + "learning_rate": 1.3581441185915982e-05, + "loss": 0.1972, + "step": 14750 + }, + { + "epoch": 40.19346049046322, + "grad_norm": 5.012624263763428, + "learning_rate": 1.3580617216455261e-05, + "loss": 0.1836, + "step": 14751 + }, + { + "epoch": 40.19618528610354, + "grad_norm": 5.424821376800537, + "learning_rate": 1.3579793219108805e-05, + "loss": 0.2442, + "step": 14752 + }, + { + "epoch": 40.19891008174387, + "grad_norm": 5.797748565673828, + "learning_rate": 1.3578969193883038e-05, + "loss": 0.3721, + "step": 14753 + }, + { + "epoch": 40.201634877384194, + "grad_norm": 7.14633321762085, + "learning_rate": 1.3578145140784373e-05, + "loss": 0.3064, + "step": 14754 + }, + { + "epoch": 40.20435967302452, + "grad_norm": 5.756343364715576, + "learning_rate": 1.3577321059819229e-05, + "loss": 0.2394, + "step": 14755 + }, + { + "epoch": 40.20708446866485, + "grad_norm": 6.218676567077637, + "learning_rate": 1.3576496950994022e-05, + "loss": 0.1745, + "step": 14756 + }, + { + "epoch": 40.20980926430518, + "grad_norm": 7.166897296905518, + "learning_rate": 1.3575672814315174e-05, + "loss": 0.2559, + "step": 14757 + }, + { + "epoch": 40.212534059945504, + "grad_norm": 6.445605754852295, + "learning_rate": 1.3574848649789102e-05, + "loss": 0.1658, + "step": 14758 + }, + { + "epoch": 40.21525885558583, + "grad_norm": 5.106618881225586, + "learning_rate": 1.357402445742222e-05, + "loss": 0.3415, + "step": 14759 + }, + { + "epoch": 40.217983651226156, + "grad_norm": 5.6757965087890625, + "learning_rate": 1.3573200237220951e-05, + "loss": 0.2629, + "step": 14760 + }, + { + "epoch": 40.22070844686648, + "grad_norm": 6.836151599884033, + "learning_rate": 1.3572375989191717e-05, + "loss": 0.2822, + "step": 14761 + }, + { + "epoch": 40.223433242506815, + "grad_norm": 4.928470134735107, + "learning_rate": 1.3571551713340931e-05, + "loss": 0.3333, + "step": 14762 + }, + { + "epoch": 40.22615803814714, + "grad_norm": 4.809662818908691, + "learning_rate": 1.3570727409675018e-05, + "loss": 0.1796, + "step": 14763 + }, + { + "epoch": 40.228882833787466, + "grad_norm": 6.912206172943115, + "learning_rate": 1.3569903078200393e-05, + "loss": 0.1788, + "step": 14764 + }, + { + "epoch": 40.23160762942779, + "grad_norm": 5.686048984527588, + "learning_rate": 1.3569078718923478e-05, + "loss": 0.1935, + "step": 14765 + }, + { + "epoch": 40.23433242506812, + "grad_norm": 6.835017681121826, + "learning_rate": 1.3568254331850693e-05, + "loss": 0.1676, + "step": 14766 + }, + { + "epoch": 40.237057220708444, + "grad_norm": 6.015300750732422, + "learning_rate": 1.3567429916988457e-05, + "loss": 0.2258, + "step": 14767 + }, + { + "epoch": 40.23978201634878, + "grad_norm": 26.15471076965332, + "learning_rate": 1.3566605474343192e-05, + "loss": 0.2457, + "step": 14768 + }, + { + "epoch": 40.2425068119891, + "grad_norm": 5.850229740142822, + "learning_rate": 1.3565781003921318e-05, + "loss": 0.2355, + "step": 14769 + }, + { + "epoch": 40.24523160762943, + "grad_norm": 4.393250942230225, + "learning_rate": 1.3564956505729259e-05, + "loss": 0.3133, + "step": 14770 + }, + { + "epoch": 40.247956403269754, + "grad_norm": 5.310056686401367, + "learning_rate": 1.356413197977343e-05, + "loss": 0.1958, + "step": 14771 + }, + { + "epoch": 40.25068119891008, + "grad_norm": 6.719603538513184, + "learning_rate": 1.3563307426060258e-05, + "loss": 0.2014, + "step": 14772 + }, + { + "epoch": 40.253405994550405, + "grad_norm": 6.757342338562012, + "learning_rate": 1.3562482844596164e-05, + "loss": 0.2555, + "step": 14773 + }, + { + "epoch": 40.25613079019074, + "grad_norm": 4.700272560119629, + "learning_rate": 1.3561658235387562e-05, + "loss": 0.3251, + "step": 14774 + }, + { + "epoch": 40.258855585831064, + "grad_norm": 5.600427150726318, + "learning_rate": 1.3560833598440887e-05, + "loss": 0.1668, + "step": 14775 + }, + { + "epoch": 40.26158038147139, + "grad_norm": 7.44266939163208, + "learning_rate": 1.3560008933762552e-05, + "loss": 0.2774, + "step": 14776 + }, + { + "epoch": 40.264305177111716, + "grad_norm": 4.850956916809082, + "learning_rate": 1.355918424135898e-05, + "loss": 0.2892, + "step": 14777 + }, + { + "epoch": 40.26702997275204, + "grad_norm": 4.869438648223877, + "learning_rate": 1.35583595212366e-05, + "loss": 0.5064, + "step": 14778 + }, + { + "epoch": 40.26975476839237, + "grad_norm": 6.677958011627197, + "learning_rate": 1.3557534773401827e-05, + "loss": 0.3253, + "step": 14779 + }, + { + "epoch": 40.2724795640327, + "grad_norm": 6.601706504821777, + "learning_rate": 1.355670999786109e-05, + "loss": 0.2698, + "step": 14780 + }, + { + "epoch": 40.275204359673026, + "grad_norm": 4.455941677093506, + "learning_rate": 1.3555885194620806e-05, + "loss": 0.2024, + "step": 14781 + }, + { + "epoch": 40.27792915531335, + "grad_norm": 4.924816131591797, + "learning_rate": 1.3555060363687407e-05, + "loss": 0.1795, + "step": 14782 + }, + { + "epoch": 40.28065395095368, + "grad_norm": 6.3266119956970215, + "learning_rate": 1.355423550506731e-05, + "loss": 0.2472, + "step": 14783 + }, + { + "epoch": 40.283378746594, + "grad_norm": 6.0468549728393555, + "learning_rate": 1.3553410618766942e-05, + "loss": 0.2499, + "step": 14784 + }, + { + "epoch": 40.28610354223433, + "grad_norm": 4.959547519683838, + "learning_rate": 1.3552585704792724e-05, + "loss": 0.1743, + "step": 14785 + }, + { + "epoch": 40.28882833787466, + "grad_norm": 5.919888496398926, + "learning_rate": 1.3551760763151087e-05, + "loss": 0.2734, + "step": 14786 + }, + { + "epoch": 40.29155313351499, + "grad_norm": 6.15693998336792, + "learning_rate": 1.355093579384845e-05, + "loss": 0.2804, + "step": 14787 + }, + { + "epoch": 40.294277929155314, + "grad_norm": 6.691210746765137, + "learning_rate": 1.3550110796891241e-05, + "loss": 0.2145, + "step": 14788 + }, + { + "epoch": 40.29700272479564, + "grad_norm": 5.143745422363281, + "learning_rate": 1.3549285772285881e-05, + "loss": 0.2393, + "step": 14789 + }, + { + "epoch": 40.299727520435965, + "grad_norm": 7.448602199554443, + "learning_rate": 1.3548460720038798e-05, + "loss": 0.3274, + "step": 14790 + }, + { + "epoch": 40.30245231607629, + "grad_norm": 5.299944877624512, + "learning_rate": 1.3547635640156415e-05, + "loss": 0.1837, + "step": 14791 + }, + { + "epoch": 40.305177111716624, + "grad_norm": 6.9879679679870605, + "learning_rate": 1.3546810532645166e-05, + "loss": 0.2359, + "step": 14792 + }, + { + "epoch": 40.30790190735695, + "grad_norm": 5.754627227783203, + "learning_rate": 1.3545985397511464e-05, + "loss": 0.1475, + "step": 14793 + }, + { + "epoch": 40.310626702997276, + "grad_norm": 5.53333854675293, + "learning_rate": 1.3545160234761745e-05, + "loss": 0.1715, + "step": 14794 + }, + { + "epoch": 40.3133514986376, + "grad_norm": 7.198060989379883, + "learning_rate": 1.354433504440243e-05, + "loss": 0.2008, + "step": 14795 + }, + { + "epoch": 40.31607629427793, + "grad_norm": 6.643033027648926, + "learning_rate": 1.3543509826439951e-05, + "loss": 0.2318, + "step": 14796 + }, + { + "epoch": 40.31880108991825, + "grad_norm": 6.457057476043701, + "learning_rate": 1.3542684580880729e-05, + "loss": 0.3141, + "step": 14797 + }, + { + "epoch": 40.321525885558586, + "grad_norm": 5.512293815612793, + "learning_rate": 1.3541859307731198e-05, + "loss": 0.3023, + "step": 14798 + }, + { + "epoch": 40.32425068119891, + "grad_norm": 5.504129886627197, + "learning_rate": 1.3541034006997776e-05, + "loss": 0.1915, + "step": 14799 + }, + { + "epoch": 40.32697547683924, + "grad_norm": 6.146503925323486, + "learning_rate": 1.3540208678686897e-05, + "loss": 0.2172, + "step": 14800 + }, + { + "epoch": 40.32970027247956, + "grad_norm": 5.390168190002441, + "learning_rate": 1.3539383322804986e-05, + "loss": 0.1998, + "step": 14801 + }, + { + "epoch": 40.33242506811989, + "grad_norm": 5.944275379180908, + "learning_rate": 1.353855793935847e-05, + "loss": 0.3185, + "step": 14802 + }, + { + "epoch": 40.335149863760215, + "grad_norm": 6.440017223358154, + "learning_rate": 1.353773252835378e-05, + "loss": 0.245, + "step": 14803 + }, + { + "epoch": 40.33787465940055, + "grad_norm": 5.658210277557373, + "learning_rate": 1.3536907089797344e-05, + "loss": 0.1766, + "step": 14804 + }, + { + "epoch": 40.34059945504087, + "grad_norm": 6.608595371246338, + "learning_rate": 1.3536081623695588e-05, + "loss": 0.2682, + "step": 14805 + }, + { + "epoch": 40.3433242506812, + "grad_norm": 7.2391510009765625, + "learning_rate": 1.3535256130054943e-05, + "loss": 0.3797, + "step": 14806 + }, + { + "epoch": 40.346049046321525, + "grad_norm": 8.538012504577637, + "learning_rate": 1.3534430608881837e-05, + "loss": 0.229, + "step": 14807 + }, + { + "epoch": 40.34877384196185, + "grad_norm": 5.476230621337891, + "learning_rate": 1.35336050601827e-05, + "loss": 0.2702, + "step": 14808 + }, + { + "epoch": 40.35149863760218, + "grad_norm": 4.536299228668213, + "learning_rate": 1.353277948396396e-05, + "loss": 0.1606, + "step": 14809 + }, + { + "epoch": 40.35422343324251, + "grad_norm": 5.5461320877075195, + "learning_rate": 1.3531953880232044e-05, + "loss": 0.375, + "step": 14810 + }, + { + "epoch": 40.356948228882835, + "grad_norm": 5.543405532836914, + "learning_rate": 1.3531128248993388e-05, + "loss": 0.1926, + "step": 14811 + }, + { + "epoch": 40.35967302452316, + "grad_norm": 4.79237174987793, + "learning_rate": 1.353030259025442e-05, + "loss": 0.232, + "step": 14812 + }, + { + "epoch": 40.36239782016349, + "grad_norm": 4.4786200523376465, + "learning_rate": 1.3529476904021565e-05, + "loss": 0.1896, + "step": 14813 + }, + { + "epoch": 40.36512261580381, + "grad_norm": 5.660500526428223, + "learning_rate": 1.3528651190301263e-05, + "loss": 0.1839, + "step": 14814 + }, + { + "epoch": 40.36784741144414, + "grad_norm": 6.6640520095825195, + "learning_rate": 1.3527825449099936e-05, + "loss": 0.3246, + "step": 14815 + }, + { + "epoch": 40.37057220708447, + "grad_norm": 4.925924777984619, + "learning_rate": 1.3526999680424018e-05, + "loss": 0.2152, + "step": 14816 + }, + { + "epoch": 40.3732970027248, + "grad_norm": 6.950525283813477, + "learning_rate": 1.352617388427994e-05, + "loss": 0.188, + "step": 14817 + }, + { + "epoch": 40.37602179836512, + "grad_norm": 6.052989482879639, + "learning_rate": 1.3525348060674133e-05, + "loss": 0.2143, + "step": 14818 + }, + { + "epoch": 40.37874659400545, + "grad_norm": 5.452238082885742, + "learning_rate": 1.3524522209613027e-05, + "loss": 0.3057, + "step": 14819 + }, + { + "epoch": 40.381471389645775, + "grad_norm": 6.343240737915039, + "learning_rate": 1.3523696331103058e-05, + "loss": 0.2796, + "step": 14820 + }, + { + "epoch": 40.3841961852861, + "grad_norm": 4.896117687225342, + "learning_rate": 1.3522870425150654e-05, + "loss": 0.3237, + "step": 14821 + }, + { + "epoch": 40.38692098092643, + "grad_norm": 6.452795505523682, + "learning_rate": 1.3522044491762253e-05, + "loss": 0.2743, + "step": 14822 + }, + { + "epoch": 40.38964577656676, + "grad_norm": 8.737284660339355, + "learning_rate": 1.3521218530944276e-05, + "loss": 0.3762, + "step": 14823 + }, + { + "epoch": 40.392370572207085, + "grad_norm": 7.082198143005371, + "learning_rate": 1.3520392542703167e-05, + "loss": 0.3012, + "step": 14824 + }, + { + "epoch": 40.39509536784741, + "grad_norm": 6.1143879890441895, + "learning_rate": 1.3519566527045354e-05, + "loss": 0.1956, + "step": 14825 + }, + { + "epoch": 40.39782016348774, + "grad_norm": 8.48856258392334, + "learning_rate": 1.3518740483977268e-05, + "loss": 0.2278, + "step": 14826 + }, + { + "epoch": 40.40054495912806, + "grad_norm": 4.892963886260986, + "learning_rate": 1.3517914413505344e-05, + "loss": 0.2896, + "step": 14827 + }, + { + "epoch": 40.403269754768395, + "grad_norm": 5.718017101287842, + "learning_rate": 1.3517088315636018e-05, + "loss": 0.1962, + "step": 14828 + }, + { + "epoch": 40.40599455040872, + "grad_norm": 6.417229652404785, + "learning_rate": 1.351626219037572e-05, + "loss": 0.4118, + "step": 14829 + }, + { + "epoch": 40.40871934604905, + "grad_norm": 7.505584716796875, + "learning_rate": 1.3515436037730887e-05, + "loss": 0.2588, + "step": 14830 + }, + { + "epoch": 40.41144414168937, + "grad_norm": 5.5002264976501465, + "learning_rate": 1.3514609857707948e-05, + "loss": 0.1766, + "step": 14831 + }, + { + "epoch": 40.4141689373297, + "grad_norm": 5.516236305236816, + "learning_rate": 1.3513783650313346e-05, + "loss": 0.1651, + "step": 14832 + }, + { + "epoch": 40.416893732970024, + "grad_norm": 6.154860496520996, + "learning_rate": 1.3512957415553505e-05, + "loss": 0.2749, + "step": 14833 + }, + { + "epoch": 40.41961852861036, + "grad_norm": 6.072230339050293, + "learning_rate": 1.3512131153434867e-05, + "loss": 0.2501, + "step": 14834 + }, + { + "epoch": 40.42234332425068, + "grad_norm": 5.330625534057617, + "learning_rate": 1.3511304863963863e-05, + "loss": 0.2563, + "step": 14835 + }, + { + "epoch": 40.42506811989101, + "grad_norm": 4.895598888397217, + "learning_rate": 1.351047854714693e-05, + "loss": 0.1862, + "step": 14836 + }, + { + "epoch": 40.427792915531334, + "grad_norm": 5.669843673706055, + "learning_rate": 1.3509652202990501e-05, + "loss": 0.1945, + "step": 14837 + }, + { + "epoch": 40.43051771117166, + "grad_norm": 7.436789512634277, + "learning_rate": 1.350882583150102e-05, + "loss": 0.3026, + "step": 14838 + }, + { + "epoch": 40.433242506811986, + "grad_norm": 5.909114360809326, + "learning_rate": 1.3507999432684911e-05, + "loss": 0.2505, + "step": 14839 + }, + { + "epoch": 40.43596730245232, + "grad_norm": 5.152442455291748, + "learning_rate": 1.350717300654862e-05, + "loss": 0.2828, + "step": 14840 + }, + { + "epoch": 40.438692098092645, + "grad_norm": 5.967596530914307, + "learning_rate": 1.3506346553098573e-05, + "loss": 0.2723, + "step": 14841 + }, + { + "epoch": 40.44141689373297, + "grad_norm": 5.889393329620361, + "learning_rate": 1.3505520072341216e-05, + "loss": 0.1981, + "step": 14842 + }, + { + "epoch": 40.444141689373296, + "grad_norm": 5.980917930603027, + "learning_rate": 1.3504693564282977e-05, + "loss": 0.3313, + "step": 14843 + }, + { + "epoch": 40.44686648501362, + "grad_norm": 5.2491559982299805, + "learning_rate": 1.3503867028930305e-05, + "loss": 0.1679, + "step": 14844 + }, + { + "epoch": 40.44959128065395, + "grad_norm": 5.511984825134277, + "learning_rate": 1.350304046628962e-05, + "loss": 0.1712, + "step": 14845 + }, + { + "epoch": 40.45231607629428, + "grad_norm": 5.705016136169434, + "learning_rate": 1.3502213876367373e-05, + "loss": 0.2663, + "step": 14846 + }, + { + "epoch": 40.45504087193461, + "grad_norm": 5.521117687225342, + "learning_rate": 1.3501387259169998e-05, + "loss": 0.2274, + "step": 14847 + }, + { + "epoch": 40.45776566757493, + "grad_norm": 5.227612495422363, + "learning_rate": 1.3500560614703932e-05, + "loss": 0.2319, + "step": 14848 + }, + { + "epoch": 40.46049046321526, + "grad_norm": 5.669434547424316, + "learning_rate": 1.3499733942975611e-05, + "loss": 0.2661, + "step": 14849 + }, + { + "epoch": 40.463215258855584, + "grad_norm": 5.9248175621032715, + "learning_rate": 1.3498907243991477e-05, + "loss": 0.1756, + "step": 14850 + }, + { + "epoch": 40.46594005449591, + "grad_norm": 5.283051490783691, + "learning_rate": 1.3498080517757961e-05, + "loss": 0.3733, + "step": 14851 + }, + { + "epoch": 40.46866485013624, + "grad_norm": 4.850691795349121, + "learning_rate": 1.3497253764281513e-05, + "loss": 0.166, + "step": 14852 + }, + { + "epoch": 40.47138964577657, + "grad_norm": 5.2142791748046875, + "learning_rate": 1.3496426983568561e-05, + "loss": 0.1824, + "step": 14853 + }, + { + "epoch": 40.474114441416894, + "grad_norm": 4.949707508087158, + "learning_rate": 1.3495600175625548e-05, + "loss": 0.2636, + "step": 14854 + }, + { + "epoch": 40.47683923705722, + "grad_norm": 6.136460304260254, + "learning_rate": 1.3494773340458916e-05, + "loss": 0.2619, + "step": 14855 + }, + { + "epoch": 40.479564032697546, + "grad_norm": 5.417229175567627, + "learning_rate": 1.34939464780751e-05, + "loss": 0.2144, + "step": 14856 + }, + { + "epoch": 40.48228882833787, + "grad_norm": 6.840548992156982, + "learning_rate": 1.3493119588480541e-05, + "loss": 0.4061, + "step": 14857 + }, + { + "epoch": 40.485013623978205, + "grad_norm": 7.138721942901611, + "learning_rate": 1.349229267168168e-05, + "loss": 0.2626, + "step": 14858 + }, + { + "epoch": 40.48773841961853, + "grad_norm": 7.157942295074463, + "learning_rate": 1.3491465727684953e-05, + "loss": 0.3388, + "step": 14859 + }, + { + "epoch": 40.490463215258856, + "grad_norm": 6.756263732910156, + "learning_rate": 1.3490638756496807e-05, + "loss": 0.2513, + "step": 14860 + }, + { + "epoch": 40.49318801089918, + "grad_norm": 7.291346073150635, + "learning_rate": 1.348981175812368e-05, + "loss": 0.2314, + "step": 14861 + }, + { + "epoch": 40.49591280653951, + "grad_norm": 5.688564300537109, + "learning_rate": 1.3488984732572006e-05, + "loss": 0.1974, + "step": 14862 + }, + { + "epoch": 40.49863760217983, + "grad_norm": 6.727434158325195, + "learning_rate": 1.3488157679848235e-05, + "loss": 0.2977, + "step": 14863 + }, + { + "epoch": 40.50136239782017, + "grad_norm": 4.9347968101501465, + "learning_rate": 1.3487330599958802e-05, + "loss": 0.2374, + "step": 14864 + }, + { + "epoch": 40.50408719346049, + "grad_norm": 5.227428436279297, + "learning_rate": 1.3486503492910155e-05, + "loss": 0.2063, + "step": 14865 + }, + { + "epoch": 40.50681198910082, + "grad_norm": 7.073912143707275, + "learning_rate": 1.3485676358708725e-05, + "loss": 0.2745, + "step": 14866 + }, + { + "epoch": 40.509536784741144, + "grad_norm": 8.08021068572998, + "learning_rate": 1.3484849197360964e-05, + "loss": 0.1532, + "step": 14867 + }, + { + "epoch": 40.51226158038147, + "grad_norm": 5.847911834716797, + "learning_rate": 1.348402200887331e-05, + "loss": 0.3067, + "step": 14868 + }, + { + "epoch": 40.514986376021795, + "grad_norm": 5.258172035217285, + "learning_rate": 1.3483194793252202e-05, + "loss": 0.3422, + "step": 14869 + }, + { + "epoch": 40.51771117166213, + "grad_norm": 5.617648124694824, + "learning_rate": 1.3482367550504085e-05, + "loss": 0.1506, + "step": 14870 + }, + { + "epoch": 40.520435967302454, + "grad_norm": 5.911000728607178, + "learning_rate": 1.3481540280635403e-05, + "loss": 0.3285, + "step": 14871 + }, + { + "epoch": 40.52316076294278, + "grad_norm": 7.393513202667236, + "learning_rate": 1.3480712983652598e-05, + "loss": 0.2773, + "step": 14872 + }, + { + "epoch": 40.525885558583106, + "grad_norm": 5.925257682800293, + "learning_rate": 1.3479885659562111e-05, + "loss": 0.2323, + "step": 14873 + }, + { + "epoch": 40.52861035422343, + "grad_norm": 5.522267818450928, + "learning_rate": 1.3479058308370386e-05, + "loss": 0.33, + "step": 14874 + }, + { + "epoch": 40.53133514986376, + "grad_norm": 5.7643256187438965, + "learning_rate": 1.3478230930083868e-05, + "loss": 0.2511, + "step": 14875 + }, + { + "epoch": 40.53405994550409, + "grad_norm": 6.358617782592773, + "learning_rate": 1.3477403524708998e-05, + "loss": 0.229, + "step": 14876 + }, + { + "epoch": 40.536784741144416, + "grad_norm": 5.766740798950195, + "learning_rate": 1.3476576092252225e-05, + "loss": 0.2071, + "step": 14877 + }, + { + "epoch": 40.53950953678474, + "grad_norm": 4.795498847961426, + "learning_rate": 1.3475748632719985e-05, + "loss": 0.2402, + "step": 14878 + }, + { + "epoch": 40.54223433242507, + "grad_norm": 6.2379350662231445, + "learning_rate": 1.3474921146118728e-05, + "loss": 0.2724, + "step": 14879 + }, + { + "epoch": 40.54495912806539, + "grad_norm": 4.677596092224121, + "learning_rate": 1.3474093632454897e-05, + "loss": 0.2636, + "step": 14880 + }, + { + "epoch": 40.54768392370572, + "grad_norm": 5.005476951599121, + "learning_rate": 1.3473266091734938e-05, + "loss": 0.3155, + "step": 14881 + }, + { + "epoch": 40.55040871934605, + "grad_norm": 6.714357376098633, + "learning_rate": 1.3472438523965292e-05, + "loss": 0.2178, + "step": 14882 + }, + { + "epoch": 40.55313351498638, + "grad_norm": 10.46469497680664, + "learning_rate": 1.3471610929152408e-05, + "loss": 0.4024, + "step": 14883 + }, + { + "epoch": 40.555858310626704, + "grad_norm": 7.666954517364502, + "learning_rate": 1.3470783307302728e-05, + "loss": 0.2054, + "step": 14884 + }, + { + "epoch": 40.55858310626703, + "grad_norm": 6.6751179695129395, + "learning_rate": 1.3469955658422701e-05, + "loss": 0.3029, + "step": 14885 + }, + { + "epoch": 40.561307901907355, + "grad_norm": 5.923067092895508, + "learning_rate": 1.3469127982518773e-05, + "loss": 0.2173, + "step": 14886 + }, + { + "epoch": 40.56403269754768, + "grad_norm": 7.947319507598877, + "learning_rate": 1.3468300279597386e-05, + "loss": 0.2964, + "step": 14887 + }, + { + "epoch": 40.566757493188014, + "grad_norm": 5.859461307525635, + "learning_rate": 1.3467472549664983e-05, + "loss": 0.2649, + "step": 14888 + }, + { + "epoch": 40.56948228882834, + "grad_norm": 6.946326732635498, + "learning_rate": 1.3466644792728023e-05, + "loss": 0.2178, + "step": 14889 + }, + { + "epoch": 40.572207084468666, + "grad_norm": 5.288938999176025, + "learning_rate": 1.3465817008792943e-05, + "loss": 0.1667, + "step": 14890 + }, + { + "epoch": 40.57493188010899, + "grad_norm": 10.767555236816406, + "learning_rate": 1.3464989197866192e-05, + "loss": 0.3047, + "step": 14891 + }, + { + "epoch": 40.57765667574932, + "grad_norm": 5.773517608642578, + "learning_rate": 1.3464161359954214e-05, + "loss": 0.2887, + "step": 14892 + }, + { + "epoch": 40.58038147138964, + "grad_norm": 8.373126029968262, + "learning_rate": 1.3463333495063462e-05, + "loss": 0.2623, + "step": 14893 + }, + { + "epoch": 40.583106267029976, + "grad_norm": 6.424461841583252, + "learning_rate": 1.3462505603200377e-05, + "loss": 0.2723, + "step": 14894 + }, + { + "epoch": 40.5858310626703, + "grad_norm": 7.6376118659973145, + "learning_rate": 1.3461677684371412e-05, + "loss": 0.3219, + "step": 14895 + }, + { + "epoch": 40.58855585831063, + "grad_norm": 5.907564640045166, + "learning_rate": 1.346084973858301e-05, + "loss": 0.2069, + "step": 14896 + }, + { + "epoch": 40.59128065395095, + "grad_norm": 5.691221714019775, + "learning_rate": 1.3460021765841625e-05, + "loss": 0.198, + "step": 14897 + }, + { + "epoch": 40.59400544959128, + "grad_norm": 5.604295253753662, + "learning_rate": 1.34591937661537e-05, + "loss": 0.2034, + "step": 14898 + }, + { + "epoch": 40.596730245231605, + "grad_norm": 4.799344062805176, + "learning_rate": 1.3458365739525685e-05, + "loss": 0.203, + "step": 14899 + }, + { + "epoch": 40.59945504087194, + "grad_norm": 5.533874988555908, + "learning_rate": 1.3457537685964029e-05, + "loss": 0.3049, + "step": 14900 + }, + { + "epoch": 40.60217983651226, + "grad_norm": 6.924694061279297, + "learning_rate": 1.3456709605475182e-05, + "loss": 0.2093, + "step": 14901 + }, + { + "epoch": 40.60490463215259, + "grad_norm": 5.239685535430908, + "learning_rate": 1.345588149806559e-05, + "loss": 0.2447, + "step": 14902 + }, + { + "epoch": 40.607629427792915, + "grad_norm": 5.3831095695495605, + "learning_rate": 1.3455053363741708e-05, + "loss": 0.1792, + "step": 14903 + }, + { + "epoch": 40.61035422343324, + "grad_norm": 6.45353889465332, + "learning_rate": 1.3454225202509978e-05, + "loss": 0.3018, + "step": 14904 + }, + { + "epoch": 40.61307901907357, + "grad_norm": 5.3861212730407715, + "learning_rate": 1.3453397014376854e-05, + "loss": 0.2651, + "step": 14905 + }, + { + "epoch": 40.6158038147139, + "grad_norm": 5.265120983123779, + "learning_rate": 1.3452568799348783e-05, + "loss": 0.2325, + "step": 14906 + }, + { + "epoch": 40.618528610354225, + "grad_norm": 8.889595985412598, + "learning_rate": 1.3451740557432223e-05, + "loss": 0.2323, + "step": 14907 + }, + { + "epoch": 40.62125340599455, + "grad_norm": 5.120465278625488, + "learning_rate": 1.3450912288633614e-05, + "loss": 0.2641, + "step": 14908 + }, + { + "epoch": 40.62397820163488, + "grad_norm": 6.105363368988037, + "learning_rate": 1.3450083992959413e-05, + "loss": 0.1906, + "step": 14909 + }, + { + "epoch": 40.6267029972752, + "grad_norm": 9.551621437072754, + "learning_rate": 1.3449255670416068e-05, + "loss": 0.3251, + "step": 14910 + }, + { + "epoch": 40.62942779291553, + "grad_norm": 6.234216690063477, + "learning_rate": 1.3448427321010034e-05, + "loss": 0.2052, + "step": 14911 + }, + { + "epoch": 40.63215258855586, + "grad_norm": 5.134133815765381, + "learning_rate": 1.3447598944747755e-05, + "loss": 0.1361, + "step": 14912 + }, + { + "epoch": 40.63487738419619, + "grad_norm": 6.906923770904541, + "learning_rate": 1.3446770541635687e-05, + "loss": 0.2399, + "step": 14913 + }, + { + "epoch": 40.63760217983651, + "grad_norm": 5.535183429718018, + "learning_rate": 1.3445942111680279e-05, + "loss": 0.2268, + "step": 14914 + }, + { + "epoch": 40.64032697547684, + "grad_norm": 6.394478797912598, + "learning_rate": 1.3445113654887992e-05, + "loss": 0.2457, + "step": 14915 + }, + { + "epoch": 40.643051771117165, + "grad_norm": 4.879506587982178, + "learning_rate": 1.3444285171265263e-05, + "loss": 0.1335, + "step": 14916 + }, + { + "epoch": 40.64577656675749, + "grad_norm": 5.884253978729248, + "learning_rate": 1.3443456660818557e-05, + "loss": 0.2834, + "step": 14917 + }, + { + "epoch": 40.64850136239782, + "grad_norm": 4.804670333862305, + "learning_rate": 1.3442628123554318e-05, + "loss": 0.2397, + "step": 14918 + }, + { + "epoch": 40.65122615803815, + "grad_norm": 5.187518119812012, + "learning_rate": 1.3441799559479005e-05, + "loss": 0.2859, + "step": 14919 + }, + { + "epoch": 40.653950953678475, + "grad_norm": 4.903922080993652, + "learning_rate": 1.3440970968599065e-05, + "loss": 0.1925, + "step": 14920 + }, + { + "epoch": 40.6566757493188, + "grad_norm": 5.095132350921631, + "learning_rate": 1.3440142350920958e-05, + "loss": 0.2361, + "step": 14921 + }, + { + "epoch": 40.65940054495913, + "grad_norm": 5.3817901611328125, + "learning_rate": 1.3439313706451125e-05, + "loss": 0.226, + "step": 14922 + }, + { + "epoch": 40.66212534059945, + "grad_norm": 5.576498508453369, + "learning_rate": 1.3438485035196034e-05, + "loss": 0.2948, + "step": 14923 + }, + { + "epoch": 40.664850136239785, + "grad_norm": 5.794294357299805, + "learning_rate": 1.343765633716213e-05, + "loss": 0.1942, + "step": 14924 + }, + { + "epoch": 40.66757493188011, + "grad_norm": 4.943784713745117, + "learning_rate": 1.3436827612355871e-05, + "loss": 0.2043, + "step": 14925 + }, + { + "epoch": 40.67029972752044, + "grad_norm": 5.971388816833496, + "learning_rate": 1.3435998860783708e-05, + "loss": 0.2005, + "step": 14926 + }, + { + "epoch": 40.67302452316076, + "grad_norm": 5.976658821105957, + "learning_rate": 1.3435170082452097e-05, + "loss": 0.2635, + "step": 14927 + }, + { + "epoch": 40.67574931880109, + "grad_norm": 5.012649059295654, + "learning_rate": 1.3434341277367491e-05, + "loss": 0.3775, + "step": 14928 + }, + { + "epoch": 40.678474114441414, + "grad_norm": 4.810773849487305, + "learning_rate": 1.343351244553635e-05, + "loss": 0.2225, + "step": 14929 + }, + { + "epoch": 40.68119891008175, + "grad_norm": 5.172163963317871, + "learning_rate": 1.343268358696512e-05, + "loss": 0.2724, + "step": 14930 + }, + { + "epoch": 40.68392370572207, + "grad_norm": 5.959063529968262, + "learning_rate": 1.3431854701660259e-05, + "loss": 0.2525, + "step": 14931 + }, + { + "epoch": 40.6866485013624, + "grad_norm": 5.518011569976807, + "learning_rate": 1.3431025789628227e-05, + "loss": 0.2462, + "step": 14932 + }, + { + "epoch": 40.689373297002724, + "grad_norm": 5.654611110687256, + "learning_rate": 1.3430196850875476e-05, + "loss": 0.2591, + "step": 14933 + }, + { + "epoch": 40.69209809264305, + "grad_norm": 5.825628280639648, + "learning_rate": 1.3429367885408461e-05, + "loss": 0.216, + "step": 14934 + }, + { + "epoch": 40.694822888283376, + "grad_norm": 5.7777886390686035, + "learning_rate": 1.3428538893233642e-05, + "loss": 0.3862, + "step": 14935 + }, + { + "epoch": 40.69754768392371, + "grad_norm": 5.627559661865234, + "learning_rate": 1.3427709874357471e-05, + "loss": 0.2041, + "step": 14936 + }, + { + "epoch": 40.700272479564035, + "grad_norm": 5.278099060058594, + "learning_rate": 1.3426880828786408e-05, + "loss": 0.2989, + "step": 14937 + }, + { + "epoch": 40.70299727520436, + "grad_norm": 4.595234394073486, + "learning_rate": 1.3426051756526905e-05, + "loss": 0.3122, + "step": 14938 + }, + { + "epoch": 40.705722070844686, + "grad_norm": 5.167964935302734, + "learning_rate": 1.342522265758542e-05, + "loss": 0.278, + "step": 14939 + }, + { + "epoch": 40.70844686648501, + "grad_norm": 6.490757465362549, + "learning_rate": 1.3424393531968415e-05, + "loss": 0.3191, + "step": 14940 + }, + { + "epoch": 40.71117166212534, + "grad_norm": 5.710482120513916, + "learning_rate": 1.3423564379682339e-05, + "loss": 0.4288, + "step": 14941 + }, + { + "epoch": 40.71389645776567, + "grad_norm": 5.107451438903809, + "learning_rate": 1.342273520073366e-05, + "loss": 0.3045, + "step": 14942 + }, + { + "epoch": 40.716621253406, + "grad_norm": 6.680281639099121, + "learning_rate": 1.3421905995128821e-05, + "loss": 0.1385, + "step": 14943 + }, + { + "epoch": 40.71934604904632, + "grad_norm": 6.430998802185059, + "learning_rate": 1.3421076762874295e-05, + "loss": 0.2798, + "step": 14944 + }, + { + "epoch": 40.72207084468665, + "grad_norm": 5.79957389831543, + "learning_rate": 1.3420247503976529e-05, + "loss": 0.3243, + "step": 14945 + }, + { + "epoch": 40.724795640326974, + "grad_norm": 5.468590259552002, + "learning_rate": 1.3419418218441989e-05, + "loss": 0.3202, + "step": 14946 + }, + { + "epoch": 40.7275204359673, + "grad_norm": 4.622290134429932, + "learning_rate": 1.3418588906277128e-05, + "loss": 0.1476, + "step": 14947 + }, + { + "epoch": 40.73024523160763, + "grad_norm": 4.551146030426025, + "learning_rate": 1.3417759567488407e-05, + "loss": 0.2247, + "step": 14948 + }, + { + "epoch": 40.73297002724796, + "grad_norm": 5.9461774826049805, + "learning_rate": 1.3416930202082284e-05, + "loss": 0.3004, + "step": 14949 + }, + { + "epoch": 40.735694822888284, + "grad_norm": 5.845150470733643, + "learning_rate": 1.341610081006522e-05, + "loss": 0.2999, + "step": 14950 + }, + { + "epoch": 40.73841961852861, + "grad_norm": 4.415715217590332, + "learning_rate": 1.341527139144367e-05, + "loss": 0.1576, + "step": 14951 + }, + { + "epoch": 40.741144414168936, + "grad_norm": 5.789761066436768, + "learning_rate": 1.3414441946224099e-05, + "loss": 0.286, + "step": 14952 + }, + { + "epoch": 40.74386920980926, + "grad_norm": 5.601269721984863, + "learning_rate": 1.3413612474412965e-05, + "loss": 0.1891, + "step": 14953 + }, + { + "epoch": 40.746594005449595, + "grad_norm": 6.888553142547607, + "learning_rate": 1.3412782976016724e-05, + "loss": 0.2617, + "step": 14954 + }, + { + "epoch": 40.74931880108992, + "grad_norm": 5.94119119644165, + "learning_rate": 1.3411953451041839e-05, + "loss": 0.2158, + "step": 14955 + }, + { + "epoch": 40.752043596730246, + "grad_norm": 9.400856971740723, + "learning_rate": 1.3411123899494772e-05, + "loss": 0.229, + "step": 14956 + }, + { + "epoch": 40.75476839237057, + "grad_norm": 8.853175163269043, + "learning_rate": 1.341029432138198e-05, + "loss": 0.4265, + "step": 14957 + }, + { + "epoch": 40.7574931880109, + "grad_norm": 6.882060527801514, + "learning_rate": 1.3409464716709928e-05, + "loss": 0.2463, + "step": 14958 + }, + { + "epoch": 40.76021798365122, + "grad_norm": 5.097872257232666, + "learning_rate": 1.3408635085485074e-05, + "loss": 0.1524, + "step": 14959 + }, + { + "epoch": 40.762942779291556, + "grad_norm": 5.943040370941162, + "learning_rate": 1.340780542771388e-05, + "loss": 0.4234, + "step": 14960 + }, + { + "epoch": 40.76566757493188, + "grad_norm": 7.117913246154785, + "learning_rate": 1.3406975743402805e-05, + "loss": 0.2, + "step": 14961 + }, + { + "epoch": 40.76839237057221, + "grad_norm": 7.399886131286621, + "learning_rate": 1.3406146032558316e-05, + "loss": 0.3461, + "step": 14962 + }, + { + "epoch": 40.771117166212534, + "grad_norm": 5.474939823150635, + "learning_rate": 1.3405316295186868e-05, + "loss": 0.218, + "step": 14963 + }, + { + "epoch": 40.77384196185286, + "grad_norm": 4.896245956420898, + "learning_rate": 1.3404486531294926e-05, + "loss": 0.168, + "step": 14964 + }, + { + "epoch": 40.776566757493185, + "grad_norm": 6.233972549438477, + "learning_rate": 1.3403656740888953e-05, + "loss": 0.252, + "step": 14965 + }, + { + "epoch": 40.77929155313352, + "grad_norm": 5.181840419769287, + "learning_rate": 1.3402826923975414e-05, + "loss": 0.1587, + "step": 14966 + }, + { + "epoch": 40.782016348773844, + "grad_norm": 6.172066688537598, + "learning_rate": 1.3401997080560765e-05, + "loss": 0.1852, + "step": 14967 + }, + { + "epoch": 40.78474114441417, + "grad_norm": 5.824451446533203, + "learning_rate": 1.3401167210651474e-05, + "loss": 0.2186, + "step": 14968 + }, + { + "epoch": 40.787465940054496, + "grad_norm": 5.7823591232299805, + "learning_rate": 1.3400337314254e-05, + "loss": 0.2286, + "step": 14969 + }, + { + "epoch": 40.79019073569482, + "grad_norm": 5.527565002441406, + "learning_rate": 1.339950739137481e-05, + "loss": 0.2641, + "step": 14970 + }, + { + "epoch": 40.79291553133515, + "grad_norm": 6.882816791534424, + "learning_rate": 1.3398677442020367e-05, + "loss": 0.2936, + "step": 14971 + }, + { + "epoch": 40.79564032697548, + "grad_norm": 5.974388122558594, + "learning_rate": 1.3397847466197133e-05, + "loss": 0.422, + "step": 14972 + }, + { + "epoch": 40.798365122615806, + "grad_norm": 5.234097957611084, + "learning_rate": 1.339701746391157e-05, + "loss": 0.2596, + "step": 14973 + }, + { + "epoch": 40.80108991825613, + "grad_norm": 9.07652759552002, + "learning_rate": 1.3396187435170144e-05, + "loss": 0.2723, + "step": 14974 + }, + { + "epoch": 40.80381471389646, + "grad_norm": 5.8103437423706055, + "learning_rate": 1.3395357379979324e-05, + "loss": 0.1719, + "step": 14975 + }, + { + "epoch": 40.80653950953678, + "grad_norm": 5.6345534324646, + "learning_rate": 1.3394527298345567e-05, + "loss": 0.193, + "step": 14976 + }, + { + "epoch": 40.80926430517711, + "grad_norm": 5.143917083740234, + "learning_rate": 1.339369719027534e-05, + "loss": 0.1949, + "step": 14977 + }, + { + "epoch": 40.81198910081744, + "grad_norm": 5.574187278747559, + "learning_rate": 1.3392867055775112e-05, + "loss": 0.1412, + "step": 14978 + }, + { + "epoch": 40.81471389645777, + "grad_norm": 6.678638458251953, + "learning_rate": 1.3392036894851342e-05, + "loss": 0.2533, + "step": 14979 + }, + { + "epoch": 40.817438692098094, + "grad_norm": 6.180417537689209, + "learning_rate": 1.3391206707510498e-05, + "loss": 0.166, + "step": 14980 + }, + { + "epoch": 40.82016348773842, + "grad_norm": 6.180706024169922, + "learning_rate": 1.3390376493759045e-05, + "loss": 0.231, + "step": 14981 + }, + { + "epoch": 40.822888283378745, + "grad_norm": 5.376947402954102, + "learning_rate": 1.3389546253603447e-05, + "loss": 0.2622, + "step": 14982 + }, + { + "epoch": 40.82561307901907, + "grad_norm": 4.870726585388184, + "learning_rate": 1.3388715987050174e-05, + "loss": 0.2365, + "step": 14983 + }, + { + "epoch": 40.828337874659404, + "grad_norm": 6.5397138595581055, + "learning_rate": 1.338788569410569e-05, + "loss": 0.2467, + "step": 14984 + }, + { + "epoch": 40.83106267029973, + "grad_norm": 5.011137962341309, + "learning_rate": 1.3387055374776463e-05, + "loss": 0.279, + "step": 14985 + }, + { + "epoch": 40.833787465940055, + "grad_norm": 4.846118450164795, + "learning_rate": 1.3386225029068959e-05, + "loss": 0.1282, + "step": 14986 + }, + { + "epoch": 40.83651226158038, + "grad_norm": 6.057253360748291, + "learning_rate": 1.338539465698964e-05, + "loss": 0.2232, + "step": 14987 + }, + { + "epoch": 40.83923705722071, + "grad_norm": 6.4753031730651855, + "learning_rate": 1.3384564258544976e-05, + "loss": 0.2677, + "step": 14988 + }, + { + "epoch": 40.84196185286103, + "grad_norm": 7.979143142700195, + "learning_rate": 1.3383733833741434e-05, + "loss": 0.2295, + "step": 14989 + }, + { + "epoch": 40.844686648501366, + "grad_norm": 6.787848949432373, + "learning_rate": 1.3382903382585485e-05, + "loss": 0.214, + "step": 14990 + }, + { + "epoch": 40.84741144414169, + "grad_norm": 5.826859474182129, + "learning_rate": 1.338207290508359e-05, + "loss": 0.1957, + "step": 14991 + }, + { + "epoch": 40.85013623978202, + "grad_norm": 5.740458011627197, + "learning_rate": 1.3381242401242222e-05, + "loss": 0.229, + "step": 14992 + }, + { + "epoch": 40.85286103542234, + "grad_norm": 5.911404609680176, + "learning_rate": 1.3380411871067846e-05, + "loss": 0.4161, + "step": 14993 + }, + { + "epoch": 40.85558583106267, + "grad_norm": 6.816946506500244, + "learning_rate": 1.3379581314566931e-05, + "loss": 0.2727, + "step": 14994 + }, + { + "epoch": 40.858310626702995, + "grad_norm": 6.2688069343566895, + "learning_rate": 1.3378750731745949e-05, + "loss": 0.2802, + "step": 14995 + }, + { + "epoch": 40.86103542234333, + "grad_norm": 4.649788856506348, + "learning_rate": 1.337792012261136e-05, + "loss": 0.3784, + "step": 14996 + }, + { + "epoch": 40.86376021798365, + "grad_norm": 5.236213684082031, + "learning_rate": 1.337708948716964e-05, + "loss": 0.2497, + "step": 14997 + }, + { + "epoch": 40.86648501362398, + "grad_norm": 4.856684684753418, + "learning_rate": 1.3376258825427259e-05, + "loss": 0.2789, + "step": 14998 + }, + { + "epoch": 40.869209809264305, + "grad_norm": 6.627138137817383, + "learning_rate": 1.3375428137390678e-05, + "loss": 0.2303, + "step": 14999 + }, + { + "epoch": 40.87193460490463, + "grad_norm": 5.439791202545166, + "learning_rate": 1.3374597423066373e-05, + "loss": 0.3366, + "step": 15000 + }, + { + "epoch": 40.87465940054496, + "grad_norm": 5.366386413574219, + "learning_rate": 1.3373766682460811e-05, + "loss": 0.1568, + "step": 15001 + }, + { + "epoch": 40.87738419618529, + "grad_norm": 6.989178657531738, + "learning_rate": 1.3372935915580465e-05, + "loss": 0.2469, + "step": 15002 + }, + { + "epoch": 40.880108991825615, + "grad_norm": 6.559767723083496, + "learning_rate": 1.3372105122431801e-05, + "loss": 0.2893, + "step": 15003 + }, + { + "epoch": 40.88283378746594, + "grad_norm": 5.447100639343262, + "learning_rate": 1.3371274303021293e-05, + "loss": 0.1565, + "step": 15004 + }, + { + "epoch": 40.88555858310627, + "grad_norm": 6.380908012390137, + "learning_rate": 1.3370443457355407e-05, + "loss": 0.1827, + "step": 15005 + }, + { + "epoch": 40.88828337874659, + "grad_norm": 4.741380214691162, + "learning_rate": 1.3369612585440617e-05, + "loss": 0.2058, + "step": 15006 + }, + { + "epoch": 40.89100817438692, + "grad_norm": 5.247865200042725, + "learning_rate": 1.336878168728339e-05, + "loss": 0.1651, + "step": 15007 + }, + { + "epoch": 40.89373297002725, + "grad_norm": 5.421178817749023, + "learning_rate": 1.33679507628902e-05, + "loss": 0.1881, + "step": 15008 + }, + { + "epoch": 40.89645776566758, + "grad_norm": 7.068850517272949, + "learning_rate": 1.336711981226752e-05, + "loss": 0.2087, + "step": 15009 + }, + { + "epoch": 40.8991825613079, + "grad_norm": 6.348726272583008, + "learning_rate": 1.336628883542182e-05, + "loss": 0.265, + "step": 15010 + }, + { + "epoch": 40.90190735694823, + "grad_norm": 5.680532932281494, + "learning_rate": 1.3365457832359567e-05, + "loss": 0.1723, + "step": 15011 + }, + { + "epoch": 40.904632152588555, + "grad_norm": 7.25140380859375, + "learning_rate": 1.3364626803087242e-05, + "loss": 0.3176, + "step": 15012 + }, + { + "epoch": 40.90735694822888, + "grad_norm": 6.55526065826416, + "learning_rate": 1.3363795747611309e-05, + "loss": 0.3861, + "step": 15013 + }, + { + "epoch": 40.91008174386921, + "grad_norm": 5.4566473960876465, + "learning_rate": 1.3362964665938246e-05, + "loss": 0.2871, + "step": 15014 + }, + { + "epoch": 40.91280653950954, + "grad_norm": 5.61224889755249, + "learning_rate": 1.3362133558074517e-05, + "loss": 0.164, + "step": 15015 + }, + { + "epoch": 40.915531335149865, + "grad_norm": 6.36538553237915, + "learning_rate": 1.3361302424026603e-05, + "loss": 0.2852, + "step": 15016 + }, + { + "epoch": 40.91825613079019, + "grad_norm": 5.29815149307251, + "learning_rate": 1.3360471263800974e-05, + "loss": 0.2155, + "step": 15017 + }, + { + "epoch": 40.920980926430516, + "grad_norm": 5.939804553985596, + "learning_rate": 1.33596400774041e-05, + "loss": 0.3171, + "step": 15018 + }, + { + "epoch": 40.92370572207084, + "grad_norm": 4.8379693031311035, + "learning_rate": 1.335880886484246e-05, + "loss": 0.2887, + "step": 15019 + }, + { + "epoch": 40.926430517711175, + "grad_norm": 4.905444145202637, + "learning_rate": 1.3357977626122525e-05, + "loss": 0.2915, + "step": 15020 + }, + { + "epoch": 40.9291553133515, + "grad_norm": 5.513583660125732, + "learning_rate": 1.3357146361250765e-05, + "loss": 0.2451, + "step": 15021 + }, + { + "epoch": 40.93188010899183, + "grad_norm": 6.400475978851318, + "learning_rate": 1.3356315070233664e-05, + "loss": 0.247, + "step": 15022 + }, + { + "epoch": 40.93460490463215, + "grad_norm": 7.196538925170898, + "learning_rate": 1.3355483753077682e-05, + "loss": 0.2287, + "step": 15023 + }, + { + "epoch": 40.93732970027248, + "grad_norm": 5.121399402618408, + "learning_rate": 1.3354652409789303e-05, + "loss": 0.1901, + "step": 15024 + }, + { + "epoch": 40.940054495912804, + "grad_norm": 5.523329257965088, + "learning_rate": 1.3353821040375001e-05, + "loss": 0.3396, + "step": 15025 + }, + { + "epoch": 40.94277929155314, + "grad_norm": 6.12915563583374, + "learning_rate": 1.3352989644841245e-05, + "loss": 0.2905, + "step": 15026 + }, + { + "epoch": 40.94550408719346, + "grad_norm": 5.719439506530762, + "learning_rate": 1.3352158223194517e-05, + "loss": 0.3653, + "step": 15027 + }, + { + "epoch": 40.94822888283379, + "grad_norm": 5.728538990020752, + "learning_rate": 1.3351326775441287e-05, + "loss": 0.2712, + "step": 15028 + }, + { + "epoch": 40.950953678474114, + "grad_norm": 5.390470027923584, + "learning_rate": 1.3350495301588034e-05, + "loss": 0.2523, + "step": 15029 + }, + { + "epoch": 40.95367847411444, + "grad_norm": 4.868643283843994, + "learning_rate": 1.334966380164123e-05, + "loss": 0.2482, + "step": 15030 + }, + { + "epoch": 40.956403269754766, + "grad_norm": 5.358735084533691, + "learning_rate": 1.3348832275607351e-05, + "loss": 0.3782, + "step": 15031 + }, + { + "epoch": 40.95912806539509, + "grad_norm": 6.365812301635742, + "learning_rate": 1.3348000723492875e-05, + "loss": 0.2387, + "step": 15032 + }, + { + "epoch": 40.961852861035425, + "grad_norm": 6.051462173461914, + "learning_rate": 1.3347169145304277e-05, + "loss": 0.1827, + "step": 15033 + }, + { + "epoch": 40.96457765667575, + "grad_norm": 4.960656642913818, + "learning_rate": 1.3346337541048034e-05, + "loss": 0.257, + "step": 15034 + }, + { + "epoch": 40.967302452316076, + "grad_norm": 5.8224873542785645, + "learning_rate": 1.3345505910730621e-05, + "loss": 0.3081, + "step": 15035 + }, + { + "epoch": 40.9700272479564, + "grad_norm": 7.290229797363281, + "learning_rate": 1.3344674254358515e-05, + "loss": 0.2471, + "step": 15036 + }, + { + "epoch": 40.97275204359673, + "grad_norm": 8.550009727478027, + "learning_rate": 1.3343842571938197e-05, + "loss": 0.2004, + "step": 15037 + }, + { + "epoch": 40.97547683923706, + "grad_norm": 5.098455429077148, + "learning_rate": 1.3343010863476135e-05, + "loss": 0.4074, + "step": 15038 + }, + { + "epoch": 40.97820163487739, + "grad_norm": 5.775397777557373, + "learning_rate": 1.3342179128978818e-05, + "loss": 0.2965, + "step": 15039 + }, + { + "epoch": 40.98092643051771, + "grad_norm": 7.7027106285095215, + "learning_rate": 1.3341347368452712e-05, + "loss": 0.259, + "step": 15040 + }, + { + "epoch": 40.98365122615804, + "grad_norm": 6.634826183319092, + "learning_rate": 1.3340515581904306e-05, + "loss": 0.1937, + "step": 15041 + }, + { + "epoch": 40.986376021798364, + "grad_norm": 4.4922614097595215, + "learning_rate": 1.3339683769340069e-05, + "loss": 0.1159, + "step": 15042 + }, + { + "epoch": 40.98910081743869, + "grad_norm": 5.7162275314331055, + "learning_rate": 1.333885193076648e-05, + "loss": 0.2325, + "step": 15043 + }, + { + "epoch": 40.991825613079016, + "grad_norm": 5.713405609130859, + "learning_rate": 1.3338020066190022e-05, + "loss": 0.382, + "step": 15044 + }, + { + "epoch": 40.99455040871935, + "grad_norm": 5.215897560119629, + "learning_rate": 1.3337188175617173e-05, + "loss": 0.3264, + "step": 15045 + }, + { + "epoch": 40.997275204359674, + "grad_norm": 6.1874165534973145, + "learning_rate": 1.3336356259054406e-05, + "loss": 0.4108, + "step": 15046 + }, + { + "epoch": 41.0, + "grad_norm": 6.213327884674072, + "learning_rate": 1.3335524316508208e-05, + "loss": 0.2671, + "step": 15047 + }, + { + "epoch": 41.002724795640326, + "grad_norm": 5.763308048248291, + "learning_rate": 1.3334692347985053e-05, + "loss": 0.1794, + "step": 15048 + }, + { + "epoch": 41.00544959128065, + "grad_norm": 4.891640663146973, + "learning_rate": 1.333386035349142e-05, + "loss": 0.2744, + "step": 15049 + }, + { + "epoch": 41.00817438692098, + "grad_norm": 5.161420822143555, + "learning_rate": 1.3333028333033791e-05, + "loss": 0.2648, + "step": 15050 + }, + { + "epoch": 41.01089918256131, + "grad_norm": 5.25761079788208, + "learning_rate": 1.3332196286618641e-05, + "loss": 0.1408, + "step": 15051 + }, + { + "epoch": 41.013623978201636, + "grad_norm": 5.3399481773376465, + "learning_rate": 1.3331364214252456e-05, + "loss": 0.1608, + "step": 15052 + }, + { + "epoch": 41.01634877384196, + "grad_norm": 4.414523601531982, + "learning_rate": 1.3330532115941714e-05, + "loss": 0.1297, + "step": 15053 + }, + { + "epoch": 41.01907356948229, + "grad_norm": 4.573468208312988, + "learning_rate": 1.3329699991692894e-05, + "loss": 0.2599, + "step": 15054 + }, + { + "epoch": 41.02179836512261, + "grad_norm": 5.290121555328369, + "learning_rate": 1.3328867841512481e-05, + "loss": 0.1638, + "step": 15055 + }, + { + "epoch": 41.02452316076294, + "grad_norm": 5.881246089935303, + "learning_rate": 1.3328035665406948e-05, + "loss": 0.157, + "step": 15056 + }, + { + "epoch": 41.02724795640327, + "grad_norm": 5.0966033935546875, + "learning_rate": 1.3327203463382786e-05, + "loss": 0.2493, + "step": 15057 + }, + { + "epoch": 41.0299727520436, + "grad_norm": 5.441526412963867, + "learning_rate": 1.3326371235446464e-05, + "loss": 0.2309, + "step": 15058 + }, + { + "epoch": 41.032697547683924, + "grad_norm": 7.732897758483887, + "learning_rate": 1.3325538981604475e-05, + "loss": 0.1622, + "step": 15059 + }, + { + "epoch": 41.03542234332425, + "grad_norm": 5.739369869232178, + "learning_rate": 1.332470670186329e-05, + "loss": 0.2691, + "step": 15060 + }, + { + "epoch": 41.038147138964575, + "grad_norm": 6.659055709838867, + "learning_rate": 1.3323874396229402e-05, + "loss": 0.1583, + "step": 15061 + }, + { + "epoch": 41.0408719346049, + "grad_norm": 11.251084327697754, + "learning_rate": 1.3323042064709285e-05, + "loss": 0.2757, + "step": 15062 + }, + { + "epoch": 41.043596730245234, + "grad_norm": 7.61301326751709, + "learning_rate": 1.3322209707309424e-05, + "loss": 0.3217, + "step": 15063 + }, + { + "epoch": 41.04632152588556, + "grad_norm": 5.039181709289551, + "learning_rate": 1.3321377324036297e-05, + "loss": 0.251, + "step": 15064 + }, + { + "epoch": 41.049046321525886, + "grad_norm": 6.336490631103516, + "learning_rate": 1.3320544914896396e-05, + "loss": 0.1705, + "step": 15065 + }, + { + "epoch": 41.05177111716621, + "grad_norm": 4.297523021697998, + "learning_rate": 1.3319712479896195e-05, + "loss": 0.1433, + "step": 15066 + }, + { + "epoch": 41.05449591280654, + "grad_norm": 5.132529258728027, + "learning_rate": 1.3318880019042179e-05, + "loss": 0.1973, + "step": 15067 + }, + { + "epoch": 41.05722070844686, + "grad_norm": 5.375813007354736, + "learning_rate": 1.3318047532340833e-05, + "loss": 0.18, + "step": 15068 + }, + { + "epoch": 41.059945504087196, + "grad_norm": 27.851383209228516, + "learning_rate": 1.3317215019798639e-05, + "loss": 0.2283, + "step": 15069 + }, + { + "epoch": 41.06267029972752, + "grad_norm": 5.794404029846191, + "learning_rate": 1.3316382481422081e-05, + "loss": 0.3191, + "step": 15070 + }, + { + "epoch": 41.06539509536785, + "grad_norm": 5.4679670333862305, + "learning_rate": 1.3315549917217647e-05, + "loss": 0.1392, + "step": 15071 + }, + { + "epoch": 41.06811989100817, + "grad_norm": 6.183343410491943, + "learning_rate": 1.3314717327191814e-05, + "loss": 0.2343, + "step": 15072 + }, + { + "epoch": 41.0708446866485, + "grad_norm": 5.130636215209961, + "learning_rate": 1.331388471135107e-05, + "loss": 0.3179, + "step": 15073 + }, + { + "epoch": 41.073569482288825, + "grad_norm": 4.36638879776001, + "learning_rate": 1.3313052069701896e-05, + "loss": 0.1996, + "step": 15074 + }, + { + "epoch": 41.07629427792916, + "grad_norm": 5.1475629806518555, + "learning_rate": 1.3312219402250781e-05, + "loss": 0.1936, + "step": 15075 + }, + { + "epoch": 41.079019073569484, + "grad_norm": 6.122947692871094, + "learning_rate": 1.3311386709004208e-05, + "loss": 0.2562, + "step": 15076 + }, + { + "epoch": 41.08174386920981, + "grad_norm": 7.6103386878967285, + "learning_rate": 1.3310553989968662e-05, + "loss": 0.2668, + "step": 15077 + }, + { + "epoch": 41.084468664850135, + "grad_norm": 5.603167533874512, + "learning_rate": 1.3309721245150627e-05, + "loss": 0.221, + "step": 15078 + }, + { + "epoch": 41.08719346049046, + "grad_norm": 6.73805046081543, + "learning_rate": 1.3308888474556591e-05, + "loss": 0.1863, + "step": 15079 + }, + { + "epoch": 41.08991825613079, + "grad_norm": 5.044631004333496, + "learning_rate": 1.3308055678193037e-05, + "loss": 0.2452, + "step": 15080 + }, + { + "epoch": 41.09264305177112, + "grad_norm": 5.798475742340088, + "learning_rate": 1.3307222856066452e-05, + "loss": 0.1698, + "step": 15081 + }, + { + "epoch": 41.095367847411445, + "grad_norm": 5.877731800079346, + "learning_rate": 1.3306390008183324e-05, + "loss": 0.2777, + "step": 15082 + }, + { + "epoch": 41.09809264305177, + "grad_norm": 7.005524635314941, + "learning_rate": 1.3305557134550133e-05, + "loss": 0.2625, + "step": 15083 + }, + { + "epoch": 41.1008174386921, + "grad_norm": 5.313305377960205, + "learning_rate": 1.3304724235173372e-05, + "loss": 0.2115, + "step": 15084 + }, + { + "epoch": 41.10354223433242, + "grad_norm": 5.591778755187988, + "learning_rate": 1.3303891310059528e-05, + "loss": 0.2092, + "step": 15085 + }, + { + "epoch": 41.10626702997275, + "grad_norm": 6.332198143005371, + "learning_rate": 1.3303058359215075e-05, + "loss": 0.2679, + "step": 15086 + }, + { + "epoch": 41.10899182561308, + "grad_norm": 5.046824932098389, + "learning_rate": 1.3302225382646518e-05, + "loss": 0.1625, + "step": 15087 + }, + { + "epoch": 41.11171662125341, + "grad_norm": 9.898218154907227, + "learning_rate": 1.3301392380360334e-05, + "loss": 0.2491, + "step": 15088 + }, + { + "epoch": 41.11444141689373, + "grad_norm": 6.03626012802124, + "learning_rate": 1.3300559352363015e-05, + "loss": 0.2215, + "step": 15089 + }, + { + "epoch": 41.11716621253406, + "grad_norm": 5.38420295715332, + "learning_rate": 1.3299726298661039e-05, + "loss": 0.1795, + "step": 15090 + }, + { + "epoch": 41.119891008174385, + "grad_norm": 6.802674293518066, + "learning_rate": 1.3298893219260909e-05, + "loss": 0.2123, + "step": 15091 + }, + { + "epoch": 41.12261580381471, + "grad_norm": 4.805606365203857, + "learning_rate": 1.32980601141691e-05, + "loss": 0.1599, + "step": 15092 + }, + { + "epoch": 41.12534059945504, + "grad_norm": 18.50775718688965, + "learning_rate": 1.3297226983392106e-05, + "loss": 0.1739, + "step": 15093 + }, + { + "epoch": 41.12806539509537, + "grad_norm": 4.983346939086914, + "learning_rate": 1.3296393826936416e-05, + "loss": 0.2814, + "step": 15094 + }, + { + "epoch": 41.130790190735695, + "grad_norm": 6.066840171813965, + "learning_rate": 1.3295560644808511e-05, + "loss": 0.2472, + "step": 15095 + }, + { + "epoch": 41.13351498637602, + "grad_norm": 5.6400017738342285, + "learning_rate": 1.3294727437014891e-05, + "loss": 0.2128, + "step": 15096 + }, + { + "epoch": 41.13623978201635, + "grad_norm": 6.294003486633301, + "learning_rate": 1.3293894203562041e-05, + "loss": 0.4346, + "step": 15097 + }, + { + "epoch": 41.13896457765667, + "grad_norm": 5.857290267944336, + "learning_rate": 1.3293060944456446e-05, + "loss": 0.3423, + "step": 15098 + }, + { + "epoch": 41.141689373297005, + "grad_norm": 5.681890487670898, + "learning_rate": 1.32922276597046e-05, + "loss": 0.2084, + "step": 15099 + }, + { + "epoch": 41.14441416893733, + "grad_norm": 7.933870315551758, + "learning_rate": 1.3291394349312989e-05, + "loss": 0.1554, + "step": 15100 + }, + { + "epoch": 41.14713896457766, + "grad_norm": 5.457008361816406, + "learning_rate": 1.3290561013288108e-05, + "loss": 0.2418, + "step": 15101 + }, + { + "epoch": 41.14986376021798, + "grad_norm": 6.152347564697266, + "learning_rate": 1.3289727651636439e-05, + "loss": 0.162, + "step": 15102 + }, + { + "epoch": 41.15258855585831, + "grad_norm": 6.3874664306640625, + "learning_rate": 1.328889426436448e-05, + "loss": 0.3618, + "step": 15103 + }, + { + "epoch": 41.155313351498634, + "grad_norm": 7.355878829956055, + "learning_rate": 1.328806085147872e-05, + "loss": 0.2442, + "step": 15104 + }, + { + "epoch": 41.15803814713897, + "grad_norm": 5.6302876472473145, + "learning_rate": 1.3287227412985644e-05, + "loss": 0.1831, + "step": 15105 + }, + { + "epoch": 41.16076294277929, + "grad_norm": 5.576440334320068, + "learning_rate": 1.3286393948891749e-05, + "loss": 0.3528, + "step": 15106 + }, + { + "epoch": 41.16348773841962, + "grad_norm": 9.891507148742676, + "learning_rate": 1.3285560459203524e-05, + "loss": 0.1704, + "step": 15107 + }, + { + "epoch": 41.166212534059945, + "grad_norm": 14.930198669433594, + "learning_rate": 1.3284726943927458e-05, + "loss": 0.2097, + "step": 15108 + }, + { + "epoch": 41.16893732970027, + "grad_norm": 7.592243671417236, + "learning_rate": 1.3283893403070044e-05, + "loss": 0.2157, + "step": 15109 + }, + { + "epoch": 41.171662125340596, + "grad_norm": 5.6844000816345215, + "learning_rate": 1.3283059836637775e-05, + "loss": 0.2903, + "step": 15110 + }, + { + "epoch": 41.17438692098093, + "grad_norm": 5.559866905212402, + "learning_rate": 1.3282226244637141e-05, + "loss": 0.2717, + "step": 15111 + }, + { + "epoch": 41.177111716621255, + "grad_norm": 5.3150434494018555, + "learning_rate": 1.3281392627074638e-05, + "loss": 0.1836, + "step": 15112 + }, + { + "epoch": 41.17983651226158, + "grad_norm": 4.613548755645752, + "learning_rate": 1.3280558983956753e-05, + "loss": 0.2416, + "step": 15113 + }, + { + "epoch": 41.182561307901906, + "grad_norm": 5.153605937957764, + "learning_rate": 1.3279725315289979e-05, + "loss": 0.1446, + "step": 15114 + }, + { + "epoch": 41.18528610354223, + "grad_norm": 5.514246940612793, + "learning_rate": 1.327889162108081e-05, + "loss": 0.3107, + "step": 15115 + }, + { + "epoch": 41.18801089918256, + "grad_norm": 7.106926441192627, + "learning_rate": 1.327805790133574e-05, + "loss": 0.2872, + "step": 15116 + }, + { + "epoch": 41.19073569482289, + "grad_norm": 6.395162582397461, + "learning_rate": 1.327722415606126e-05, + "loss": 0.1159, + "step": 15117 + }, + { + "epoch": 41.19346049046322, + "grad_norm": 7.043217658996582, + "learning_rate": 1.3276390385263862e-05, + "loss": 0.1785, + "step": 15118 + }, + { + "epoch": 41.19618528610354, + "grad_norm": 6.702186107635498, + "learning_rate": 1.3275556588950043e-05, + "loss": 0.2931, + "step": 15119 + }, + { + "epoch": 41.19891008174387, + "grad_norm": 5.641571998596191, + "learning_rate": 1.3274722767126294e-05, + "loss": 0.1619, + "step": 15120 + }, + { + "epoch": 41.201634877384194, + "grad_norm": 5.504769325256348, + "learning_rate": 1.3273888919799109e-05, + "loss": 0.2541, + "step": 15121 + }, + { + "epoch": 41.20435967302452, + "grad_norm": 6.530135631561279, + "learning_rate": 1.3273055046974984e-05, + "loss": 0.2569, + "step": 15122 + }, + { + "epoch": 41.20708446866485, + "grad_norm": 6.953867435455322, + "learning_rate": 1.3272221148660409e-05, + "loss": 0.1993, + "step": 15123 + }, + { + "epoch": 41.20980926430518, + "grad_norm": 5.282675266265869, + "learning_rate": 1.3271387224861885e-05, + "loss": 0.3132, + "step": 15124 + }, + { + "epoch": 41.212534059945504, + "grad_norm": 6.146264553070068, + "learning_rate": 1.3270553275585897e-05, + "loss": 0.1945, + "step": 15125 + }, + { + "epoch": 41.21525885558583, + "grad_norm": 6.121618270874023, + "learning_rate": 1.3269719300838952e-05, + "loss": 0.2037, + "step": 15126 + }, + { + "epoch": 41.217983651226156, + "grad_norm": 6.169727802276611, + "learning_rate": 1.3268885300627534e-05, + "loss": 0.1898, + "step": 15127 + }, + { + "epoch": 41.22070844686648, + "grad_norm": 7.4113383293151855, + "learning_rate": 1.3268051274958145e-05, + "loss": 0.2764, + "step": 15128 + }, + { + "epoch": 41.223433242506815, + "grad_norm": 7.6999688148498535, + "learning_rate": 1.3267217223837273e-05, + "loss": 0.2147, + "step": 15129 + }, + { + "epoch": 41.22615803814714, + "grad_norm": 24.69585418701172, + "learning_rate": 1.3266383147271422e-05, + "loss": 0.178, + "step": 15130 + }, + { + "epoch": 41.228882833787466, + "grad_norm": 5.99130392074585, + "learning_rate": 1.3265549045267085e-05, + "loss": 0.1981, + "step": 15131 + }, + { + "epoch": 41.23160762942779, + "grad_norm": 7.409508228302002, + "learning_rate": 1.3264714917830756e-05, + "loss": 0.2539, + "step": 15132 + }, + { + "epoch": 41.23433242506812, + "grad_norm": 5.927445411682129, + "learning_rate": 1.3263880764968933e-05, + "loss": 0.1674, + "step": 15133 + }, + { + "epoch": 41.237057220708444, + "grad_norm": 6.339357376098633, + "learning_rate": 1.326304658668811e-05, + "loss": 0.2224, + "step": 15134 + }, + { + "epoch": 41.23978201634878, + "grad_norm": 4.94216251373291, + "learning_rate": 1.3262212382994786e-05, + "loss": 0.1854, + "step": 15135 + }, + { + "epoch": 41.2425068119891, + "grad_norm": 5.53244161605835, + "learning_rate": 1.3261378153895459e-05, + "loss": 0.2227, + "step": 15136 + }, + { + "epoch": 41.24523160762943, + "grad_norm": 4.807004928588867, + "learning_rate": 1.3260543899396618e-05, + "loss": 0.1899, + "step": 15137 + }, + { + "epoch": 41.247956403269754, + "grad_norm": 5.70207405090332, + "learning_rate": 1.3259709619504772e-05, + "loss": 0.2131, + "step": 15138 + }, + { + "epoch": 41.25068119891008, + "grad_norm": 5.638994216918945, + "learning_rate": 1.3258875314226409e-05, + "loss": 0.2647, + "step": 15139 + }, + { + "epoch": 41.253405994550405, + "grad_norm": 5.902090549468994, + "learning_rate": 1.3258040983568035e-05, + "loss": 0.3854, + "step": 15140 + }, + { + "epoch": 41.25613079019074, + "grad_norm": 5.736852169036865, + "learning_rate": 1.3257206627536137e-05, + "loss": 0.3005, + "step": 15141 + }, + { + "epoch": 41.258855585831064, + "grad_norm": 5.480114936828613, + "learning_rate": 1.3256372246137223e-05, + "loss": 0.1725, + "step": 15142 + }, + { + "epoch": 41.26158038147139, + "grad_norm": 4.521186351776123, + "learning_rate": 1.3255537839377784e-05, + "loss": 0.1908, + "step": 15143 + }, + { + "epoch": 41.264305177111716, + "grad_norm": 5.752655506134033, + "learning_rate": 1.3254703407264322e-05, + "loss": 0.2556, + "step": 15144 + }, + { + "epoch": 41.26702997275204, + "grad_norm": 5.045345306396484, + "learning_rate": 1.3253868949803332e-05, + "loss": 0.1471, + "step": 15145 + }, + { + "epoch": 41.26975476839237, + "grad_norm": 4.824075222015381, + "learning_rate": 1.3253034467001319e-05, + "loss": 0.2457, + "step": 15146 + }, + { + "epoch": 41.2724795640327, + "grad_norm": 6.3114495277404785, + "learning_rate": 1.3252199958864775e-05, + "loss": 0.263, + "step": 15147 + }, + { + "epoch": 41.275204359673026, + "grad_norm": 6.216378211975098, + "learning_rate": 1.3251365425400205e-05, + "loss": 0.2134, + "step": 15148 + }, + { + "epoch": 41.27792915531335, + "grad_norm": 5.833584308624268, + "learning_rate": 1.3250530866614104e-05, + "loss": 0.2827, + "step": 15149 + }, + { + "epoch": 41.28065395095368, + "grad_norm": 5.205456256866455, + "learning_rate": 1.3249696282512976e-05, + "loss": 0.2104, + "step": 15150 + }, + { + "epoch": 41.283378746594, + "grad_norm": 5.878049850463867, + "learning_rate": 1.3248861673103315e-05, + "loss": 0.2962, + "step": 15151 + }, + { + "epoch": 41.28610354223433, + "grad_norm": 4.970963954925537, + "learning_rate": 1.3248027038391626e-05, + "loss": 0.1247, + "step": 15152 + }, + { + "epoch": 41.28882833787466, + "grad_norm": 7.160046100616455, + "learning_rate": 1.3247192378384406e-05, + "loss": 0.1987, + "step": 15153 + }, + { + "epoch": 41.29155313351499, + "grad_norm": 5.031962871551514, + "learning_rate": 1.3246357693088155e-05, + "loss": 0.3038, + "step": 15154 + }, + { + "epoch": 41.294277929155314, + "grad_norm": 6.0762104988098145, + "learning_rate": 1.3245522982509376e-05, + "loss": 0.226, + "step": 15155 + }, + { + "epoch": 41.29700272479564, + "grad_norm": 3.9628217220306396, + "learning_rate": 1.3244688246654569e-05, + "loss": 0.1666, + "step": 15156 + }, + { + "epoch": 41.299727520435965, + "grad_norm": 4.434725284576416, + "learning_rate": 1.3243853485530231e-05, + "loss": 0.4491, + "step": 15157 + }, + { + "epoch": 41.30245231607629, + "grad_norm": 6.514955997467041, + "learning_rate": 1.3243018699142871e-05, + "loss": 0.251, + "step": 15158 + }, + { + "epoch": 41.305177111716624, + "grad_norm": 5.702577590942383, + "learning_rate": 1.3242183887498983e-05, + "loss": 0.2284, + "step": 15159 + }, + { + "epoch": 41.30790190735695, + "grad_norm": 5.384641647338867, + "learning_rate": 1.3241349050605074e-05, + "loss": 0.1658, + "step": 15160 + }, + { + "epoch": 41.310626702997276, + "grad_norm": 4.907167911529541, + "learning_rate": 1.324051418846764e-05, + "loss": 0.2739, + "step": 15161 + }, + { + "epoch": 41.3133514986376, + "grad_norm": 5.377655506134033, + "learning_rate": 1.323967930109319e-05, + "loss": 0.1862, + "step": 15162 + }, + { + "epoch": 41.31607629427793, + "grad_norm": 5.394341945648193, + "learning_rate": 1.3238844388488215e-05, + "loss": 0.2562, + "step": 15163 + }, + { + "epoch": 41.31880108991825, + "grad_norm": 4.6092424392700195, + "learning_rate": 1.3238009450659228e-05, + "loss": 0.2982, + "step": 15164 + }, + { + "epoch": 41.321525885558586, + "grad_norm": 4.88956880569458, + "learning_rate": 1.3237174487612727e-05, + "loss": 0.1864, + "step": 15165 + }, + { + "epoch": 41.32425068119891, + "grad_norm": 5.869426727294922, + "learning_rate": 1.3236339499355217e-05, + "loss": 0.1928, + "step": 15166 + }, + { + "epoch": 41.32697547683924, + "grad_norm": 6.263637065887451, + "learning_rate": 1.3235504485893198e-05, + "loss": 0.1864, + "step": 15167 + }, + { + "epoch": 41.32970027247956, + "grad_norm": 4.82780122756958, + "learning_rate": 1.3234669447233175e-05, + "loss": 0.2086, + "step": 15168 + }, + { + "epoch": 41.33242506811989, + "grad_norm": 4.812079906463623, + "learning_rate": 1.323383438338165e-05, + "loss": 0.2209, + "step": 15169 + }, + { + "epoch": 41.335149863760215, + "grad_norm": 5.495488166809082, + "learning_rate": 1.3232999294345126e-05, + "loss": 0.2713, + "step": 15170 + }, + { + "epoch": 41.33787465940055, + "grad_norm": 6.937367916107178, + "learning_rate": 1.3232164180130108e-05, + "loss": 0.3763, + "step": 15171 + }, + { + "epoch": 41.34059945504087, + "grad_norm": 7.551480293273926, + "learning_rate": 1.3231329040743099e-05, + "loss": 0.275, + "step": 15172 + }, + { + "epoch": 41.3433242506812, + "grad_norm": 5.157136917114258, + "learning_rate": 1.3230493876190602e-05, + "loss": 0.1614, + "step": 15173 + }, + { + "epoch": 41.346049046321525, + "grad_norm": 9.280787467956543, + "learning_rate": 1.3229658686479128e-05, + "loss": 0.1954, + "step": 15174 + }, + { + "epoch": 41.34877384196185, + "grad_norm": 11.969324111938477, + "learning_rate": 1.322882347161517e-05, + "loss": 0.1795, + "step": 15175 + }, + { + "epoch": 41.35149863760218, + "grad_norm": 6.5450968742370605, + "learning_rate": 1.3227988231605242e-05, + "loss": 0.337, + "step": 15176 + }, + { + "epoch": 41.35422343324251, + "grad_norm": 4.671832084655762, + "learning_rate": 1.3227152966455844e-05, + "loss": 0.3085, + "step": 15177 + }, + { + "epoch": 41.356948228882835, + "grad_norm": 5.481117248535156, + "learning_rate": 1.3226317676173485e-05, + "loss": 0.2548, + "step": 15178 + }, + { + "epoch": 41.35967302452316, + "grad_norm": 6.210432529449463, + "learning_rate": 1.3225482360764666e-05, + "loss": 0.2514, + "step": 15179 + }, + { + "epoch": 41.36239782016349, + "grad_norm": 3.732023239135742, + "learning_rate": 1.3224647020235894e-05, + "loss": 0.2427, + "step": 15180 + }, + { + "epoch": 41.36512261580381, + "grad_norm": 4.857550144195557, + "learning_rate": 1.3223811654593677e-05, + "loss": 0.199, + "step": 15181 + }, + { + "epoch": 41.36784741144414, + "grad_norm": 7.312856674194336, + "learning_rate": 1.3222976263844517e-05, + "loss": 0.2503, + "step": 15182 + }, + { + "epoch": 41.37057220708447, + "grad_norm": 5.666393756866455, + "learning_rate": 1.3222140847994917e-05, + "loss": 0.2112, + "step": 15183 + }, + { + "epoch": 41.3732970027248, + "grad_norm": 7.047507286071777, + "learning_rate": 1.3221305407051395e-05, + "loss": 0.3018, + "step": 15184 + }, + { + "epoch": 41.37602179836512, + "grad_norm": 6.197628021240234, + "learning_rate": 1.3220469941020447e-05, + "loss": 0.2899, + "step": 15185 + }, + { + "epoch": 41.37874659400545, + "grad_norm": 5.384599685668945, + "learning_rate": 1.3219634449908585e-05, + "loss": 0.3897, + "step": 15186 + }, + { + "epoch": 41.381471389645775, + "grad_norm": 5.311314582824707, + "learning_rate": 1.321879893372231e-05, + "loss": 0.2588, + "step": 15187 + }, + { + "epoch": 41.3841961852861, + "grad_norm": 5.707054138183594, + "learning_rate": 1.3217963392468135e-05, + "loss": 0.2493, + "step": 15188 + }, + { + "epoch": 41.38692098092643, + "grad_norm": 8.608099937438965, + "learning_rate": 1.3217127826152563e-05, + "loss": 0.2018, + "step": 15189 + }, + { + "epoch": 41.38964577656676, + "grad_norm": 5.823888778686523, + "learning_rate": 1.3216292234782104e-05, + "loss": 0.202, + "step": 15190 + }, + { + "epoch": 41.392370572207085, + "grad_norm": 5.694127082824707, + "learning_rate": 1.3215456618363264e-05, + "loss": 0.3065, + "step": 15191 + }, + { + "epoch": 41.39509536784741, + "grad_norm": 4.225665092468262, + "learning_rate": 1.3214620976902553e-05, + "loss": 0.1481, + "step": 15192 + }, + { + "epoch": 41.39782016348774, + "grad_norm": 7.366786003112793, + "learning_rate": 1.3213785310406477e-05, + "loss": 0.2728, + "step": 15193 + }, + { + "epoch": 41.40054495912806, + "grad_norm": 5.030938148498535, + "learning_rate": 1.321294961888154e-05, + "loss": 0.217, + "step": 15194 + }, + { + "epoch": 41.403269754768395, + "grad_norm": 4.735142230987549, + "learning_rate": 1.321211390233426e-05, + "loss": 0.1598, + "step": 15195 + }, + { + "epoch": 41.40599455040872, + "grad_norm": 4.333200931549072, + "learning_rate": 1.321127816077114e-05, + "loss": 0.2, + "step": 15196 + }, + { + "epoch": 41.40871934604905, + "grad_norm": 5.632680892944336, + "learning_rate": 1.3210442394198686e-05, + "loss": 0.1638, + "step": 15197 + }, + { + "epoch": 41.41144414168937, + "grad_norm": 6.012128829956055, + "learning_rate": 1.3209606602623411e-05, + "loss": 0.1948, + "step": 15198 + }, + { + "epoch": 41.4141689373297, + "grad_norm": 4.546900272369385, + "learning_rate": 1.3208770786051826e-05, + "loss": 0.1966, + "step": 15199 + }, + { + "epoch": 41.416893732970024, + "grad_norm": 4.972142219543457, + "learning_rate": 1.3207934944490433e-05, + "loss": 0.1824, + "step": 15200 + }, + { + "epoch": 41.41961852861036, + "grad_norm": 6.288185119628906, + "learning_rate": 1.3207099077945749e-05, + "loss": 0.2804, + "step": 15201 + }, + { + "epoch": 41.42234332425068, + "grad_norm": 5.620209217071533, + "learning_rate": 1.3206263186424279e-05, + "loss": 0.2924, + "step": 15202 + }, + { + "epoch": 41.42506811989101, + "grad_norm": 4.958395481109619, + "learning_rate": 1.3205427269932535e-05, + "loss": 0.2925, + "step": 15203 + }, + { + "epoch": 41.427792915531334, + "grad_norm": 4.600726127624512, + "learning_rate": 1.3204591328477028e-05, + "loss": 0.3718, + "step": 15204 + }, + { + "epoch": 41.43051771117166, + "grad_norm": 4.540500640869141, + "learning_rate": 1.3203755362064263e-05, + "loss": 0.17, + "step": 15205 + }, + { + "epoch": 41.433242506811986, + "grad_norm": 8.953529357910156, + "learning_rate": 1.3202919370700758e-05, + "loss": 0.2036, + "step": 15206 + }, + { + "epoch": 41.43596730245232, + "grad_norm": 3.953489065170288, + "learning_rate": 1.3202083354393019e-05, + "loss": 0.1904, + "step": 15207 + }, + { + "epoch": 41.438692098092645, + "grad_norm": 5.842988967895508, + "learning_rate": 1.3201247313147559e-05, + "loss": 0.2263, + "step": 15208 + }, + { + "epoch": 41.44141689373297, + "grad_norm": 5.583596706390381, + "learning_rate": 1.3200411246970885e-05, + "loss": 0.208, + "step": 15209 + }, + { + "epoch": 41.444141689373296, + "grad_norm": 4.909837245941162, + "learning_rate": 1.3199575155869514e-05, + "loss": 0.1663, + "step": 15210 + }, + { + "epoch": 41.44686648501362, + "grad_norm": 5.328984260559082, + "learning_rate": 1.3198739039849955e-05, + "loss": 0.3241, + "step": 15211 + }, + { + "epoch": 41.44959128065395, + "grad_norm": 6.674950122833252, + "learning_rate": 1.3197902898918718e-05, + "loss": 0.4411, + "step": 15212 + }, + { + "epoch": 41.45231607629428, + "grad_norm": 5.948317050933838, + "learning_rate": 1.3197066733082316e-05, + "loss": 0.1893, + "step": 15213 + }, + { + "epoch": 41.45504087193461, + "grad_norm": 4.927055835723877, + "learning_rate": 1.3196230542347259e-05, + "loss": 0.1572, + "step": 15214 + }, + { + "epoch": 41.45776566757493, + "grad_norm": 4.261422157287598, + "learning_rate": 1.3195394326720063e-05, + "loss": 0.2113, + "step": 15215 + }, + { + "epoch": 41.46049046321526, + "grad_norm": 5.302755355834961, + "learning_rate": 1.3194558086207238e-05, + "loss": 0.3796, + "step": 15216 + }, + { + "epoch": 41.463215258855584, + "grad_norm": 5.816093921661377, + "learning_rate": 1.3193721820815302e-05, + "loss": 0.2574, + "step": 15217 + }, + { + "epoch": 41.46594005449591, + "grad_norm": 4.7682600021362305, + "learning_rate": 1.3192885530550758e-05, + "loss": 0.5291, + "step": 15218 + }, + { + "epoch": 41.46866485013624, + "grad_norm": 7.575376987457275, + "learning_rate": 1.3192049215420129e-05, + "loss": 0.3073, + "step": 15219 + }, + { + "epoch": 41.47138964577657, + "grad_norm": 5.825736999511719, + "learning_rate": 1.319121287542992e-05, + "loss": 0.228, + "step": 15220 + }, + { + "epoch": 41.474114441416894, + "grad_norm": 5.374505519866943, + "learning_rate": 1.319037651058665e-05, + "loss": 0.3985, + "step": 15221 + }, + { + "epoch": 41.47683923705722, + "grad_norm": 5.100955009460449, + "learning_rate": 1.3189540120896829e-05, + "loss": 0.2792, + "step": 15222 + }, + { + "epoch": 41.479564032697546, + "grad_norm": 5.804059982299805, + "learning_rate": 1.318870370636697e-05, + "loss": 0.0899, + "step": 15223 + }, + { + "epoch": 41.48228882833787, + "grad_norm": 5.3307061195373535, + "learning_rate": 1.3187867267003592e-05, + "loss": 0.3647, + "step": 15224 + }, + { + "epoch": 41.485013623978205, + "grad_norm": 6.556344985961914, + "learning_rate": 1.3187030802813206e-05, + "loss": 0.3535, + "step": 15225 + }, + { + "epoch": 41.48773841961853, + "grad_norm": 5.337364673614502, + "learning_rate": 1.3186194313802325e-05, + "loss": 0.1569, + "step": 15226 + }, + { + "epoch": 41.490463215258856, + "grad_norm": 4.980561256408691, + "learning_rate": 1.318535779997747e-05, + "loss": 0.2563, + "step": 15227 + }, + { + "epoch": 41.49318801089918, + "grad_norm": 6.962838649749756, + "learning_rate": 1.3184521261345146e-05, + "loss": 0.3742, + "step": 15228 + }, + { + "epoch": 41.49591280653951, + "grad_norm": 5.183857440948486, + "learning_rate": 1.3183684697911875e-05, + "loss": 0.2242, + "step": 15229 + }, + { + "epoch": 41.49863760217983, + "grad_norm": 7.675213813781738, + "learning_rate": 1.318284810968417e-05, + "loss": 0.3745, + "step": 15230 + }, + { + "epoch": 41.50136239782017, + "grad_norm": 5.953858852386475, + "learning_rate": 1.3182011496668548e-05, + "loss": 0.2852, + "step": 15231 + }, + { + "epoch": 41.50408719346049, + "grad_norm": 6.068861484527588, + "learning_rate": 1.3181174858871517e-05, + "loss": 0.2057, + "step": 15232 + }, + { + "epoch": 41.50681198910082, + "grad_norm": 7.253425121307373, + "learning_rate": 1.3180338196299603e-05, + "loss": 0.1679, + "step": 15233 + }, + { + "epoch": 41.509536784741144, + "grad_norm": 4.526234149932861, + "learning_rate": 1.3179501508959315e-05, + "loss": 0.2014, + "step": 15234 + }, + { + "epoch": 41.51226158038147, + "grad_norm": 5.607563495635986, + "learning_rate": 1.3178664796857176e-05, + "loss": 0.2669, + "step": 15235 + }, + { + "epoch": 41.514986376021795, + "grad_norm": 6.936614990234375, + "learning_rate": 1.3177828059999695e-05, + "loss": 0.2768, + "step": 15236 + }, + { + "epoch": 41.51771117166213, + "grad_norm": 5.585014820098877, + "learning_rate": 1.3176991298393393e-05, + "loss": 0.3114, + "step": 15237 + }, + { + "epoch": 41.520435967302454, + "grad_norm": 5.922313213348389, + "learning_rate": 1.3176154512044783e-05, + "loss": 0.237, + "step": 15238 + }, + { + "epoch": 41.52316076294278, + "grad_norm": 4.764875411987305, + "learning_rate": 1.3175317700960386e-05, + "loss": 0.3261, + "step": 15239 + }, + { + "epoch": 41.525885558583106, + "grad_norm": 5.3954758644104, + "learning_rate": 1.3174480865146712e-05, + "loss": 0.3271, + "step": 15240 + }, + { + "epoch": 41.52861035422343, + "grad_norm": 4.896951198577881, + "learning_rate": 1.317364400461029e-05, + "loss": 0.4214, + "step": 15241 + }, + { + "epoch": 41.53133514986376, + "grad_norm": 9.775511741638184, + "learning_rate": 1.3172807119357625e-05, + "loss": 0.2403, + "step": 15242 + }, + { + "epoch": 41.53405994550409, + "grad_norm": 4.736580848693848, + "learning_rate": 1.3171970209395243e-05, + "loss": 0.247, + "step": 15243 + }, + { + "epoch": 41.536784741144416, + "grad_norm": 5.65787410736084, + "learning_rate": 1.317113327472966e-05, + "loss": 0.3753, + "step": 15244 + }, + { + "epoch": 41.53950953678474, + "grad_norm": 5.568493366241455, + "learning_rate": 1.3170296315367392e-05, + "loss": 0.1749, + "step": 15245 + }, + { + "epoch": 41.54223433242507, + "grad_norm": 4.574891090393066, + "learning_rate": 1.3169459331314958e-05, + "loss": 0.2714, + "step": 15246 + }, + { + "epoch": 41.54495912806539, + "grad_norm": 5.970724582672119, + "learning_rate": 1.3168622322578879e-05, + "loss": 0.1911, + "step": 15247 + }, + { + "epoch": 41.54768392370572, + "grad_norm": 4.580286026000977, + "learning_rate": 1.316778528916567e-05, + "loss": 0.1701, + "step": 15248 + }, + { + "epoch": 41.55040871934605, + "grad_norm": 6.1775336265563965, + "learning_rate": 1.3166948231081849e-05, + "loss": 0.2282, + "step": 15249 + }, + { + "epoch": 41.55313351498638, + "grad_norm": 4.816786289215088, + "learning_rate": 1.3166111148333935e-05, + "loss": 0.1585, + "step": 15250 + }, + { + "epoch": 41.555858310626704, + "grad_norm": 4.877140998840332, + "learning_rate": 1.3165274040928456e-05, + "loss": 0.2069, + "step": 15251 + }, + { + "epoch": 41.55858310626703, + "grad_norm": 5.608216762542725, + "learning_rate": 1.316443690887192e-05, + "loss": 0.2691, + "step": 15252 + }, + { + "epoch": 41.561307901907355, + "grad_norm": 5.537759780883789, + "learning_rate": 1.3163599752170852e-05, + "loss": 0.2128, + "step": 15253 + }, + { + "epoch": 41.56403269754768, + "grad_norm": 8.375011444091797, + "learning_rate": 1.3162762570831773e-05, + "loss": 0.1543, + "step": 15254 + }, + { + "epoch": 41.566757493188014, + "grad_norm": 5.1054816246032715, + "learning_rate": 1.31619253648612e-05, + "loss": 0.173, + "step": 15255 + }, + { + "epoch": 41.56948228882834, + "grad_norm": 4.622839450836182, + "learning_rate": 1.3161088134265651e-05, + "loss": 0.2326, + "step": 15256 + }, + { + "epoch": 41.572207084468666, + "grad_norm": 5.541858673095703, + "learning_rate": 1.3160250879051655e-05, + "loss": 0.2054, + "step": 15257 + }, + { + "epoch": 41.57493188010899, + "grad_norm": 5.578751087188721, + "learning_rate": 1.315941359922572e-05, + "loss": 0.2286, + "step": 15258 + }, + { + "epoch": 41.57765667574932, + "grad_norm": 5.844489574432373, + "learning_rate": 1.3158576294794378e-05, + "loss": 0.2263, + "step": 15259 + }, + { + "epoch": 41.58038147138964, + "grad_norm": 6.654881477355957, + "learning_rate": 1.3157738965764146e-05, + "loss": 0.501, + "step": 15260 + }, + { + "epoch": 41.583106267029976, + "grad_norm": 5.959126949310303, + "learning_rate": 1.3156901612141543e-05, + "loss": 0.2935, + "step": 15261 + }, + { + "epoch": 41.5858310626703, + "grad_norm": 5.3083415031433105, + "learning_rate": 1.3156064233933093e-05, + "loss": 0.1636, + "step": 15262 + }, + { + "epoch": 41.58855585831063, + "grad_norm": 7.250215530395508, + "learning_rate": 1.3155226831145316e-05, + "loss": 0.2337, + "step": 15263 + }, + { + "epoch": 41.59128065395095, + "grad_norm": 5.6582417488098145, + "learning_rate": 1.3154389403784733e-05, + "loss": 0.1862, + "step": 15264 + }, + { + "epoch": 41.59400544959128, + "grad_norm": 4.778441905975342, + "learning_rate": 1.3153551951857869e-05, + "loss": 0.298, + "step": 15265 + }, + { + "epoch": 41.596730245231605, + "grad_norm": 5.2142839431762695, + "learning_rate": 1.315271447537124e-05, + "loss": 0.2852, + "step": 15266 + }, + { + "epoch": 41.59945504087194, + "grad_norm": 4.115604877471924, + "learning_rate": 1.3151876974331375e-05, + "loss": 0.1143, + "step": 15267 + }, + { + "epoch": 41.60217983651226, + "grad_norm": 7.301044464111328, + "learning_rate": 1.3151039448744794e-05, + "loss": 0.2248, + "step": 15268 + }, + { + "epoch": 41.60490463215259, + "grad_norm": 4.621791839599609, + "learning_rate": 1.3150201898618019e-05, + "loss": 0.32, + "step": 15269 + }, + { + "epoch": 41.607629427792915, + "grad_norm": 6.88387393951416, + "learning_rate": 1.314936432395757e-05, + "loss": 0.2261, + "step": 15270 + }, + { + "epoch": 41.61035422343324, + "grad_norm": 4.959455490112305, + "learning_rate": 1.3148526724769976e-05, + "loss": 0.1509, + "step": 15271 + }, + { + "epoch": 41.61307901907357, + "grad_norm": 6.008310317993164, + "learning_rate": 1.3147689101061755e-05, + "loss": 0.4298, + "step": 15272 + }, + { + "epoch": 41.6158038147139, + "grad_norm": 5.80253267288208, + "learning_rate": 1.3146851452839435e-05, + "loss": 0.1591, + "step": 15273 + }, + { + "epoch": 41.618528610354225, + "grad_norm": 5.511794567108154, + "learning_rate": 1.3146013780109536e-05, + "loss": 0.244, + "step": 15274 + }, + { + "epoch": 41.62125340599455, + "grad_norm": 4.241323947906494, + "learning_rate": 1.3145176082878584e-05, + "loss": 0.1746, + "step": 15275 + }, + { + "epoch": 41.62397820163488, + "grad_norm": 5.244009494781494, + "learning_rate": 1.3144338361153101e-05, + "loss": 0.2232, + "step": 15276 + }, + { + "epoch": 41.6267029972752, + "grad_norm": 5.850700378417969, + "learning_rate": 1.314350061493961e-05, + "loss": 0.316, + "step": 15277 + }, + { + "epoch": 41.62942779291553, + "grad_norm": 5.898186683654785, + "learning_rate": 1.314266284424464e-05, + "loss": 0.3151, + "step": 15278 + }, + { + "epoch": 41.63215258855586, + "grad_norm": 7.902008533477783, + "learning_rate": 1.3141825049074712e-05, + "loss": 0.2866, + "step": 15279 + }, + { + "epoch": 41.63487738419619, + "grad_norm": 4.587899208068848, + "learning_rate": 1.3140987229436353e-05, + "loss": 0.2135, + "step": 15280 + }, + { + "epoch": 41.63760217983651, + "grad_norm": 4.991730213165283, + "learning_rate": 1.3140149385336085e-05, + "loss": 0.2355, + "step": 15281 + }, + { + "epoch": 41.64032697547684, + "grad_norm": 5.29056978225708, + "learning_rate": 1.3139311516780435e-05, + "loss": 0.3366, + "step": 15282 + }, + { + "epoch": 41.643051771117165, + "grad_norm": 4.8959269523620605, + "learning_rate": 1.3138473623775927e-05, + "loss": 0.242, + "step": 15283 + }, + { + "epoch": 41.64577656675749, + "grad_norm": 4.812049865722656, + "learning_rate": 1.3137635706329091e-05, + "loss": 0.2605, + "step": 15284 + }, + { + "epoch": 41.64850136239782, + "grad_norm": 5.69114875793457, + "learning_rate": 1.3136797764446445e-05, + "loss": 0.2483, + "step": 15285 + }, + { + "epoch": 41.65122615803815, + "grad_norm": 4.23663330078125, + "learning_rate": 1.3135959798134522e-05, + "loss": 0.1755, + "step": 15286 + }, + { + "epoch": 41.653950953678475, + "grad_norm": 5.8705153465271, + "learning_rate": 1.3135121807399842e-05, + "loss": 0.2071, + "step": 15287 + }, + { + "epoch": 41.6566757493188, + "grad_norm": 4.611892223358154, + "learning_rate": 1.3134283792248939e-05, + "loss": 0.1189, + "step": 15288 + }, + { + "epoch": 41.65940054495913, + "grad_norm": 6.163382530212402, + "learning_rate": 1.3133445752688329e-05, + "loss": 0.2847, + "step": 15289 + }, + { + "epoch": 41.66212534059945, + "grad_norm": 4.534838676452637, + "learning_rate": 1.3132607688724547e-05, + "loss": 0.1187, + "step": 15290 + }, + { + "epoch": 41.664850136239785, + "grad_norm": 5.232635498046875, + "learning_rate": 1.3131769600364117e-05, + "loss": 0.2185, + "step": 15291 + }, + { + "epoch": 41.66757493188011, + "grad_norm": 4.810821056365967, + "learning_rate": 1.3130931487613566e-05, + "loss": 0.1955, + "step": 15292 + }, + { + "epoch": 41.67029972752044, + "grad_norm": 5.155076026916504, + "learning_rate": 1.313009335047942e-05, + "loss": 0.2985, + "step": 15293 + }, + { + "epoch": 41.67302452316076, + "grad_norm": 5.9662604331970215, + "learning_rate": 1.312925518896821e-05, + "loss": 0.1742, + "step": 15294 + }, + { + "epoch": 41.67574931880109, + "grad_norm": 6.306094646453857, + "learning_rate": 1.312841700308646e-05, + "loss": 0.2366, + "step": 15295 + }, + { + "epoch": 41.678474114441414, + "grad_norm": 9.599309921264648, + "learning_rate": 1.31275787928407e-05, + "loss": 0.285, + "step": 15296 + }, + { + "epoch": 41.68119891008175, + "grad_norm": 7.673811435699463, + "learning_rate": 1.3126740558237459e-05, + "loss": 0.3566, + "step": 15297 + }, + { + "epoch": 41.68392370572207, + "grad_norm": 5.701015949249268, + "learning_rate": 1.312590229928326e-05, + "loss": 0.2245, + "step": 15298 + }, + { + "epoch": 41.6866485013624, + "grad_norm": 5.403347015380859, + "learning_rate": 1.3125064015984634e-05, + "loss": 0.288, + "step": 15299 + }, + { + "epoch": 41.689373297002724, + "grad_norm": 5.293545722961426, + "learning_rate": 1.3124225708348113e-05, + "loss": 0.2547, + "step": 15300 + }, + { + "epoch": 41.69209809264305, + "grad_norm": 5.065179347991943, + "learning_rate": 1.3123387376380218e-05, + "loss": 0.3229, + "step": 15301 + }, + { + "epoch": 41.694822888283376, + "grad_norm": 4.2079644203186035, + "learning_rate": 1.3122549020087487e-05, + "loss": 0.185, + "step": 15302 + }, + { + "epoch": 41.69754768392371, + "grad_norm": 5.518126964569092, + "learning_rate": 1.3121710639476444e-05, + "loss": 0.1744, + "step": 15303 + }, + { + "epoch": 41.700272479564035, + "grad_norm": 7.460519313812256, + "learning_rate": 1.3120872234553618e-05, + "loss": 0.306, + "step": 15304 + }, + { + "epoch": 41.70299727520436, + "grad_norm": 67.50646209716797, + "learning_rate": 1.3120033805325541e-05, + "loss": 0.2707, + "step": 15305 + }, + { + "epoch": 41.705722070844686, + "grad_norm": 5.967147350311279, + "learning_rate": 1.3119195351798742e-05, + "loss": 0.2522, + "step": 15306 + }, + { + "epoch": 41.70844686648501, + "grad_norm": 6.045979976654053, + "learning_rate": 1.3118356873979745e-05, + "loss": 0.2151, + "step": 15307 + }, + { + "epoch": 41.71117166212534, + "grad_norm": 10.25633716583252, + "learning_rate": 1.3117518371875091e-05, + "loss": 0.3222, + "step": 15308 + }, + { + "epoch": 41.71389645776567, + "grad_norm": 9.394362449645996, + "learning_rate": 1.3116679845491298e-05, + "loss": 0.2045, + "step": 15309 + }, + { + "epoch": 41.716621253406, + "grad_norm": 12.04206371307373, + "learning_rate": 1.3115841294834908e-05, + "loss": 0.2087, + "step": 15310 + }, + { + "epoch": 41.71934604904632, + "grad_norm": 6.293303966522217, + "learning_rate": 1.3115002719912443e-05, + "loss": 0.1517, + "step": 15311 + }, + { + "epoch": 41.72207084468665, + "grad_norm": 5.3646087646484375, + "learning_rate": 1.3114164120730439e-05, + "loss": 0.371, + "step": 15312 + }, + { + "epoch": 41.724795640326974, + "grad_norm": 8.045680046081543, + "learning_rate": 1.3113325497295424e-05, + "loss": 0.34, + "step": 15313 + }, + { + "epoch": 41.7275204359673, + "grad_norm": 6.927548885345459, + "learning_rate": 1.3112486849613933e-05, + "loss": 0.14, + "step": 15314 + }, + { + "epoch": 41.73024523160763, + "grad_norm": 6.970993518829346, + "learning_rate": 1.311164817769249e-05, + "loss": 0.1973, + "step": 15315 + }, + { + "epoch": 41.73297002724796, + "grad_norm": 5.929052352905273, + "learning_rate": 1.3110809481537637e-05, + "loss": 0.3159, + "step": 15316 + }, + { + "epoch": 41.735694822888284, + "grad_norm": 6.026272296905518, + "learning_rate": 1.3109970761155895e-05, + "loss": 0.3716, + "step": 15317 + }, + { + "epoch": 41.73841961852861, + "grad_norm": 5.031559944152832, + "learning_rate": 1.31091320165538e-05, + "loss": 0.2368, + "step": 15318 + }, + { + "epoch": 41.741144414168936, + "grad_norm": 5.375189304351807, + "learning_rate": 1.3108293247737886e-05, + "loss": 0.2339, + "step": 15319 + }, + { + "epoch": 41.74386920980926, + "grad_norm": 10.033079147338867, + "learning_rate": 1.3107454454714686e-05, + "loss": 0.1756, + "step": 15320 + }, + { + "epoch": 41.746594005449595, + "grad_norm": 7.099547863006592, + "learning_rate": 1.310661563749073e-05, + "loss": 0.2812, + "step": 15321 + }, + { + "epoch": 41.74931880108992, + "grad_norm": 6.8617048263549805, + "learning_rate": 1.3105776796072554e-05, + "loss": 0.3354, + "step": 15322 + }, + { + "epoch": 41.752043596730246, + "grad_norm": 6.954360485076904, + "learning_rate": 1.3104937930466684e-05, + "loss": 0.1971, + "step": 15323 + }, + { + "epoch": 41.75476839237057, + "grad_norm": 5.201631546020508, + "learning_rate": 1.3104099040679658e-05, + "loss": 0.2502, + "step": 15324 + }, + { + "epoch": 41.7574931880109, + "grad_norm": 6.470422267913818, + "learning_rate": 1.3103260126718009e-05, + "loss": 0.3214, + "step": 15325 + }, + { + "epoch": 41.76021798365122, + "grad_norm": 5.426015853881836, + "learning_rate": 1.310242118858827e-05, + "loss": 0.1899, + "step": 15326 + }, + { + "epoch": 41.762942779291556, + "grad_norm": 6.195144176483154, + "learning_rate": 1.3101582226296974e-05, + "loss": 0.2476, + "step": 15327 + }, + { + "epoch": 41.76566757493188, + "grad_norm": 5.391987323760986, + "learning_rate": 1.310074323985066e-05, + "loss": 0.2142, + "step": 15328 + }, + { + "epoch": 41.76839237057221, + "grad_norm": 7.920438766479492, + "learning_rate": 1.3099904229255853e-05, + "loss": 0.194, + "step": 15329 + }, + { + "epoch": 41.771117166212534, + "grad_norm": 5.797364711761475, + "learning_rate": 1.3099065194519094e-05, + "loss": 0.202, + "step": 15330 + }, + { + "epoch": 41.77384196185286, + "grad_norm": 6.113834381103516, + "learning_rate": 1.3098226135646913e-05, + "loss": 0.3482, + "step": 15331 + }, + { + "epoch": 41.776566757493185, + "grad_norm": 5.577930927276611, + "learning_rate": 1.3097387052645848e-05, + "loss": 0.3937, + "step": 15332 + }, + { + "epoch": 41.77929155313352, + "grad_norm": 5.87706184387207, + "learning_rate": 1.3096547945522431e-05, + "loss": 0.226, + "step": 15333 + }, + { + "epoch": 41.782016348773844, + "grad_norm": 8.071033477783203, + "learning_rate": 1.3095708814283199e-05, + "loss": 0.1975, + "step": 15334 + }, + { + "epoch": 41.78474114441417, + "grad_norm": 14.369377136230469, + "learning_rate": 1.3094869658934684e-05, + "loss": 0.2438, + "step": 15335 + }, + { + "epoch": 41.787465940054496, + "grad_norm": 7.034031391143799, + "learning_rate": 1.3094030479483428e-05, + "loss": 0.1746, + "step": 15336 + }, + { + "epoch": 41.79019073569482, + "grad_norm": 6.4937920570373535, + "learning_rate": 1.3093191275935957e-05, + "loss": 0.1385, + "step": 15337 + }, + { + "epoch": 41.79291553133515, + "grad_norm": 6.9117207527160645, + "learning_rate": 1.3092352048298817e-05, + "loss": 0.2037, + "step": 15338 + }, + { + "epoch": 41.79564032697548, + "grad_norm": 4.784533977508545, + "learning_rate": 1.3091512796578536e-05, + "loss": 0.1467, + "step": 15339 + }, + { + "epoch": 41.798365122615806, + "grad_norm": 7.152564525604248, + "learning_rate": 1.3090673520781656e-05, + "loss": 0.1942, + "step": 15340 + }, + { + "epoch": 41.80108991825613, + "grad_norm": 6.839911937713623, + "learning_rate": 1.3089834220914708e-05, + "loss": 0.1905, + "step": 15341 + }, + { + "epoch": 41.80381471389646, + "grad_norm": 7.334344387054443, + "learning_rate": 1.308899489698423e-05, + "loss": 0.1861, + "step": 15342 + }, + { + "epoch": 41.80653950953678, + "grad_norm": 6.282195568084717, + "learning_rate": 1.308815554899676e-05, + "loss": 0.2075, + "step": 15343 + }, + { + "epoch": 41.80926430517711, + "grad_norm": 5.372369289398193, + "learning_rate": 1.3087316176958831e-05, + "loss": 0.3172, + "step": 15344 + }, + { + "epoch": 41.81198910081744, + "grad_norm": 4.968111038208008, + "learning_rate": 1.3086476780876984e-05, + "loss": 0.2896, + "step": 15345 + }, + { + "epoch": 41.81471389645777, + "grad_norm": 5.8525776863098145, + "learning_rate": 1.308563736075776e-05, + "loss": 0.2248, + "step": 15346 + }, + { + "epoch": 41.817438692098094, + "grad_norm": 5.676025390625, + "learning_rate": 1.3084797916607685e-05, + "loss": 0.2509, + "step": 15347 + }, + { + "epoch": 41.82016348773842, + "grad_norm": 4.851386070251465, + "learning_rate": 1.3083958448433309e-05, + "loss": 0.2982, + "step": 15348 + }, + { + "epoch": 41.822888283378745, + "grad_norm": 6.4344916343688965, + "learning_rate": 1.308311895624116e-05, + "loss": 0.2299, + "step": 15349 + }, + { + "epoch": 41.82561307901907, + "grad_norm": 6.615203380584717, + "learning_rate": 1.3082279440037781e-05, + "loss": 0.2948, + "step": 15350 + }, + { + "epoch": 41.828337874659404, + "grad_norm": 5.562697887420654, + "learning_rate": 1.3081439899829708e-05, + "loss": 0.1624, + "step": 15351 + }, + { + "epoch": 41.83106267029973, + "grad_norm": 12.665985107421875, + "learning_rate": 1.3080600335623481e-05, + "loss": 0.3642, + "step": 15352 + }, + { + "epoch": 41.833787465940055, + "grad_norm": 6.387678146362305, + "learning_rate": 1.3079760747425639e-05, + "loss": 0.2876, + "step": 15353 + }, + { + "epoch": 41.83651226158038, + "grad_norm": 6.966700553894043, + "learning_rate": 1.3078921135242717e-05, + "loss": 0.3378, + "step": 15354 + }, + { + "epoch": 41.83923705722071, + "grad_norm": 6.500558376312256, + "learning_rate": 1.307808149908126e-05, + "loss": 0.2065, + "step": 15355 + }, + { + "epoch": 41.84196185286103, + "grad_norm": 5.680296897888184, + "learning_rate": 1.3077241838947799e-05, + "loss": 0.1368, + "step": 15356 + }, + { + "epoch": 41.844686648501366, + "grad_norm": 6.377245903015137, + "learning_rate": 1.307640215484888e-05, + "loss": 0.203, + "step": 15357 + }, + { + "epoch": 41.84741144414169, + "grad_norm": 22.68838119506836, + "learning_rate": 1.3075562446791042e-05, + "loss": 0.1714, + "step": 15358 + }, + { + "epoch": 41.85013623978202, + "grad_norm": 8.626298904418945, + "learning_rate": 1.3074722714780817e-05, + "loss": 0.2568, + "step": 15359 + }, + { + "epoch": 41.85286103542234, + "grad_norm": 6.1405534744262695, + "learning_rate": 1.3073882958824755e-05, + "loss": 0.1826, + "step": 15360 + }, + { + "epoch": 41.85558583106267, + "grad_norm": 7.051835060119629, + "learning_rate": 1.307304317892939e-05, + "loss": 0.2987, + "step": 15361 + }, + { + "epoch": 41.858310626702995, + "grad_norm": 6.392403602600098, + "learning_rate": 1.3072203375101263e-05, + "loss": 0.2063, + "step": 15362 + }, + { + "epoch": 41.86103542234333, + "grad_norm": 6.399654388427734, + "learning_rate": 1.3071363547346916e-05, + "loss": 0.3133, + "step": 15363 + }, + { + "epoch": 41.86376021798365, + "grad_norm": 6.283120155334473, + "learning_rate": 1.3070523695672887e-05, + "loss": 0.2275, + "step": 15364 + }, + { + "epoch": 41.86648501362398, + "grad_norm": 6.596218585968018, + "learning_rate": 1.3069683820085722e-05, + "loss": 0.3038, + "step": 15365 + }, + { + "epoch": 41.869209809264305, + "grad_norm": 7.6157097816467285, + "learning_rate": 1.3068843920591953e-05, + "loss": 0.2207, + "step": 15366 + }, + { + "epoch": 41.87193460490463, + "grad_norm": 5.655492305755615, + "learning_rate": 1.306800399719813e-05, + "loss": 0.2601, + "step": 15367 + }, + { + "epoch": 41.87465940054496, + "grad_norm": 6.912761688232422, + "learning_rate": 1.306716404991079e-05, + "loss": 0.2409, + "step": 15368 + }, + { + "epoch": 41.87738419618529, + "grad_norm": 6.548763275146484, + "learning_rate": 1.3066324078736474e-05, + "loss": 0.212, + "step": 15369 + }, + { + "epoch": 41.880108991825615, + "grad_norm": 5.032128810882568, + "learning_rate": 1.3065484083681726e-05, + "loss": 0.2292, + "step": 15370 + }, + { + "epoch": 41.88283378746594, + "grad_norm": 6.4837870597839355, + "learning_rate": 1.3064644064753088e-05, + "loss": 0.3713, + "step": 15371 + }, + { + "epoch": 41.88555858310627, + "grad_norm": 5.282232284545898, + "learning_rate": 1.3063804021957096e-05, + "loss": 0.1822, + "step": 15372 + }, + { + "epoch": 41.88828337874659, + "grad_norm": 7.438727378845215, + "learning_rate": 1.3062963955300301e-05, + "loss": 0.191, + "step": 15373 + }, + { + "epoch": 41.89100817438692, + "grad_norm": 5.965965747833252, + "learning_rate": 1.306212386478924e-05, + "loss": 0.297, + "step": 15374 + }, + { + "epoch": 41.89373297002725, + "grad_norm": 7.361672878265381, + "learning_rate": 1.3061283750430457e-05, + "loss": 0.1581, + "step": 15375 + }, + { + "epoch": 41.89645776566758, + "grad_norm": 5.851138114929199, + "learning_rate": 1.3060443612230493e-05, + "loss": 0.1822, + "step": 15376 + }, + { + "epoch": 41.8991825613079, + "grad_norm": 5.922891139984131, + "learning_rate": 1.3059603450195897e-05, + "loss": 0.2337, + "step": 15377 + }, + { + "epoch": 41.90190735694823, + "grad_norm": 5.012266635894775, + "learning_rate": 1.30587632643332e-05, + "loss": 0.2147, + "step": 15378 + }, + { + "epoch": 41.904632152588555, + "grad_norm": 5.913313388824463, + "learning_rate": 1.305792305464896e-05, + "loss": 0.2551, + "step": 15379 + }, + { + "epoch": 41.90735694822888, + "grad_norm": 6.6129608154296875, + "learning_rate": 1.305708282114971e-05, + "loss": 0.3024, + "step": 15380 + }, + { + "epoch": 41.91008174386921, + "grad_norm": 6.702880382537842, + "learning_rate": 1.3056242563842003e-05, + "loss": 0.4563, + "step": 15381 + }, + { + "epoch": 41.91280653950954, + "grad_norm": 7.25404691696167, + "learning_rate": 1.3055402282732372e-05, + "loss": 0.2057, + "step": 15382 + }, + { + "epoch": 41.915531335149865, + "grad_norm": 6.396892547607422, + "learning_rate": 1.3054561977827369e-05, + "loss": 0.2443, + "step": 15383 + }, + { + "epoch": 41.91825613079019, + "grad_norm": 6.1185479164123535, + "learning_rate": 1.3053721649133536e-05, + "loss": 0.1937, + "step": 15384 + }, + { + "epoch": 41.920980926430516, + "grad_norm": 6.4015631675720215, + "learning_rate": 1.3052881296657414e-05, + "loss": 0.1727, + "step": 15385 + }, + { + "epoch": 41.92370572207084, + "grad_norm": 6.655409336090088, + "learning_rate": 1.305204092040555e-05, + "loss": 0.1824, + "step": 15386 + }, + { + "epoch": 41.926430517711175, + "grad_norm": 5.204779148101807, + "learning_rate": 1.3051200520384493e-05, + "loss": 0.2001, + "step": 15387 + }, + { + "epoch": 41.9291553133515, + "grad_norm": 5.45819616317749, + "learning_rate": 1.3050360096600782e-05, + "loss": 0.1931, + "step": 15388 + }, + { + "epoch": 41.93188010899183, + "grad_norm": 5.179225444793701, + "learning_rate": 1.304951964906097e-05, + "loss": 0.2817, + "step": 15389 + }, + { + "epoch": 41.93460490463215, + "grad_norm": 5.597849369049072, + "learning_rate": 1.304867917777159e-05, + "loss": 0.29, + "step": 15390 + }, + { + "epoch": 41.93732970027248, + "grad_norm": 8.691641807556152, + "learning_rate": 1.30478386827392e-05, + "loss": 0.3512, + "step": 15391 + }, + { + "epoch": 41.940054495912804, + "grad_norm": 5.923669815063477, + "learning_rate": 1.3046998163970337e-05, + "loss": 0.2259, + "step": 15392 + }, + { + "epoch": 41.94277929155314, + "grad_norm": 6.423624515533447, + "learning_rate": 1.3046157621471554e-05, + "loss": 0.2494, + "step": 15393 + }, + { + "epoch": 41.94550408719346, + "grad_norm": 6.862639427185059, + "learning_rate": 1.304531705524939e-05, + "loss": 0.2584, + "step": 15394 + }, + { + "epoch": 41.94822888283379, + "grad_norm": 6.9730730056762695, + "learning_rate": 1.3044476465310393e-05, + "loss": 0.3208, + "step": 15395 + }, + { + "epoch": 41.950953678474114, + "grad_norm": 4.9324631690979, + "learning_rate": 1.3043635851661114e-05, + "loss": 0.279, + "step": 15396 + }, + { + "epoch": 41.95367847411444, + "grad_norm": 5.757242202758789, + "learning_rate": 1.3042795214308099e-05, + "loss": 0.3135, + "step": 15397 + }, + { + "epoch": 41.956403269754766, + "grad_norm": 6.020074367523193, + "learning_rate": 1.304195455325789e-05, + "loss": 0.258, + "step": 15398 + }, + { + "epoch": 41.95912806539509, + "grad_norm": 5.665360927581787, + "learning_rate": 1.3041113868517039e-05, + "loss": 0.3511, + "step": 15399 + }, + { + "epoch": 41.961852861035425, + "grad_norm": 6.090458393096924, + "learning_rate": 1.3040273160092089e-05, + "loss": 0.2254, + "step": 15400 + }, + { + "epoch": 41.96457765667575, + "grad_norm": 7.211927890777588, + "learning_rate": 1.3039432427989592e-05, + "loss": 0.1688, + "step": 15401 + }, + { + "epoch": 41.967302452316076, + "grad_norm": 6.268174648284912, + "learning_rate": 1.303859167221609e-05, + "loss": 0.3152, + "step": 15402 + }, + { + "epoch": 41.9700272479564, + "grad_norm": 4.178107261657715, + "learning_rate": 1.3037750892778136e-05, + "loss": 0.3118, + "step": 15403 + }, + { + "epoch": 41.97275204359673, + "grad_norm": 5.503861427307129, + "learning_rate": 1.3036910089682272e-05, + "loss": 0.2277, + "step": 15404 + }, + { + "epoch": 41.97547683923706, + "grad_norm": 5.349115371704102, + "learning_rate": 1.3036069262935057e-05, + "loss": 0.2132, + "step": 15405 + }, + { + "epoch": 41.97820163487739, + "grad_norm": 5.785735607147217, + "learning_rate": 1.3035228412543026e-05, + "loss": 0.2861, + "step": 15406 + }, + { + "epoch": 41.98092643051771, + "grad_norm": 6.72636604309082, + "learning_rate": 1.3034387538512739e-05, + "loss": 0.3956, + "step": 15407 + }, + { + "epoch": 41.98365122615804, + "grad_norm": 6.461788177490234, + "learning_rate": 1.3033546640850734e-05, + "loss": 0.2765, + "step": 15408 + }, + { + "epoch": 41.986376021798364, + "grad_norm": 6.205533504486084, + "learning_rate": 1.3032705719563569e-05, + "loss": 0.3482, + "step": 15409 + }, + { + "epoch": 41.98910081743869, + "grad_norm": 6.210002899169922, + "learning_rate": 1.3031864774657788e-05, + "loss": 0.1491, + "step": 15410 + }, + { + "epoch": 41.991825613079016, + "grad_norm": 6.160497665405273, + "learning_rate": 1.3031023806139944e-05, + "loss": 0.3325, + "step": 15411 + }, + { + "epoch": 41.99455040871935, + "grad_norm": 5.840280055999756, + "learning_rate": 1.303018281401658e-05, + "loss": 0.1688, + "step": 15412 + }, + { + "epoch": 41.997275204359674, + "grad_norm": 6.895257472991943, + "learning_rate": 1.3029341798294253e-05, + "loss": 0.1855, + "step": 15413 + }, + { + "epoch": 42.0, + "grad_norm": 5.932795524597168, + "learning_rate": 1.3028500758979507e-05, + "loss": 0.1838, + "step": 15414 + }, + { + "epoch": 42.002724795640326, + "grad_norm": 5.44658899307251, + "learning_rate": 1.3027659696078898e-05, + "loss": 0.2222, + "step": 15415 + }, + { + "epoch": 42.00544959128065, + "grad_norm": 5.552676677703857, + "learning_rate": 1.302681860959897e-05, + "loss": 0.2783, + "step": 15416 + }, + { + "epoch": 42.00817438692098, + "grad_norm": 4.85700798034668, + "learning_rate": 1.3025977499546279e-05, + "loss": 0.1188, + "step": 15417 + }, + { + "epoch": 42.01089918256131, + "grad_norm": 6.233191967010498, + "learning_rate": 1.3025136365927371e-05, + "loss": 0.1516, + "step": 15418 + }, + { + "epoch": 42.013623978201636, + "grad_norm": 4.825685501098633, + "learning_rate": 1.3024295208748798e-05, + "loss": 0.2505, + "step": 15419 + }, + { + "epoch": 42.01634877384196, + "grad_norm": 5.147552490234375, + "learning_rate": 1.3023454028017111e-05, + "loss": 0.1792, + "step": 15420 + }, + { + "epoch": 42.01907356948229, + "grad_norm": 4.855800628662109, + "learning_rate": 1.3022612823738861e-05, + "loss": 0.26, + "step": 15421 + }, + { + "epoch": 42.02179836512261, + "grad_norm": 5.426023960113525, + "learning_rate": 1.3021771595920601e-05, + "loss": 0.2316, + "step": 15422 + }, + { + "epoch": 42.02452316076294, + "grad_norm": 6.038941860198975, + "learning_rate": 1.3020930344568881e-05, + "loss": 0.27, + "step": 15423 + }, + { + "epoch": 42.02724795640327, + "grad_norm": 6.548643589019775, + "learning_rate": 1.3020089069690252e-05, + "loss": 0.2178, + "step": 15424 + }, + { + "epoch": 42.0299727520436, + "grad_norm": 6.110074043273926, + "learning_rate": 1.3019247771291265e-05, + "loss": 0.2289, + "step": 15425 + }, + { + "epoch": 42.032697547683924, + "grad_norm": 5.3518195152282715, + "learning_rate": 1.3018406449378475e-05, + "loss": 0.2506, + "step": 15426 + }, + { + "epoch": 42.03542234332425, + "grad_norm": 5.930940628051758, + "learning_rate": 1.3017565103958434e-05, + "loss": 0.1571, + "step": 15427 + }, + { + "epoch": 42.038147138964575, + "grad_norm": 4.607296943664551, + "learning_rate": 1.3016723735037693e-05, + "loss": 0.1317, + "step": 15428 + }, + { + "epoch": 42.0408719346049, + "grad_norm": 5.928393840789795, + "learning_rate": 1.3015882342622804e-05, + "loss": 0.3472, + "step": 15429 + }, + { + "epoch": 42.043596730245234, + "grad_norm": 6.279974937438965, + "learning_rate": 1.3015040926720319e-05, + "loss": 0.1874, + "step": 15430 + }, + { + "epoch": 42.04632152588556, + "grad_norm": 4.728000164031982, + "learning_rate": 1.3014199487336792e-05, + "loss": 0.1772, + "step": 15431 + }, + { + "epoch": 42.049046321525886, + "grad_norm": 8.560091972351074, + "learning_rate": 1.3013358024478778e-05, + "loss": 0.1634, + "step": 15432 + }, + { + "epoch": 42.05177111716621, + "grad_norm": 6.110546112060547, + "learning_rate": 1.3012516538152828e-05, + "loss": 0.1488, + "step": 15433 + }, + { + "epoch": 42.05449591280654, + "grad_norm": 5.91204309463501, + "learning_rate": 1.3011675028365496e-05, + "loss": 0.1645, + "step": 15434 + }, + { + "epoch": 42.05722070844686, + "grad_norm": 6.979456901550293, + "learning_rate": 1.3010833495123339e-05, + "loss": 0.18, + "step": 15435 + }, + { + "epoch": 42.059945504087196, + "grad_norm": 4.777736186981201, + "learning_rate": 1.3009991938432904e-05, + "loss": 0.2222, + "step": 15436 + }, + { + "epoch": 42.06267029972752, + "grad_norm": 4.932180881500244, + "learning_rate": 1.3009150358300751e-05, + "loss": 0.1425, + "step": 15437 + }, + { + "epoch": 42.06539509536785, + "grad_norm": 5.368439197540283, + "learning_rate": 1.3008308754733428e-05, + "loss": 0.1572, + "step": 15438 + }, + { + "epoch": 42.06811989100817, + "grad_norm": 6.10922908782959, + "learning_rate": 1.3007467127737497e-05, + "loss": 0.368, + "step": 15439 + }, + { + "epoch": 42.0708446866485, + "grad_norm": 10.76334285736084, + "learning_rate": 1.3006625477319509e-05, + "loss": 0.2007, + "step": 15440 + }, + { + "epoch": 42.073569482288825, + "grad_norm": 8.216444969177246, + "learning_rate": 1.3005783803486015e-05, + "loss": 0.1735, + "step": 15441 + }, + { + "epoch": 42.07629427792916, + "grad_norm": 5.379700183868408, + "learning_rate": 1.3004942106243576e-05, + "loss": 0.1608, + "step": 15442 + }, + { + "epoch": 42.079019073569484, + "grad_norm": 4.8208818435668945, + "learning_rate": 1.3004100385598744e-05, + "loss": 0.2262, + "step": 15443 + }, + { + "epoch": 42.08174386920981, + "grad_norm": 5.083765983581543, + "learning_rate": 1.3003258641558073e-05, + "loss": 0.3147, + "step": 15444 + }, + { + "epoch": 42.084468664850135, + "grad_norm": 11.18905258178711, + "learning_rate": 1.3002416874128125e-05, + "loss": 0.243, + "step": 15445 + }, + { + "epoch": 42.08719346049046, + "grad_norm": 10.343413352966309, + "learning_rate": 1.3001575083315447e-05, + "loss": 0.3232, + "step": 15446 + }, + { + "epoch": 42.08991825613079, + "grad_norm": 6.096678256988525, + "learning_rate": 1.30007332691266e-05, + "loss": 0.1783, + "step": 15447 + }, + { + "epoch": 42.09264305177112, + "grad_norm": 4.937675952911377, + "learning_rate": 1.2999891431568141e-05, + "loss": 0.1357, + "step": 15448 + }, + { + "epoch": 42.095367847411445, + "grad_norm": 5.313512802124023, + "learning_rate": 1.299904957064662e-05, + "loss": 0.1648, + "step": 15449 + }, + { + "epoch": 42.09809264305177, + "grad_norm": 6.183883190155029, + "learning_rate": 1.29982076863686e-05, + "loss": 0.1842, + "step": 15450 + }, + { + "epoch": 42.1008174386921, + "grad_norm": 6.514837265014648, + "learning_rate": 1.2997365778740636e-05, + "loss": 0.245, + "step": 15451 + }, + { + "epoch": 42.10354223433242, + "grad_norm": 5.0147504806518555, + "learning_rate": 1.2996523847769283e-05, + "loss": 0.1951, + "step": 15452 + }, + { + "epoch": 42.10626702997275, + "grad_norm": 5.101580619812012, + "learning_rate": 1.2995681893461098e-05, + "loss": 0.1931, + "step": 15453 + }, + { + "epoch": 42.10899182561308, + "grad_norm": 5.041823387145996, + "learning_rate": 1.2994839915822639e-05, + "loss": 0.1534, + "step": 15454 + }, + { + "epoch": 42.11171662125341, + "grad_norm": 5.5947585105896, + "learning_rate": 1.2993997914860464e-05, + "loss": 0.1637, + "step": 15455 + }, + { + "epoch": 42.11444141689373, + "grad_norm": 5.6965837478637695, + "learning_rate": 1.2993155890581127e-05, + "loss": 0.1769, + "step": 15456 + }, + { + "epoch": 42.11716621253406, + "grad_norm": 5.925455570220947, + "learning_rate": 1.2992313842991189e-05, + "loss": 0.2349, + "step": 15457 + }, + { + "epoch": 42.119891008174385, + "grad_norm": 10.506064414978027, + "learning_rate": 1.2991471772097211e-05, + "loss": 0.1553, + "step": 15458 + }, + { + "epoch": 42.12261580381471, + "grad_norm": 4.932344436645508, + "learning_rate": 1.2990629677905741e-05, + "loss": 0.1751, + "step": 15459 + }, + { + "epoch": 42.12534059945504, + "grad_norm": 5.502622127532959, + "learning_rate": 1.298978756042335e-05, + "loss": 0.1926, + "step": 15460 + }, + { + "epoch": 42.12806539509537, + "grad_norm": 5.065340042114258, + "learning_rate": 1.2988945419656585e-05, + "loss": 0.1705, + "step": 15461 + }, + { + "epoch": 42.130790190735695, + "grad_norm": 7.667355537414551, + "learning_rate": 1.2988103255612012e-05, + "loss": 0.2387, + "step": 15462 + }, + { + "epoch": 42.13351498637602, + "grad_norm": 12.919604301452637, + "learning_rate": 1.2987261068296184e-05, + "loss": 0.2179, + "step": 15463 + }, + { + "epoch": 42.13623978201635, + "grad_norm": 5.050688743591309, + "learning_rate": 1.2986418857715663e-05, + "loss": 0.1942, + "step": 15464 + }, + { + "epoch": 42.13896457765667, + "grad_norm": 6.5861053466796875, + "learning_rate": 1.298557662387701e-05, + "loss": 0.1959, + "step": 15465 + }, + { + "epoch": 42.141689373297005, + "grad_norm": 9.029101371765137, + "learning_rate": 1.2984734366786782e-05, + "loss": 0.2185, + "step": 15466 + }, + { + "epoch": 42.14441416893733, + "grad_norm": 6.017579078674316, + "learning_rate": 1.298389208645154e-05, + "loss": 0.2112, + "step": 15467 + }, + { + "epoch": 42.14713896457766, + "grad_norm": 5.677315711975098, + "learning_rate": 1.2983049782877842e-05, + "loss": 0.3474, + "step": 15468 + }, + { + "epoch": 42.14986376021798, + "grad_norm": 6.018444538116455, + "learning_rate": 1.2982207456072246e-05, + "loss": 0.1863, + "step": 15469 + }, + { + "epoch": 42.15258855585831, + "grad_norm": 5.981948375701904, + "learning_rate": 1.2981365106041317e-05, + "loss": 0.2695, + "step": 15470 + }, + { + "epoch": 42.155313351498634, + "grad_norm": 6.641706466674805, + "learning_rate": 1.298052273279161e-05, + "loss": 0.2976, + "step": 15471 + }, + { + "epoch": 42.15803814713897, + "grad_norm": 6.385588645935059, + "learning_rate": 1.297968033632969e-05, + "loss": 0.2371, + "step": 15472 + }, + { + "epoch": 42.16076294277929, + "grad_norm": 7.496885776519775, + "learning_rate": 1.2978837916662113e-05, + "loss": 0.392, + "step": 15473 + }, + { + "epoch": 42.16348773841962, + "grad_norm": 5.354748249053955, + "learning_rate": 1.2977995473795444e-05, + "loss": 0.2055, + "step": 15474 + }, + { + "epoch": 42.166212534059945, + "grad_norm": 9.016228675842285, + "learning_rate": 1.2977153007736241e-05, + "loss": 0.2193, + "step": 15475 + }, + { + "epoch": 42.16893732970027, + "grad_norm": 5.192065715789795, + "learning_rate": 1.2976310518491068e-05, + "loss": 0.4163, + "step": 15476 + }, + { + "epoch": 42.171662125340596, + "grad_norm": 5.013331890106201, + "learning_rate": 1.2975468006066483e-05, + "loss": 0.2784, + "step": 15477 + }, + { + "epoch": 42.17438692098093, + "grad_norm": 5.486303806304932, + "learning_rate": 1.2974625470469051e-05, + "loss": 0.4019, + "step": 15478 + }, + { + "epoch": 42.177111716621255, + "grad_norm": 10.600406646728516, + "learning_rate": 1.297378291170533e-05, + "loss": 0.2654, + "step": 15479 + }, + { + "epoch": 42.17983651226158, + "grad_norm": 22.355682373046875, + "learning_rate": 1.2972940329781885e-05, + "loss": 0.2869, + "step": 15480 + }, + { + "epoch": 42.182561307901906, + "grad_norm": 7.4673357009887695, + "learning_rate": 1.2972097724705273e-05, + "loss": 0.1731, + "step": 15481 + }, + { + "epoch": 42.18528610354223, + "grad_norm": 7.031222343444824, + "learning_rate": 1.2971255096482063e-05, + "loss": 0.2067, + "step": 15482 + }, + { + "epoch": 42.18801089918256, + "grad_norm": 7.047456741333008, + "learning_rate": 1.297041244511881e-05, + "loss": 0.1381, + "step": 15483 + }, + { + "epoch": 42.19073569482289, + "grad_norm": 5.458183288574219, + "learning_rate": 1.2969569770622084e-05, + "loss": 0.2736, + "step": 15484 + }, + { + "epoch": 42.19346049046322, + "grad_norm": 5.774094581604004, + "learning_rate": 1.2968727072998442e-05, + "loss": 0.2545, + "step": 15485 + }, + { + "epoch": 42.19618528610354, + "grad_norm": 8.14728832244873, + "learning_rate": 1.2967884352254451e-05, + "loss": 0.2662, + "step": 15486 + }, + { + "epoch": 42.19891008174387, + "grad_norm": 5.487812519073486, + "learning_rate": 1.2967041608396671e-05, + "loss": 0.2005, + "step": 15487 + }, + { + "epoch": 42.201634877384194, + "grad_norm": 5.376804351806641, + "learning_rate": 1.296619884143167e-05, + "loss": 0.3924, + "step": 15488 + }, + { + "epoch": 42.20435967302452, + "grad_norm": 7.430761337280273, + "learning_rate": 1.2965356051366003e-05, + "loss": 0.3456, + "step": 15489 + }, + { + "epoch": 42.20708446866485, + "grad_norm": 6.076028347015381, + "learning_rate": 1.296451323820624e-05, + "loss": 0.2327, + "step": 15490 + }, + { + "epoch": 42.20980926430518, + "grad_norm": 5.0028395652771, + "learning_rate": 1.2963670401958944e-05, + "loss": 0.13, + "step": 15491 + }, + { + "epoch": 42.212534059945504, + "grad_norm": 5.353379726409912, + "learning_rate": 1.2962827542630678e-05, + "loss": 0.2015, + "step": 15492 + }, + { + "epoch": 42.21525885558583, + "grad_norm": 7.217342853546143, + "learning_rate": 1.2961984660228005e-05, + "loss": 0.1236, + "step": 15493 + }, + { + "epoch": 42.217983651226156, + "grad_norm": 6.616295337677002, + "learning_rate": 1.2961141754757494e-05, + "loss": 0.2788, + "step": 15494 + }, + { + "epoch": 42.22070844686648, + "grad_norm": 5.089466094970703, + "learning_rate": 1.2960298826225701e-05, + "loss": 0.2865, + "step": 15495 + }, + { + "epoch": 42.223433242506815, + "grad_norm": 5.868330478668213, + "learning_rate": 1.2959455874639202e-05, + "loss": 0.2689, + "step": 15496 + }, + { + "epoch": 42.22615803814714, + "grad_norm": 5.696859836578369, + "learning_rate": 1.2958612900004552e-05, + "loss": 0.2144, + "step": 15497 + }, + { + "epoch": 42.228882833787466, + "grad_norm": 6.412961959838867, + "learning_rate": 1.2957769902328324e-05, + "loss": 0.2056, + "step": 15498 + }, + { + "epoch": 42.23160762942779, + "grad_norm": 6.366140842437744, + "learning_rate": 1.2956926881617073e-05, + "loss": 0.1171, + "step": 15499 + }, + { + "epoch": 42.23433242506812, + "grad_norm": 4.624966621398926, + "learning_rate": 1.2956083837877376e-05, + "loss": 0.1428, + "step": 15500 + }, + { + "epoch": 42.237057220708444, + "grad_norm": 8.231295585632324, + "learning_rate": 1.2955240771115788e-05, + "loss": 0.3253, + "step": 15501 + }, + { + "epoch": 42.23978201634878, + "grad_norm": 5.296624183654785, + "learning_rate": 1.2954397681338886e-05, + "loss": 0.1492, + "step": 15502 + }, + { + "epoch": 42.2425068119891, + "grad_norm": 5.643084526062012, + "learning_rate": 1.2953554568553225e-05, + "loss": 0.2552, + "step": 15503 + }, + { + "epoch": 42.24523160762943, + "grad_norm": 5.668529987335205, + "learning_rate": 1.2952711432765381e-05, + "loss": 0.2309, + "step": 15504 + }, + { + "epoch": 42.247956403269754, + "grad_norm": 5.27156925201416, + "learning_rate": 1.2951868273981912e-05, + "loss": 0.1807, + "step": 15505 + }, + { + "epoch": 42.25068119891008, + "grad_norm": 5.571093559265137, + "learning_rate": 1.2951025092209391e-05, + "loss": 0.2919, + "step": 15506 + }, + { + "epoch": 42.253405994550405, + "grad_norm": 13.448417663574219, + "learning_rate": 1.2950181887454374e-05, + "loss": 0.1656, + "step": 15507 + }, + { + "epoch": 42.25613079019074, + "grad_norm": 5.163852214813232, + "learning_rate": 1.2949338659723443e-05, + "loss": 0.2104, + "step": 15508 + }, + { + "epoch": 42.258855585831064, + "grad_norm": 6.779701232910156, + "learning_rate": 1.2948495409023155e-05, + "loss": 0.4256, + "step": 15509 + }, + { + "epoch": 42.26158038147139, + "grad_norm": 11.53541374206543, + "learning_rate": 1.294765213536008e-05, + "loss": 0.149, + "step": 15510 + }, + { + "epoch": 42.264305177111716, + "grad_norm": 5.645216941833496, + "learning_rate": 1.2946808838740786e-05, + "loss": 0.2024, + "step": 15511 + }, + { + "epoch": 42.26702997275204, + "grad_norm": 6.562511444091797, + "learning_rate": 1.2945965519171837e-05, + "loss": 0.2311, + "step": 15512 + }, + { + "epoch": 42.26975476839237, + "grad_norm": 5.998152732849121, + "learning_rate": 1.2945122176659806e-05, + "loss": 0.135, + "step": 15513 + }, + { + "epoch": 42.2724795640327, + "grad_norm": 7.895827770233154, + "learning_rate": 1.2944278811211257e-05, + "loss": 0.3027, + "step": 15514 + }, + { + "epoch": 42.275204359673026, + "grad_norm": 5.272707939147949, + "learning_rate": 1.2943435422832757e-05, + "loss": 0.2454, + "step": 15515 + }, + { + "epoch": 42.27792915531335, + "grad_norm": 7.751999855041504, + "learning_rate": 1.2942592011530878e-05, + "loss": 0.3795, + "step": 15516 + }, + { + "epoch": 42.28065395095368, + "grad_norm": 5.843137264251709, + "learning_rate": 1.294174857731219e-05, + "loss": 0.1421, + "step": 15517 + }, + { + "epoch": 42.283378746594, + "grad_norm": 6.004982948303223, + "learning_rate": 1.2940905120183256e-05, + "loss": 0.1472, + "step": 15518 + }, + { + "epoch": 42.28610354223433, + "grad_norm": 5.694803237915039, + "learning_rate": 1.2940061640150647e-05, + "loss": 0.2206, + "step": 15519 + }, + { + "epoch": 42.28882833787466, + "grad_norm": 6.18784236907959, + "learning_rate": 1.2939218137220937e-05, + "loss": 0.142, + "step": 15520 + }, + { + "epoch": 42.29155313351499, + "grad_norm": 6.286417484283447, + "learning_rate": 1.2938374611400686e-05, + "loss": 0.1637, + "step": 15521 + }, + { + "epoch": 42.294277929155314, + "grad_norm": 12.573493957519531, + "learning_rate": 1.2937531062696472e-05, + "loss": 0.2488, + "step": 15522 + }, + { + "epoch": 42.29700272479564, + "grad_norm": 5.91987419128418, + "learning_rate": 1.2936687491114857e-05, + "loss": 0.2027, + "step": 15523 + }, + { + "epoch": 42.299727520435965, + "grad_norm": 5.3064866065979, + "learning_rate": 1.2935843896662415e-05, + "loss": 0.2772, + "step": 15524 + }, + { + "epoch": 42.30245231607629, + "grad_norm": 7.935819149017334, + "learning_rate": 1.2935000279345717e-05, + "loss": 0.2905, + "step": 15525 + }, + { + "epoch": 42.305177111716624, + "grad_norm": 10.462241172790527, + "learning_rate": 1.293415663917133e-05, + "loss": 0.2463, + "step": 15526 + }, + { + "epoch": 42.30790190735695, + "grad_norm": 5.2981367111206055, + "learning_rate": 1.2933312976145827e-05, + "loss": 0.2498, + "step": 15527 + }, + { + "epoch": 42.310626702997276, + "grad_norm": 5.681687355041504, + "learning_rate": 1.2932469290275776e-05, + "loss": 0.2193, + "step": 15528 + }, + { + "epoch": 42.3133514986376, + "grad_norm": 4.980800151824951, + "learning_rate": 1.2931625581567748e-05, + "loss": 0.2744, + "step": 15529 + }, + { + "epoch": 42.31607629427793, + "grad_norm": 4.790737628936768, + "learning_rate": 1.2930781850028313e-05, + "loss": 0.1973, + "step": 15530 + }, + { + "epoch": 42.31880108991825, + "grad_norm": 5.458620548248291, + "learning_rate": 1.2929938095664045e-05, + "loss": 0.2656, + "step": 15531 + }, + { + "epoch": 42.321525885558586, + "grad_norm": 8.451607704162598, + "learning_rate": 1.2929094318481515e-05, + "loss": 0.3004, + "step": 15532 + }, + { + "epoch": 42.32425068119891, + "grad_norm": 5.715627193450928, + "learning_rate": 1.2928250518487291e-05, + "loss": 0.2858, + "step": 15533 + }, + { + "epoch": 42.32697547683924, + "grad_norm": 5.105525493621826, + "learning_rate": 1.2927406695687945e-05, + "loss": 0.1778, + "step": 15534 + }, + { + "epoch": 42.32970027247956, + "grad_norm": 6.924923896789551, + "learning_rate": 1.2926562850090052e-05, + "loss": 0.1534, + "step": 15535 + }, + { + "epoch": 42.33242506811989, + "grad_norm": 5.473208904266357, + "learning_rate": 1.2925718981700181e-05, + "loss": 0.1992, + "step": 15536 + }, + { + "epoch": 42.335149863760215, + "grad_norm": 5.2932610511779785, + "learning_rate": 1.2924875090524904e-05, + "loss": 0.1865, + "step": 15537 + }, + { + "epoch": 42.33787465940055, + "grad_norm": 7.486854076385498, + "learning_rate": 1.2924031176570794e-05, + "loss": 0.2947, + "step": 15538 + }, + { + "epoch": 42.34059945504087, + "grad_norm": 5.6262359619140625, + "learning_rate": 1.2923187239844426e-05, + "loss": 0.2825, + "step": 15539 + }, + { + "epoch": 42.3433242506812, + "grad_norm": 7.020451068878174, + "learning_rate": 1.2922343280352367e-05, + "loss": 0.2192, + "step": 15540 + }, + { + "epoch": 42.346049046321525, + "grad_norm": 5.153855800628662, + "learning_rate": 1.2921499298101193e-05, + "loss": 0.1758, + "step": 15541 + }, + { + "epoch": 42.34877384196185, + "grad_norm": 5.127655506134033, + "learning_rate": 1.2920655293097474e-05, + "loss": 0.2618, + "step": 15542 + }, + { + "epoch": 42.35149863760218, + "grad_norm": 10.108250617980957, + "learning_rate": 1.291981126534779e-05, + "loss": 0.2181, + "step": 15543 + }, + { + "epoch": 42.35422343324251, + "grad_norm": 6.072994709014893, + "learning_rate": 1.2918967214858709e-05, + "loss": 0.1606, + "step": 15544 + }, + { + "epoch": 42.356948228882835, + "grad_norm": 6.636490345001221, + "learning_rate": 1.2918123141636804e-05, + "loss": 0.2944, + "step": 15545 + }, + { + "epoch": 42.35967302452316, + "grad_norm": 7.909504413604736, + "learning_rate": 1.291727904568865e-05, + "loss": 0.256, + "step": 15546 + }, + { + "epoch": 42.36239782016349, + "grad_norm": 5.1938090324401855, + "learning_rate": 1.2916434927020825e-05, + "loss": 0.1128, + "step": 15547 + }, + { + "epoch": 42.36512261580381, + "grad_norm": 5.129669666290283, + "learning_rate": 1.291559078563989e-05, + "loss": 0.2096, + "step": 15548 + }, + { + "epoch": 42.36784741144414, + "grad_norm": 5.939659118652344, + "learning_rate": 1.2914746621552437e-05, + "loss": 0.173, + "step": 15549 + }, + { + "epoch": 42.37057220708447, + "grad_norm": 7.425166130065918, + "learning_rate": 1.2913902434765023e-05, + "loss": 0.2892, + "step": 15550 + }, + { + "epoch": 42.3732970027248, + "grad_norm": 6.21837043762207, + "learning_rate": 1.2913058225284237e-05, + "loss": 0.2662, + "step": 15551 + }, + { + "epoch": 42.37602179836512, + "grad_norm": 7.428950309753418, + "learning_rate": 1.2912213993116642e-05, + "loss": 0.1748, + "step": 15552 + }, + { + "epoch": 42.37874659400545, + "grad_norm": 4.864560604095459, + "learning_rate": 1.2911369738268823e-05, + "loss": 0.3374, + "step": 15553 + }, + { + "epoch": 42.381471389645775, + "grad_norm": 6.655929088592529, + "learning_rate": 1.2910525460747346e-05, + "loss": 0.3018, + "step": 15554 + }, + { + "epoch": 42.3841961852861, + "grad_norm": 4.93895959854126, + "learning_rate": 1.2909681160558794e-05, + "loss": 0.4243, + "step": 15555 + }, + { + "epoch": 42.38692098092643, + "grad_norm": 6.0697922706604, + "learning_rate": 1.2908836837709734e-05, + "loss": 0.147, + "step": 15556 + }, + { + "epoch": 42.38964577656676, + "grad_norm": 4.908973217010498, + "learning_rate": 1.2907992492206752e-05, + "loss": 0.2268, + "step": 15557 + }, + { + "epoch": 42.392370572207085, + "grad_norm": 6.194726467132568, + "learning_rate": 1.2907148124056415e-05, + "loss": 0.1345, + "step": 15558 + }, + { + "epoch": 42.39509536784741, + "grad_norm": 4.846452713012695, + "learning_rate": 1.2906303733265301e-05, + "loss": 0.1757, + "step": 15559 + }, + { + "epoch": 42.39782016348774, + "grad_norm": 4.52724552154541, + "learning_rate": 1.2905459319839988e-05, + "loss": 0.1843, + "step": 15560 + }, + { + "epoch": 42.40054495912806, + "grad_norm": 5.058575630187988, + "learning_rate": 1.2904614883787052e-05, + "loss": 0.2414, + "step": 15561 + }, + { + "epoch": 42.403269754768395, + "grad_norm": 5.1417341232299805, + "learning_rate": 1.290377042511307e-05, + "loss": 0.2135, + "step": 15562 + }, + { + "epoch": 42.40599455040872, + "grad_norm": 5.533407211303711, + "learning_rate": 1.2902925943824615e-05, + "loss": 0.2542, + "step": 15563 + }, + { + "epoch": 42.40871934604905, + "grad_norm": 5.8959503173828125, + "learning_rate": 1.2902081439928268e-05, + "loss": 0.31, + "step": 15564 + }, + { + "epoch": 42.41144414168937, + "grad_norm": 5.670324802398682, + "learning_rate": 1.2901236913430604e-05, + "loss": 0.3066, + "step": 15565 + }, + { + "epoch": 42.4141689373297, + "grad_norm": 6.487437725067139, + "learning_rate": 1.2900392364338199e-05, + "loss": 0.1703, + "step": 15566 + }, + { + "epoch": 42.416893732970024, + "grad_norm": 9.519947052001953, + "learning_rate": 1.2899547792657633e-05, + "loss": 0.2129, + "step": 15567 + }, + { + "epoch": 42.41961852861036, + "grad_norm": 6.691407203674316, + "learning_rate": 1.289870319839548e-05, + "loss": 0.1647, + "step": 15568 + }, + { + "epoch": 42.42234332425068, + "grad_norm": 5.998138904571533, + "learning_rate": 1.289785858155832e-05, + "loss": 0.2248, + "step": 15569 + }, + { + "epoch": 42.42506811989101, + "grad_norm": 5.7534685134887695, + "learning_rate": 1.2897013942152732e-05, + "loss": 0.2413, + "step": 15570 + }, + { + "epoch": 42.427792915531334, + "grad_norm": 5.390469074249268, + "learning_rate": 1.2896169280185293e-05, + "loss": 0.3113, + "step": 15571 + }, + { + "epoch": 42.43051771117166, + "grad_norm": 5.165089130401611, + "learning_rate": 1.289532459566258e-05, + "loss": 0.1694, + "step": 15572 + }, + { + "epoch": 42.433242506811986, + "grad_norm": 19.199241638183594, + "learning_rate": 1.2894479888591173e-05, + "loss": 0.2332, + "step": 15573 + }, + { + "epoch": 42.43596730245232, + "grad_norm": 5.859897136688232, + "learning_rate": 1.289363515897765e-05, + "loss": 0.2173, + "step": 15574 + }, + { + "epoch": 42.438692098092645, + "grad_norm": 5.306302547454834, + "learning_rate": 1.289279040682859e-05, + "loss": 0.2181, + "step": 15575 + }, + { + "epoch": 42.44141689373297, + "grad_norm": 5.701376438140869, + "learning_rate": 1.2891945632150566e-05, + "loss": 0.1909, + "step": 15576 + }, + { + "epoch": 42.444141689373296, + "grad_norm": 5.970940113067627, + "learning_rate": 1.2891100834950167e-05, + "loss": 0.2238, + "step": 15577 + }, + { + "epoch": 42.44686648501362, + "grad_norm": 6.2598557472229, + "learning_rate": 1.2890256015233968e-05, + "loss": 0.3004, + "step": 15578 + }, + { + "epoch": 42.44959128065395, + "grad_norm": 5.792520523071289, + "learning_rate": 1.2889411173008549e-05, + "loss": 0.2131, + "step": 15579 + }, + { + "epoch": 42.45231607629428, + "grad_norm": 4.6232805252075195, + "learning_rate": 1.2888566308280486e-05, + "loss": 0.2638, + "step": 15580 + }, + { + "epoch": 42.45504087193461, + "grad_norm": 5.799549102783203, + "learning_rate": 1.2887721421056366e-05, + "loss": 0.1464, + "step": 15581 + }, + { + "epoch": 42.45776566757493, + "grad_norm": 9.060937881469727, + "learning_rate": 1.2886876511342758e-05, + "loss": 0.3488, + "step": 15582 + }, + { + "epoch": 42.46049046321526, + "grad_norm": 5.300330638885498, + "learning_rate": 1.2886031579146257e-05, + "loss": 0.2588, + "step": 15583 + }, + { + "epoch": 42.463215258855584, + "grad_norm": 5.925723552703857, + "learning_rate": 1.2885186624473428e-05, + "loss": 0.2493, + "step": 15584 + }, + { + "epoch": 42.46594005449591, + "grad_norm": 4.02168083190918, + "learning_rate": 1.288434164733086e-05, + "loss": 0.3596, + "step": 15585 + }, + { + "epoch": 42.46866485013624, + "grad_norm": 6.255588531494141, + "learning_rate": 1.2883496647725131e-05, + "loss": 0.1687, + "step": 15586 + }, + { + "epoch": 42.47138964577657, + "grad_norm": 5.425561428070068, + "learning_rate": 1.2882651625662825e-05, + "loss": 0.1327, + "step": 15587 + }, + { + "epoch": 42.474114441416894, + "grad_norm": 6.124661922454834, + "learning_rate": 1.288180658115052e-05, + "loss": 0.1344, + "step": 15588 + }, + { + "epoch": 42.47683923705722, + "grad_norm": 6.7752366065979, + "learning_rate": 1.28809615141948e-05, + "loss": 0.297, + "step": 15589 + }, + { + "epoch": 42.479564032697546, + "grad_norm": 6.834358215332031, + "learning_rate": 1.2880116424802242e-05, + "loss": 0.3883, + "step": 15590 + }, + { + "epoch": 42.48228882833787, + "grad_norm": 5.602798938751221, + "learning_rate": 1.287927131297943e-05, + "loss": 0.3643, + "step": 15591 + }, + { + "epoch": 42.485013623978205, + "grad_norm": 6.323520183563232, + "learning_rate": 1.2878426178732947e-05, + "loss": 0.2445, + "step": 15592 + }, + { + "epoch": 42.48773841961853, + "grad_norm": 4.985516548156738, + "learning_rate": 1.2877581022069374e-05, + "loss": 0.1582, + "step": 15593 + }, + { + "epoch": 42.490463215258856, + "grad_norm": 5.517819404602051, + "learning_rate": 1.2876735842995291e-05, + "loss": 0.1748, + "step": 15594 + }, + { + "epoch": 42.49318801089918, + "grad_norm": 6.430752277374268, + "learning_rate": 1.2875890641517283e-05, + "loss": 0.1986, + "step": 15595 + }, + { + "epoch": 42.49591280653951, + "grad_norm": 8.593796730041504, + "learning_rate": 1.2875045417641928e-05, + "loss": 0.1428, + "step": 15596 + }, + { + "epoch": 42.49863760217983, + "grad_norm": 5.309615612030029, + "learning_rate": 1.2874200171375817e-05, + "loss": 0.2898, + "step": 15597 + }, + { + "epoch": 42.50136239782017, + "grad_norm": 6.958247661590576, + "learning_rate": 1.2873354902725525e-05, + "loss": 0.2751, + "step": 15598 + }, + { + "epoch": 42.50408719346049, + "grad_norm": 5.246025085449219, + "learning_rate": 1.2872509611697639e-05, + "loss": 0.1521, + "step": 15599 + }, + { + "epoch": 42.50681198910082, + "grad_norm": 5.215633869171143, + "learning_rate": 1.287166429829874e-05, + "loss": 0.1823, + "step": 15600 + }, + { + "epoch": 42.509536784741144, + "grad_norm": 7.842749118804932, + "learning_rate": 1.2870818962535412e-05, + "loss": 0.1688, + "step": 15601 + }, + { + "epoch": 42.51226158038147, + "grad_norm": 5.858428001403809, + "learning_rate": 1.2869973604414237e-05, + "loss": 0.2268, + "step": 15602 + }, + { + "epoch": 42.514986376021795, + "grad_norm": 5.467252731323242, + "learning_rate": 1.28691282239418e-05, + "loss": 0.1691, + "step": 15603 + }, + { + "epoch": 42.51771117166213, + "grad_norm": 4.986133098602295, + "learning_rate": 1.2868282821124685e-05, + "loss": 0.3136, + "step": 15604 + }, + { + "epoch": 42.520435967302454, + "grad_norm": 5.284420967102051, + "learning_rate": 1.2867437395969476e-05, + "loss": 0.1013, + "step": 15605 + }, + { + "epoch": 42.52316076294278, + "grad_norm": 5.0402607917785645, + "learning_rate": 1.2866591948482756e-05, + "loss": 0.2024, + "step": 15606 + }, + { + "epoch": 42.525885558583106, + "grad_norm": 5.158346652984619, + "learning_rate": 1.286574647867111e-05, + "loss": 0.1467, + "step": 15607 + }, + { + "epoch": 42.52861035422343, + "grad_norm": 5.764071464538574, + "learning_rate": 1.2864900986541125e-05, + "loss": 0.1802, + "step": 15608 + }, + { + "epoch": 42.53133514986376, + "grad_norm": 6.164839744567871, + "learning_rate": 1.2864055472099381e-05, + "loss": 0.2463, + "step": 15609 + }, + { + "epoch": 42.53405994550409, + "grad_norm": 7.74569845199585, + "learning_rate": 1.2863209935352468e-05, + "loss": 0.23, + "step": 15610 + }, + { + "epoch": 42.536784741144416, + "grad_norm": 5.935806751251221, + "learning_rate": 1.2862364376306964e-05, + "loss": 0.1226, + "step": 15611 + }, + { + "epoch": 42.53950953678474, + "grad_norm": 5.458498954772949, + "learning_rate": 1.2861518794969464e-05, + "loss": 0.3806, + "step": 15612 + }, + { + "epoch": 42.54223433242507, + "grad_norm": 6.322701454162598, + "learning_rate": 1.2860673191346542e-05, + "loss": 0.3062, + "step": 15613 + }, + { + "epoch": 42.54495912806539, + "grad_norm": 7.980700969696045, + "learning_rate": 1.2859827565444793e-05, + "loss": 0.1646, + "step": 15614 + }, + { + "epoch": 42.54768392370572, + "grad_norm": 6.683459758758545, + "learning_rate": 1.2858981917270796e-05, + "loss": 0.2345, + "step": 15615 + }, + { + "epoch": 42.55040871934605, + "grad_norm": 7.966632843017578, + "learning_rate": 1.2858136246831144e-05, + "loss": 0.3876, + "step": 15616 + }, + { + "epoch": 42.55313351498638, + "grad_norm": 5.730477809906006, + "learning_rate": 1.2857290554132416e-05, + "loss": 0.2682, + "step": 15617 + }, + { + "epoch": 42.555858310626704, + "grad_norm": 5.792958736419678, + "learning_rate": 1.2856444839181199e-05, + "loss": 0.1936, + "step": 15618 + }, + { + "epoch": 42.55858310626703, + "grad_norm": 8.202452659606934, + "learning_rate": 1.2855599101984085e-05, + "loss": 0.159, + "step": 15619 + }, + { + "epoch": 42.561307901907355, + "grad_norm": 5.304412364959717, + "learning_rate": 1.2854753342547656e-05, + "loss": 0.2151, + "step": 15620 + }, + { + "epoch": 42.56403269754768, + "grad_norm": 4.5617594718933105, + "learning_rate": 1.2853907560878499e-05, + "loss": 0.1409, + "step": 15621 + }, + { + "epoch": 42.566757493188014, + "grad_norm": 7.792327880859375, + "learning_rate": 1.2853061756983203e-05, + "loss": 0.3014, + "step": 15622 + }, + { + "epoch": 42.56948228882834, + "grad_norm": 10.473942756652832, + "learning_rate": 1.2852215930868353e-05, + "loss": 0.2424, + "step": 15623 + }, + { + "epoch": 42.572207084468666, + "grad_norm": 6.214908599853516, + "learning_rate": 1.285137008254054e-05, + "loss": 0.1883, + "step": 15624 + }, + { + "epoch": 42.57493188010899, + "grad_norm": 8.285236358642578, + "learning_rate": 1.2850524212006344e-05, + "loss": 0.34, + "step": 15625 + }, + { + "epoch": 42.57765667574932, + "grad_norm": 5.568668365478516, + "learning_rate": 1.284967831927236e-05, + "loss": 0.2885, + "step": 15626 + }, + { + "epoch": 42.58038147138964, + "grad_norm": 4.822712421417236, + "learning_rate": 1.2848832404345173e-05, + "loss": 0.1432, + "step": 15627 + }, + { + "epoch": 42.583106267029976, + "grad_norm": 7.120174407958984, + "learning_rate": 1.2847986467231368e-05, + "loss": 0.2746, + "step": 15628 + }, + { + "epoch": 42.5858310626703, + "grad_norm": 5.246706962585449, + "learning_rate": 1.2847140507937539e-05, + "loss": 0.3759, + "step": 15629 + }, + { + "epoch": 42.58855585831063, + "grad_norm": 6.120863437652588, + "learning_rate": 1.2846294526470274e-05, + "loss": 0.3094, + "step": 15630 + }, + { + "epoch": 42.59128065395095, + "grad_norm": 9.145034790039062, + "learning_rate": 1.2845448522836152e-05, + "loss": 0.1625, + "step": 15631 + }, + { + "epoch": 42.59400544959128, + "grad_norm": 7.596875190734863, + "learning_rate": 1.2844602497041774e-05, + "loss": 0.1904, + "step": 15632 + }, + { + "epoch": 42.596730245231605, + "grad_norm": 7.045854568481445, + "learning_rate": 1.2843756449093721e-05, + "loss": 0.2578, + "step": 15633 + }, + { + "epoch": 42.59945504087194, + "grad_norm": 5.64263916015625, + "learning_rate": 1.2842910378998585e-05, + "loss": 0.3601, + "step": 15634 + }, + { + "epoch": 42.60217983651226, + "grad_norm": 6.453949451446533, + "learning_rate": 1.2842064286762954e-05, + "loss": 0.2219, + "step": 15635 + }, + { + "epoch": 42.60490463215259, + "grad_norm": 5.985903263092041, + "learning_rate": 1.2841218172393417e-05, + "loss": 0.1634, + "step": 15636 + }, + { + "epoch": 42.607629427792915, + "grad_norm": 6.2830810546875, + "learning_rate": 1.2840372035896565e-05, + "loss": 0.3231, + "step": 15637 + }, + { + "epoch": 42.61035422343324, + "grad_norm": 5.878849983215332, + "learning_rate": 1.2839525877278986e-05, + "loss": 0.3066, + "step": 15638 + }, + { + "epoch": 42.61307901907357, + "grad_norm": 9.201489448547363, + "learning_rate": 1.2838679696547272e-05, + "loss": 0.2384, + "step": 15639 + }, + { + "epoch": 42.6158038147139, + "grad_norm": 4.6086626052856445, + "learning_rate": 1.2837833493708013e-05, + "loss": 0.2048, + "step": 15640 + }, + { + "epoch": 42.618528610354225, + "grad_norm": 7.550244331359863, + "learning_rate": 1.2836987268767798e-05, + "loss": 0.3065, + "step": 15641 + }, + { + "epoch": 42.62125340599455, + "grad_norm": 6.34338903427124, + "learning_rate": 1.2836141021733217e-05, + "loss": 0.2497, + "step": 15642 + }, + { + "epoch": 42.62397820163488, + "grad_norm": 9.32612419128418, + "learning_rate": 1.283529475261086e-05, + "loss": 0.2767, + "step": 15643 + }, + { + "epoch": 42.6267029972752, + "grad_norm": 5.956027507781982, + "learning_rate": 1.283444846140732e-05, + "loss": 0.2447, + "step": 15644 + }, + { + "epoch": 42.62942779291553, + "grad_norm": 5.47667932510376, + "learning_rate": 1.2833602148129184e-05, + "loss": 0.1846, + "step": 15645 + }, + { + "epoch": 42.63215258855586, + "grad_norm": 6.449533462524414, + "learning_rate": 1.2832755812783048e-05, + "loss": 0.3097, + "step": 15646 + }, + { + "epoch": 42.63487738419619, + "grad_norm": 5.0832905769348145, + "learning_rate": 1.28319094553755e-05, + "loss": 0.1385, + "step": 15647 + }, + { + "epoch": 42.63760217983651, + "grad_norm": 5.39228630065918, + "learning_rate": 1.2831063075913134e-05, + "loss": 0.2786, + "step": 15648 + }, + { + "epoch": 42.64032697547684, + "grad_norm": 5.079096794128418, + "learning_rate": 1.2830216674402539e-05, + "loss": 0.2716, + "step": 15649 + }, + { + "epoch": 42.643051771117165, + "grad_norm": 7.23034143447876, + "learning_rate": 1.2829370250850306e-05, + "loss": 0.4366, + "step": 15650 + }, + { + "epoch": 42.64577656675749, + "grad_norm": 6.6343560218811035, + "learning_rate": 1.282852380526303e-05, + "loss": 0.2604, + "step": 15651 + }, + { + "epoch": 42.64850136239782, + "grad_norm": 7.3391194343566895, + "learning_rate": 1.2827677337647302e-05, + "loss": 0.1819, + "step": 15652 + }, + { + "epoch": 42.65122615803815, + "grad_norm": 11.406492233276367, + "learning_rate": 1.2826830848009711e-05, + "loss": 0.1838, + "step": 15653 + }, + { + "epoch": 42.653950953678475, + "grad_norm": 7.062712669372559, + "learning_rate": 1.2825984336356856e-05, + "loss": 0.2989, + "step": 15654 + }, + { + "epoch": 42.6566757493188, + "grad_norm": 10.87055778503418, + "learning_rate": 1.2825137802695324e-05, + "loss": 0.1964, + "step": 15655 + }, + { + "epoch": 42.65940054495913, + "grad_norm": 7.037644863128662, + "learning_rate": 1.282429124703171e-05, + "loss": 0.1846, + "step": 15656 + }, + { + "epoch": 42.66212534059945, + "grad_norm": 5.161700248718262, + "learning_rate": 1.2823444669372606e-05, + "loss": 0.1318, + "step": 15657 + }, + { + "epoch": 42.664850136239785, + "grad_norm": 6.45982551574707, + "learning_rate": 1.282259806972461e-05, + "loss": 0.2821, + "step": 15658 + }, + { + "epoch": 42.66757493188011, + "grad_norm": 6.253321647644043, + "learning_rate": 1.2821751448094306e-05, + "loss": 0.3189, + "step": 15659 + }, + { + "epoch": 42.67029972752044, + "grad_norm": 5.008757591247559, + "learning_rate": 1.2820904804488297e-05, + "loss": 0.2248, + "step": 15660 + }, + { + "epoch": 42.67302452316076, + "grad_norm": 5.852625370025635, + "learning_rate": 1.2820058138913169e-05, + "loss": 0.2124, + "step": 15661 + }, + { + "epoch": 42.67574931880109, + "grad_norm": 6.222420692443848, + "learning_rate": 1.2819211451375517e-05, + "loss": 0.3006, + "step": 15662 + }, + { + "epoch": 42.678474114441414, + "grad_norm": 6.5769195556640625, + "learning_rate": 1.2818364741881939e-05, + "loss": 0.2786, + "step": 15663 + }, + { + "epoch": 42.68119891008175, + "grad_norm": 15.356090545654297, + "learning_rate": 1.281751801043903e-05, + "loss": 0.3032, + "step": 15664 + }, + { + "epoch": 42.68392370572207, + "grad_norm": 5.917220592498779, + "learning_rate": 1.2816671257053377e-05, + "loss": 0.1984, + "step": 15665 + }, + { + "epoch": 42.6866485013624, + "grad_norm": 5.45731258392334, + "learning_rate": 1.2815824481731582e-05, + "loss": 0.1677, + "step": 15666 + }, + { + "epoch": 42.689373297002724, + "grad_norm": 5.89810037612915, + "learning_rate": 1.2814977684480234e-05, + "loss": 0.262, + "step": 15667 + }, + { + "epoch": 42.69209809264305, + "grad_norm": 6.147561550140381, + "learning_rate": 1.2814130865305937e-05, + "loss": 0.2132, + "step": 15668 + }, + { + "epoch": 42.694822888283376, + "grad_norm": 5.025945663452148, + "learning_rate": 1.2813284024215272e-05, + "loss": 0.1731, + "step": 15669 + }, + { + "epoch": 42.69754768392371, + "grad_norm": 6.564162254333496, + "learning_rate": 1.2812437161214843e-05, + "loss": 0.3235, + "step": 15670 + }, + { + "epoch": 42.700272479564035, + "grad_norm": 5.934960842132568, + "learning_rate": 1.2811590276311243e-05, + "loss": 0.3416, + "step": 15671 + }, + { + "epoch": 42.70299727520436, + "grad_norm": 7.1388726234436035, + "learning_rate": 1.2810743369511071e-05, + "loss": 0.1969, + "step": 15672 + }, + { + "epoch": 42.705722070844686, + "grad_norm": 5.952902793884277, + "learning_rate": 1.280989644082092e-05, + "loss": 0.1279, + "step": 15673 + }, + { + "epoch": 42.70844686648501, + "grad_norm": 5.618162631988525, + "learning_rate": 1.2809049490247386e-05, + "loss": 0.227, + "step": 15674 + }, + { + "epoch": 42.71117166212534, + "grad_norm": 5.18951416015625, + "learning_rate": 1.2808202517797064e-05, + "loss": 0.3255, + "step": 15675 + }, + { + "epoch": 42.71389645776567, + "grad_norm": 5.392221450805664, + "learning_rate": 1.2807355523476552e-05, + "loss": 0.2909, + "step": 15676 + }, + { + "epoch": 42.716621253406, + "grad_norm": 5.3777618408203125, + "learning_rate": 1.2806508507292444e-05, + "loss": 0.1854, + "step": 15677 + }, + { + "epoch": 42.71934604904632, + "grad_norm": 6.626627445220947, + "learning_rate": 1.280566146925134e-05, + "loss": 0.1884, + "step": 15678 + }, + { + "epoch": 42.72207084468665, + "grad_norm": 5.3079681396484375, + "learning_rate": 1.2804814409359834e-05, + "loss": 0.164, + "step": 15679 + }, + { + "epoch": 42.724795640326974, + "grad_norm": 5.620943069458008, + "learning_rate": 1.2803967327624522e-05, + "loss": 0.1486, + "step": 15680 + }, + { + "epoch": 42.7275204359673, + "grad_norm": 7.279932975769043, + "learning_rate": 1.2803120224052004e-05, + "loss": 0.185, + "step": 15681 + }, + { + "epoch": 42.73024523160763, + "grad_norm": 5.815249443054199, + "learning_rate": 1.2802273098648876e-05, + "loss": 0.1892, + "step": 15682 + }, + { + "epoch": 42.73297002724796, + "grad_norm": 5.860848426818848, + "learning_rate": 1.2801425951421736e-05, + "loss": 0.1905, + "step": 15683 + }, + { + "epoch": 42.735694822888284, + "grad_norm": 7.554252624511719, + "learning_rate": 1.280057878237718e-05, + "loss": 0.2471, + "step": 15684 + }, + { + "epoch": 42.73841961852861, + "grad_norm": 6.2970356941223145, + "learning_rate": 1.2799731591521805e-05, + "loss": 0.3025, + "step": 15685 + }, + { + "epoch": 42.741144414168936, + "grad_norm": 4.874846458435059, + "learning_rate": 1.2798884378862213e-05, + "loss": 0.2105, + "step": 15686 + }, + { + "epoch": 42.74386920980926, + "grad_norm": 8.647810935974121, + "learning_rate": 1.2798037144405e-05, + "loss": 0.2013, + "step": 15687 + }, + { + "epoch": 42.746594005449595, + "grad_norm": 5.494062423706055, + "learning_rate": 1.2797189888156761e-05, + "loss": 0.1594, + "step": 15688 + }, + { + "epoch": 42.74931880108992, + "grad_norm": 4.149773597717285, + "learning_rate": 1.27963426101241e-05, + "loss": 0.1171, + "step": 15689 + }, + { + "epoch": 42.752043596730246, + "grad_norm": 5.264461994171143, + "learning_rate": 1.279549531031361e-05, + "loss": 0.1744, + "step": 15690 + }, + { + "epoch": 42.75476839237057, + "grad_norm": 8.829997062683105, + "learning_rate": 1.2794647988731896e-05, + "loss": 0.2036, + "step": 15691 + }, + { + "epoch": 42.7574931880109, + "grad_norm": 5.838218688964844, + "learning_rate": 1.279380064538555e-05, + "loss": 0.2639, + "step": 15692 + }, + { + "epoch": 42.76021798365122, + "grad_norm": 4.818917751312256, + "learning_rate": 1.2792953280281175e-05, + "loss": 0.1606, + "step": 15693 + }, + { + "epoch": 42.762942779291556, + "grad_norm": 5.961804389953613, + "learning_rate": 1.2792105893425373e-05, + "loss": 0.1779, + "step": 15694 + }, + { + "epoch": 42.76566757493188, + "grad_norm": 6.108853340148926, + "learning_rate": 1.2791258484824736e-05, + "loss": 0.1674, + "step": 15695 + }, + { + "epoch": 42.76839237057221, + "grad_norm": 5.334097385406494, + "learning_rate": 1.279041105448587e-05, + "loss": 0.3838, + "step": 15696 + }, + { + "epoch": 42.771117166212534, + "grad_norm": 6.470245838165283, + "learning_rate": 1.278956360241537e-05, + "loss": 0.2318, + "step": 15697 + }, + { + "epoch": 42.77384196185286, + "grad_norm": 4.926463603973389, + "learning_rate": 1.2788716128619843e-05, + "loss": 0.1291, + "step": 15698 + }, + { + "epoch": 42.776566757493185, + "grad_norm": 5.360116004943848, + "learning_rate": 1.2787868633105882e-05, + "loss": 0.3191, + "step": 15699 + }, + { + "epoch": 42.77929155313352, + "grad_norm": 6.295806407928467, + "learning_rate": 1.278702111588009e-05, + "loss": 0.3707, + "step": 15700 + }, + { + "epoch": 42.782016348773844, + "grad_norm": 7.457422256469727, + "learning_rate": 1.2786173576949068e-05, + "loss": 0.1382, + "step": 15701 + }, + { + "epoch": 42.78474114441417, + "grad_norm": 5.710942268371582, + "learning_rate": 1.2785326016319415e-05, + "loss": 0.1496, + "step": 15702 + }, + { + "epoch": 42.787465940054496, + "grad_norm": 6.969316005706787, + "learning_rate": 1.2784478433997733e-05, + "loss": 0.1845, + "step": 15703 + }, + { + "epoch": 42.79019073569482, + "grad_norm": 5.756155490875244, + "learning_rate": 1.278363082999062e-05, + "loss": 0.3519, + "step": 15704 + }, + { + "epoch": 42.79291553133515, + "grad_norm": 4.032855033874512, + "learning_rate": 1.2782783204304683e-05, + "loss": 0.2219, + "step": 15705 + }, + { + "epoch": 42.79564032697548, + "grad_norm": 5.56076717376709, + "learning_rate": 1.2781935556946517e-05, + "loss": 0.2272, + "step": 15706 + }, + { + "epoch": 42.798365122615806, + "grad_norm": 6.550904273986816, + "learning_rate": 1.2781087887922729e-05, + "loss": 0.1784, + "step": 15707 + }, + { + "epoch": 42.80108991825613, + "grad_norm": 5.889643669128418, + "learning_rate": 1.2780240197239917e-05, + "loss": 0.1644, + "step": 15708 + }, + { + "epoch": 42.80381471389646, + "grad_norm": 5.0112810134887695, + "learning_rate": 1.2779392484904685e-05, + "loss": 0.1532, + "step": 15709 + }, + { + "epoch": 42.80653950953678, + "grad_norm": 5.021573543548584, + "learning_rate": 1.2778544750923634e-05, + "loss": 0.1197, + "step": 15710 + }, + { + "epoch": 42.80926430517711, + "grad_norm": 7.210042953491211, + "learning_rate": 1.2777696995303366e-05, + "loss": 0.2753, + "step": 15711 + }, + { + "epoch": 42.81198910081744, + "grad_norm": 5.5177812576293945, + "learning_rate": 1.277684921805048e-05, + "loss": 0.2453, + "step": 15712 + }, + { + "epoch": 42.81471389645777, + "grad_norm": 5.005462169647217, + "learning_rate": 1.2776001419171585e-05, + "loss": 0.3069, + "step": 15713 + }, + { + "epoch": 42.817438692098094, + "grad_norm": 9.254091262817383, + "learning_rate": 1.2775153598673276e-05, + "loss": 0.3414, + "step": 15714 + }, + { + "epoch": 42.82016348773842, + "grad_norm": 4.597906112670898, + "learning_rate": 1.2774305756562164e-05, + "loss": 0.2491, + "step": 15715 + }, + { + "epoch": 42.822888283378745, + "grad_norm": 4.350356101989746, + "learning_rate": 1.2773457892844844e-05, + "loss": 0.1406, + "step": 15716 + }, + { + "epoch": 42.82561307901907, + "grad_norm": 6.244409561157227, + "learning_rate": 1.277261000752793e-05, + "loss": 0.3517, + "step": 15717 + }, + { + "epoch": 42.828337874659404, + "grad_norm": 5.680519104003906, + "learning_rate": 1.2771762100618012e-05, + "loss": 0.2949, + "step": 15718 + }, + { + "epoch": 42.83106267029973, + "grad_norm": 6.875699520111084, + "learning_rate": 1.2770914172121706e-05, + "loss": 0.2951, + "step": 15719 + }, + { + "epoch": 42.833787465940055, + "grad_norm": 6.159343242645264, + "learning_rate": 1.2770066222045605e-05, + "loss": 0.1965, + "step": 15720 + }, + { + "epoch": 42.83651226158038, + "grad_norm": 7.010004043579102, + "learning_rate": 1.276921825039632e-05, + "loss": 0.2616, + "step": 15721 + }, + { + "epoch": 42.83923705722071, + "grad_norm": 5.467535495758057, + "learning_rate": 1.2768370257180449e-05, + "loss": 0.3691, + "step": 15722 + }, + { + "epoch": 42.84196185286103, + "grad_norm": 8.308337211608887, + "learning_rate": 1.2767522242404602e-05, + "loss": 0.1829, + "step": 15723 + }, + { + "epoch": 42.844686648501366, + "grad_norm": 5.9903178215026855, + "learning_rate": 1.276667420607538e-05, + "loss": 0.3084, + "step": 15724 + }, + { + "epoch": 42.84741144414169, + "grad_norm": 6.222293376922607, + "learning_rate": 1.276582614819939e-05, + "loss": 0.3444, + "step": 15725 + }, + { + "epoch": 42.85013623978202, + "grad_norm": 4.581437587738037, + "learning_rate": 1.2764978068783233e-05, + "loss": 0.2841, + "step": 15726 + }, + { + "epoch": 42.85286103542234, + "grad_norm": 7.398552894592285, + "learning_rate": 1.2764129967833518e-05, + "loss": 0.2128, + "step": 15727 + }, + { + "epoch": 42.85558583106267, + "grad_norm": 5.676241397857666, + "learning_rate": 1.2763281845356845e-05, + "loss": 0.1577, + "step": 15728 + }, + { + "epoch": 42.858310626702995, + "grad_norm": 5.449347972869873, + "learning_rate": 1.2762433701359827e-05, + "loss": 0.2946, + "step": 15729 + }, + { + "epoch": 42.86103542234333, + "grad_norm": 5.118447780609131, + "learning_rate": 1.2761585535849059e-05, + "loss": 0.2588, + "step": 15730 + }, + { + "epoch": 42.86376021798365, + "grad_norm": 5.3504252433776855, + "learning_rate": 1.2760737348831152e-05, + "loss": 0.2406, + "step": 15731 + }, + { + "epoch": 42.86648501362398, + "grad_norm": 5.175047874450684, + "learning_rate": 1.2759889140312711e-05, + "loss": 0.2955, + "step": 15732 + }, + { + "epoch": 42.869209809264305, + "grad_norm": 5.723325252532959, + "learning_rate": 1.2759040910300346e-05, + "loss": 0.1567, + "step": 15733 + }, + { + "epoch": 42.87193460490463, + "grad_norm": 5.2911224365234375, + "learning_rate": 1.2758192658800657e-05, + "loss": 0.3188, + "step": 15734 + }, + { + "epoch": 42.87465940054496, + "grad_norm": 4.562192440032959, + "learning_rate": 1.2757344385820254e-05, + "loss": 0.2519, + "step": 15735 + }, + { + "epoch": 42.87738419618529, + "grad_norm": 5.385756969451904, + "learning_rate": 1.2756496091365737e-05, + "loss": 0.2218, + "step": 15736 + }, + { + "epoch": 42.880108991825615, + "grad_norm": 5.6548752784729, + "learning_rate": 1.2755647775443722e-05, + "loss": 0.2245, + "step": 15737 + }, + { + "epoch": 42.88283378746594, + "grad_norm": 5.487072467803955, + "learning_rate": 1.275479943806081e-05, + "loss": 0.193, + "step": 15738 + }, + { + "epoch": 42.88555858310627, + "grad_norm": 6.113552093505859, + "learning_rate": 1.2753951079223606e-05, + "loss": 0.2282, + "step": 15739 + }, + { + "epoch": 42.88828337874659, + "grad_norm": 6.495295524597168, + "learning_rate": 1.275310269893872e-05, + "loss": 0.1993, + "step": 15740 + }, + { + "epoch": 42.89100817438692, + "grad_norm": 7.8980512619018555, + "learning_rate": 1.2752254297212762e-05, + "loss": 0.204, + "step": 15741 + }, + { + "epoch": 42.89373297002725, + "grad_norm": 6.508900165557861, + "learning_rate": 1.2751405874052334e-05, + "loss": 0.3016, + "step": 15742 + }, + { + "epoch": 42.89645776566758, + "grad_norm": 5.994144439697266, + "learning_rate": 1.2750557429464046e-05, + "loss": 0.2495, + "step": 15743 + }, + { + "epoch": 42.8991825613079, + "grad_norm": 5.538070201873779, + "learning_rate": 1.2749708963454507e-05, + "loss": 0.2072, + "step": 15744 + }, + { + "epoch": 42.90190735694823, + "grad_norm": 4.820894718170166, + "learning_rate": 1.274886047603032e-05, + "loss": 0.2049, + "step": 15745 + }, + { + "epoch": 42.904632152588555, + "grad_norm": 5.188495635986328, + "learning_rate": 1.2748011967198097e-05, + "loss": 0.1993, + "step": 15746 + }, + { + "epoch": 42.90735694822888, + "grad_norm": 5.004482269287109, + "learning_rate": 1.2747163436964447e-05, + "loss": 0.2109, + "step": 15747 + }, + { + "epoch": 42.91008174386921, + "grad_norm": 4.467107772827148, + "learning_rate": 1.274631488533597e-05, + "loss": 0.1824, + "step": 15748 + }, + { + "epoch": 42.91280653950954, + "grad_norm": 7.456881046295166, + "learning_rate": 1.274546631231929e-05, + "loss": 0.3516, + "step": 15749 + }, + { + "epoch": 42.915531335149865, + "grad_norm": 5.800576686859131, + "learning_rate": 1.2744617717921002e-05, + "loss": 0.3031, + "step": 15750 + }, + { + "epoch": 42.91825613079019, + "grad_norm": 4.827005863189697, + "learning_rate": 1.274376910214772e-05, + "loss": 0.1644, + "step": 15751 + }, + { + "epoch": 42.920980926430516, + "grad_norm": 6.49036169052124, + "learning_rate": 1.2742920465006052e-05, + "loss": 0.2566, + "step": 15752 + }, + { + "epoch": 42.92370572207084, + "grad_norm": 4.562337398529053, + "learning_rate": 1.2742071806502612e-05, + "loss": 0.1349, + "step": 15753 + }, + { + "epoch": 42.926430517711175, + "grad_norm": 5.6639509201049805, + "learning_rate": 1.2741223126644e-05, + "loss": 0.1537, + "step": 15754 + }, + { + "epoch": 42.9291553133515, + "grad_norm": 5.751596927642822, + "learning_rate": 1.2740374425436834e-05, + "loss": 0.1934, + "step": 15755 + }, + { + "epoch": 42.93188010899183, + "grad_norm": 5.298120021820068, + "learning_rate": 1.2739525702887718e-05, + "loss": 0.1716, + "step": 15756 + }, + { + "epoch": 42.93460490463215, + "grad_norm": 6.753478050231934, + "learning_rate": 1.2738676959003262e-05, + "loss": 0.2581, + "step": 15757 + }, + { + "epoch": 42.93732970027248, + "grad_norm": 7.195338249206543, + "learning_rate": 1.2737828193790081e-05, + "loss": 0.3621, + "step": 15758 + }, + { + "epoch": 42.940054495912804, + "grad_norm": 6.741783142089844, + "learning_rate": 1.2736979407254782e-05, + "loss": 0.2503, + "step": 15759 + }, + { + "epoch": 42.94277929155314, + "grad_norm": 15.566309928894043, + "learning_rate": 1.2736130599403973e-05, + "loss": 0.2491, + "step": 15760 + }, + { + "epoch": 42.94550408719346, + "grad_norm": 5.59145450592041, + "learning_rate": 1.2735281770244272e-05, + "loss": 0.1539, + "step": 15761 + }, + { + "epoch": 42.94822888283379, + "grad_norm": 6.900923728942871, + "learning_rate": 1.273443291978228e-05, + "loss": 0.1658, + "step": 15762 + }, + { + "epoch": 42.950953678474114, + "grad_norm": 6.400233268737793, + "learning_rate": 1.2733584048024614e-05, + "loss": 0.153, + "step": 15763 + }, + { + "epoch": 42.95367847411444, + "grad_norm": 7.227105617523193, + "learning_rate": 1.2732735154977885e-05, + "loss": 0.3138, + "step": 15764 + }, + { + "epoch": 42.956403269754766, + "grad_norm": 6.766824722290039, + "learning_rate": 1.2731886240648699e-05, + "loss": 0.2832, + "step": 15765 + }, + { + "epoch": 42.95912806539509, + "grad_norm": 7.418117523193359, + "learning_rate": 1.2731037305043675e-05, + "loss": 0.215, + "step": 15766 + }, + { + "epoch": 42.961852861035425, + "grad_norm": 6.897304534912109, + "learning_rate": 1.2730188348169416e-05, + "loss": 0.1917, + "step": 15767 + }, + { + "epoch": 42.96457765667575, + "grad_norm": 6.344455718994141, + "learning_rate": 1.272933937003254e-05, + "loss": 0.2007, + "step": 15768 + }, + { + "epoch": 42.967302452316076, + "grad_norm": 6.0487189292907715, + "learning_rate": 1.2728490370639659e-05, + "loss": 0.2554, + "step": 15769 + }, + { + "epoch": 42.9700272479564, + "grad_norm": 4.928340911865234, + "learning_rate": 1.2727641349997379e-05, + "loss": 0.2699, + "step": 15770 + }, + { + "epoch": 42.97275204359673, + "grad_norm": 5.338281154632568, + "learning_rate": 1.2726792308112319e-05, + "loss": 0.2481, + "step": 15771 + }, + { + "epoch": 42.97547683923706, + "grad_norm": 4.367077350616455, + "learning_rate": 1.2725943244991089e-05, + "loss": 0.1288, + "step": 15772 + }, + { + "epoch": 42.97820163487739, + "grad_norm": 4.917163372039795, + "learning_rate": 1.27250941606403e-05, + "loss": 0.1928, + "step": 15773 + }, + { + "epoch": 42.98092643051771, + "grad_norm": 6.855035305023193, + "learning_rate": 1.2724245055066561e-05, + "loss": 0.1877, + "step": 15774 + }, + { + "epoch": 42.98365122615804, + "grad_norm": 5.984237194061279, + "learning_rate": 1.2723395928276492e-05, + "loss": 0.2683, + "step": 15775 + }, + { + "epoch": 42.986376021798364, + "grad_norm": 5.014121055603027, + "learning_rate": 1.2722546780276705e-05, + "loss": 0.1354, + "step": 15776 + }, + { + "epoch": 42.98910081743869, + "grad_norm": 10.273235321044922, + "learning_rate": 1.272169761107381e-05, + "loss": 0.2324, + "step": 15777 + }, + { + "epoch": 42.991825613079016, + "grad_norm": 9.372404098510742, + "learning_rate": 1.272084842067442e-05, + "loss": 0.2366, + "step": 15778 + }, + { + "epoch": 42.99455040871935, + "grad_norm": 5.833219528198242, + "learning_rate": 1.2719999209085152e-05, + "loss": 0.4153, + "step": 15779 + }, + { + "epoch": 42.997275204359674, + "grad_norm": 7.8355913162231445, + "learning_rate": 1.2719149976312617e-05, + "loss": 0.4989, + "step": 15780 + }, + { + "epoch": 43.0, + "grad_norm": 4.25089693069458, + "learning_rate": 1.2718300722363431e-05, + "loss": 0.1144, + "step": 15781 + }, + { + "epoch": 43.002724795640326, + "grad_norm": 8.438754081726074, + "learning_rate": 1.2717451447244205e-05, + "loss": 0.1911, + "step": 15782 + }, + { + "epoch": 43.00544959128065, + "grad_norm": 5.1629252433776855, + "learning_rate": 1.2716602150961553e-05, + "loss": 0.2953, + "step": 15783 + }, + { + "epoch": 43.00817438692098, + "grad_norm": 4.964519500732422, + "learning_rate": 1.2715752833522094e-05, + "loss": 0.1674, + "step": 15784 + }, + { + "epoch": 43.01089918256131, + "grad_norm": 5.678306579589844, + "learning_rate": 1.2714903494932438e-05, + "loss": 0.179, + "step": 15785 + }, + { + "epoch": 43.013623978201636, + "grad_norm": 6.6454620361328125, + "learning_rate": 1.2714054135199201e-05, + "loss": 0.1723, + "step": 15786 + }, + { + "epoch": 43.01634877384196, + "grad_norm": 6.484141826629639, + "learning_rate": 1.2713204754328996e-05, + "loss": 0.1289, + "step": 15787 + }, + { + "epoch": 43.01907356948229, + "grad_norm": 4.936593532562256, + "learning_rate": 1.2712355352328442e-05, + "loss": 0.356, + "step": 15788 + }, + { + "epoch": 43.02179836512261, + "grad_norm": 5.204105377197266, + "learning_rate": 1.2711505929204153e-05, + "loss": 0.134, + "step": 15789 + }, + { + "epoch": 43.02452316076294, + "grad_norm": 5.359770774841309, + "learning_rate": 1.2710656484962742e-05, + "loss": 0.2325, + "step": 15790 + }, + { + "epoch": 43.02724795640327, + "grad_norm": 5.6926751136779785, + "learning_rate": 1.2709807019610823e-05, + "loss": 0.1692, + "step": 15791 + }, + { + "epoch": 43.0299727520436, + "grad_norm": 5.559471130371094, + "learning_rate": 1.2708957533155014e-05, + "loss": 0.2531, + "step": 15792 + }, + { + "epoch": 43.032697547683924, + "grad_norm": 4.012047290802002, + "learning_rate": 1.2708108025601935e-05, + "loss": 0.1518, + "step": 15793 + }, + { + "epoch": 43.03542234332425, + "grad_norm": 6.4738311767578125, + "learning_rate": 1.2707258496958197e-05, + "loss": 0.2364, + "step": 15794 + }, + { + "epoch": 43.038147138964575, + "grad_norm": 4.456639289855957, + "learning_rate": 1.2706408947230414e-05, + "loss": 0.1331, + "step": 15795 + }, + { + "epoch": 43.0408719346049, + "grad_norm": 6.203889846801758, + "learning_rate": 1.270555937642521e-05, + "loss": 0.2468, + "step": 15796 + }, + { + "epoch": 43.043596730245234, + "grad_norm": 4.330617427825928, + "learning_rate": 1.2704709784549192e-05, + "loss": 0.3094, + "step": 15797 + }, + { + "epoch": 43.04632152588556, + "grad_norm": 6.280506134033203, + "learning_rate": 1.2703860171608985e-05, + "loss": 0.2799, + "step": 15798 + }, + { + "epoch": 43.049046321525886, + "grad_norm": 6.598577976226807, + "learning_rate": 1.2703010537611198e-05, + "loss": 0.1708, + "step": 15799 + }, + { + "epoch": 43.05177111716621, + "grad_norm": 5.593931198120117, + "learning_rate": 1.2702160882562453e-05, + "loss": 0.188, + "step": 15800 + }, + { + "epoch": 43.05449591280654, + "grad_norm": 4.6534199714660645, + "learning_rate": 1.2701311206469366e-05, + "loss": 0.2912, + "step": 15801 + }, + { + "epoch": 43.05722070844686, + "grad_norm": 5.074550151824951, + "learning_rate": 1.2700461509338555e-05, + "loss": 0.1516, + "step": 15802 + }, + { + "epoch": 43.059945504087196, + "grad_norm": 6.933719635009766, + "learning_rate": 1.2699611791176638e-05, + "loss": 0.2509, + "step": 15803 + }, + { + "epoch": 43.06267029972752, + "grad_norm": 5.630640983581543, + "learning_rate": 1.269876205199023e-05, + "loss": 0.132, + "step": 15804 + }, + { + "epoch": 43.06539509536785, + "grad_norm": 6.669646739959717, + "learning_rate": 1.269791229178595e-05, + "loss": 0.2525, + "step": 15805 + }, + { + "epoch": 43.06811989100817, + "grad_norm": 6.0606584548950195, + "learning_rate": 1.2697062510570417e-05, + "loss": 0.2483, + "step": 15806 + }, + { + "epoch": 43.0708446866485, + "grad_norm": 5.033213138580322, + "learning_rate": 1.2696212708350247e-05, + "loss": 0.2202, + "step": 15807 + }, + { + "epoch": 43.073569482288825, + "grad_norm": 5.555293083190918, + "learning_rate": 1.2695362885132057e-05, + "loss": 0.2937, + "step": 15808 + }, + { + "epoch": 43.07629427792916, + "grad_norm": 5.399478435516357, + "learning_rate": 1.269451304092247e-05, + "loss": 0.1889, + "step": 15809 + }, + { + "epoch": 43.079019073569484, + "grad_norm": 6.696550369262695, + "learning_rate": 1.2693663175728102e-05, + "loss": 0.3098, + "step": 15810 + }, + { + "epoch": 43.08174386920981, + "grad_norm": 5.641627788543701, + "learning_rate": 1.269281328955557e-05, + "loss": 0.2914, + "step": 15811 + }, + { + "epoch": 43.084468664850135, + "grad_norm": 5.6052680015563965, + "learning_rate": 1.2691963382411498e-05, + "loss": 0.1666, + "step": 15812 + }, + { + "epoch": 43.08719346049046, + "grad_norm": 5.3014373779296875, + "learning_rate": 1.26911134543025e-05, + "loss": 0.2783, + "step": 15813 + }, + { + "epoch": 43.08991825613079, + "grad_norm": 4.597877502441406, + "learning_rate": 1.2690263505235199e-05, + "loss": 0.286, + "step": 15814 + }, + { + "epoch": 43.09264305177112, + "grad_norm": 4.8344645500183105, + "learning_rate": 1.2689413535216209e-05, + "loss": 0.2461, + "step": 15815 + }, + { + "epoch": 43.095367847411445, + "grad_norm": 4.9873046875, + "learning_rate": 1.2688563544252156e-05, + "loss": 0.1694, + "step": 15816 + }, + { + "epoch": 43.09809264305177, + "grad_norm": 5.87472677230835, + "learning_rate": 1.2687713532349653e-05, + "loss": 0.346, + "step": 15817 + }, + { + "epoch": 43.1008174386921, + "grad_norm": 5.895587921142578, + "learning_rate": 1.2686863499515327e-05, + "loss": 0.1604, + "step": 15818 + }, + { + "epoch": 43.10354223433242, + "grad_norm": 5.016204357147217, + "learning_rate": 1.2686013445755792e-05, + "loss": 0.2268, + "step": 15819 + }, + { + "epoch": 43.10626702997275, + "grad_norm": 4.473295211791992, + "learning_rate": 1.2685163371077676e-05, + "loss": 0.1698, + "step": 15820 + }, + { + "epoch": 43.10899182561308, + "grad_norm": 5.678323745727539, + "learning_rate": 1.2684313275487587e-05, + "loss": 0.2753, + "step": 15821 + }, + { + "epoch": 43.11171662125341, + "grad_norm": 5.489089012145996, + "learning_rate": 1.2683463158992157e-05, + "loss": 0.2203, + "step": 15822 + }, + { + "epoch": 43.11444141689373, + "grad_norm": 4.795029163360596, + "learning_rate": 1.2682613021598e-05, + "loss": 0.2138, + "step": 15823 + }, + { + "epoch": 43.11716621253406, + "grad_norm": 4.624063968658447, + "learning_rate": 1.2681762863311744e-05, + "loss": 0.2654, + "step": 15824 + }, + { + "epoch": 43.119891008174385, + "grad_norm": 5.710758209228516, + "learning_rate": 1.2680912684139996e-05, + "loss": 0.2917, + "step": 15825 + }, + { + "epoch": 43.12261580381471, + "grad_norm": 6.505515098571777, + "learning_rate": 1.2680062484089396e-05, + "loss": 0.2112, + "step": 15826 + }, + { + "epoch": 43.12534059945504, + "grad_norm": 5.088910102844238, + "learning_rate": 1.2679212263166548e-05, + "loss": 0.1748, + "step": 15827 + }, + { + "epoch": 43.12806539509537, + "grad_norm": 7.963064193725586, + "learning_rate": 1.2678362021378085e-05, + "loss": 0.2247, + "step": 15828 + }, + { + "epoch": 43.130790190735695, + "grad_norm": 5.173469543457031, + "learning_rate": 1.2677511758730625e-05, + "loss": 0.3488, + "step": 15829 + }, + { + "epoch": 43.13351498637602, + "grad_norm": 5.114818572998047, + "learning_rate": 1.267666147523079e-05, + "loss": 0.2002, + "step": 15830 + }, + { + "epoch": 43.13623978201635, + "grad_norm": 5.150710582733154, + "learning_rate": 1.2675811170885199e-05, + "loss": 0.2605, + "step": 15831 + }, + { + "epoch": 43.13896457765667, + "grad_norm": 4.721823215484619, + "learning_rate": 1.2674960845700478e-05, + "loss": 0.167, + "step": 15832 + }, + { + "epoch": 43.141689373297005, + "grad_norm": 7.443442344665527, + "learning_rate": 1.267411049968325e-05, + "loss": 0.1951, + "step": 15833 + }, + { + "epoch": 43.14441416893733, + "grad_norm": 6.747244834899902, + "learning_rate": 1.2673260132840133e-05, + "loss": 0.2664, + "step": 15834 + }, + { + "epoch": 43.14713896457766, + "grad_norm": 8.787422180175781, + "learning_rate": 1.2672409745177752e-05, + "loss": 0.1762, + "step": 15835 + }, + { + "epoch": 43.14986376021798, + "grad_norm": 7.668347358703613, + "learning_rate": 1.267155933670273e-05, + "loss": 0.1555, + "step": 15836 + }, + { + "epoch": 43.15258855585831, + "grad_norm": 23.420007705688477, + "learning_rate": 1.267070890742169e-05, + "loss": 0.1536, + "step": 15837 + }, + { + "epoch": 43.155313351498634, + "grad_norm": 5.895536422729492, + "learning_rate": 1.2669858457341258e-05, + "loss": 0.2571, + "step": 15838 + }, + { + "epoch": 43.15803814713897, + "grad_norm": 4.71837043762207, + "learning_rate": 1.266900798646805e-05, + "loss": 0.161, + "step": 15839 + }, + { + "epoch": 43.16076294277929, + "grad_norm": 5.424498558044434, + "learning_rate": 1.2668157494808697e-05, + "loss": 0.1275, + "step": 15840 + }, + { + "epoch": 43.16348773841962, + "grad_norm": 5.675332069396973, + "learning_rate": 1.2667306982369816e-05, + "loss": 0.1802, + "step": 15841 + }, + { + "epoch": 43.166212534059945, + "grad_norm": 3.783858060836792, + "learning_rate": 1.2666456449158037e-05, + "loss": 0.2775, + "step": 15842 + }, + { + "epoch": 43.16893732970027, + "grad_norm": 5.900336742401123, + "learning_rate": 1.2665605895179977e-05, + "loss": 0.3205, + "step": 15843 + }, + { + "epoch": 43.171662125340596, + "grad_norm": 4.113350868225098, + "learning_rate": 1.266475532044227e-05, + "loss": 0.148, + "step": 15844 + }, + { + "epoch": 43.17438692098093, + "grad_norm": 6.5994672775268555, + "learning_rate": 1.266390472495153e-05, + "loss": 0.2427, + "step": 15845 + }, + { + "epoch": 43.177111716621255, + "grad_norm": 5.132373809814453, + "learning_rate": 1.2663054108714388e-05, + "loss": 0.2726, + "step": 15846 + }, + { + "epoch": 43.17983651226158, + "grad_norm": 6.610569477081299, + "learning_rate": 1.2662203471737465e-05, + "loss": 0.3831, + "step": 15847 + }, + { + "epoch": 43.182561307901906, + "grad_norm": 5.182617664337158, + "learning_rate": 1.2661352814027388e-05, + "loss": 0.2854, + "step": 15848 + }, + { + "epoch": 43.18528610354223, + "grad_norm": 4.746345520019531, + "learning_rate": 1.266050213559078e-05, + "loss": 0.199, + "step": 15849 + }, + { + "epoch": 43.18801089918256, + "grad_norm": 6.213058948516846, + "learning_rate": 1.2659651436434268e-05, + "loss": 0.2269, + "step": 15850 + }, + { + "epoch": 43.19073569482289, + "grad_norm": 4.184413909912109, + "learning_rate": 1.2658800716564474e-05, + "loss": 0.1484, + "step": 15851 + }, + { + "epoch": 43.19346049046322, + "grad_norm": 6.441722869873047, + "learning_rate": 1.2657949975988028e-05, + "loss": 0.3351, + "step": 15852 + }, + { + "epoch": 43.19618528610354, + "grad_norm": 4.789957523345947, + "learning_rate": 1.2657099214711553e-05, + "loss": 0.1619, + "step": 15853 + }, + { + "epoch": 43.19891008174387, + "grad_norm": 4.777517795562744, + "learning_rate": 1.2656248432741674e-05, + "loss": 0.1425, + "step": 15854 + }, + { + "epoch": 43.201634877384194, + "grad_norm": 5.650998592376709, + "learning_rate": 1.2655397630085015e-05, + "loss": 0.1421, + "step": 15855 + }, + { + "epoch": 43.20435967302452, + "grad_norm": 6.645985126495361, + "learning_rate": 1.2654546806748209e-05, + "loss": 0.1788, + "step": 15856 + }, + { + "epoch": 43.20708446866485, + "grad_norm": 6.334911346435547, + "learning_rate": 1.2653695962737875e-05, + "loss": 0.2482, + "step": 15857 + }, + { + "epoch": 43.20980926430518, + "grad_norm": 5.914535999298096, + "learning_rate": 1.2652845098060647e-05, + "loss": 0.1692, + "step": 15858 + }, + { + "epoch": 43.212534059945504, + "grad_norm": 5.427907466888428, + "learning_rate": 1.2651994212723142e-05, + "loss": 0.2051, + "step": 15859 + }, + { + "epoch": 43.21525885558583, + "grad_norm": 5.219813346862793, + "learning_rate": 1.2651143306731992e-05, + "loss": 0.2219, + "step": 15860 + }, + { + "epoch": 43.217983651226156, + "grad_norm": 4.969454765319824, + "learning_rate": 1.2650292380093826e-05, + "loss": 0.2183, + "step": 15861 + }, + { + "epoch": 43.22070844686648, + "grad_norm": 5.98974084854126, + "learning_rate": 1.2649441432815266e-05, + "loss": 0.1773, + "step": 15862 + }, + { + "epoch": 43.223433242506815, + "grad_norm": 5.0268168449401855, + "learning_rate": 1.2648590464902941e-05, + "loss": 0.2191, + "step": 15863 + }, + { + "epoch": 43.22615803814714, + "grad_norm": 6.868879318237305, + "learning_rate": 1.264773947636348e-05, + "loss": 0.3091, + "step": 15864 + }, + { + "epoch": 43.228882833787466, + "grad_norm": 5.643497943878174, + "learning_rate": 1.2646888467203509e-05, + "loss": 0.1794, + "step": 15865 + }, + { + "epoch": 43.23160762942779, + "grad_norm": 8.155420303344727, + "learning_rate": 1.2646037437429654e-05, + "loss": 0.2581, + "step": 15866 + }, + { + "epoch": 43.23433242506812, + "grad_norm": 6.457836151123047, + "learning_rate": 1.2645186387048546e-05, + "loss": 0.173, + "step": 15867 + }, + { + "epoch": 43.237057220708444, + "grad_norm": 5.538093566894531, + "learning_rate": 1.2644335316066811e-05, + "loss": 0.2043, + "step": 15868 + }, + { + "epoch": 43.23978201634878, + "grad_norm": 4.105807781219482, + "learning_rate": 1.2643484224491078e-05, + "loss": 0.2702, + "step": 15869 + }, + { + "epoch": 43.2425068119891, + "grad_norm": 5.2638726234436035, + "learning_rate": 1.2642633112327975e-05, + "loss": 0.246, + "step": 15870 + }, + { + "epoch": 43.24523160762943, + "grad_norm": 6.423031330108643, + "learning_rate": 1.2641781979584133e-05, + "loss": 0.1329, + "step": 15871 + }, + { + "epoch": 43.247956403269754, + "grad_norm": 4.938924312591553, + "learning_rate": 1.2640930826266176e-05, + "loss": 0.221, + "step": 15872 + }, + { + "epoch": 43.25068119891008, + "grad_norm": 5.241696357727051, + "learning_rate": 1.2640079652380734e-05, + "loss": 0.1771, + "step": 15873 + }, + { + "epoch": 43.253405994550405, + "grad_norm": 5.034905433654785, + "learning_rate": 1.2639228457934435e-05, + "loss": 0.1534, + "step": 15874 + }, + { + "epoch": 43.25613079019074, + "grad_norm": 8.160731315612793, + "learning_rate": 1.2638377242933912e-05, + "loss": 0.3567, + "step": 15875 + }, + { + "epoch": 43.258855585831064, + "grad_norm": 6.0418877601623535, + "learning_rate": 1.2637526007385792e-05, + "loss": 0.2643, + "step": 15876 + }, + { + "epoch": 43.26158038147139, + "grad_norm": 4.733092308044434, + "learning_rate": 1.2636674751296702e-05, + "loss": 0.276, + "step": 15877 + }, + { + "epoch": 43.264305177111716, + "grad_norm": 4.871381759643555, + "learning_rate": 1.2635823474673277e-05, + "loss": 0.163, + "step": 15878 + }, + { + "epoch": 43.26702997275204, + "grad_norm": 4.54433536529541, + "learning_rate": 1.2634972177522143e-05, + "loss": 0.3121, + "step": 15879 + }, + { + "epoch": 43.26975476839237, + "grad_norm": 4.6075758934021, + "learning_rate": 1.263412085984993e-05, + "loss": 0.2503, + "step": 15880 + }, + { + "epoch": 43.2724795640327, + "grad_norm": 6.629269123077393, + "learning_rate": 1.2633269521663269e-05, + "loss": 0.2072, + "step": 15881 + }, + { + "epoch": 43.275204359673026, + "grad_norm": 8.31963062286377, + "learning_rate": 1.2632418162968789e-05, + "loss": 0.2411, + "step": 15882 + }, + { + "epoch": 43.27792915531335, + "grad_norm": 19.239208221435547, + "learning_rate": 1.2631566783773121e-05, + "loss": 0.2096, + "step": 15883 + }, + { + "epoch": 43.28065395095368, + "grad_norm": 4.6367716789245605, + "learning_rate": 1.2630715384082897e-05, + "loss": 0.2933, + "step": 15884 + }, + { + "epoch": 43.283378746594, + "grad_norm": 5.596940517425537, + "learning_rate": 1.2629863963904745e-05, + "loss": 0.1837, + "step": 15885 + }, + { + "epoch": 43.28610354223433, + "grad_norm": 5.270818710327148, + "learning_rate": 1.2629012523245294e-05, + "loss": 0.4278, + "step": 15886 + }, + { + "epoch": 43.28882833787466, + "grad_norm": 5.236704349517822, + "learning_rate": 1.2628161062111182e-05, + "loss": 0.2124, + "step": 15887 + }, + { + "epoch": 43.29155313351499, + "grad_norm": 6.127437591552734, + "learning_rate": 1.2627309580509034e-05, + "loss": 0.2041, + "step": 15888 + }, + { + "epoch": 43.294277929155314, + "grad_norm": 4.5770673751831055, + "learning_rate": 1.2626458078445487e-05, + "loss": 0.1639, + "step": 15889 + }, + { + "epoch": 43.29700272479564, + "grad_norm": 5.236861705780029, + "learning_rate": 1.2625606555927167e-05, + "loss": 0.1547, + "step": 15890 + }, + { + "epoch": 43.299727520435965, + "grad_norm": 5.086138725280762, + "learning_rate": 1.2624755012960707e-05, + "loss": 0.2465, + "step": 15891 + }, + { + "epoch": 43.30245231607629, + "grad_norm": 4.756349086761475, + "learning_rate": 1.2623903449552741e-05, + "loss": 0.1608, + "step": 15892 + }, + { + "epoch": 43.305177111716624, + "grad_norm": 5.747576713562012, + "learning_rate": 1.2623051865709899e-05, + "loss": 0.3202, + "step": 15893 + }, + { + "epoch": 43.30790190735695, + "grad_norm": 7.722446918487549, + "learning_rate": 1.262220026143881e-05, + "loss": 0.1602, + "step": 15894 + }, + { + "epoch": 43.310626702997276, + "grad_norm": 13.73774528503418, + "learning_rate": 1.2621348636746115e-05, + "loss": 0.2676, + "step": 15895 + }, + { + "epoch": 43.3133514986376, + "grad_norm": 4.293647766113281, + "learning_rate": 1.2620496991638439e-05, + "loss": 0.1291, + "step": 15896 + }, + { + "epoch": 43.31607629427793, + "grad_norm": 11.641107559204102, + "learning_rate": 1.2619645326122416e-05, + "loss": 0.2622, + "step": 15897 + }, + { + "epoch": 43.31880108991825, + "grad_norm": 5.130149841308594, + "learning_rate": 1.261879364020468e-05, + "loss": 0.1486, + "step": 15898 + }, + { + "epoch": 43.321525885558586, + "grad_norm": 4.847710132598877, + "learning_rate": 1.2617941933891867e-05, + "loss": 0.3147, + "step": 15899 + }, + { + "epoch": 43.32425068119891, + "grad_norm": 4.9436116218566895, + "learning_rate": 1.26170902071906e-05, + "loss": 0.2143, + "step": 15900 + }, + { + "epoch": 43.32697547683924, + "grad_norm": 5.533937931060791, + "learning_rate": 1.2616238460107525e-05, + "loss": 0.2049, + "step": 15901 + }, + { + "epoch": 43.32970027247956, + "grad_norm": 6.411024570465088, + "learning_rate": 1.2615386692649263e-05, + "loss": 0.1421, + "step": 15902 + }, + { + "epoch": 43.33242506811989, + "grad_norm": 4.478221893310547, + "learning_rate": 1.2614534904822455e-05, + "loss": 0.2364, + "step": 15903 + }, + { + "epoch": 43.335149863760215, + "grad_norm": 6.68491268157959, + "learning_rate": 1.2613683096633736e-05, + "loss": 0.3194, + "step": 15904 + }, + { + "epoch": 43.33787465940055, + "grad_norm": 5.500149726867676, + "learning_rate": 1.2612831268089736e-05, + "loss": 0.1888, + "step": 15905 + }, + { + "epoch": 43.34059945504087, + "grad_norm": 5.258341312408447, + "learning_rate": 1.261197941919709e-05, + "loss": 0.2387, + "step": 15906 + }, + { + "epoch": 43.3433242506812, + "grad_norm": 4.661367893218994, + "learning_rate": 1.2611127549962432e-05, + "loss": 0.1575, + "step": 15907 + }, + { + "epoch": 43.346049046321525, + "grad_norm": 4.837214946746826, + "learning_rate": 1.2610275660392397e-05, + "loss": 0.2816, + "step": 15908 + }, + { + "epoch": 43.34877384196185, + "grad_norm": 5.191956520080566, + "learning_rate": 1.2609423750493622e-05, + "loss": 0.2298, + "step": 15909 + }, + { + "epoch": 43.35149863760218, + "grad_norm": 4.816946983337402, + "learning_rate": 1.2608571820272734e-05, + "loss": 0.2029, + "step": 15910 + }, + { + "epoch": 43.35422343324251, + "grad_norm": 5.787227630615234, + "learning_rate": 1.2607719869736374e-05, + "loss": 0.1945, + "step": 15911 + }, + { + "epoch": 43.356948228882835, + "grad_norm": 5.747407913208008, + "learning_rate": 1.2606867898891175e-05, + "loss": 0.1796, + "step": 15912 + }, + { + "epoch": 43.35967302452316, + "grad_norm": 5.252607345581055, + "learning_rate": 1.2606015907743777e-05, + "loss": 0.1556, + "step": 15913 + }, + { + "epoch": 43.36239782016349, + "grad_norm": 5.972566604614258, + "learning_rate": 1.2605163896300808e-05, + "loss": 0.2113, + "step": 15914 + }, + { + "epoch": 43.36512261580381, + "grad_norm": 5.59675407409668, + "learning_rate": 1.2604311864568905e-05, + "loss": 0.2823, + "step": 15915 + }, + { + "epoch": 43.36784741144414, + "grad_norm": 5.3479905128479, + "learning_rate": 1.2603459812554708e-05, + "loss": 0.1877, + "step": 15916 + }, + { + "epoch": 43.37057220708447, + "grad_norm": 5.108469486236572, + "learning_rate": 1.260260774026485e-05, + "loss": 0.1691, + "step": 15917 + }, + { + "epoch": 43.3732970027248, + "grad_norm": 7.5149736404418945, + "learning_rate": 1.2601755647705963e-05, + "loss": 0.184, + "step": 15918 + }, + { + "epoch": 43.37602179836512, + "grad_norm": 4.790966033935547, + "learning_rate": 1.260090353488469e-05, + "loss": 0.277, + "step": 15919 + }, + { + "epoch": 43.37874659400545, + "grad_norm": 5.162489414215088, + "learning_rate": 1.2600051401807659e-05, + "loss": 0.3124, + "step": 15920 + }, + { + "epoch": 43.381471389645775, + "grad_norm": 4.985558032989502, + "learning_rate": 1.2599199248481515e-05, + "loss": 0.2502, + "step": 15921 + }, + { + "epoch": 43.3841961852861, + "grad_norm": 5.302313327789307, + "learning_rate": 1.2598347074912891e-05, + "loss": 0.2769, + "step": 15922 + }, + { + "epoch": 43.38692098092643, + "grad_norm": 4.48428201675415, + "learning_rate": 1.2597494881108425e-05, + "loss": 0.2012, + "step": 15923 + }, + { + "epoch": 43.38964577656676, + "grad_norm": 5.0740132331848145, + "learning_rate": 1.259664266707475e-05, + "loss": 0.3165, + "step": 15924 + }, + { + "epoch": 43.392370572207085, + "grad_norm": 6.1025390625, + "learning_rate": 1.2595790432818508e-05, + "loss": 0.3137, + "step": 15925 + }, + { + "epoch": 43.39509536784741, + "grad_norm": 6.309225082397461, + "learning_rate": 1.2594938178346332e-05, + "loss": 0.2605, + "step": 15926 + }, + { + "epoch": 43.39782016348774, + "grad_norm": 4.591233730316162, + "learning_rate": 1.2594085903664861e-05, + "loss": 0.2574, + "step": 15927 + }, + { + "epoch": 43.40054495912806, + "grad_norm": 5.807793617248535, + "learning_rate": 1.2593233608780733e-05, + "loss": 0.1706, + "step": 15928 + }, + { + "epoch": 43.403269754768395, + "grad_norm": 4.671628475189209, + "learning_rate": 1.2592381293700583e-05, + "loss": 0.1156, + "step": 15929 + }, + { + "epoch": 43.40599455040872, + "grad_norm": 5.2835307121276855, + "learning_rate": 1.2591528958431052e-05, + "loss": 0.2042, + "step": 15930 + }, + { + "epoch": 43.40871934604905, + "grad_norm": 4.173274517059326, + "learning_rate": 1.259067660297878e-05, + "loss": 0.1545, + "step": 15931 + }, + { + "epoch": 43.41144414168937, + "grad_norm": 4.61704683303833, + "learning_rate": 1.2589824227350397e-05, + "loss": 0.2786, + "step": 15932 + }, + { + "epoch": 43.4141689373297, + "grad_norm": 4.443673133850098, + "learning_rate": 1.2588971831552553e-05, + "loss": 0.2406, + "step": 15933 + }, + { + "epoch": 43.416893732970024, + "grad_norm": 5.341704368591309, + "learning_rate": 1.2588119415591873e-05, + "loss": 0.2189, + "step": 15934 + }, + { + "epoch": 43.41961852861036, + "grad_norm": 4.745103359222412, + "learning_rate": 1.2587266979475006e-05, + "loss": 0.2466, + "step": 15935 + }, + { + "epoch": 43.42234332425068, + "grad_norm": 5.30593729019165, + "learning_rate": 1.2586414523208586e-05, + "loss": 0.2246, + "step": 15936 + }, + { + "epoch": 43.42506811989101, + "grad_norm": 4.774023532867432, + "learning_rate": 1.2585562046799251e-05, + "loss": 0.1179, + "step": 15937 + }, + { + "epoch": 43.427792915531334, + "grad_norm": 4.554322719573975, + "learning_rate": 1.2584709550253644e-05, + "loss": 0.2502, + "step": 15938 + }, + { + "epoch": 43.43051771117166, + "grad_norm": 5.701827049255371, + "learning_rate": 1.2583857033578401e-05, + "loss": 0.3235, + "step": 15939 + }, + { + "epoch": 43.433242506811986, + "grad_norm": 6.528021812438965, + "learning_rate": 1.2583004496780164e-05, + "loss": 0.3034, + "step": 15940 + }, + { + "epoch": 43.43596730245232, + "grad_norm": 6.078108310699463, + "learning_rate": 1.258215193986557e-05, + "loss": 0.1343, + "step": 15941 + }, + { + "epoch": 43.438692098092645, + "grad_norm": 5.999648094177246, + "learning_rate": 1.2581299362841262e-05, + "loss": 0.1692, + "step": 15942 + }, + { + "epoch": 43.44141689373297, + "grad_norm": 6.091801166534424, + "learning_rate": 1.2580446765713876e-05, + "loss": 0.3725, + "step": 15943 + }, + { + "epoch": 43.444141689373296, + "grad_norm": 5.250519275665283, + "learning_rate": 1.2579594148490054e-05, + "loss": 0.1306, + "step": 15944 + }, + { + "epoch": 43.44686648501362, + "grad_norm": 4.235337257385254, + "learning_rate": 1.2578741511176436e-05, + "loss": 0.1967, + "step": 15945 + }, + { + "epoch": 43.44959128065395, + "grad_norm": 4.8902435302734375, + "learning_rate": 1.257788885377966e-05, + "loss": 0.1744, + "step": 15946 + }, + { + "epoch": 43.45231607629428, + "grad_norm": 6.23908805847168, + "learning_rate": 1.257703617630637e-05, + "loss": 0.1973, + "step": 15947 + }, + { + "epoch": 43.45504087193461, + "grad_norm": 5.5344648361206055, + "learning_rate": 1.2576183478763207e-05, + "loss": 0.1486, + "step": 15948 + }, + { + "epoch": 43.45776566757493, + "grad_norm": 4.776824474334717, + "learning_rate": 1.2575330761156808e-05, + "loss": 0.4061, + "step": 15949 + }, + { + "epoch": 43.46049046321526, + "grad_norm": 4.633957386016846, + "learning_rate": 1.2574478023493817e-05, + "loss": 0.2403, + "step": 15950 + }, + { + "epoch": 43.463215258855584, + "grad_norm": 3.901925563812256, + "learning_rate": 1.2573625265780873e-05, + "loss": 0.21, + "step": 15951 + }, + { + "epoch": 43.46594005449591, + "grad_norm": 5.508082389831543, + "learning_rate": 1.257277248802462e-05, + "loss": 0.3442, + "step": 15952 + }, + { + "epoch": 43.46866485013624, + "grad_norm": 6.7831926345825195, + "learning_rate": 1.2571919690231695e-05, + "loss": 0.3998, + "step": 15953 + }, + { + "epoch": 43.47138964577657, + "grad_norm": 4.064985275268555, + "learning_rate": 1.2571066872408744e-05, + "loss": 0.1023, + "step": 15954 + }, + { + "epoch": 43.474114441416894, + "grad_norm": 7.114734649658203, + "learning_rate": 1.2570214034562404e-05, + "loss": 0.245, + "step": 15955 + }, + { + "epoch": 43.47683923705722, + "grad_norm": 5.0616278648376465, + "learning_rate": 1.2569361176699323e-05, + "loss": 0.22, + "step": 15956 + }, + { + "epoch": 43.479564032697546, + "grad_norm": 7.711175441741943, + "learning_rate": 1.256850829882614e-05, + "loss": 0.2321, + "step": 15957 + }, + { + "epoch": 43.48228882833787, + "grad_norm": 11.367053031921387, + "learning_rate": 1.2567655400949497e-05, + "loss": 0.3439, + "step": 15958 + }, + { + "epoch": 43.485013623978205, + "grad_norm": 6.908168315887451, + "learning_rate": 1.2566802483076033e-05, + "loss": 0.198, + "step": 15959 + }, + { + "epoch": 43.48773841961853, + "grad_norm": 5.678273677825928, + "learning_rate": 1.25659495452124e-05, + "loss": 0.3083, + "step": 15960 + }, + { + "epoch": 43.490463215258856, + "grad_norm": 4.642317295074463, + "learning_rate": 1.256509658736523e-05, + "loss": 0.1347, + "step": 15961 + }, + { + "epoch": 43.49318801089918, + "grad_norm": 5.812233924865723, + "learning_rate": 1.2564243609541172e-05, + "loss": 0.1897, + "step": 15962 + }, + { + "epoch": 43.49591280653951, + "grad_norm": 5.294683456420898, + "learning_rate": 1.2563390611746864e-05, + "loss": 0.1106, + "step": 15963 + }, + { + "epoch": 43.49863760217983, + "grad_norm": 5.511291027069092, + "learning_rate": 1.2562537593988954e-05, + "loss": 0.2228, + "step": 15964 + }, + { + "epoch": 43.50136239782017, + "grad_norm": 5.468712329864502, + "learning_rate": 1.2561684556274085e-05, + "loss": 0.2565, + "step": 15965 + }, + { + "epoch": 43.50408719346049, + "grad_norm": 6.432379245758057, + "learning_rate": 1.25608314986089e-05, + "loss": 0.1214, + "step": 15966 + }, + { + "epoch": 43.50681198910082, + "grad_norm": 6.043390274047852, + "learning_rate": 1.2559978421000039e-05, + "loss": 0.1766, + "step": 15967 + }, + { + "epoch": 43.509536784741144, + "grad_norm": 4.677197456359863, + "learning_rate": 1.2559125323454154e-05, + "loss": 0.2536, + "step": 15968 + }, + { + "epoch": 43.51226158038147, + "grad_norm": 4.803244113922119, + "learning_rate": 1.2558272205977877e-05, + "loss": 0.2002, + "step": 15969 + }, + { + "epoch": 43.514986376021795, + "grad_norm": 4.047486782073975, + "learning_rate": 1.255741906857786e-05, + "loss": 0.1019, + "step": 15970 + }, + { + "epoch": 43.51771117166213, + "grad_norm": 8.100784301757812, + "learning_rate": 1.2556565911260747e-05, + "loss": 0.2284, + "step": 15971 + }, + { + "epoch": 43.520435967302454, + "grad_norm": 5.012939453125, + "learning_rate": 1.2555712734033179e-05, + "loss": 0.1698, + "step": 15972 + }, + { + "epoch": 43.52316076294278, + "grad_norm": 6.9246931076049805, + "learning_rate": 1.2554859536901805e-05, + "loss": 0.303, + "step": 15973 + }, + { + "epoch": 43.525885558583106, + "grad_norm": 6.250595569610596, + "learning_rate": 1.2554006319873265e-05, + "loss": 0.1173, + "step": 15974 + }, + { + "epoch": 43.52861035422343, + "grad_norm": 4.4001898765563965, + "learning_rate": 1.2553153082954206e-05, + "loss": 0.265, + "step": 15975 + }, + { + "epoch": 43.53133514986376, + "grad_norm": 5.430992603302002, + "learning_rate": 1.2552299826151275e-05, + "loss": 0.2309, + "step": 15976 + }, + { + "epoch": 43.53405994550409, + "grad_norm": 4.987862586975098, + "learning_rate": 1.2551446549471114e-05, + "loss": 0.3293, + "step": 15977 + }, + { + "epoch": 43.536784741144416, + "grad_norm": 6.801769256591797, + "learning_rate": 1.2550593252920371e-05, + "loss": 0.2247, + "step": 15978 + }, + { + "epoch": 43.53950953678474, + "grad_norm": 4.975493907928467, + "learning_rate": 1.2549739936505687e-05, + "loss": 0.1541, + "step": 15979 + }, + { + "epoch": 43.54223433242507, + "grad_norm": 5.002984523773193, + "learning_rate": 1.2548886600233709e-05, + "loss": 0.1904, + "step": 15980 + }, + { + "epoch": 43.54495912806539, + "grad_norm": 4.474903106689453, + "learning_rate": 1.2548033244111087e-05, + "loss": 0.1213, + "step": 15981 + }, + { + "epoch": 43.54768392370572, + "grad_norm": 5.30739164352417, + "learning_rate": 1.2547179868144466e-05, + "loss": 0.1704, + "step": 15982 + }, + { + "epoch": 43.55040871934605, + "grad_norm": 6.663933277130127, + "learning_rate": 1.2546326472340486e-05, + "loss": 0.1754, + "step": 15983 + }, + { + "epoch": 43.55313351498638, + "grad_norm": 4.3429131507873535, + "learning_rate": 1.2545473056705801e-05, + "loss": 0.133, + "step": 15984 + }, + { + "epoch": 43.555858310626704, + "grad_norm": 5.424915313720703, + "learning_rate": 1.2544619621247052e-05, + "loss": 0.1214, + "step": 15985 + }, + { + "epoch": 43.55858310626703, + "grad_norm": 5.305258274078369, + "learning_rate": 1.2543766165970887e-05, + "loss": 0.1232, + "step": 15986 + }, + { + "epoch": 43.561307901907355, + "grad_norm": 4.916006565093994, + "learning_rate": 1.2542912690883954e-05, + "loss": 0.2455, + "step": 15987 + }, + { + "epoch": 43.56403269754768, + "grad_norm": 5.430879592895508, + "learning_rate": 1.25420591959929e-05, + "loss": 0.2218, + "step": 15988 + }, + { + "epoch": 43.566757493188014, + "grad_norm": 4.888143539428711, + "learning_rate": 1.2541205681304364e-05, + "loss": 0.1677, + "step": 15989 + }, + { + "epoch": 43.56948228882834, + "grad_norm": 4.813355445861816, + "learning_rate": 1.2540352146825008e-05, + "loss": 0.1328, + "step": 15990 + }, + { + "epoch": 43.572207084468666, + "grad_norm": 6.177624225616455, + "learning_rate": 1.2539498592561468e-05, + "loss": 0.216, + "step": 15991 + }, + { + "epoch": 43.57493188010899, + "grad_norm": 5.1723432540893555, + "learning_rate": 1.2538645018520396e-05, + "loss": 0.1481, + "step": 15992 + }, + { + "epoch": 43.57765667574932, + "grad_norm": 5.250513553619385, + "learning_rate": 1.2537791424708436e-05, + "loss": 0.3468, + "step": 15993 + }, + { + "epoch": 43.58038147138964, + "grad_norm": 5.463875770568848, + "learning_rate": 1.2536937811132242e-05, + "loss": 0.1758, + "step": 15994 + }, + { + "epoch": 43.583106267029976, + "grad_norm": 5.446907997131348, + "learning_rate": 1.2536084177798453e-05, + "loss": 0.1342, + "step": 15995 + }, + { + "epoch": 43.5858310626703, + "grad_norm": 6.789150238037109, + "learning_rate": 1.2535230524713726e-05, + "loss": 0.1471, + "step": 15996 + }, + { + "epoch": 43.58855585831063, + "grad_norm": 7.316271781921387, + "learning_rate": 1.2534376851884702e-05, + "loss": 0.27, + "step": 15997 + }, + { + "epoch": 43.59128065395095, + "grad_norm": 5.163402080535889, + "learning_rate": 1.2533523159318035e-05, + "loss": 0.1695, + "step": 15998 + }, + { + "epoch": 43.59400544959128, + "grad_norm": 4.516694068908691, + "learning_rate": 1.2532669447020369e-05, + "loss": 0.1947, + "step": 15999 + }, + { + "epoch": 43.596730245231605, + "grad_norm": 6.344399929046631, + "learning_rate": 1.2531815714998356e-05, + "loss": 0.307, + "step": 16000 + }, + { + "epoch": 43.59945504087194, + "grad_norm": 5.544537544250488, + "learning_rate": 1.2530961963258643e-05, + "loss": 0.1917, + "step": 16001 + }, + { + "epoch": 43.60217983651226, + "grad_norm": 7.054203987121582, + "learning_rate": 1.2530108191807884e-05, + "loss": 0.2518, + "step": 16002 + }, + { + "epoch": 43.60490463215259, + "grad_norm": 5.008299350738525, + "learning_rate": 1.252925440065272e-05, + "loss": 0.1638, + "step": 16003 + }, + { + "epoch": 43.607629427792915, + "grad_norm": 5.451460838317871, + "learning_rate": 1.2528400589799805e-05, + "loss": 0.2308, + "step": 16004 + }, + { + "epoch": 43.61035422343324, + "grad_norm": 7.667142868041992, + "learning_rate": 1.2527546759255786e-05, + "loss": 0.1488, + "step": 16005 + }, + { + "epoch": 43.61307901907357, + "grad_norm": 6.472372531890869, + "learning_rate": 1.2526692909027314e-05, + "loss": 0.2041, + "step": 16006 + }, + { + "epoch": 43.6158038147139, + "grad_norm": 4.346190929412842, + "learning_rate": 1.252583903912104e-05, + "loss": 0.2752, + "step": 16007 + }, + { + "epoch": 43.618528610354225, + "grad_norm": 4.9120192527771, + "learning_rate": 1.2524985149543616e-05, + "loss": 0.3718, + "step": 16008 + }, + { + "epoch": 43.62125340599455, + "grad_norm": 4.977303504943848, + "learning_rate": 1.2524131240301684e-05, + "loss": 0.22, + "step": 16009 + }, + { + "epoch": 43.62397820163488, + "grad_norm": 5.490370273590088, + "learning_rate": 1.2523277311401903e-05, + "loss": 0.2609, + "step": 16010 + }, + { + "epoch": 43.6267029972752, + "grad_norm": 9.68083381652832, + "learning_rate": 1.2522423362850917e-05, + "loss": 0.2579, + "step": 16011 + }, + { + "epoch": 43.62942779291553, + "grad_norm": 7.106309413909912, + "learning_rate": 1.2521569394655382e-05, + "loss": 0.4242, + "step": 16012 + }, + { + "epoch": 43.63215258855586, + "grad_norm": 5.843109607696533, + "learning_rate": 1.2520715406821942e-05, + "loss": 0.19, + "step": 16013 + }, + { + "epoch": 43.63487738419619, + "grad_norm": 4.223015785217285, + "learning_rate": 1.2519861399357254e-05, + "loss": 0.1386, + "step": 16014 + }, + { + "epoch": 43.63760217983651, + "grad_norm": 6.382819175720215, + "learning_rate": 1.2519007372267964e-05, + "loss": 0.291, + "step": 16015 + }, + { + "epoch": 43.64032697547684, + "grad_norm": 4.584835529327393, + "learning_rate": 1.2518153325560726e-05, + "loss": 0.1245, + "step": 16016 + }, + { + "epoch": 43.643051771117165, + "grad_norm": 3.7178592681884766, + "learning_rate": 1.2517299259242193e-05, + "loss": 0.1624, + "step": 16017 + }, + { + "epoch": 43.64577656675749, + "grad_norm": 5.389956951141357, + "learning_rate": 1.2516445173319013e-05, + "loss": 0.236, + "step": 16018 + }, + { + "epoch": 43.64850136239782, + "grad_norm": 6.396854400634766, + "learning_rate": 1.2515591067797841e-05, + "loss": 0.2456, + "step": 16019 + }, + { + "epoch": 43.65122615803815, + "grad_norm": 6.409819602966309, + "learning_rate": 1.2514736942685326e-05, + "loss": 0.2351, + "step": 16020 + }, + { + "epoch": 43.653950953678475, + "grad_norm": 4.087258338928223, + "learning_rate": 1.251388279798812e-05, + "loss": 0.1525, + "step": 16021 + }, + { + "epoch": 43.6566757493188, + "grad_norm": 5.1316819190979, + "learning_rate": 1.2513028633712875e-05, + "loss": 0.2031, + "step": 16022 + }, + { + "epoch": 43.65940054495913, + "grad_norm": 7.15573263168335, + "learning_rate": 1.2512174449866243e-05, + "loss": 0.4549, + "step": 16023 + }, + { + "epoch": 43.66212534059945, + "grad_norm": 4.485933780670166, + "learning_rate": 1.251132024645488e-05, + "loss": 0.2953, + "step": 16024 + }, + { + "epoch": 43.664850136239785, + "grad_norm": 4.975935459136963, + "learning_rate": 1.2510466023485435e-05, + "loss": 0.1809, + "step": 16025 + }, + { + "epoch": 43.66757493188011, + "grad_norm": 5.3832688331604, + "learning_rate": 1.2509611780964562e-05, + "loss": 0.2421, + "step": 16026 + }, + { + "epoch": 43.67029972752044, + "grad_norm": 7.378668785095215, + "learning_rate": 1.2508757518898911e-05, + "loss": 0.2202, + "step": 16027 + }, + { + "epoch": 43.67302452316076, + "grad_norm": 5.278179168701172, + "learning_rate": 1.2507903237295138e-05, + "loss": 0.1807, + "step": 16028 + }, + { + "epoch": 43.67574931880109, + "grad_norm": 6.28816032409668, + "learning_rate": 1.2507048936159896e-05, + "loss": 0.1944, + "step": 16029 + }, + { + "epoch": 43.678474114441414, + "grad_norm": 4.760003089904785, + "learning_rate": 1.2506194615499836e-05, + "loss": 0.2402, + "step": 16030 + }, + { + "epoch": 43.68119891008175, + "grad_norm": 6.2029805183410645, + "learning_rate": 1.2505340275321613e-05, + "loss": 0.2573, + "step": 16031 + }, + { + "epoch": 43.68392370572207, + "grad_norm": 4.338624954223633, + "learning_rate": 1.2504485915631883e-05, + "loss": 0.1321, + "step": 16032 + }, + { + "epoch": 43.6866485013624, + "grad_norm": 4.835025310516357, + "learning_rate": 1.2503631536437295e-05, + "loss": 0.1835, + "step": 16033 + }, + { + "epoch": 43.689373297002724, + "grad_norm": 9.827530860900879, + "learning_rate": 1.2502777137744507e-05, + "loss": 0.2545, + "step": 16034 + }, + { + "epoch": 43.69209809264305, + "grad_norm": 5.594376564025879, + "learning_rate": 1.250192271956017e-05, + "loss": 0.1847, + "step": 16035 + }, + { + "epoch": 43.694822888283376, + "grad_norm": 5.1019392013549805, + "learning_rate": 1.250106828189094e-05, + "loss": 0.175, + "step": 16036 + }, + { + "epoch": 43.69754768392371, + "grad_norm": 5.329370021820068, + "learning_rate": 1.2500213824743472e-05, + "loss": 0.2035, + "step": 16037 + }, + { + "epoch": 43.700272479564035, + "grad_norm": 5.356943607330322, + "learning_rate": 1.2499359348124418e-05, + "loss": 0.1966, + "step": 16038 + }, + { + "epoch": 43.70299727520436, + "grad_norm": 5.181354999542236, + "learning_rate": 1.2498504852040433e-05, + "loss": 0.2862, + "step": 16039 + }, + { + "epoch": 43.705722070844686, + "grad_norm": 4.817810535430908, + "learning_rate": 1.2497650336498172e-05, + "loss": 0.1609, + "step": 16040 + }, + { + "epoch": 43.70844686648501, + "grad_norm": 6.273209095001221, + "learning_rate": 1.2496795801504291e-05, + "loss": 0.1707, + "step": 16041 + }, + { + "epoch": 43.71117166212534, + "grad_norm": 4.329726219177246, + "learning_rate": 1.2495941247065445e-05, + "loss": 0.1393, + "step": 16042 + }, + { + "epoch": 43.71389645776567, + "grad_norm": 6.111339092254639, + "learning_rate": 1.2495086673188293e-05, + "loss": 0.2964, + "step": 16043 + }, + { + "epoch": 43.716621253406, + "grad_norm": 4.5158491134643555, + "learning_rate": 1.249423207987948e-05, + "loss": 0.2061, + "step": 16044 + }, + { + "epoch": 43.71934604904632, + "grad_norm": 5.9191083908081055, + "learning_rate": 1.249337746714567e-05, + "loss": 0.2371, + "step": 16045 + }, + { + "epoch": 43.72207084468665, + "grad_norm": 4.54535436630249, + "learning_rate": 1.2492522834993519e-05, + "loss": 0.2207, + "step": 16046 + }, + { + "epoch": 43.724795640326974, + "grad_norm": 4.868076801300049, + "learning_rate": 1.2491668183429679e-05, + "loss": 0.1785, + "step": 16047 + }, + { + "epoch": 43.7275204359673, + "grad_norm": 4.8957977294921875, + "learning_rate": 1.2490813512460806e-05, + "loss": 0.1964, + "step": 16048 + }, + { + "epoch": 43.73024523160763, + "grad_norm": 5.272156715393066, + "learning_rate": 1.2489958822093557e-05, + "loss": 0.1245, + "step": 16049 + }, + { + "epoch": 43.73297002724796, + "grad_norm": 5.2726593017578125, + "learning_rate": 1.2489104112334588e-05, + "loss": 0.1562, + "step": 16050 + }, + { + "epoch": 43.735694822888284, + "grad_norm": 6.89739990234375, + "learning_rate": 1.248824938319056e-05, + "loss": 0.2311, + "step": 16051 + }, + { + "epoch": 43.73841961852861, + "grad_norm": 4.722046852111816, + "learning_rate": 1.2487394634668123e-05, + "loss": 0.1761, + "step": 16052 + }, + { + "epoch": 43.741144414168936, + "grad_norm": 5.488198280334473, + "learning_rate": 1.2486539866773941e-05, + "loss": 0.2041, + "step": 16053 + }, + { + "epoch": 43.74386920980926, + "grad_norm": 5.007774829864502, + "learning_rate": 1.2485685079514663e-05, + "loss": 0.1779, + "step": 16054 + }, + { + "epoch": 43.746594005449595, + "grad_norm": 11.114958763122559, + "learning_rate": 1.2484830272896951e-05, + "loss": 0.2186, + "step": 16055 + }, + { + "epoch": 43.74931880108992, + "grad_norm": 5.780182838439941, + "learning_rate": 1.2483975446927459e-05, + "loss": 0.2337, + "step": 16056 + }, + { + "epoch": 43.752043596730246, + "grad_norm": 6.6061859130859375, + "learning_rate": 1.2483120601612847e-05, + "loss": 0.2101, + "step": 16057 + }, + { + "epoch": 43.75476839237057, + "grad_norm": 6.823513031005859, + "learning_rate": 1.2482265736959769e-05, + "loss": 0.1509, + "step": 16058 + }, + { + "epoch": 43.7574931880109, + "grad_norm": 6.462015151977539, + "learning_rate": 1.248141085297489e-05, + "loss": 0.2858, + "step": 16059 + }, + { + "epoch": 43.76021798365122, + "grad_norm": 4.85947322845459, + "learning_rate": 1.2480555949664859e-05, + "loss": 0.1335, + "step": 16060 + }, + { + "epoch": 43.762942779291556, + "grad_norm": 4.83868932723999, + "learning_rate": 1.247970102703634e-05, + "loss": 0.2706, + "step": 16061 + }, + { + "epoch": 43.76566757493188, + "grad_norm": 6.2221503257751465, + "learning_rate": 1.247884608509599e-05, + "loss": 0.1767, + "step": 16062 + }, + { + "epoch": 43.76839237057221, + "grad_norm": 5.1493988037109375, + "learning_rate": 1.2477991123850468e-05, + "loss": 0.2175, + "step": 16063 + }, + { + "epoch": 43.771117166212534, + "grad_norm": 5.098999500274658, + "learning_rate": 1.2477136143306428e-05, + "loss": 0.1342, + "step": 16064 + }, + { + "epoch": 43.77384196185286, + "grad_norm": 5.399009704589844, + "learning_rate": 1.2476281143470535e-05, + "loss": 0.1434, + "step": 16065 + }, + { + "epoch": 43.776566757493185, + "grad_norm": 7.601125240325928, + "learning_rate": 1.2475426124349436e-05, + "loss": 0.205, + "step": 16066 + }, + { + "epoch": 43.77929155313352, + "grad_norm": 5.856564521789551, + "learning_rate": 1.2474571085949807e-05, + "loss": 0.2831, + "step": 16067 + }, + { + "epoch": 43.782016348773844, + "grad_norm": 5.1694135665893555, + "learning_rate": 1.2473716028278292e-05, + "loss": 0.5207, + "step": 16068 + }, + { + "epoch": 43.78474114441417, + "grad_norm": 4.714412689208984, + "learning_rate": 1.2472860951341561e-05, + "loss": 0.1497, + "step": 16069 + }, + { + "epoch": 43.787465940054496, + "grad_norm": 5.425742149353027, + "learning_rate": 1.2472005855146265e-05, + "loss": 0.2264, + "step": 16070 + }, + { + "epoch": 43.79019073569482, + "grad_norm": 5.301591396331787, + "learning_rate": 1.247115073969907e-05, + "loss": 0.1359, + "step": 16071 + }, + { + "epoch": 43.79291553133515, + "grad_norm": 5.562912940979004, + "learning_rate": 1.2470295605006628e-05, + "loss": 0.2102, + "step": 16072 + }, + { + "epoch": 43.79564032697548, + "grad_norm": 6.005643844604492, + "learning_rate": 1.246944045107561e-05, + "loss": 0.1778, + "step": 16073 + }, + { + "epoch": 43.798365122615806, + "grad_norm": 4.845348358154297, + "learning_rate": 1.2468585277912664e-05, + "loss": 0.1918, + "step": 16074 + }, + { + "epoch": 43.80108991825613, + "grad_norm": 5.073792457580566, + "learning_rate": 1.2467730085524454e-05, + "loss": 0.1407, + "step": 16075 + }, + { + "epoch": 43.80381471389646, + "grad_norm": 5.499170780181885, + "learning_rate": 1.2466874873917646e-05, + "loss": 0.158, + "step": 16076 + }, + { + "epoch": 43.80653950953678, + "grad_norm": 7.507500648498535, + "learning_rate": 1.2466019643098895e-05, + "loss": 0.1994, + "step": 16077 + }, + { + "epoch": 43.80926430517711, + "grad_norm": 4.464300155639648, + "learning_rate": 1.2465164393074859e-05, + "loss": 0.2694, + "step": 16078 + }, + { + "epoch": 43.81198910081744, + "grad_norm": 5.403188228607178, + "learning_rate": 1.2464309123852205e-05, + "loss": 0.1728, + "step": 16079 + }, + { + "epoch": 43.81471389645777, + "grad_norm": 7.665669918060303, + "learning_rate": 1.246345383543759e-05, + "loss": 0.2252, + "step": 16080 + }, + { + "epoch": 43.817438692098094, + "grad_norm": 5.672266960144043, + "learning_rate": 1.2462598527837678e-05, + "loss": 0.2267, + "step": 16081 + }, + { + "epoch": 43.82016348773842, + "grad_norm": 5.895010948181152, + "learning_rate": 1.2461743201059124e-05, + "loss": 0.2448, + "step": 16082 + }, + { + "epoch": 43.822888283378745, + "grad_norm": 7.843247890472412, + "learning_rate": 1.2460887855108597e-05, + "loss": 0.2243, + "step": 16083 + }, + { + "epoch": 43.82561307901907, + "grad_norm": 5.759918212890625, + "learning_rate": 1.2460032489992751e-05, + "loss": 0.1763, + "step": 16084 + }, + { + "epoch": 43.828337874659404, + "grad_norm": 5.617268085479736, + "learning_rate": 1.2459177105718251e-05, + "loss": 0.1667, + "step": 16085 + }, + { + "epoch": 43.83106267029973, + "grad_norm": 4.631982803344727, + "learning_rate": 1.2458321702291762e-05, + "loss": 0.1943, + "step": 16086 + }, + { + "epoch": 43.833787465940055, + "grad_norm": 4.916030406951904, + "learning_rate": 1.2457466279719943e-05, + "loss": 0.1129, + "step": 16087 + }, + { + "epoch": 43.83651226158038, + "grad_norm": 6.239870548248291, + "learning_rate": 1.2456610838009454e-05, + "loss": 0.2857, + "step": 16088 + }, + { + "epoch": 43.83923705722071, + "grad_norm": 6.174760818481445, + "learning_rate": 1.2455755377166958e-05, + "loss": 0.1576, + "step": 16089 + }, + { + "epoch": 43.84196185286103, + "grad_norm": 6.801732063293457, + "learning_rate": 1.245489989719912e-05, + "loss": 0.1155, + "step": 16090 + }, + { + "epoch": 43.844686648501366, + "grad_norm": 5.358292102813721, + "learning_rate": 1.2454044398112602e-05, + "loss": 0.2784, + "step": 16091 + }, + { + "epoch": 43.84741144414169, + "grad_norm": 6.265818119049072, + "learning_rate": 1.245318887991406e-05, + "loss": 0.1893, + "step": 16092 + }, + { + "epoch": 43.85013623978202, + "grad_norm": 4.627772331237793, + "learning_rate": 1.2452333342610166e-05, + "loss": 0.1819, + "step": 16093 + }, + { + "epoch": 43.85286103542234, + "grad_norm": 5.668519496917725, + "learning_rate": 1.2451477786207575e-05, + "loss": 0.2036, + "step": 16094 + }, + { + "epoch": 43.85558583106267, + "grad_norm": 9.2498197555542, + "learning_rate": 1.245062221071296e-05, + "loss": 0.253, + "step": 16095 + }, + { + "epoch": 43.858310626702995, + "grad_norm": 4.812533855438232, + "learning_rate": 1.2449766616132973e-05, + "loss": 0.2204, + "step": 16096 + }, + { + "epoch": 43.86103542234333, + "grad_norm": 5.658326625823975, + "learning_rate": 1.2448911002474287e-05, + "loss": 0.1572, + "step": 16097 + }, + { + "epoch": 43.86376021798365, + "grad_norm": 6.318443298339844, + "learning_rate": 1.2448055369743557e-05, + "loss": 0.1373, + "step": 16098 + }, + { + "epoch": 43.86648501362398, + "grad_norm": 4.787212371826172, + "learning_rate": 1.2447199717947451e-05, + "loss": 0.1609, + "step": 16099 + }, + { + "epoch": 43.869209809264305, + "grad_norm": 5.018313407897949, + "learning_rate": 1.2446344047092633e-05, + "loss": 0.3412, + "step": 16100 + }, + { + "epoch": 43.87193460490463, + "grad_norm": 5.533585071563721, + "learning_rate": 1.2445488357185766e-05, + "loss": 0.1091, + "step": 16101 + }, + { + "epoch": 43.87465940054496, + "grad_norm": 10.251208305358887, + "learning_rate": 1.2444632648233517e-05, + "loss": 0.2603, + "step": 16102 + }, + { + "epoch": 43.87738419618529, + "grad_norm": 6.50205135345459, + "learning_rate": 1.2443776920242542e-05, + "loss": 0.3353, + "step": 16103 + }, + { + "epoch": 43.880108991825615, + "grad_norm": 5.021983623504639, + "learning_rate": 1.2442921173219515e-05, + "loss": 0.199, + "step": 16104 + }, + { + "epoch": 43.88283378746594, + "grad_norm": 7.136135101318359, + "learning_rate": 1.2442065407171098e-05, + "loss": 0.1986, + "step": 16105 + }, + { + "epoch": 43.88555858310627, + "grad_norm": 5.772706985473633, + "learning_rate": 1.2441209622103951e-05, + "loss": 0.1638, + "step": 16106 + }, + { + "epoch": 43.88828337874659, + "grad_norm": 7.06938362121582, + "learning_rate": 1.2440353818024744e-05, + "loss": 0.2592, + "step": 16107 + }, + { + "epoch": 43.89100817438692, + "grad_norm": 5.062612056732178, + "learning_rate": 1.243949799494014e-05, + "loss": 0.2136, + "step": 16108 + }, + { + "epoch": 43.89373297002725, + "grad_norm": 6.993363380432129, + "learning_rate": 1.2438642152856802e-05, + "loss": 0.2269, + "step": 16109 + }, + { + "epoch": 43.89645776566758, + "grad_norm": 7.7213311195373535, + "learning_rate": 1.24377862917814e-05, + "loss": 0.2116, + "step": 16110 + }, + { + "epoch": 43.8991825613079, + "grad_norm": 4.676961898803711, + "learning_rate": 1.2436930411720594e-05, + "loss": 0.1582, + "step": 16111 + }, + { + "epoch": 43.90190735694823, + "grad_norm": 3.7129993438720703, + "learning_rate": 1.2436074512681055e-05, + "loss": 0.1428, + "step": 16112 + }, + { + "epoch": 43.904632152588555, + "grad_norm": 5.535231590270996, + "learning_rate": 1.2435218594669445e-05, + "loss": 0.1777, + "step": 16113 + }, + { + "epoch": 43.90735694822888, + "grad_norm": 5.202457427978516, + "learning_rate": 1.2434362657692432e-05, + "loss": 0.2078, + "step": 16114 + }, + { + "epoch": 43.91008174386921, + "grad_norm": 5.230146884918213, + "learning_rate": 1.2433506701756678e-05, + "loss": 0.2223, + "step": 16115 + }, + { + "epoch": 43.91280653950954, + "grad_norm": 6.026159286499023, + "learning_rate": 1.2432650726868854e-05, + "loss": 0.3477, + "step": 16116 + }, + { + "epoch": 43.915531335149865, + "grad_norm": 6.212592601776123, + "learning_rate": 1.2431794733035625e-05, + "loss": 0.1644, + "step": 16117 + }, + { + "epoch": 43.91825613079019, + "grad_norm": 8.96209716796875, + "learning_rate": 1.2430938720263657e-05, + "loss": 0.2091, + "step": 16118 + }, + { + "epoch": 43.920980926430516, + "grad_norm": 5.667464733123779, + "learning_rate": 1.2430082688559616e-05, + "loss": 0.2952, + "step": 16119 + }, + { + "epoch": 43.92370572207084, + "grad_norm": 5.065408229827881, + "learning_rate": 1.242922663793017e-05, + "loss": 0.245, + "step": 16120 + }, + { + "epoch": 43.926430517711175, + "grad_norm": 6.7920427322387695, + "learning_rate": 1.2428370568381982e-05, + "loss": 0.2838, + "step": 16121 + }, + { + "epoch": 43.9291553133515, + "grad_norm": 5.5842180252075195, + "learning_rate": 1.2427514479921725e-05, + "loss": 0.1599, + "step": 16122 + }, + { + "epoch": 43.93188010899183, + "grad_norm": 6.502938270568848, + "learning_rate": 1.2426658372556062e-05, + "loss": 0.163, + "step": 16123 + }, + { + "epoch": 43.93460490463215, + "grad_norm": 8.820902824401855, + "learning_rate": 1.2425802246291664e-05, + "loss": 0.2465, + "step": 16124 + }, + { + "epoch": 43.93732970027248, + "grad_norm": 5.5153889656066895, + "learning_rate": 1.2424946101135193e-05, + "loss": 0.1917, + "step": 16125 + }, + { + "epoch": 43.940054495912804, + "grad_norm": 7.109150409698486, + "learning_rate": 1.2424089937093324e-05, + "loss": 0.2391, + "step": 16126 + }, + { + "epoch": 43.94277929155314, + "grad_norm": 7.857607841491699, + "learning_rate": 1.2423233754172714e-05, + "loss": 0.1871, + "step": 16127 + }, + { + "epoch": 43.94550408719346, + "grad_norm": 116.6109848022461, + "learning_rate": 1.2422377552380045e-05, + "loss": 0.2427, + "step": 16128 + }, + { + "epoch": 43.94822888283379, + "grad_norm": 6.429569244384766, + "learning_rate": 1.2421521331721974e-05, + "loss": 0.2248, + "step": 16129 + }, + { + "epoch": 43.950953678474114, + "grad_norm": 5.0744781494140625, + "learning_rate": 1.2420665092205173e-05, + "loss": 0.3101, + "step": 16130 + }, + { + "epoch": 43.95367847411444, + "grad_norm": 10.218924522399902, + "learning_rate": 1.2419808833836309e-05, + "loss": 0.221, + "step": 16131 + }, + { + "epoch": 43.956403269754766, + "grad_norm": 9.258928298950195, + "learning_rate": 1.2418952556622055e-05, + "loss": 0.3065, + "step": 16132 + }, + { + "epoch": 43.95912806539509, + "grad_norm": 6.090509414672852, + "learning_rate": 1.2418096260569072e-05, + "loss": 0.156, + "step": 16133 + }, + { + "epoch": 43.961852861035425, + "grad_norm": 6.892738342285156, + "learning_rate": 1.2417239945684036e-05, + "loss": 0.3133, + "step": 16134 + }, + { + "epoch": 43.96457765667575, + "grad_norm": 8.078993797302246, + "learning_rate": 1.241638361197361e-05, + "loss": 0.3408, + "step": 16135 + }, + { + "epoch": 43.967302452316076, + "grad_norm": 14.61220645904541, + "learning_rate": 1.2415527259444471e-05, + "loss": 0.2736, + "step": 16136 + }, + { + "epoch": 43.9700272479564, + "grad_norm": 11.88048267364502, + "learning_rate": 1.2414670888103279e-05, + "loss": 0.4071, + "step": 16137 + }, + { + "epoch": 43.97275204359673, + "grad_norm": 9.614017486572266, + "learning_rate": 1.241381449795671e-05, + "loss": 0.2885, + "step": 16138 + }, + { + "epoch": 43.97547683923706, + "grad_norm": 7.922733306884766, + "learning_rate": 1.2412958089011433e-05, + "loss": 0.2641, + "step": 16139 + }, + { + "epoch": 43.97820163487739, + "grad_norm": 13.481842994689941, + "learning_rate": 1.2412101661274114e-05, + "loss": 0.3297, + "step": 16140 + }, + { + "epoch": 43.98092643051771, + "grad_norm": 9.547430038452148, + "learning_rate": 1.2411245214751426e-05, + "loss": 0.2846, + "step": 16141 + }, + { + "epoch": 43.98365122615804, + "grad_norm": 11.379546165466309, + "learning_rate": 1.2410388749450038e-05, + "loss": 0.3534, + "step": 16142 + }, + { + "epoch": 43.986376021798364, + "grad_norm": 31.17267417907715, + "learning_rate": 1.2409532265376618e-05, + "loss": 0.3415, + "step": 16143 + }, + { + "epoch": 43.98910081743869, + "grad_norm": 10.252547264099121, + "learning_rate": 1.2408675762537838e-05, + "loss": 0.2567, + "step": 16144 + }, + { + "epoch": 43.991825613079016, + "grad_norm": 9.675552368164062, + "learning_rate": 1.240781924094037e-05, + "loss": 0.3126, + "step": 16145 + }, + { + "epoch": 43.99455040871935, + "grad_norm": 15.750492095947266, + "learning_rate": 1.2406962700590884e-05, + "loss": 0.3246, + "step": 16146 + }, + { + "epoch": 43.997275204359674, + "grad_norm": 7.915947437286377, + "learning_rate": 1.2406106141496049e-05, + "loss": 0.1831, + "step": 16147 + }, + { + "epoch": 44.0, + "grad_norm": 7.796821117401123, + "learning_rate": 1.2405249563662539e-05, + "loss": 0.2965, + "step": 16148 + }, + { + "epoch": 44.002724795640326, + "grad_norm": 8.101951599121094, + "learning_rate": 1.2404392967097019e-05, + "loss": 0.2635, + "step": 16149 + }, + { + "epoch": 44.00544959128065, + "grad_norm": 8.145999908447266, + "learning_rate": 1.2403536351806167e-05, + "loss": 0.2394, + "step": 16150 + }, + { + "epoch": 44.00817438692098, + "grad_norm": 8.64932632446289, + "learning_rate": 1.2402679717796651e-05, + "loss": 0.3574, + "step": 16151 + }, + { + "epoch": 44.01089918256131, + "grad_norm": 6.614543437957764, + "learning_rate": 1.240182306507514e-05, + "loss": 0.361, + "step": 16152 + }, + { + "epoch": 44.013623978201636, + "grad_norm": 7.630898952484131, + "learning_rate": 1.2400966393648309e-05, + "loss": 0.3195, + "step": 16153 + }, + { + "epoch": 44.01634877384196, + "grad_norm": 7.651569366455078, + "learning_rate": 1.2400109703522831e-05, + "loss": 0.2422, + "step": 16154 + }, + { + "epoch": 44.01907356948229, + "grad_norm": 5.433675765991211, + "learning_rate": 1.2399252994705373e-05, + "loss": 0.209, + "step": 16155 + }, + { + "epoch": 44.02179836512261, + "grad_norm": 5.823220252990723, + "learning_rate": 1.2398396267202615e-05, + "loss": 0.1415, + "step": 16156 + }, + { + "epoch": 44.02452316076294, + "grad_norm": 7.748629093170166, + "learning_rate": 1.239753952102122e-05, + "loss": 0.2618, + "step": 16157 + }, + { + "epoch": 44.02724795640327, + "grad_norm": 5.98864221572876, + "learning_rate": 1.2396682756167866e-05, + "loss": 0.3019, + "step": 16158 + }, + { + "epoch": 44.0299727520436, + "grad_norm": 5.825252056121826, + "learning_rate": 1.2395825972649222e-05, + "loss": 0.1885, + "step": 16159 + }, + { + "epoch": 44.032697547683924, + "grad_norm": 7.396633148193359, + "learning_rate": 1.2394969170471965e-05, + "loss": 0.3402, + "step": 16160 + }, + { + "epoch": 44.03542234332425, + "grad_norm": 5.753902912139893, + "learning_rate": 1.2394112349642761e-05, + "loss": 0.1355, + "step": 16161 + }, + { + "epoch": 44.038147138964575, + "grad_norm": 5.8221845626831055, + "learning_rate": 1.2393255510168292e-05, + "loss": 0.2352, + "step": 16162 + }, + { + "epoch": 44.0408719346049, + "grad_norm": 7.52283239364624, + "learning_rate": 1.2392398652055222e-05, + "loss": 0.2686, + "step": 16163 + }, + { + "epoch": 44.043596730245234, + "grad_norm": 6.4456467628479, + "learning_rate": 1.2391541775310231e-05, + "loss": 0.3121, + "step": 16164 + }, + { + "epoch": 44.04632152588556, + "grad_norm": 6.80079984664917, + "learning_rate": 1.2390684879939989e-05, + "loss": 0.4465, + "step": 16165 + }, + { + "epoch": 44.049046321525886, + "grad_norm": 5.70070219039917, + "learning_rate": 1.238982796595117e-05, + "loss": 0.3208, + "step": 16166 + }, + { + "epoch": 44.05177111716621, + "grad_norm": 5.9923505783081055, + "learning_rate": 1.2388971033350447e-05, + "loss": 0.1696, + "step": 16167 + }, + { + "epoch": 44.05449591280654, + "grad_norm": 6.572014331817627, + "learning_rate": 1.2388114082144495e-05, + "loss": 0.2166, + "step": 16168 + }, + { + "epoch": 44.05722070844686, + "grad_norm": 6.781308174133301, + "learning_rate": 1.2387257112339987e-05, + "loss": 0.271, + "step": 16169 + }, + { + "epoch": 44.059945504087196, + "grad_norm": 5.984559059143066, + "learning_rate": 1.2386400123943597e-05, + "loss": 0.3424, + "step": 16170 + }, + { + "epoch": 44.06267029972752, + "grad_norm": 6.572991847991943, + "learning_rate": 1.2385543116962002e-05, + "loss": 0.157, + "step": 16171 + }, + { + "epoch": 44.06539509536785, + "grad_norm": 5.872347831726074, + "learning_rate": 1.2384686091401874e-05, + "loss": 0.1674, + "step": 16172 + }, + { + "epoch": 44.06811989100817, + "grad_norm": 5.073558807373047, + "learning_rate": 1.2383829047269884e-05, + "loss": 0.2827, + "step": 16173 + }, + { + "epoch": 44.0708446866485, + "grad_norm": 5.1867170333862305, + "learning_rate": 1.2382971984572714e-05, + "loss": 0.3451, + "step": 16174 + }, + { + "epoch": 44.073569482288825, + "grad_norm": 5.426074028015137, + "learning_rate": 1.2382114903317033e-05, + "loss": 0.1745, + "step": 16175 + }, + { + "epoch": 44.07629427792916, + "grad_norm": 6.267030239105225, + "learning_rate": 1.2381257803509518e-05, + "loss": 0.3035, + "step": 16176 + }, + { + "epoch": 44.079019073569484, + "grad_norm": 8.500021934509277, + "learning_rate": 1.2380400685156844e-05, + "loss": 0.2106, + "step": 16177 + }, + { + "epoch": 44.08174386920981, + "grad_norm": 6.597235679626465, + "learning_rate": 1.2379543548265685e-05, + "loss": 0.2307, + "step": 16178 + }, + { + "epoch": 44.084468664850135, + "grad_norm": 6.0201096534729, + "learning_rate": 1.2378686392842718e-05, + "loss": 0.2329, + "step": 16179 + }, + { + "epoch": 44.08719346049046, + "grad_norm": 5.377299785614014, + "learning_rate": 1.2377829218894618e-05, + "loss": 0.1459, + "step": 16180 + }, + { + "epoch": 44.08991825613079, + "grad_norm": 5.008917331695557, + "learning_rate": 1.237697202642806e-05, + "loss": 0.2108, + "step": 16181 + }, + { + "epoch": 44.09264305177112, + "grad_norm": 6.565011978149414, + "learning_rate": 1.2376114815449723e-05, + "loss": 0.2874, + "step": 16182 + }, + { + "epoch": 44.095367847411445, + "grad_norm": 6.714814186096191, + "learning_rate": 1.2375257585966275e-05, + "loss": 0.2558, + "step": 16183 + }, + { + "epoch": 44.09809264305177, + "grad_norm": 5.044266223907471, + "learning_rate": 1.2374400337984404e-05, + "loss": 0.3174, + "step": 16184 + }, + { + "epoch": 44.1008174386921, + "grad_norm": 7.665246963500977, + "learning_rate": 1.2373543071510774e-05, + "loss": 0.1517, + "step": 16185 + }, + { + "epoch": 44.10354223433242, + "grad_norm": 7.603165149688721, + "learning_rate": 1.2372685786552072e-05, + "loss": 0.1894, + "step": 16186 + }, + { + "epoch": 44.10626702997275, + "grad_norm": 9.16969108581543, + "learning_rate": 1.2371828483114964e-05, + "loss": 0.1768, + "step": 16187 + }, + { + "epoch": 44.10899182561308, + "grad_norm": 6.315141677856445, + "learning_rate": 1.2370971161206136e-05, + "loss": 0.4095, + "step": 16188 + }, + { + "epoch": 44.11171662125341, + "grad_norm": 6.79281759262085, + "learning_rate": 1.237011382083226e-05, + "loss": 0.1776, + "step": 16189 + }, + { + "epoch": 44.11444141689373, + "grad_norm": 5.980787754058838, + "learning_rate": 1.2369256462000015e-05, + "loss": 0.1793, + "step": 16190 + }, + { + "epoch": 44.11716621253406, + "grad_norm": 4.813692569732666, + "learning_rate": 1.2368399084716072e-05, + "loss": 0.2648, + "step": 16191 + }, + { + "epoch": 44.119891008174385, + "grad_norm": 6.074870586395264, + "learning_rate": 1.236754168898712e-05, + "loss": 0.1811, + "step": 16192 + }, + { + "epoch": 44.12261580381471, + "grad_norm": 6.126917839050293, + "learning_rate": 1.2366684274819825e-05, + "loss": 0.1966, + "step": 16193 + }, + { + "epoch": 44.12534059945504, + "grad_norm": 5.153909206390381, + "learning_rate": 1.2365826842220872e-05, + "loss": 0.1499, + "step": 16194 + }, + { + "epoch": 44.12806539509537, + "grad_norm": 5.3130269050598145, + "learning_rate": 1.2364969391196933e-05, + "loss": 0.1913, + "step": 16195 + }, + { + "epoch": 44.130790190735695, + "grad_norm": 6.73169469833374, + "learning_rate": 1.2364111921754686e-05, + "loss": 0.1729, + "step": 16196 + }, + { + "epoch": 44.13351498637602, + "grad_norm": 4.773559093475342, + "learning_rate": 1.2363254433900818e-05, + "loss": 0.1593, + "step": 16197 + }, + { + "epoch": 44.13623978201635, + "grad_norm": 6.7105937004089355, + "learning_rate": 1.2362396927641996e-05, + "loss": 0.1693, + "step": 16198 + }, + { + "epoch": 44.13896457765667, + "grad_norm": 5.667901039123535, + "learning_rate": 1.2361539402984905e-05, + "loss": 0.2905, + "step": 16199 + }, + { + "epoch": 44.141689373297005, + "grad_norm": 5.803109645843506, + "learning_rate": 1.2360681859936222e-05, + "loss": 0.1897, + "step": 16200 + }, + { + "epoch": 44.14441416893733, + "grad_norm": 5.439942836761475, + "learning_rate": 1.2359824298502622e-05, + "loss": 0.1578, + "step": 16201 + }, + { + "epoch": 44.14713896457766, + "grad_norm": 6.289660930633545, + "learning_rate": 1.2358966718690786e-05, + "loss": 0.2778, + "step": 16202 + }, + { + "epoch": 44.14986376021798, + "grad_norm": 4.494592666625977, + "learning_rate": 1.2358109120507393e-05, + "loss": 0.1301, + "step": 16203 + }, + { + "epoch": 44.15258855585831, + "grad_norm": 9.831260681152344, + "learning_rate": 1.2357251503959125e-05, + "loss": 0.1682, + "step": 16204 + }, + { + "epoch": 44.155313351498634, + "grad_norm": 4.6189751625061035, + "learning_rate": 1.2356393869052656e-05, + "loss": 0.2497, + "step": 16205 + }, + { + "epoch": 44.15803814713897, + "grad_norm": 6.3724212646484375, + "learning_rate": 1.2355536215794668e-05, + "loss": 0.247, + "step": 16206 + }, + { + "epoch": 44.16076294277929, + "grad_norm": 6.15195369720459, + "learning_rate": 1.235467854419184e-05, + "loss": 0.2225, + "step": 16207 + }, + { + "epoch": 44.16348773841962, + "grad_norm": 6.59060525894165, + "learning_rate": 1.235382085425085e-05, + "loss": 0.1894, + "step": 16208 + }, + { + "epoch": 44.166212534059945, + "grad_norm": 7.037757396697998, + "learning_rate": 1.2352963145978382e-05, + "loss": 0.2516, + "step": 16209 + }, + { + "epoch": 44.16893732970027, + "grad_norm": 5.91162109375, + "learning_rate": 1.235210541938111e-05, + "loss": 0.1681, + "step": 16210 + }, + { + "epoch": 44.171662125340596, + "grad_norm": 4.856721878051758, + "learning_rate": 1.2351247674465719e-05, + "loss": 0.2594, + "step": 16211 + }, + { + "epoch": 44.17438692098093, + "grad_norm": 6.868969440460205, + "learning_rate": 1.2350389911238884e-05, + "loss": 0.2111, + "step": 16212 + }, + { + "epoch": 44.177111716621255, + "grad_norm": 5.090456962585449, + "learning_rate": 1.2349532129707289e-05, + "loss": 0.223, + "step": 16213 + }, + { + "epoch": 44.17983651226158, + "grad_norm": 5.5267653465271, + "learning_rate": 1.2348674329877613e-05, + "loss": 0.1978, + "step": 16214 + }, + { + "epoch": 44.182561307901906, + "grad_norm": 5.36014986038208, + "learning_rate": 1.2347816511756539e-05, + "loss": 0.1841, + "step": 16215 + }, + { + "epoch": 44.18528610354223, + "grad_norm": 8.039497375488281, + "learning_rate": 1.2346958675350742e-05, + "loss": 0.2234, + "step": 16216 + }, + { + "epoch": 44.18801089918256, + "grad_norm": 5.579095363616943, + "learning_rate": 1.234610082066691e-05, + "loss": 0.2629, + "step": 16217 + }, + { + "epoch": 44.19073569482289, + "grad_norm": 7.914852142333984, + "learning_rate": 1.234524294771172e-05, + "loss": 0.1971, + "step": 16218 + }, + { + "epoch": 44.19346049046322, + "grad_norm": 7.122565746307373, + "learning_rate": 1.2344385056491852e-05, + "loss": 0.2775, + "step": 16219 + }, + { + "epoch": 44.19618528610354, + "grad_norm": 6.786997318267822, + "learning_rate": 1.2343527147013988e-05, + "loss": 0.2078, + "step": 16220 + }, + { + "epoch": 44.19891008174387, + "grad_norm": 5.375175952911377, + "learning_rate": 1.234266921928481e-05, + "loss": 0.1441, + "step": 16221 + }, + { + "epoch": 44.201634877384194, + "grad_norm": 5.61326265335083, + "learning_rate": 1.2341811273310999e-05, + "loss": 0.2092, + "step": 16222 + }, + { + "epoch": 44.20435967302452, + "grad_norm": 6.873278617858887, + "learning_rate": 1.234095330909924e-05, + "loss": 0.4392, + "step": 16223 + }, + { + "epoch": 44.20708446866485, + "grad_norm": 4.88468599319458, + "learning_rate": 1.234009532665621e-05, + "loss": 0.1497, + "step": 16224 + }, + { + "epoch": 44.20980926430518, + "grad_norm": 5.8181352615356445, + "learning_rate": 1.2339237325988595e-05, + "loss": 0.218, + "step": 16225 + }, + { + "epoch": 44.212534059945504, + "grad_norm": 6.216662406921387, + "learning_rate": 1.2338379307103072e-05, + "loss": 0.1904, + "step": 16226 + }, + { + "epoch": 44.21525885558583, + "grad_norm": 4.694410800933838, + "learning_rate": 1.233752127000633e-05, + "loss": 0.1707, + "step": 16227 + }, + { + "epoch": 44.217983651226156, + "grad_norm": 4.57954740524292, + "learning_rate": 1.2336663214705045e-05, + "loss": 0.1731, + "step": 16228 + }, + { + "epoch": 44.22070844686648, + "grad_norm": 9.905463218688965, + "learning_rate": 1.2335805141205901e-05, + "loss": 0.1608, + "step": 16229 + }, + { + "epoch": 44.223433242506815, + "grad_norm": 6.8656005859375, + "learning_rate": 1.2334947049515582e-05, + "loss": 0.4211, + "step": 16230 + }, + { + "epoch": 44.22615803814714, + "grad_norm": 5.616997718811035, + "learning_rate": 1.2334088939640772e-05, + "loss": 0.1646, + "step": 16231 + }, + { + "epoch": 44.228882833787466, + "grad_norm": 8.053744316101074, + "learning_rate": 1.233323081158815e-05, + "loss": 0.2007, + "step": 16232 + }, + { + "epoch": 44.23160762942779, + "grad_norm": 6.566122531890869, + "learning_rate": 1.2332372665364406e-05, + "loss": 0.263, + "step": 16233 + }, + { + "epoch": 44.23433242506812, + "grad_norm": 5.1463165283203125, + "learning_rate": 1.2331514500976216e-05, + "loss": 0.2473, + "step": 16234 + }, + { + "epoch": 44.237057220708444, + "grad_norm": 5.497501850128174, + "learning_rate": 1.2330656318430268e-05, + "loss": 0.1558, + "step": 16235 + }, + { + "epoch": 44.23978201634878, + "grad_norm": 4.741311073303223, + "learning_rate": 1.232979811773324e-05, + "loss": 0.1728, + "step": 16236 + }, + { + "epoch": 44.2425068119891, + "grad_norm": 6.691548824310303, + "learning_rate": 1.2328939898891823e-05, + "loss": 0.2718, + "step": 16237 + }, + { + "epoch": 44.24523160762943, + "grad_norm": 5.722686767578125, + "learning_rate": 1.2328081661912692e-05, + "loss": 0.3028, + "step": 16238 + }, + { + "epoch": 44.247956403269754, + "grad_norm": 6.705719947814941, + "learning_rate": 1.2327223406802542e-05, + "loss": 0.3498, + "step": 16239 + }, + { + "epoch": 44.25068119891008, + "grad_norm": 9.26452922821045, + "learning_rate": 1.2326365133568046e-05, + "loss": 0.1984, + "step": 16240 + }, + { + "epoch": 44.253405994550405, + "grad_norm": 8.045634269714355, + "learning_rate": 1.2325506842215897e-05, + "loss": 0.3474, + "step": 16241 + }, + { + "epoch": 44.25613079019074, + "grad_norm": 4.803380966186523, + "learning_rate": 1.2324648532752775e-05, + "loss": 0.1735, + "step": 16242 + }, + { + "epoch": 44.258855585831064, + "grad_norm": 4.696771621704102, + "learning_rate": 1.2323790205185364e-05, + "loss": 0.2244, + "step": 16243 + }, + { + "epoch": 44.26158038147139, + "grad_norm": 5.288698673248291, + "learning_rate": 1.2322931859520349e-05, + "loss": 0.1474, + "step": 16244 + }, + { + "epoch": 44.264305177111716, + "grad_norm": 6.997115612030029, + "learning_rate": 1.2322073495764418e-05, + "loss": 0.2016, + "step": 16245 + }, + { + "epoch": 44.26702997275204, + "grad_norm": 8.896620750427246, + "learning_rate": 1.232121511392425e-05, + "loss": 0.1961, + "step": 16246 + }, + { + "epoch": 44.26975476839237, + "grad_norm": 5.633690357208252, + "learning_rate": 1.2320356714006534e-05, + "loss": 0.2289, + "step": 16247 + }, + { + "epoch": 44.2724795640327, + "grad_norm": 5.711029052734375, + "learning_rate": 1.2319498296017955e-05, + "loss": 0.1247, + "step": 16248 + }, + { + "epoch": 44.275204359673026, + "grad_norm": 4.915972709655762, + "learning_rate": 1.2318639859965198e-05, + "loss": 0.1993, + "step": 16249 + }, + { + "epoch": 44.27792915531335, + "grad_norm": 5.64224910736084, + "learning_rate": 1.231778140585495e-05, + "loss": 0.1367, + "step": 16250 + }, + { + "epoch": 44.28065395095368, + "grad_norm": 4.77384614944458, + "learning_rate": 1.2316922933693893e-05, + "loss": 0.2323, + "step": 16251 + }, + { + "epoch": 44.283378746594, + "grad_norm": 4.476263046264648, + "learning_rate": 1.2316064443488715e-05, + "loss": 0.1991, + "step": 16252 + }, + { + "epoch": 44.28610354223433, + "grad_norm": 5.16072416305542, + "learning_rate": 1.2315205935246103e-05, + "loss": 0.4493, + "step": 16253 + }, + { + "epoch": 44.28882833787466, + "grad_norm": 6.235977649688721, + "learning_rate": 1.2314347408972742e-05, + "loss": 0.1392, + "step": 16254 + }, + { + "epoch": 44.29155313351499, + "grad_norm": 11.483926773071289, + "learning_rate": 1.2313488864675318e-05, + "loss": 0.245, + "step": 16255 + }, + { + "epoch": 44.294277929155314, + "grad_norm": 4.5253729820251465, + "learning_rate": 1.2312630302360513e-05, + "loss": 0.1809, + "step": 16256 + }, + { + "epoch": 44.29700272479564, + "grad_norm": 5.335109233856201, + "learning_rate": 1.2311771722035022e-05, + "loss": 0.1643, + "step": 16257 + }, + { + "epoch": 44.299727520435965, + "grad_norm": 7.941211700439453, + "learning_rate": 1.2310913123705523e-05, + "loss": 0.2764, + "step": 16258 + }, + { + "epoch": 44.30245231607629, + "grad_norm": 5.2220845222473145, + "learning_rate": 1.2310054507378712e-05, + "loss": 0.2522, + "step": 16259 + }, + { + "epoch": 44.305177111716624, + "grad_norm": 6.244221210479736, + "learning_rate": 1.2309195873061269e-05, + "loss": 0.2413, + "step": 16260 + }, + { + "epoch": 44.30790190735695, + "grad_norm": 5.436784267425537, + "learning_rate": 1.2308337220759883e-05, + "loss": 0.251, + "step": 16261 + }, + { + "epoch": 44.310626702997276, + "grad_norm": 6.853261470794678, + "learning_rate": 1.230747855048124e-05, + "loss": 0.2238, + "step": 16262 + }, + { + "epoch": 44.3133514986376, + "grad_norm": 6.074221134185791, + "learning_rate": 1.230661986223203e-05, + "loss": 0.3987, + "step": 16263 + }, + { + "epoch": 44.31607629427793, + "grad_norm": 5.958846569061279, + "learning_rate": 1.2305761156018936e-05, + "loss": 0.2845, + "step": 16264 + }, + { + "epoch": 44.31880108991825, + "grad_norm": 6.054225444793701, + "learning_rate": 1.230490243184865e-05, + "loss": 0.2574, + "step": 16265 + }, + { + "epoch": 44.321525885558586, + "grad_norm": 5.6045098304748535, + "learning_rate": 1.2304043689727859e-05, + "loss": 0.2519, + "step": 16266 + }, + { + "epoch": 44.32425068119891, + "grad_norm": 6.948996543884277, + "learning_rate": 1.2303184929663248e-05, + "loss": 0.1045, + "step": 16267 + }, + { + "epoch": 44.32697547683924, + "grad_norm": 4.249958038330078, + "learning_rate": 1.2302326151661509e-05, + "loss": 0.2094, + "step": 16268 + }, + { + "epoch": 44.32970027247956, + "grad_norm": 5.515820503234863, + "learning_rate": 1.2301467355729327e-05, + "loss": 0.3183, + "step": 16269 + }, + { + "epoch": 44.33242506811989, + "grad_norm": 6.033924102783203, + "learning_rate": 1.2300608541873391e-05, + "loss": 0.2324, + "step": 16270 + }, + { + "epoch": 44.335149863760215, + "grad_norm": 16.895814895629883, + "learning_rate": 1.229974971010039e-05, + "loss": 0.2255, + "step": 16271 + }, + { + "epoch": 44.33787465940055, + "grad_norm": 5.29602575302124, + "learning_rate": 1.2298890860417013e-05, + "loss": 0.1508, + "step": 16272 + }, + { + "epoch": 44.34059945504087, + "grad_norm": 5.749146938323975, + "learning_rate": 1.2298031992829945e-05, + "loss": 0.2484, + "step": 16273 + }, + { + "epoch": 44.3433242506812, + "grad_norm": 5.419031143188477, + "learning_rate": 1.229717310734588e-05, + "loss": 0.236, + "step": 16274 + }, + { + "epoch": 44.346049046321525, + "grad_norm": 6.744513034820557, + "learning_rate": 1.2296314203971505e-05, + "loss": 0.1292, + "step": 16275 + }, + { + "epoch": 44.34877384196185, + "grad_norm": 5.140876293182373, + "learning_rate": 1.2295455282713509e-05, + "loss": 0.2218, + "step": 16276 + }, + { + "epoch": 44.35149863760218, + "grad_norm": 5.723390579223633, + "learning_rate": 1.229459634357858e-05, + "loss": 0.3446, + "step": 16277 + }, + { + "epoch": 44.35422343324251, + "grad_norm": 4.45698881149292, + "learning_rate": 1.229373738657341e-05, + "loss": 0.1729, + "step": 16278 + }, + { + "epoch": 44.356948228882835, + "grad_norm": 5.501786708831787, + "learning_rate": 1.2292878411704688e-05, + "loss": 0.1649, + "step": 16279 + }, + { + "epoch": 44.35967302452316, + "grad_norm": 5.382435321807861, + "learning_rate": 1.2292019418979098e-05, + "loss": 0.1078, + "step": 16280 + }, + { + "epoch": 44.36239782016349, + "grad_norm": 6.311226844787598, + "learning_rate": 1.2291160408403338e-05, + "loss": 0.2673, + "step": 16281 + }, + { + "epoch": 44.36512261580381, + "grad_norm": 5.9953742027282715, + "learning_rate": 1.2290301379984095e-05, + "loss": 0.1188, + "step": 16282 + }, + { + "epoch": 44.36784741144414, + "grad_norm": 6.1877312660217285, + "learning_rate": 1.2289442333728057e-05, + "loss": 0.2395, + "step": 16283 + }, + { + "epoch": 44.37057220708447, + "grad_norm": 6.551638126373291, + "learning_rate": 1.2288583269641917e-05, + "loss": 0.1718, + "step": 16284 + }, + { + "epoch": 44.3732970027248, + "grad_norm": 5.743000030517578, + "learning_rate": 1.2287724187732364e-05, + "loss": 0.1979, + "step": 16285 + }, + { + "epoch": 44.37602179836512, + "grad_norm": 4.951767921447754, + "learning_rate": 1.2286865088006088e-05, + "loss": 0.1429, + "step": 16286 + }, + { + "epoch": 44.37874659400545, + "grad_norm": 7.207986354827881, + "learning_rate": 1.2286005970469779e-05, + "loss": 0.1797, + "step": 16287 + }, + { + "epoch": 44.381471389645775, + "grad_norm": 5.050862789154053, + "learning_rate": 1.2285146835130133e-05, + "loss": 0.1633, + "step": 16288 + }, + { + "epoch": 44.3841961852861, + "grad_norm": 4.695954322814941, + "learning_rate": 1.2284287681993834e-05, + "loss": 0.2142, + "step": 16289 + }, + { + "epoch": 44.38692098092643, + "grad_norm": 5.752518653869629, + "learning_rate": 1.2283428511067574e-05, + "loss": 0.2671, + "step": 16290 + }, + { + "epoch": 44.38964577656676, + "grad_norm": 4.853794097900391, + "learning_rate": 1.228256932235805e-05, + "loss": 0.2382, + "step": 16291 + }, + { + "epoch": 44.392370572207085, + "grad_norm": 5.388570785522461, + "learning_rate": 1.228171011587195e-05, + "loss": 0.1693, + "step": 16292 + }, + { + "epoch": 44.39509536784741, + "grad_norm": 4.890974998474121, + "learning_rate": 1.228085089161596e-05, + "loss": 0.2088, + "step": 16293 + }, + { + "epoch": 44.39782016348774, + "grad_norm": 4.6638360023498535, + "learning_rate": 1.2279991649596784e-05, + "loss": 0.2171, + "step": 16294 + }, + { + "epoch": 44.40054495912806, + "grad_norm": 5.858438491821289, + "learning_rate": 1.22791323898211e-05, + "loss": 0.3256, + "step": 16295 + }, + { + "epoch": 44.403269754768395, + "grad_norm": 5.6721720695495605, + "learning_rate": 1.2278273112295612e-05, + "loss": 0.2023, + "step": 16296 + }, + { + "epoch": 44.40599455040872, + "grad_norm": 4.828054904937744, + "learning_rate": 1.2277413817027003e-05, + "loss": 0.2213, + "step": 16297 + }, + { + "epoch": 44.40871934604905, + "grad_norm": 4.199804782867432, + "learning_rate": 1.2276554504021969e-05, + "loss": 0.2457, + "step": 16298 + }, + { + "epoch": 44.41144414168937, + "grad_norm": 5.8764142990112305, + "learning_rate": 1.22756951732872e-05, + "loss": 0.3098, + "step": 16299 + }, + { + "epoch": 44.4141689373297, + "grad_norm": 4.359859943389893, + "learning_rate": 1.2274835824829392e-05, + "loss": 0.1701, + "step": 16300 + }, + { + "epoch": 44.416893732970024, + "grad_norm": 16.240520477294922, + "learning_rate": 1.2273976458655233e-05, + "loss": 0.1604, + "step": 16301 + }, + { + "epoch": 44.41961852861036, + "grad_norm": 6.469280242919922, + "learning_rate": 1.2273117074771423e-05, + "loss": 0.138, + "step": 16302 + }, + { + "epoch": 44.42234332425068, + "grad_norm": 3.977710723876953, + "learning_rate": 1.2272257673184646e-05, + "loss": 0.0885, + "step": 16303 + }, + { + "epoch": 44.42506811989101, + "grad_norm": 4.005497455596924, + "learning_rate": 1.2271398253901606e-05, + "loss": 0.1484, + "step": 16304 + }, + { + "epoch": 44.427792915531334, + "grad_norm": 4.929205417633057, + "learning_rate": 1.2270538816928982e-05, + "loss": 0.2453, + "step": 16305 + }, + { + "epoch": 44.43051771117166, + "grad_norm": 5.408425807952881, + "learning_rate": 1.226967936227348e-05, + "loss": 0.1835, + "step": 16306 + }, + { + "epoch": 44.433242506811986, + "grad_norm": 4.860259532928467, + "learning_rate": 1.2268819889941784e-05, + "loss": 0.2817, + "step": 16307 + }, + { + "epoch": 44.43596730245232, + "grad_norm": 5.1819329261779785, + "learning_rate": 1.2267960399940595e-05, + "loss": 0.1383, + "step": 16308 + }, + { + "epoch": 44.438692098092645, + "grad_norm": 6.924758434295654, + "learning_rate": 1.2267100892276602e-05, + "loss": 0.1461, + "step": 16309 + }, + { + "epoch": 44.44141689373297, + "grad_norm": 4.335215091705322, + "learning_rate": 1.2266241366956503e-05, + "loss": 0.1862, + "step": 16310 + }, + { + "epoch": 44.444141689373296, + "grad_norm": 4.81735897064209, + "learning_rate": 1.2265381823986984e-05, + "loss": 0.1676, + "step": 16311 + }, + { + "epoch": 44.44686648501362, + "grad_norm": 4.712780952453613, + "learning_rate": 1.2264522263374747e-05, + "loss": 0.1684, + "step": 16312 + }, + { + "epoch": 44.44959128065395, + "grad_norm": 4.163626194000244, + "learning_rate": 1.2263662685126486e-05, + "loss": 0.1801, + "step": 16313 + }, + { + "epoch": 44.45231607629428, + "grad_norm": 6.2198805809021, + "learning_rate": 1.2262803089248889e-05, + "loss": 0.1632, + "step": 16314 + }, + { + "epoch": 44.45504087193461, + "grad_norm": 6.122025012969971, + "learning_rate": 1.2261943475748657e-05, + "loss": 0.3163, + "step": 16315 + }, + { + "epoch": 44.45776566757493, + "grad_norm": 4.518787384033203, + "learning_rate": 1.226108384463248e-05, + "loss": 0.1251, + "step": 16316 + }, + { + "epoch": 44.46049046321526, + "grad_norm": 5.9850640296936035, + "learning_rate": 1.2260224195907053e-05, + "loss": 0.2348, + "step": 16317 + }, + { + "epoch": 44.463215258855584, + "grad_norm": 5.899969100952148, + "learning_rate": 1.2259364529579076e-05, + "loss": 0.2406, + "step": 16318 + }, + { + "epoch": 44.46594005449591, + "grad_norm": 5.047104358673096, + "learning_rate": 1.2258504845655242e-05, + "loss": 0.1589, + "step": 16319 + }, + { + "epoch": 44.46866485013624, + "grad_norm": 6.053981304168701, + "learning_rate": 1.2257645144142244e-05, + "loss": 0.2739, + "step": 16320 + }, + { + "epoch": 44.47138964577657, + "grad_norm": 6.156033515930176, + "learning_rate": 1.2256785425046776e-05, + "loss": 0.2014, + "step": 16321 + }, + { + "epoch": 44.474114441416894, + "grad_norm": 5.389181137084961, + "learning_rate": 1.2255925688375539e-05, + "loss": 0.2613, + "step": 16322 + }, + { + "epoch": 44.47683923705722, + "grad_norm": 4.212601661682129, + "learning_rate": 1.2255065934135222e-05, + "loss": 0.2288, + "step": 16323 + }, + { + "epoch": 44.479564032697546, + "grad_norm": 5.5055108070373535, + "learning_rate": 1.2254206162332523e-05, + "loss": 0.1921, + "step": 16324 + }, + { + "epoch": 44.48228882833787, + "grad_norm": 4.336231231689453, + "learning_rate": 1.2253346372974142e-05, + "loss": 0.1337, + "step": 16325 + }, + { + "epoch": 44.485013623978205, + "grad_norm": 4.315658092498779, + "learning_rate": 1.2252486566066772e-05, + "loss": 0.1666, + "step": 16326 + }, + { + "epoch": 44.48773841961853, + "grad_norm": 5.385659217834473, + "learning_rate": 1.2251626741617106e-05, + "loss": 0.1505, + "step": 16327 + }, + { + "epoch": 44.490463215258856, + "grad_norm": 5.198558807373047, + "learning_rate": 1.225076689963185e-05, + "loss": 0.2453, + "step": 16328 + }, + { + "epoch": 44.49318801089918, + "grad_norm": 7.6078200340271, + "learning_rate": 1.2249907040117688e-05, + "loss": 0.1817, + "step": 16329 + }, + { + "epoch": 44.49591280653951, + "grad_norm": 7.1719441413879395, + "learning_rate": 1.2249047163081325e-05, + "loss": 0.1521, + "step": 16330 + }, + { + "epoch": 44.49863760217983, + "grad_norm": 4.648802280426025, + "learning_rate": 1.2248187268529453e-05, + "loss": 0.1992, + "step": 16331 + }, + { + "epoch": 44.50136239782017, + "grad_norm": 5.414094924926758, + "learning_rate": 1.2247327356468772e-05, + "loss": 0.1876, + "step": 16332 + }, + { + "epoch": 44.50408719346049, + "grad_norm": 6.786231994628906, + "learning_rate": 1.2246467426905978e-05, + "loss": 0.3367, + "step": 16333 + }, + { + "epoch": 44.50681198910082, + "grad_norm": 7.858244895935059, + "learning_rate": 1.2245607479847767e-05, + "loss": 0.245, + "step": 16334 + }, + { + "epoch": 44.509536784741144, + "grad_norm": 7.821645736694336, + "learning_rate": 1.2244747515300839e-05, + "loss": 0.1359, + "step": 16335 + }, + { + "epoch": 44.51226158038147, + "grad_norm": 11.80642032623291, + "learning_rate": 1.224388753327189e-05, + "loss": 0.1764, + "step": 16336 + }, + { + "epoch": 44.514986376021795, + "grad_norm": 6.316769599914551, + "learning_rate": 1.2243027533767614e-05, + "loss": 0.175, + "step": 16337 + }, + { + "epoch": 44.51771117166213, + "grad_norm": 5.621060371398926, + "learning_rate": 1.2242167516794714e-05, + "loss": 0.1629, + "step": 16338 + }, + { + "epoch": 44.520435967302454, + "grad_norm": 4.951374530792236, + "learning_rate": 1.2241307482359885e-05, + "loss": 0.2068, + "step": 16339 + }, + { + "epoch": 44.52316076294278, + "grad_norm": 5.404215335845947, + "learning_rate": 1.2240447430469829e-05, + "loss": 0.1461, + "step": 16340 + }, + { + "epoch": 44.525885558583106, + "grad_norm": 5.342979431152344, + "learning_rate": 1.2239587361131235e-05, + "loss": 0.1788, + "step": 16341 + }, + { + "epoch": 44.52861035422343, + "grad_norm": 5.920839309692383, + "learning_rate": 1.2238727274350808e-05, + "loss": 0.2077, + "step": 16342 + }, + { + "epoch": 44.53133514986376, + "grad_norm": 4.700316905975342, + "learning_rate": 1.2237867170135244e-05, + "loss": 0.1705, + "step": 16343 + }, + { + "epoch": 44.53405994550409, + "grad_norm": 5.291968822479248, + "learning_rate": 1.2237007048491248e-05, + "loss": 0.2509, + "step": 16344 + }, + { + "epoch": 44.536784741144416, + "grad_norm": 4.686873912811279, + "learning_rate": 1.2236146909425508e-05, + "loss": 0.246, + "step": 16345 + }, + { + "epoch": 44.53950953678474, + "grad_norm": 6.583618640899658, + "learning_rate": 1.223528675294473e-05, + "loss": 0.253, + "step": 16346 + }, + { + "epoch": 44.54223433242507, + "grad_norm": 4.258402347564697, + "learning_rate": 1.223442657905561e-05, + "loss": 0.2042, + "step": 16347 + }, + { + "epoch": 44.54495912806539, + "grad_norm": 5.072122097015381, + "learning_rate": 1.2233566387764847e-05, + "loss": 0.1084, + "step": 16348 + }, + { + "epoch": 44.54768392370572, + "grad_norm": 4.582540512084961, + "learning_rate": 1.2232706179079142e-05, + "loss": 0.165, + "step": 16349 + }, + { + "epoch": 44.55040871934605, + "grad_norm": 5.258549213409424, + "learning_rate": 1.2231845953005192e-05, + "loss": 0.1454, + "step": 16350 + }, + { + "epoch": 44.55313351498638, + "grad_norm": 5.412867546081543, + "learning_rate": 1.2230985709549699e-05, + "loss": 0.2958, + "step": 16351 + }, + { + "epoch": 44.555858310626704, + "grad_norm": 5.269376754760742, + "learning_rate": 1.2230125448719358e-05, + "loss": 0.3327, + "step": 16352 + }, + { + "epoch": 44.55858310626703, + "grad_norm": 5.642248153686523, + "learning_rate": 1.2229265170520876e-05, + "loss": 0.3118, + "step": 16353 + }, + { + "epoch": 44.561307901907355, + "grad_norm": 6.034834384918213, + "learning_rate": 1.2228404874960949e-05, + "loss": 0.2119, + "step": 16354 + }, + { + "epoch": 44.56403269754768, + "grad_norm": 4.387385368347168, + "learning_rate": 1.2227544562046272e-05, + "loss": 0.1628, + "step": 16355 + }, + { + "epoch": 44.566757493188014, + "grad_norm": 7.412023067474365, + "learning_rate": 1.2226684231783551e-05, + "loss": 0.3198, + "step": 16356 + }, + { + "epoch": 44.56948228882834, + "grad_norm": 5.820879936218262, + "learning_rate": 1.2225823884179486e-05, + "loss": 0.2483, + "step": 16357 + }, + { + "epoch": 44.572207084468666, + "grad_norm": 5.885914325714111, + "learning_rate": 1.222496351924078e-05, + "loss": 0.2217, + "step": 16358 + }, + { + "epoch": 44.57493188010899, + "grad_norm": 7.226802349090576, + "learning_rate": 1.2224103136974123e-05, + "loss": 0.2107, + "step": 16359 + }, + { + "epoch": 44.57765667574932, + "grad_norm": 4.522464275360107, + "learning_rate": 1.2223242737386225e-05, + "loss": 0.1055, + "step": 16360 + }, + { + "epoch": 44.58038147138964, + "grad_norm": 4.730563640594482, + "learning_rate": 1.2222382320483785e-05, + "loss": 0.2857, + "step": 16361 + }, + { + "epoch": 44.583106267029976, + "grad_norm": 5.198635101318359, + "learning_rate": 1.2221521886273502e-05, + "loss": 0.1795, + "step": 16362 + }, + { + "epoch": 44.5858310626703, + "grad_norm": 5.904626846313477, + "learning_rate": 1.222066143476208e-05, + "loss": 0.2273, + "step": 16363 + }, + { + "epoch": 44.58855585831063, + "grad_norm": 4.365389823913574, + "learning_rate": 1.2219800965956217e-05, + "loss": 0.1739, + "step": 16364 + }, + { + "epoch": 44.59128065395095, + "grad_norm": 5.098349571228027, + "learning_rate": 1.2218940479862613e-05, + "loss": 0.2538, + "step": 16365 + }, + { + "epoch": 44.59400544959128, + "grad_norm": 5.18057918548584, + "learning_rate": 1.2218079976487976e-05, + "loss": 0.2011, + "step": 16366 + }, + { + "epoch": 44.596730245231605, + "grad_norm": 5.942376613616943, + "learning_rate": 1.2217219455839e-05, + "loss": 0.2401, + "step": 16367 + }, + { + "epoch": 44.59945504087194, + "grad_norm": 5.536251068115234, + "learning_rate": 1.221635891792239e-05, + "loss": 0.1822, + "step": 16368 + }, + { + "epoch": 44.60217983651226, + "grad_norm": 4.777346134185791, + "learning_rate": 1.2215498362744853e-05, + "loss": 0.2757, + "step": 16369 + }, + { + "epoch": 44.60490463215259, + "grad_norm": 6.0716633796691895, + "learning_rate": 1.2214637790313081e-05, + "loss": 0.5032, + "step": 16370 + }, + { + "epoch": 44.607629427792915, + "grad_norm": 4.697019577026367, + "learning_rate": 1.2213777200633786e-05, + "loss": 0.1395, + "step": 16371 + }, + { + "epoch": 44.61035422343324, + "grad_norm": 6.832633972167969, + "learning_rate": 1.221291659371366e-05, + "loss": 0.1398, + "step": 16372 + }, + { + "epoch": 44.61307901907357, + "grad_norm": 4.780966281890869, + "learning_rate": 1.2212055969559415e-05, + "loss": 0.1528, + "step": 16373 + }, + { + "epoch": 44.6158038147139, + "grad_norm": 5.384737491607666, + "learning_rate": 1.2211195328177747e-05, + "loss": 0.2267, + "step": 16374 + }, + { + "epoch": 44.618528610354225, + "grad_norm": 5.076670169830322, + "learning_rate": 1.2210334669575362e-05, + "loss": 0.1704, + "step": 16375 + }, + { + "epoch": 44.62125340599455, + "grad_norm": 4.770692825317383, + "learning_rate": 1.2209473993758957e-05, + "loss": 0.1446, + "step": 16376 + }, + { + "epoch": 44.62397820163488, + "grad_norm": 6.416381359100342, + "learning_rate": 1.2208613300735247e-05, + "loss": 0.2606, + "step": 16377 + }, + { + "epoch": 44.6267029972752, + "grad_norm": 4.535919189453125, + "learning_rate": 1.2207752590510924e-05, + "loss": 0.3067, + "step": 16378 + }, + { + "epoch": 44.62942779291553, + "grad_norm": 5.324057102203369, + "learning_rate": 1.2206891863092697e-05, + "loss": 0.2079, + "step": 16379 + }, + { + "epoch": 44.63215258855586, + "grad_norm": 5.409849643707275, + "learning_rate": 1.2206031118487264e-05, + "loss": 0.2076, + "step": 16380 + }, + { + "epoch": 44.63487738419619, + "grad_norm": 6.793900489807129, + "learning_rate": 1.2205170356701337e-05, + "loss": 0.162, + "step": 16381 + }, + { + "epoch": 44.63760217983651, + "grad_norm": 4.991828441619873, + "learning_rate": 1.220430957774161e-05, + "loss": 0.212, + "step": 16382 + }, + { + "epoch": 44.64032697547684, + "grad_norm": 6.235599040985107, + "learning_rate": 1.220344878161479e-05, + "loss": 0.2661, + "step": 16383 + }, + { + "epoch": 44.643051771117165, + "grad_norm": 4.532994747161865, + "learning_rate": 1.2202587968327584e-05, + "loss": 0.2122, + "step": 16384 + }, + { + "epoch": 44.64577656675749, + "grad_norm": 5.00579833984375, + "learning_rate": 1.2201727137886692e-05, + "loss": 0.2256, + "step": 16385 + }, + { + "epoch": 44.64850136239782, + "grad_norm": 4.9762372970581055, + "learning_rate": 1.220086629029882e-05, + "loss": 0.348, + "step": 16386 + }, + { + "epoch": 44.65122615803815, + "grad_norm": 5.744802474975586, + "learning_rate": 1.2200005425570676e-05, + "loss": 0.268, + "step": 16387 + }, + { + "epoch": 44.653950953678475, + "grad_norm": 4.24283504486084, + "learning_rate": 1.2199144543708957e-05, + "loss": 0.1737, + "step": 16388 + }, + { + "epoch": 44.6566757493188, + "grad_norm": 4.924327850341797, + "learning_rate": 1.2198283644720373e-05, + "loss": 0.2677, + "step": 16389 + }, + { + "epoch": 44.65940054495913, + "grad_norm": 4.337157249450684, + "learning_rate": 1.2197422728611624e-05, + "loss": 0.3367, + "step": 16390 + }, + { + "epoch": 44.66212534059945, + "grad_norm": 5.2622456550598145, + "learning_rate": 1.219656179538942e-05, + "loss": 0.2184, + "step": 16391 + }, + { + "epoch": 44.664850136239785, + "grad_norm": 3.9210143089294434, + "learning_rate": 1.2195700845060462e-05, + "loss": 0.3047, + "step": 16392 + }, + { + "epoch": 44.66757493188011, + "grad_norm": 4.90424108505249, + "learning_rate": 1.2194839877631457e-05, + "loss": 0.1054, + "step": 16393 + }, + { + "epoch": 44.67029972752044, + "grad_norm": 4.5516862869262695, + "learning_rate": 1.2193978893109109e-05, + "loss": 0.2586, + "step": 16394 + }, + { + "epoch": 44.67302452316076, + "grad_norm": 5.143599987030029, + "learning_rate": 1.2193117891500126e-05, + "loss": 0.258, + "step": 16395 + }, + { + "epoch": 44.67574931880109, + "grad_norm": 5.577111721038818, + "learning_rate": 1.2192256872811207e-05, + "loss": 0.1353, + "step": 16396 + }, + { + "epoch": 44.678474114441414, + "grad_norm": 5.602947235107422, + "learning_rate": 1.219139583704907e-05, + "loss": 0.3288, + "step": 16397 + }, + { + "epoch": 44.68119891008175, + "grad_norm": 5.5605082511901855, + "learning_rate": 1.2190534784220405e-05, + "loss": 0.2506, + "step": 16398 + }, + { + "epoch": 44.68392370572207, + "grad_norm": 6.177340507507324, + "learning_rate": 1.2189673714331932e-05, + "loss": 0.167, + "step": 16399 + }, + { + "epoch": 44.6866485013624, + "grad_norm": 4.574554443359375, + "learning_rate": 1.2188812627390345e-05, + "loss": 0.1967, + "step": 16400 + }, + { + "epoch": 44.689373297002724, + "grad_norm": 4.757580757141113, + "learning_rate": 1.218795152340236e-05, + "loss": 0.183, + "step": 16401 + }, + { + "epoch": 44.69209809264305, + "grad_norm": 5.213620185852051, + "learning_rate": 1.2187090402374673e-05, + "loss": 0.3285, + "step": 16402 + }, + { + "epoch": 44.694822888283376, + "grad_norm": 5.771677494049072, + "learning_rate": 1.2186229264314e-05, + "loss": 0.171, + "step": 16403 + }, + { + "epoch": 44.69754768392371, + "grad_norm": 5.553153991699219, + "learning_rate": 1.2185368109227044e-05, + "loss": 0.3119, + "step": 16404 + }, + { + "epoch": 44.700272479564035, + "grad_norm": 4.6227827072143555, + "learning_rate": 1.2184506937120513e-05, + "loss": 0.1755, + "step": 16405 + }, + { + "epoch": 44.70299727520436, + "grad_norm": 4.735884189605713, + "learning_rate": 1.2183645748001109e-05, + "loss": 0.1804, + "step": 16406 + }, + { + "epoch": 44.705722070844686, + "grad_norm": 5.025547981262207, + "learning_rate": 1.2182784541875546e-05, + "loss": 0.177, + "step": 16407 + }, + { + "epoch": 44.70844686648501, + "grad_norm": 8.84172248840332, + "learning_rate": 1.2181923318750523e-05, + "loss": 0.2655, + "step": 16408 + }, + { + "epoch": 44.71117166212534, + "grad_norm": 5.576916694641113, + "learning_rate": 1.2181062078632757e-05, + "loss": 0.2252, + "step": 16409 + }, + { + "epoch": 44.71389645776567, + "grad_norm": 7.395151615142822, + "learning_rate": 1.2180200821528942e-05, + "loss": 0.2293, + "step": 16410 + }, + { + "epoch": 44.716621253406, + "grad_norm": 6.201037883758545, + "learning_rate": 1.2179339547445799e-05, + "loss": 0.214, + "step": 16411 + }, + { + "epoch": 44.71934604904632, + "grad_norm": 4.671193599700928, + "learning_rate": 1.2178478256390028e-05, + "loss": 0.1127, + "step": 16412 + }, + { + "epoch": 44.72207084468665, + "grad_norm": 6.584817409515381, + "learning_rate": 1.2177616948368341e-05, + "loss": 0.2061, + "step": 16413 + }, + { + "epoch": 44.724795640326974, + "grad_norm": 5.561539649963379, + "learning_rate": 1.217675562338744e-05, + "loss": 0.2798, + "step": 16414 + }, + { + "epoch": 44.7275204359673, + "grad_norm": 6.056123733520508, + "learning_rate": 1.2175894281454037e-05, + "loss": 0.2159, + "step": 16415 + }, + { + "epoch": 44.73024523160763, + "grad_norm": 6.623376369476318, + "learning_rate": 1.2175032922574839e-05, + "loss": 0.262, + "step": 16416 + }, + { + "epoch": 44.73297002724796, + "grad_norm": 7.3019537925720215, + "learning_rate": 1.2174171546756557e-05, + "loss": 0.3738, + "step": 16417 + }, + { + "epoch": 44.735694822888284, + "grad_norm": 6.133616924285889, + "learning_rate": 1.2173310154005896e-05, + "loss": 0.1665, + "step": 16418 + }, + { + "epoch": 44.73841961852861, + "grad_norm": 5.614738941192627, + "learning_rate": 1.217244874432956e-05, + "loss": 0.1658, + "step": 16419 + }, + { + "epoch": 44.741144414168936, + "grad_norm": 4.63480806350708, + "learning_rate": 1.2171587317734268e-05, + "loss": 0.1498, + "step": 16420 + }, + { + "epoch": 44.74386920980926, + "grad_norm": 5.289315223693848, + "learning_rate": 1.2170725874226725e-05, + "loss": 0.2081, + "step": 16421 + }, + { + "epoch": 44.746594005449595, + "grad_norm": 4.7408599853515625, + "learning_rate": 1.2169864413813637e-05, + "loss": 0.1478, + "step": 16422 + }, + { + "epoch": 44.74931880108992, + "grad_norm": 6.242374420166016, + "learning_rate": 1.2169002936501717e-05, + "loss": 0.2716, + "step": 16423 + }, + { + "epoch": 44.752043596730246, + "grad_norm": 5.0137434005737305, + "learning_rate": 1.216814144229767e-05, + "loss": 0.2229, + "step": 16424 + }, + { + "epoch": 44.75476839237057, + "grad_norm": 5.0223798751831055, + "learning_rate": 1.2167279931208209e-05, + "loss": 0.1383, + "step": 16425 + }, + { + "epoch": 44.7574931880109, + "grad_norm": 6.727980613708496, + "learning_rate": 1.2166418403240038e-05, + "loss": 0.1514, + "step": 16426 + }, + { + "epoch": 44.76021798365122, + "grad_norm": 7.22456169128418, + "learning_rate": 1.2165556858399874e-05, + "loss": 0.1984, + "step": 16427 + }, + { + "epoch": 44.762942779291556, + "grad_norm": 4.701144695281982, + "learning_rate": 1.216469529669442e-05, + "loss": 0.2101, + "step": 16428 + }, + { + "epoch": 44.76566757493188, + "grad_norm": 5.2383222579956055, + "learning_rate": 1.216383371813039e-05, + "loss": 0.1126, + "step": 16429 + }, + { + "epoch": 44.76839237057221, + "grad_norm": 6.049795627593994, + "learning_rate": 1.2162972122714491e-05, + "loss": 0.2141, + "step": 16430 + }, + { + "epoch": 44.771117166212534, + "grad_norm": 6.866738796234131, + "learning_rate": 1.2162110510453437e-05, + "loss": 0.2691, + "step": 16431 + }, + { + "epoch": 44.77384196185286, + "grad_norm": 6.67152214050293, + "learning_rate": 1.2161248881353936e-05, + "loss": 0.1846, + "step": 16432 + }, + { + "epoch": 44.776566757493185, + "grad_norm": 4.297389984130859, + "learning_rate": 1.2160387235422697e-05, + "loss": 0.3139, + "step": 16433 + }, + { + "epoch": 44.77929155313352, + "grad_norm": 4.853041172027588, + "learning_rate": 1.215952557266643e-05, + "loss": 0.3744, + "step": 16434 + }, + { + "epoch": 44.782016348773844, + "grad_norm": 4.801114559173584, + "learning_rate": 1.2158663893091851e-05, + "loss": 0.192, + "step": 16435 + }, + { + "epoch": 44.78474114441417, + "grad_norm": 3.750229835510254, + "learning_rate": 1.2157802196705666e-05, + "loss": 0.1018, + "step": 16436 + }, + { + "epoch": 44.787465940054496, + "grad_norm": 4.52603006362915, + "learning_rate": 1.2156940483514585e-05, + "loss": 0.1754, + "step": 16437 + }, + { + "epoch": 44.79019073569482, + "grad_norm": 4.756311416625977, + "learning_rate": 1.2156078753525325e-05, + "loss": 0.1699, + "step": 16438 + }, + { + "epoch": 44.79291553133515, + "grad_norm": 5.980393886566162, + "learning_rate": 1.2155217006744588e-05, + "loss": 0.1904, + "step": 16439 + }, + { + "epoch": 44.79564032697548, + "grad_norm": 5.323193073272705, + "learning_rate": 1.2154355243179092e-05, + "loss": 0.2048, + "step": 16440 + }, + { + "epoch": 44.798365122615806, + "grad_norm": 4.5851545333862305, + "learning_rate": 1.215349346283555e-05, + "loss": 0.1346, + "step": 16441 + }, + { + "epoch": 44.80108991825613, + "grad_norm": 4.715217113494873, + "learning_rate": 1.2152631665720667e-05, + "loss": 0.2542, + "step": 16442 + }, + { + "epoch": 44.80381471389646, + "grad_norm": 5.653316974639893, + "learning_rate": 1.215176985184116e-05, + "loss": 0.134, + "step": 16443 + }, + { + "epoch": 44.80653950953678, + "grad_norm": 4.876206874847412, + "learning_rate": 1.2150908021203736e-05, + "loss": 0.3399, + "step": 16444 + }, + { + "epoch": 44.80926430517711, + "grad_norm": 5.213658332824707, + "learning_rate": 1.215004617381511e-05, + "loss": 0.2188, + "step": 16445 + }, + { + "epoch": 44.81198910081744, + "grad_norm": 5.333511829376221, + "learning_rate": 1.2149184309681995e-05, + "loss": 0.2125, + "step": 16446 + }, + { + "epoch": 44.81471389645777, + "grad_norm": 4.946162700653076, + "learning_rate": 1.21483224288111e-05, + "loss": 0.1501, + "step": 16447 + }, + { + "epoch": 44.817438692098094, + "grad_norm": 4.635293960571289, + "learning_rate": 1.2147460531209141e-05, + "loss": 0.137, + "step": 16448 + }, + { + "epoch": 44.82016348773842, + "grad_norm": 4.830501079559326, + "learning_rate": 1.2146598616882828e-05, + "loss": 0.2062, + "step": 16449 + }, + { + "epoch": 44.822888283378745, + "grad_norm": 5.653111457824707, + "learning_rate": 1.2145736685838876e-05, + "loss": 0.1813, + "step": 16450 + }, + { + "epoch": 44.82561307901907, + "grad_norm": 5.251279354095459, + "learning_rate": 1.2144874738083992e-05, + "loss": 0.261, + "step": 16451 + }, + { + "epoch": 44.828337874659404, + "grad_norm": 5.2505388259887695, + "learning_rate": 1.2144012773624893e-05, + "loss": 0.1934, + "step": 16452 + }, + { + "epoch": 44.83106267029973, + "grad_norm": 8.280632019042969, + "learning_rate": 1.2143150792468292e-05, + "loss": 0.1978, + "step": 16453 + }, + { + "epoch": 44.833787465940055, + "grad_norm": 5.335907936096191, + "learning_rate": 1.2142288794620903e-05, + "loss": 0.1751, + "step": 16454 + }, + { + "epoch": 44.83651226158038, + "grad_norm": 5.506390571594238, + "learning_rate": 1.2141426780089436e-05, + "loss": 0.295, + "step": 16455 + }, + { + "epoch": 44.83923705722071, + "grad_norm": 5.114776611328125, + "learning_rate": 1.2140564748880608e-05, + "loss": 0.2163, + "step": 16456 + }, + { + "epoch": 44.84196185286103, + "grad_norm": 5.010404586791992, + "learning_rate": 1.213970270100113e-05, + "loss": 0.305, + "step": 16457 + }, + { + "epoch": 44.844686648501366, + "grad_norm": 6.250791549682617, + "learning_rate": 1.2138840636457716e-05, + "loss": 0.2335, + "step": 16458 + }, + { + "epoch": 44.84741144414169, + "grad_norm": 5.389265060424805, + "learning_rate": 1.213797855525708e-05, + "loss": 0.2307, + "step": 16459 + }, + { + "epoch": 44.85013623978202, + "grad_norm": 5.745802402496338, + "learning_rate": 1.2137116457405938e-05, + "loss": 0.1863, + "step": 16460 + }, + { + "epoch": 44.85286103542234, + "grad_norm": 4.540849208831787, + "learning_rate": 1.2136254342910997e-05, + "loss": 0.2068, + "step": 16461 + }, + { + "epoch": 44.85558583106267, + "grad_norm": 6.162951946258545, + "learning_rate": 1.2135392211778978e-05, + "loss": 0.2772, + "step": 16462 + }, + { + "epoch": 44.858310626702995, + "grad_norm": 5.170132160186768, + "learning_rate": 1.2134530064016594e-05, + "loss": 0.181, + "step": 16463 + }, + { + "epoch": 44.86103542234333, + "grad_norm": 4.901643753051758, + "learning_rate": 1.213366789963056e-05, + "loss": 0.1205, + "step": 16464 + }, + { + "epoch": 44.86376021798365, + "grad_norm": 4.8902363777160645, + "learning_rate": 1.2132805718627588e-05, + "loss": 0.1484, + "step": 16465 + }, + { + "epoch": 44.86648501362398, + "grad_norm": 4.043622016906738, + "learning_rate": 1.2131943521014393e-05, + "loss": 0.099, + "step": 16466 + }, + { + "epoch": 44.869209809264305, + "grad_norm": 5.787082672119141, + "learning_rate": 1.213108130679769e-05, + "loss": 0.1662, + "step": 16467 + }, + { + "epoch": 44.87193460490463, + "grad_norm": 8.555408477783203, + "learning_rate": 1.2130219075984195e-05, + "loss": 0.2985, + "step": 16468 + }, + { + "epoch": 44.87465940054496, + "grad_norm": 4.420747756958008, + "learning_rate": 1.2129356828580623e-05, + "loss": 0.1179, + "step": 16469 + }, + { + "epoch": 44.87738419618529, + "grad_norm": 6.063549518585205, + "learning_rate": 1.212849456459369e-05, + "loss": 0.4112, + "step": 16470 + }, + { + "epoch": 44.880108991825615, + "grad_norm": 5.833211898803711, + "learning_rate": 1.2127632284030101e-05, + "loss": 0.2814, + "step": 16471 + }, + { + "epoch": 44.88283378746594, + "grad_norm": 4.399301528930664, + "learning_rate": 1.212676998689659e-05, + "loss": 0.1431, + "step": 16472 + }, + { + "epoch": 44.88555858310627, + "grad_norm": 5.7322821617126465, + "learning_rate": 1.212590767319986e-05, + "loss": 0.2417, + "step": 16473 + }, + { + "epoch": 44.88828337874659, + "grad_norm": 7.326210021972656, + "learning_rate": 1.2125045342946628e-05, + "loss": 0.1547, + "step": 16474 + }, + { + "epoch": 44.89100817438692, + "grad_norm": 4.27852725982666, + "learning_rate": 1.2124182996143615e-05, + "loss": 0.1268, + "step": 16475 + }, + { + "epoch": 44.89373297002725, + "grad_norm": 5.068663597106934, + "learning_rate": 1.2123320632797531e-05, + "loss": 0.298, + "step": 16476 + }, + { + "epoch": 44.89645776566758, + "grad_norm": 5.224200248718262, + "learning_rate": 1.2122458252915093e-05, + "loss": 0.1547, + "step": 16477 + }, + { + "epoch": 44.8991825613079, + "grad_norm": 5.985930919647217, + "learning_rate": 1.2121595856503018e-05, + "loss": 0.2009, + "step": 16478 + }, + { + "epoch": 44.90190735694823, + "grad_norm": 4.921285152435303, + "learning_rate": 1.2120733443568023e-05, + "loss": 0.1677, + "step": 16479 + }, + { + "epoch": 44.904632152588555, + "grad_norm": 4.74705171585083, + "learning_rate": 1.2119871014116827e-05, + "loss": 0.1077, + "step": 16480 + }, + { + "epoch": 44.90735694822888, + "grad_norm": 4.848055839538574, + "learning_rate": 1.211900856815614e-05, + "loss": 0.1856, + "step": 16481 + }, + { + "epoch": 44.91008174386921, + "grad_norm": 4.837916374206543, + "learning_rate": 1.2118146105692687e-05, + "loss": 0.1507, + "step": 16482 + }, + { + "epoch": 44.91280653950954, + "grad_norm": 7.80957555770874, + "learning_rate": 1.2117283626733176e-05, + "loss": 0.2266, + "step": 16483 + }, + { + "epoch": 44.915531335149865, + "grad_norm": 6.339170932769775, + "learning_rate": 1.2116421131284332e-05, + "loss": 0.2142, + "step": 16484 + }, + { + "epoch": 44.91825613079019, + "grad_norm": 5.276419639587402, + "learning_rate": 1.2115558619352866e-05, + "loss": 0.1582, + "step": 16485 + }, + { + "epoch": 44.920980926430516, + "grad_norm": 4.407070159912109, + "learning_rate": 1.2114696090945499e-05, + "loss": 0.2064, + "step": 16486 + }, + { + "epoch": 44.92370572207084, + "grad_norm": 9.91385269165039, + "learning_rate": 1.2113833546068945e-05, + "loss": 0.2421, + "step": 16487 + }, + { + "epoch": 44.926430517711175, + "grad_norm": 13.311921119689941, + "learning_rate": 1.2112970984729924e-05, + "loss": 0.2019, + "step": 16488 + }, + { + "epoch": 44.9291553133515, + "grad_norm": 6.210605144500732, + "learning_rate": 1.2112108406935152e-05, + "loss": 0.1967, + "step": 16489 + }, + { + "epoch": 44.93188010899183, + "grad_norm": 4.3446574211120605, + "learning_rate": 1.211124581269135e-05, + "loss": 0.3851, + "step": 16490 + }, + { + "epoch": 44.93460490463215, + "grad_norm": 4.927207946777344, + "learning_rate": 1.2110383202005234e-05, + "loss": 0.1999, + "step": 16491 + }, + { + "epoch": 44.93732970027248, + "grad_norm": 5.123676776885986, + "learning_rate": 1.2109520574883519e-05, + "loss": 0.5084, + "step": 16492 + }, + { + "epoch": 44.940054495912804, + "grad_norm": 6.560925006866455, + "learning_rate": 1.2108657931332928e-05, + "loss": 0.2164, + "step": 16493 + }, + { + "epoch": 44.94277929155314, + "grad_norm": 5.3994574546813965, + "learning_rate": 1.2107795271360177e-05, + "loss": 0.2569, + "step": 16494 + }, + { + "epoch": 44.94550408719346, + "grad_norm": 5.85552978515625, + "learning_rate": 1.210693259497198e-05, + "loss": 0.2926, + "step": 16495 + }, + { + "epoch": 44.94822888283379, + "grad_norm": 7.393570423126221, + "learning_rate": 1.2106069902175061e-05, + "loss": 0.211, + "step": 16496 + }, + { + "epoch": 44.950953678474114, + "grad_norm": 6.004249572753906, + "learning_rate": 1.210520719297614e-05, + "loss": 0.1961, + "step": 16497 + }, + { + "epoch": 44.95367847411444, + "grad_norm": 4.975900173187256, + "learning_rate": 1.2104344467381934e-05, + "loss": 0.1602, + "step": 16498 + }, + { + "epoch": 44.956403269754766, + "grad_norm": 5.147679328918457, + "learning_rate": 1.2103481725399158e-05, + "loss": 0.1848, + "step": 16499 + }, + { + "epoch": 44.95912806539509, + "grad_norm": 5.091027736663818, + "learning_rate": 1.2102618967034537e-05, + "loss": 0.2364, + "step": 16500 + }, + { + "epoch": 44.961852861035425, + "grad_norm": 3.759225845336914, + "learning_rate": 1.2101756192294785e-05, + "loss": 0.2279, + "step": 16501 + }, + { + "epoch": 44.96457765667575, + "grad_norm": 5.046459197998047, + "learning_rate": 1.2100893401186624e-05, + "loss": 0.2177, + "step": 16502 + }, + { + "epoch": 44.967302452316076, + "grad_norm": 4.500819206237793, + "learning_rate": 1.2100030593716772e-05, + "loss": 0.1707, + "step": 16503 + }, + { + "epoch": 44.9700272479564, + "grad_norm": 9.605218887329102, + "learning_rate": 1.2099167769891952e-05, + "loss": 0.2307, + "step": 16504 + }, + { + "epoch": 44.97275204359673, + "grad_norm": 28.277524948120117, + "learning_rate": 1.2098304929718875e-05, + "loss": 0.257, + "step": 16505 + }, + { + "epoch": 44.97547683923706, + "grad_norm": 5.641982555389404, + "learning_rate": 1.2097442073204272e-05, + "loss": 0.1846, + "step": 16506 + }, + { + "epoch": 44.97820163487739, + "grad_norm": 5.367890357971191, + "learning_rate": 1.2096579200354857e-05, + "loss": 0.2236, + "step": 16507 + }, + { + "epoch": 44.98092643051771, + "grad_norm": 3.9556329250335693, + "learning_rate": 1.209571631117735e-05, + "loss": 0.2136, + "step": 16508 + }, + { + "epoch": 44.98365122615804, + "grad_norm": 4.4472150802612305, + "learning_rate": 1.2094853405678471e-05, + "loss": 0.1678, + "step": 16509 + }, + { + "epoch": 44.986376021798364, + "grad_norm": 6.31549596786499, + "learning_rate": 1.2093990483864944e-05, + "loss": 0.1811, + "step": 16510 + }, + { + "epoch": 44.98910081743869, + "grad_norm": 6.078292369842529, + "learning_rate": 1.2093127545743482e-05, + "loss": 0.177, + "step": 16511 + }, + { + "epoch": 44.991825613079016, + "grad_norm": 5.6930928230285645, + "learning_rate": 1.2092264591320815e-05, + "loss": 0.2932, + "step": 16512 + }, + { + "epoch": 44.99455040871935, + "grad_norm": 4.938112258911133, + "learning_rate": 1.2091401620603656e-05, + "loss": 0.1919, + "step": 16513 + }, + { + "epoch": 44.997275204359674, + "grad_norm": 6.328670024871826, + "learning_rate": 1.2090538633598728e-05, + "loss": 0.3275, + "step": 16514 + }, + { + "epoch": 45.0, + "grad_norm": 6.109992980957031, + "learning_rate": 1.2089675630312755e-05, + "loss": 0.1832, + "step": 16515 + }, + { + "epoch": 45.002724795640326, + "grad_norm": 5.512378692626953, + "learning_rate": 1.2088812610752449e-05, + "loss": 0.179, + "step": 16516 + }, + { + "epoch": 45.00544959128065, + "grad_norm": 5.3177971839904785, + "learning_rate": 1.2087949574924542e-05, + "loss": 0.155, + "step": 16517 + }, + { + "epoch": 45.00817438692098, + "grad_norm": 4.777791500091553, + "learning_rate": 1.2087086522835754e-05, + "loss": 0.2024, + "step": 16518 + }, + { + "epoch": 45.01089918256131, + "grad_norm": 4.446604251861572, + "learning_rate": 1.2086223454492798e-05, + "loss": 0.1863, + "step": 16519 + }, + { + "epoch": 45.013623978201636, + "grad_norm": 4.505539894104004, + "learning_rate": 1.2085360369902405e-05, + "loss": 0.2233, + "step": 16520 + }, + { + "epoch": 45.01634877384196, + "grad_norm": 6.669691562652588, + "learning_rate": 1.208449726907129e-05, + "loss": 0.2606, + "step": 16521 + }, + { + "epoch": 45.01907356948229, + "grad_norm": 5.373653411865234, + "learning_rate": 1.2083634152006178e-05, + "loss": 0.3221, + "step": 16522 + }, + { + "epoch": 45.02179836512261, + "grad_norm": 5.863643169403076, + "learning_rate": 1.208277101871379e-05, + "loss": 0.2959, + "step": 16523 + }, + { + "epoch": 45.02452316076294, + "grad_norm": 5.832777976989746, + "learning_rate": 1.208190786920085e-05, + "loss": 0.3932, + "step": 16524 + }, + { + "epoch": 45.02724795640327, + "grad_norm": 5.73431396484375, + "learning_rate": 1.2081044703474079e-05, + "loss": 0.2045, + "step": 16525 + }, + { + "epoch": 45.0299727520436, + "grad_norm": 4.735246658325195, + "learning_rate": 1.2080181521540195e-05, + "loss": 0.3188, + "step": 16526 + }, + { + "epoch": 45.032697547683924, + "grad_norm": 6.507968902587891, + "learning_rate": 1.2079318323405926e-05, + "loss": 0.1391, + "step": 16527 + }, + { + "epoch": 45.03542234332425, + "grad_norm": 6.053386211395264, + "learning_rate": 1.2078455109077994e-05, + "loss": 0.2635, + "step": 16528 + }, + { + "epoch": 45.038147138964575, + "grad_norm": 6.033876895904541, + "learning_rate": 1.207759187856312e-05, + "loss": 0.1196, + "step": 16529 + }, + { + "epoch": 45.0408719346049, + "grad_norm": 4.177990913391113, + "learning_rate": 1.2076728631868026e-05, + "loss": 0.1621, + "step": 16530 + }, + { + "epoch": 45.043596730245234, + "grad_norm": 7.85495138168335, + "learning_rate": 1.2075865368999437e-05, + "loss": 0.1633, + "step": 16531 + }, + { + "epoch": 45.04632152588556, + "grad_norm": 4.977965831756592, + "learning_rate": 1.2075002089964077e-05, + "loss": 0.2815, + "step": 16532 + }, + { + "epoch": 45.049046321525886, + "grad_norm": 5.360485076904297, + "learning_rate": 1.2074138794768666e-05, + "loss": 0.1459, + "step": 16533 + }, + { + "epoch": 45.05177111716621, + "grad_norm": 4.5159831047058105, + "learning_rate": 1.2073275483419928e-05, + "loss": 0.2168, + "step": 16534 + }, + { + "epoch": 45.05449591280654, + "grad_norm": 8.731205940246582, + "learning_rate": 1.2072412155924589e-05, + "loss": 0.2906, + "step": 16535 + }, + { + "epoch": 45.05722070844686, + "grad_norm": 4.30543851852417, + "learning_rate": 1.207154881228937e-05, + "loss": 0.1112, + "step": 16536 + }, + { + "epoch": 45.059945504087196, + "grad_norm": 5.078404426574707, + "learning_rate": 1.2070685452520996e-05, + "loss": 0.2499, + "step": 16537 + }, + { + "epoch": 45.06267029972752, + "grad_norm": 4.377470016479492, + "learning_rate": 1.206982207662619e-05, + "loss": 0.1048, + "step": 16538 + }, + { + "epoch": 45.06539509536785, + "grad_norm": 5.7056803703308105, + "learning_rate": 1.2068958684611675e-05, + "loss": 0.2832, + "step": 16539 + }, + { + "epoch": 45.06811989100817, + "grad_norm": 5.156067848205566, + "learning_rate": 1.2068095276484177e-05, + "loss": 0.1302, + "step": 16540 + }, + { + "epoch": 45.0708446866485, + "grad_norm": 7.141348361968994, + "learning_rate": 1.2067231852250421e-05, + "loss": 0.2455, + "step": 16541 + }, + { + "epoch": 45.073569482288825, + "grad_norm": 3.8205201625823975, + "learning_rate": 1.206636841191713e-05, + "loss": 0.1014, + "step": 16542 + }, + { + "epoch": 45.07629427792916, + "grad_norm": 4.64540958404541, + "learning_rate": 1.2065504955491028e-05, + "loss": 0.1048, + "step": 16543 + }, + { + "epoch": 45.079019073569484, + "grad_norm": 5.926222324371338, + "learning_rate": 1.2064641482978835e-05, + "loss": 0.2379, + "step": 16544 + }, + { + "epoch": 45.08174386920981, + "grad_norm": 5.158275604248047, + "learning_rate": 1.206377799438729e-05, + "loss": 0.2085, + "step": 16545 + }, + { + "epoch": 45.084468664850135, + "grad_norm": 15.585972785949707, + "learning_rate": 1.20629144897231e-05, + "loss": 0.2434, + "step": 16546 + }, + { + "epoch": 45.08719346049046, + "grad_norm": 5.83115291595459, + "learning_rate": 1.2062050968993002e-05, + "loss": 0.1738, + "step": 16547 + }, + { + "epoch": 45.08991825613079, + "grad_norm": 7.6292033195495605, + "learning_rate": 1.2061187432203716e-05, + "loss": 0.2433, + "step": 16548 + }, + { + "epoch": 45.09264305177112, + "grad_norm": 8.051736831665039, + "learning_rate": 1.206032387936197e-05, + "loss": 0.1835, + "step": 16549 + }, + { + "epoch": 45.095367847411445, + "grad_norm": 7.657648086547852, + "learning_rate": 1.2059460310474486e-05, + "loss": 0.1468, + "step": 16550 + }, + { + "epoch": 45.09809264305177, + "grad_norm": 7.185408115386963, + "learning_rate": 1.2058596725547993e-05, + "loss": 0.2395, + "step": 16551 + }, + { + "epoch": 45.1008174386921, + "grad_norm": 5.118465900421143, + "learning_rate": 1.2057733124589216e-05, + "loss": 0.1516, + "step": 16552 + }, + { + "epoch": 45.10354223433242, + "grad_norm": 5.896913528442383, + "learning_rate": 1.2056869507604878e-05, + "loss": 0.2349, + "step": 16553 + }, + { + "epoch": 45.10626702997275, + "grad_norm": 7.021651744842529, + "learning_rate": 1.2056005874601706e-05, + "loss": 0.1852, + "step": 16554 + }, + { + "epoch": 45.10899182561308, + "grad_norm": 7.547937393188477, + "learning_rate": 1.205514222558643e-05, + "loss": 0.1539, + "step": 16555 + }, + { + "epoch": 45.11171662125341, + "grad_norm": 5.6526384353637695, + "learning_rate": 1.2054278560565768e-05, + "loss": 0.1286, + "step": 16556 + }, + { + "epoch": 45.11444141689373, + "grad_norm": 4.357674598693848, + "learning_rate": 1.2053414879546453e-05, + "loss": 0.1671, + "step": 16557 + }, + { + "epoch": 45.11716621253406, + "grad_norm": 6.144803047180176, + "learning_rate": 1.2052551182535205e-05, + "loss": 0.2076, + "step": 16558 + }, + { + "epoch": 45.119891008174385, + "grad_norm": 4.0647664070129395, + "learning_rate": 1.2051687469538762e-05, + "loss": 0.1586, + "step": 16559 + }, + { + "epoch": 45.12261580381471, + "grad_norm": 5.348049163818359, + "learning_rate": 1.2050823740563838e-05, + "loss": 0.2232, + "step": 16560 + }, + { + "epoch": 45.12534059945504, + "grad_norm": 4.529613494873047, + "learning_rate": 1.2049959995617166e-05, + "loss": 0.1346, + "step": 16561 + }, + { + "epoch": 45.12806539509537, + "grad_norm": 7.2587151527404785, + "learning_rate": 1.2049096234705471e-05, + "loss": 0.2626, + "step": 16562 + }, + { + "epoch": 45.130790190735695, + "grad_norm": 5.042852401733398, + "learning_rate": 1.2048232457835482e-05, + "loss": 0.2629, + "step": 16563 + }, + { + "epoch": 45.13351498637602, + "grad_norm": 4.998375415802002, + "learning_rate": 1.204736866501392e-05, + "loss": 0.2243, + "step": 16564 + }, + { + "epoch": 45.13623978201635, + "grad_norm": 6.485538959503174, + "learning_rate": 1.204650485624752e-05, + "loss": 0.2776, + "step": 16565 + }, + { + "epoch": 45.13896457765667, + "grad_norm": 4.741646766662598, + "learning_rate": 1.2045641031543008e-05, + "loss": 0.0986, + "step": 16566 + }, + { + "epoch": 45.141689373297005, + "grad_norm": 6.637621879577637, + "learning_rate": 1.2044777190907107e-05, + "loss": 0.1705, + "step": 16567 + }, + { + "epoch": 45.14441416893733, + "grad_norm": 4.802213668823242, + "learning_rate": 1.2043913334346546e-05, + "loss": 0.1882, + "step": 16568 + }, + { + "epoch": 45.14713896457766, + "grad_norm": 6.388574123382568, + "learning_rate": 1.2043049461868057e-05, + "loss": 0.3225, + "step": 16569 + }, + { + "epoch": 45.14986376021798, + "grad_norm": 4.970810413360596, + "learning_rate": 1.2042185573478362e-05, + "loss": 0.1427, + "step": 16570 + }, + { + "epoch": 45.15258855585831, + "grad_norm": 8.400190353393555, + "learning_rate": 1.2041321669184194e-05, + "loss": 0.4492, + "step": 16571 + }, + { + "epoch": 45.155313351498634, + "grad_norm": 5.225356101989746, + "learning_rate": 1.2040457748992275e-05, + "loss": 0.1226, + "step": 16572 + }, + { + "epoch": 45.15803814713897, + "grad_norm": 4.736957550048828, + "learning_rate": 1.203959381290934e-05, + "loss": 0.2009, + "step": 16573 + }, + { + "epoch": 45.16076294277929, + "grad_norm": 4.66796875, + "learning_rate": 1.203872986094211e-05, + "loss": 0.1301, + "step": 16574 + }, + { + "epoch": 45.16348773841962, + "grad_norm": 6.437362194061279, + "learning_rate": 1.2037865893097323e-05, + "loss": 0.2308, + "step": 16575 + }, + { + "epoch": 45.166212534059945, + "grad_norm": 4.844325065612793, + "learning_rate": 1.2037001909381699e-05, + "loss": 0.1716, + "step": 16576 + }, + { + "epoch": 45.16893732970027, + "grad_norm": 5.221934795379639, + "learning_rate": 1.203613790980197e-05, + "loss": 0.1791, + "step": 16577 + }, + { + "epoch": 45.171662125340596, + "grad_norm": 4.624213695526123, + "learning_rate": 1.2035273894364863e-05, + "loss": 0.1102, + "step": 16578 + }, + { + "epoch": 45.17438692098093, + "grad_norm": 4.950865268707275, + "learning_rate": 1.203440986307711e-05, + "loss": 0.1157, + "step": 16579 + }, + { + "epoch": 45.177111716621255, + "grad_norm": 5.598708629608154, + "learning_rate": 1.2033545815945438e-05, + "loss": 0.2494, + "step": 16580 + }, + { + "epoch": 45.17983651226158, + "grad_norm": 4.302317142486572, + "learning_rate": 1.2032681752976578e-05, + "loss": 0.0961, + "step": 16581 + }, + { + "epoch": 45.182561307901906, + "grad_norm": 4.7786946296691895, + "learning_rate": 1.2031817674177255e-05, + "loss": 0.1896, + "step": 16582 + }, + { + "epoch": 45.18528610354223, + "grad_norm": 4.99862003326416, + "learning_rate": 1.2030953579554203e-05, + "loss": 0.1549, + "step": 16583 + }, + { + "epoch": 45.18801089918256, + "grad_norm": 5.704895973205566, + "learning_rate": 1.203008946911415e-05, + "loss": 0.2137, + "step": 16584 + }, + { + "epoch": 45.19073569482289, + "grad_norm": 4.31999397277832, + "learning_rate": 1.2029225342863826e-05, + "loss": 0.1605, + "step": 16585 + }, + { + "epoch": 45.19346049046322, + "grad_norm": 3.9720940589904785, + "learning_rate": 1.202836120080996e-05, + "loss": 0.1321, + "step": 16586 + }, + { + "epoch": 45.19618528610354, + "grad_norm": 5.717876434326172, + "learning_rate": 1.2027497042959281e-05, + "loss": 0.1545, + "step": 16587 + }, + { + "epoch": 45.19891008174387, + "grad_norm": 7.608456134796143, + "learning_rate": 1.2026632869318522e-05, + "loss": 0.1343, + "step": 16588 + }, + { + "epoch": 45.201634877384194, + "grad_norm": 5.579301357269287, + "learning_rate": 1.2025768679894412e-05, + "loss": 0.2828, + "step": 16589 + }, + { + "epoch": 45.20435967302452, + "grad_norm": 4.252120494842529, + "learning_rate": 1.2024904474693679e-05, + "loss": 0.1783, + "step": 16590 + }, + { + "epoch": 45.20708446866485, + "grad_norm": 6.057271480560303, + "learning_rate": 1.2024040253723054e-05, + "loss": 0.2513, + "step": 16591 + }, + { + "epoch": 45.20980926430518, + "grad_norm": 4.746553421020508, + "learning_rate": 1.2023176016989272e-05, + "loss": 0.1571, + "step": 16592 + }, + { + "epoch": 45.212534059945504, + "grad_norm": 5.150763511657715, + "learning_rate": 1.2022311764499057e-05, + "loss": 0.1441, + "step": 16593 + }, + { + "epoch": 45.21525885558583, + "grad_norm": 4.989012241363525, + "learning_rate": 1.2021447496259145e-05, + "loss": 0.1555, + "step": 16594 + }, + { + "epoch": 45.217983651226156, + "grad_norm": 5.327992916107178, + "learning_rate": 1.2020583212276267e-05, + "loss": 0.171, + "step": 16595 + }, + { + "epoch": 45.22070844686648, + "grad_norm": 7.940482139587402, + "learning_rate": 1.2019718912557148e-05, + "loss": 0.1578, + "step": 16596 + }, + { + "epoch": 45.223433242506815, + "grad_norm": 5.864681243896484, + "learning_rate": 1.2018854597108524e-05, + "loss": 0.2566, + "step": 16597 + }, + { + "epoch": 45.22615803814714, + "grad_norm": 6.923911094665527, + "learning_rate": 1.2017990265937127e-05, + "loss": 0.3066, + "step": 16598 + }, + { + "epoch": 45.228882833787466, + "grad_norm": 6.041567802429199, + "learning_rate": 1.2017125919049688e-05, + "loss": 0.1343, + "step": 16599 + }, + { + "epoch": 45.23160762942779, + "grad_norm": 6.406617164611816, + "learning_rate": 1.2016261556452933e-05, + "loss": 0.2468, + "step": 16600 + }, + { + "epoch": 45.23433242506812, + "grad_norm": 5.396008014678955, + "learning_rate": 1.2015397178153601e-05, + "loss": 0.3443, + "step": 16601 + }, + { + "epoch": 45.237057220708444, + "grad_norm": 5.214319705963135, + "learning_rate": 1.2014532784158419e-05, + "loss": 0.1919, + "step": 16602 + }, + { + "epoch": 45.23978201634878, + "grad_norm": 5.351510047912598, + "learning_rate": 1.201366837447412e-05, + "loss": 0.2486, + "step": 16603 + }, + { + "epoch": 45.2425068119891, + "grad_norm": 4.136556148529053, + "learning_rate": 1.2012803949107437e-05, + "loss": 0.1294, + "step": 16604 + }, + { + "epoch": 45.24523160762943, + "grad_norm": 7.471392631530762, + "learning_rate": 1.2011939508065105e-05, + "loss": 0.1367, + "step": 16605 + }, + { + "epoch": 45.247956403269754, + "grad_norm": 5.440866947174072, + "learning_rate": 1.2011075051353848e-05, + "loss": 0.16, + "step": 16606 + }, + { + "epoch": 45.25068119891008, + "grad_norm": 4.633749008178711, + "learning_rate": 1.2010210578980407e-05, + "loss": 0.2055, + "step": 16607 + }, + { + "epoch": 45.253405994550405, + "grad_norm": 7.459175109863281, + "learning_rate": 1.2009346090951507e-05, + "loss": 0.2332, + "step": 16608 + }, + { + "epoch": 45.25613079019074, + "grad_norm": 9.547760009765625, + "learning_rate": 1.2008481587273889e-05, + "loss": 0.1956, + "step": 16609 + }, + { + "epoch": 45.258855585831064, + "grad_norm": 4.923254013061523, + "learning_rate": 1.2007617067954279e-05, + "loss": 0.1647, + "step": 16610 + }, + { + "epoch": 45.26158038147139, + "grad_norm": 5.788157939910889, + "learning_rate": 1.2006752532999408e-05, + "loss": 0.1401, + "step": 16611 + }, + { + "epoch": 45.264305177111716, + "grad_norm": 10.717264175415039, + "learning_rate": 1.2005887982416018e-05, + "loss": 0.2287, + "step": 16612 + }, + { + "epoch": 45.26702997275204, + "grad_norm": 5.1473612785339355, + "learning_rate": 1.2005023416210835e-05, + "loss": 0.2368, + "step": 16613 + }, + { + "epoch": 45.26975476839237, + "grad_norm": 6.619595050811768, + "learning_rate": 1.2004158834390594e-05, + "loss": 0.1329, + "step": 16614 + }, + { + "epoch": 45.2724795640327, + "grad_norm": 3.5936288833618164, + "learning_rate": 1.2003294236962028e-05, + "loss": 0.3637, + "step": 16615 + }, + { + "epoch": 45.275204359673026, + "grad_norm": 4.85862398147583, + "learning_rate": 1.2002429623931874e-05, + "loss": 0.2879, + "step": 16616 + }, + { + "epoch": 45.27792915531335, + "grad_norm": 4.307836532592773, + "learning_rate": 1.2001564995306858e-05, + "loss": 0.1005, + "step": 16617 + }, + { + "epoch": 45.28065395095368, + "grad_norm": 5.3064727783203125, + "learning_rate": 1.2000700351093722e-05, + "loss": 0.303, + "step": 16618 + }, + { + "epoch": 45.283378746594, + "grad_norm": 4.527190208435059, + "learning_rate": 1.1999835691299193e-05, + "loss": 0.2161, + "step": 16619 + }, + { + "epoch": 45.28610354223433, + "grad_norm": 5.368263244628906, + "learning_rate": 1.1998971015930012e-05, + "loss": 0.135, + "step": 16620 + }, + { + "epoch": 45.28882833787466, + "grad_norm": 4.358409404754639, + "learning_rate": 1.1998106324992906e-05, + "loss": 0.2364, + "step": 16621 + }, + { + "epoch": 45.29155313351499, + "grad_norm": 4.781009674072266, + "learning_rate": 1.1997241618494613e-05, + "loss": 0.1104, + "step": 16622 + }, + { + "epoch": 45.294277929155314, + "grad_norm": 5.457147121429443, + "learning_rate": 1.1996376896441867e-05, + "loss": 0.0939, + "step": 16623 + }, + { + "epoch": 45.29700272479564, + "grad_norm": 5.586886405944824, + "learning_rate": 1.1995512158841402e-05, + "loss": 0.2515, + "step": 16624 + }, + { + "epoch": 45.299727520435965, + "grad_norm": 5.703341007232666, + "learning_rate": 1.1994647405699951e-05, + "loss": 0.2366, + "step": 16625 + }, + { + "epoch": 45.30245231607629, + "grad_norm": 5.6486921310424805, + "learning_rate": 1.1993782637024251e-05, + "loss": 0.2428, + "step": 16626 + }, + { + "epoch": 45.305177111716624, + "grad_norm": 5.216177940368652, + "learning_rate": 1.1992917852821035e-05, + "loss": 0.1912, + "step": 16627 + }, + { + "epoch": 45.30790190735695, + "grad_norm": 6.801618576049805, + "learning_rate": 1.1992053053097041e-05, + "loss": 0.1223, + "step": 16628 + }, + { + "epoch": 45.310626702997276, + "grad_norm": 6.861721038818359, + "learning_rate": 1.1991188237859e-05, + "loss": 0.3119, + "step": 16629 + }, + { + "epoch": 45.3133514986376, + "grad_norm": 6.232369899749756, + "learning_rate": 1.199032340711365e-05, + "loss": 0.2049, + "step": 16630 + }, + { + "epoch": 45.31607629427793, + "grad_norm": 5.272371768951416, + "learning_rate": 1.1989458560867726e-05, + "loss": 0.1973, + "step": 16631 + }, + { + "epoch": 45.31880108991825, + "grad_norm": 5.843293190002441, + "learning_rate": 1.1988593699127964e-05, + "loss": 0.1102, + "step": 16632 + }, + { + "epoch": 45.321525885558586, + "grad_norm": 4.8091535568237305, + "learning_rate": 1.1987728821901094e-05, + "loss": 0.1321, + "step": 16633 + }, + { + "epoch": 45.32425068119891, + "grad_norm": 5.556960105895996, + "learning_rate": 1.198686392919386e-05, + "loss": 0.2355, + "step": 16634 + }, + { + "epoch": 45.32697547683924, + "grad_norm": 4.6954426765441895, + "learning_rate": 1.198599902101299e-05, + "loss": 0.2318, + "step": 16635 + }, + { + "epoch": 45.32970027247956, + "grad_norm": 11.321298599243164, + "learning_rate": 1.1985134097365227e-05, + "loss": 0.2587, + "step": 16636 + }, + { + "epoch": 45.33242506811989, + "grad_norm": 7.810074806213379, + "learning_rate": 1.1984269158257303e-05, + "loss": 0.1495, + "step": 16637 + }, + { + "epoch": 45.335149863760215, + "grad_norm": 5.643194198608398, + "learning_rate": 1.1983404203695954e-05, + "loss": 0.2431, + "step": 16638 + }, + { + "epoch": 45.33787465940055, + "grad_norm": 4.987616539001465, + "learning_rate": 1.1982539233687916e-05, + "loss": 0.1606, + "step": 16639 + }, + { + "epoch": 45.34059945504087, + "grad_norm": 6.060144424438477, + "learning_rate": 1.1981674248239927e-05, + "loss": 0.2073, + "step": 16640 + }, + { + "epoch": 45.3433242506812, + "grad_norm": 11.028332710266113, + "learning_rate": 1.1980809247358722e-05, + "loss": 0.181, + "step": 16641 + }, + { + "epoch": 45.346049046321525, + "grad_norm": 4.551525115966797, + "learning_rate": 1.197994423105104e-05, + "loss": 0.3275, + "step": 16642 + }, + { + "epoch": 45.34877384196185, + "grad_norm": 4.677279949188232, + "learning_rate": 1.1979079199323613e-05, + "loss": 0.1158, + "step": 16643 + }, + { + "epoch": 45.35149863760218, + "grad_norm": 15.127598762512207, + "learning_rate": 1.1978214152183186e-05, + "loss": 0.1336, + "step": 16644 + }, + { + "epoch": 45.35422343324251, + "grad_norm": 5.0481648445129395, + "learning_rate": 1.1977349089636484e-05, + "loss": 0.2007, + "step": 16645 + }, + { + "epoch": 45.356948228882835, + "grad_norm": 8.24364185333252, + "learning_rate": 1.1976484011690257e-05, + "loss": 0.2051, + "step": 16646 + }, + { + "epoch": 45.35967302452316, + "grad_norm": 4.717498779296875, + "learning_rate": 1.1975618918351234e-05, + "loss": 0.1411, + "step": 16647 + }, + { + "epoch": 45.36239782016349, + "grad_norm": 9.359580039978027, + "learning_rate": 1.1974753809626157e-05, + "loss": 0.2377, + "step": 16648 + }, + { + "epoch": 45.36512261580381, + "grad_norm": 3.6303634643554688, + "learning_rate": 1.1973888685521755e-05, + "loss": 0.1616, + "step": 16649 + }, + { + "epoch": 45.36784741144414, + "grad_norm": 6.411387920379639, + "learning_rate": 1.1973023546044777e-05, + "loss": 0.1923, + "step": 16650 + }, + { + "epoch": 45.37057220708447, + "grad_norm": 5.722949504852295, + "learning_rate": 1.1972158391201949e-05, + "loss": 0.119, + "step": 16651 + }, + { + "epoch": 45.3732970027248, + "grad_norm": 5.816916465759277, + "learning_rate": 1.197129322100002e-05, + "loss": 0.2458, + "step": 16652 + }, + { + "epoch": 45.37602179836512, + "grad_norm": 6.132981777191162, + "learning_rate": 1.197042803544572e-05, + "loss": 0.195, + "step": 16653 + }, + { + "epoch": 45.37874659400545, + "grad_norm": 6.963262557983398, + "learning_rate": 1.1969562834545794e-05, + "loss": 0.3227, + "step": 16654 + }, + { + "epoch": 45.381471389645775, + "grad_norm": 5.772555351257324, + "learning_rate": 1.1968697618306973e-05, + "loss": 0.223, + "step": 16655 + }, + { + "epoch": 45.3841961852861, + "grad_norm": 4.3310546875, + "learning_rate": 1.1967832386736001e-05, + "loss": 0.2026, + "step": 16656 + }, + { + "epoch": 45.38692098092643, + "grad_norm": 4.356783866882324, + "learning_rate": 1.1966967139839609e-05, + "loss": 0.3471, + "step": 16657 + }, + { + "epoch": 45.38964577656676, + "grad_norm": 5.222243785858154, + "learning_rate": 1.1966101877624545e-05, + "loss": 0.136, + "step": 16658 + }, + { + "epoch": 45.392370572207085, + "grad_norm": 30.365690231323242, + "learning_rate": 1.1965236600097541e-05, + "loss": 0.3697, + "step": 16659 + }, + { + "epoch": 45.39509536784741, + "grad_norm": 7.362423419952393, + "learning_rate": 1.1964371307265334e-05, + "loss": 0.3103, + "step": 16660 + }, + { + "epoch": 45.39782016348774, + "grad_norm": 41.33028793334961, + "learning_rate": 1.196350599913467e-05, + "loss": 0.3573, + "step": 16661 + }, + { + "epoch": 45.40054495912806, + "grad_norm": 5.660735607147217, + "learning_rate": 1.1962640675712284e-05, + "loss": 0.1426, + "step": 16662 + }, + { + "epoch": 45.403269754768395, + "grad_norm": 5.834871292114258, + "learning_rate": 1.1961775337004916e-05, + "loss": 0.2839, + "step": 16663 + }, + { + "epoch": 45.40599455040872, + "grad_norm": 6.210115909576416, + "learning_rate": 1.1960909983019307e-05, + "loss": 0.141, + "step": 16664 + }, + { + "epoch": 45.40871934604905, + "grad_norm": 5.948051452636719, + "learning_rate": 1.1960044613762189e-05, + "loss": 0.1444, + "step": 16665 + }, + { + "epoch": 45.41144414168937, + "grad_norm": 5.73265266418457, + "learning_rate": 1.1959179229240312e-05, + "loss": 0.1241, + "step": 16666 + }, + { + "epoch": 45.4141689373297, + "grad_norm": 5.090624809265137, + "learning_rate": 1.1958313829460406e-05, + "loss": 0.1477, + "step": 16667 + }, + { + "epoch": 45.416893732970024, + "grad_norm": 6.242894649505615, + "learning_rate": 1.1957448414429218e-05, + "loss": 0.1256, + "step": 16668 + }, + { + "epoch": 45.41961852861036, + "grad_norm": 13.589362144470215, + "learning_rate": 1.1956582984153479e-05, + "loss": 0.1658, + "step": 16669 + }, + { + "epoch": 45.42234332425068, + "grad_norm": 5.8010406494140625, + "learning_rate": 1.1955717538639941e-05, + "loss": 0.2329, + "step": 16670 + }, + { + "epoch": 45.42506811989101, + "grad_norm": 5.109614372253418, + "learning_rate": 1.1954852077895335e-05, + "loss": 0.1757, + "step": 16671 + }, + { + "epoch": 45.427792915531334, + "grad_norm": 4.750753879547119, + "learning_rate": 1.1953986601926406e-05, + "loss": 0.155, + "step": 16672 + }, + { + "epoch": 45.43051771117166, + "grad_norm": 8.827396392822266, + "learning_rate": 1.195312111073989e-05, + "loss": 0.197, + "step": 16673 + }, + { + "epoch": 45.433242506811986, + "grad_norm": 6.231132507324219, + "learning_rate": 1.195225560434253e-05, + "loss": 0.1877, + "step": 16674 + }, + { + "epoch": 45.43596730245232, + "grad_norm": 6.299057483673096, + "learning_rate": 1.1951390082741068e-05, + "loss": 0.2544, + "step": 16675 + }, + { + "epoch": 45.438692098092645, + "grad_norm": 5.301882743835449, + "learning_rate": 1.1950524545942241e-05, + "loss": 0.2188, + "step": 16676 + }, + { + "epoch": 45.44141689373297, + "grad_norm": 5.3790106773376465, + "learning_rate": 1.1949658993952793e-05, + "loss": 0.1404, + "step": 16677 + }, + { + "epoch": 45.444141689373296, + "grad_norm": 8.645112991333008, + "learning_rate": 1.1948793426779462e-05, + "loss": 0.2259, + "step": 16678 + }, + { + "epoch": 45.44686648501362, + "grad_norm": 8.512444496154785, + "learning_rate": 1.194792784442899e-05, + "loss": 0.1794, + "step": 16679 + }, + { + "epoch": 45.44959128065395, + "grad_norm": 5.109349250793457, + "learning_rate": 1.1947062246908121e-05, + "loss": 0.1572, + "step": 16680 + }, + { + "epoch": 45.45231607629428, + "grad_norm": 5.574517250061035, + "learning_rate": 1.1946196634223592e-05, + "loss": 0.1516, + "step": 16681 + }, + { + "epoch": 45.45504087193461, + "grad_norm": 8.244447708129883, + "learning_rate": 1.1945331006382148e-05, + "loss": 0.1866, + "step": 16682 + }, + { + "epoch": 45.45776566757493, + "grad_norm": 6.59032678604126, + "learning_rate": 1.1944465363390527e-05, + "loss": 0.1877, + "step": 16683 + }, + { + "epoch": 45.46049046321526, + "grad_norm": 6.2295050621032715, + "learning_rate": 1.1943599705255476e-05, + "loss": 0.176, + "step": 16684 + }, + { + "epoch": 45.463215258855584, + "grad_norm": 26.40064239501953, + "learning_rate": 1.1942734031983727e-05, + "loss": 0.3238, + "step": 16685 + }, + { + "epoch": 45.46594005449591, + "grad_norm": 6.458420276641846, + "learning_rate": 1.1941868343582031e-05, + "loss": 0.2262, + "step": 16686 + }, + { + "epoch": 45.46866485013624, + "grad_norm": 5.881272315979004, + "learning_rate": 1.1941002640057126e-05, + "loss": 0.1857, + "step": 16687 + }, + { + "epoch": 45.47138964577657, + "grad_norm": 9.554805755615234, + "learning_rate": 1.1940136921415757e-05, + "loss": 0.2529, + "step": 16688 + }, + { + "epoch": 45.474114441416894, + "grad_norm": 6.610429286956787, + "learning_rate": 1.1939271187664664e-05, + "loss": 0.1741, + "step": 16689 + }, + { + "epoch": 45.47683923705722, + "grad_norm": 6.144949436187744, + "learning_rate": 1.1938405438810588e-05, + "loss": 0.1192, + "step": 16690 + }, + { + "epoch": 45.479564032697546, + "grad_norm": 6.75967264175415, + "learning_rate": 1.193753967486027e-05, + "loss": 0.2601, + "step": 16691 + }, + { + "epoch": 45.48228882833787, + "grad_norm": 7.9903717041015625, + "learning_rate": 1.1936673895820461e-05, + "loss": 0.2191, + "step": 16692 + }, + { + "epoch": 45.485013623978205, + "grad_norm": 6.284823894500732, + "learning_rate": 1.1935808101697895e-05, + "loss": 0.1932, + "step": 16693 + }, + { + "epoch": 45.48773841961853, + "grad_norm": 6.077003479003906, + "learning_rate": 1.1934942292499316e-05, + "loss": 0.1526, + "step": 16694 + }, + { + "epoch": 45.490463215258856, + "grad_norm": 6.023370742797852, + "learning_rate": 1.1934076468231472e-05, + "loss": 0.2062, + "step": 16695 + }, + { + "epoch": 45.49318801089918, + "grad_norm": 6.809840202331543, + "learning_rate": 1.1933210628901101e-05, + "loss": 0.2429, + "step": 16696 + }, + { + "epoch": 45.49591280653951, + "grad_norm": 9.45288372039795, + "learning_rate": 1.193234477451495e-05, + "loss": 0.1293, + "step": 16697 + }, + { + "epoch": 45.49863760217983, + "grad_norm": 5.4122395515441895, + "learning_rate": 1.1931478905079758e-05, + "loss": 0.1945, + "step": 16698 + }, + { + "epoch": 45.50136239782017, + "grad_norm": 4.952850818634033, + "learning_rate": 1.1930613020602273e-05, + "loss": 0.1848, + "step": 16699 + }, + { + "epoch": 45.50408719346049, + "grad_norm": 8.232172012329102, + "learning_rate": 1.1929747121089232e-05, + "loss": 0.2203, + "step": 16700 + }, + { + "epoch": 45.50681198910082, + "grad_norm": 5.5052900314331055, + "learning_rate": 1.1928881206547385e-05, + "loss": 0.1445, + "step": 16701 + }, + { + "epoch": 45.509536784741144, + "grad_norm": 6.1682820320129395, + "learning_rate": 1.1928015276983473e-05, + "loss": 0.1938, + "step": 16702 + }, + { + "epoch": 45.51226158038147, + "grad_norm": 6.207098007202148, + "learning_rate": 1.192714933240424e-05, + "loss": 0.2524, + "step": 16703 + }, + { + "epoch": 45.514986376021795, + "grad_norm": 4.526002407073975, + "learning_rate": 1.192628337281643e-05, + "loss": 0.1458, + "step": 16704 + }, + { + "epoch": 45.51771117166213, + "grad_norm": 9.20603084564209, + "learning_rate": 1.1925417398226786e-05, + "loss": 0.3266, + "step": 16705 + }, + { + "epoch": 45.520435967302454, + "grad_norm": 4.8588337898254395, + "learning_rate": 1.1924551408642054e-05, + "loss": 0.1795, + "step": 16706 + }, + { + "epoch": 45.52316076294278, + "grad_norm": 11.087041854858398, + "learning_rate": 1.1923685404068978e-05, + "loss": 0.0995, + "step": 16707 + }, + { + "epoch": 45.525885558583106, + "grad_norm": 7.632423400878906, + "learning_rate": 1.1922819384514302e-05, + "loss": 0.1736, + "step": 16708 + }, + { + "epoch": 45.52861035422343, + "grad_norm": 4.280725002288818, + "learning_rate": 1.1921953349984771e-05, + "loss": 0.2495, + "step": 16709 + }, + { + "epoch": 45.53133514986376, + "grad_norm": 4.482978343963623, + "learning_rate": 1.1921087300487128e-05, + "loss": 0.1411, + "step": 16710 + }, + { + "epoch": 45.53405994550409, + "grad_norm": 5.198719024658203, + "learning_rate": 1.1920221236028122e-05, + "loss": 0.2058, + "step": 16711 + }, + { + "epoch": 45.536784741144416, + "grad_norm": 6.219206809997559, + "learning_rate": 1.1919355156614488e-05, + "loss": 0.2802, + "step": 16712 + }, + { + "epoch": 45.53950953678474, + "grad_norm": 8.376551628112793, + "learning_rate": 1.1918489062252982e-05, + "loss": 0.3149, + "step": 16713 + }, + { + "epoch": 45.54223433242507, + "grad_norm": 5.516513824462891, + "learning_rate": 1.1917622952950346e-05, + "loss": 0.1148, + "step": 16714 + }, + { + "epoch": 45.54495912806539, + "grad_norm": 5.855601787567139, + "learning_rate": 1.1916756828713326e-05, + "loss": 0.1591, + "step": 16715 + }, + { + "epoch": 45.54768392370572, + "grad_norm": 6.673274517059326, + "learning_rate": 1.191589068954866e-05, + "loss": 0.225, + "step": 16716 + }, + { + "epoch": 45.55040871934605, + "grad_norm": 5.49294376373291, + "learning_rate": 1.1915024535463102e-05, + "loss": 0.1777, + "step": 16717 + }, + { + "epoch": 45.55313351498638, + "grad_norm": 5.714776515960693, + "learning_rate": 1.1914158366463392e-05, + "loss": 0.1862, + "step": 16718 + }, + { + "epoch": 45.555858310626704, + "grad_norm": 7.998096942901611, + "learning_rate": 1.1913292182556284e-05, + "loss": 0.1626, + "step": 16719 + }, + { + "epoch": 45.55858310626703, + "grad_norm": 4.941965103149414, + "learning_rate": 1.191242598374851e-05, + "loss": 0.2365, + "step": 16720 + }, + { + "epoch": 45.561307901907355, + "grad_norm": 11.13440227508545, + "learning_rate": 1.191155977004683e-05, + "loss": 0.2244, + "step": 16721 + }, + { + "epoch": 45.56403269754768, + "grad_norm": 5.3765034675598145, + "learning_rate": 1.1910693541457983e-05, + "loss": 0.1614, + "step": 16722 + }, + { + "epoch": 45.566757493188014, + "grad_norm": 4.9884467124938965, + "learning_rate": 1.1909827297988716e-05, + "loss": 0.1526, + "step": 16723 + }, + { + "epoch": 45.56948228882834, + "grad_norm": 5.218952655792236, + "learning_rate": 1.1908961039645774e-05, + "loss": 0.283, + "step": 16724 + }, + { + "epoch": 45.572207084468666, + "grad_norm": 5.10790491104126, + "learning_rate": 1.1908094766435906e-05, + "loss": 0.2459, + "step": 16725 + }, + { + "epoch": 45.57493188010899, + "grad_norm": 7.868581295013428, + "learning_rate": 1.190722847836586e-05, + "loss": 0.286, + "step": 16726 + }, + { + "epoch": 45.57765667574932, + "grad_norm": 7.350738525390625, + "learning_rate": 1.1906362175442376e-05, + "loss": 0.2108, + "step": 16727 + }, + { + "epoch": 45.58038147138964, + "grad_norm": 6.340230464935303, + "learning_rate": 1.1905495857672207e-05, + "loss": 0.1519, + "step": 16728 + }, + { + "epoch": 45.583106267029976, + "grad_norm": 5.222556114196777, + "learning_rate": 1.1904629525062094e-05, + "loss": 0.1501, + "step": 16729 + }, + { + "epoch": 45.5858310626703, + "grad_norm": 6.270688056945801, + "learning_rate": 1.190376317761879e-05, + "loss": 0.3152, + "step": 16730 + }, + { + "epoch": 45.58855585831063, + "grad_norm": 5.900198459625244, + "learning_rate": 1.1902896815349041e-05, + "loss": 0.31, + "step": 16731 + }, + { + "epoch": 45.59128065395095, + "grad_norm": 6.09793758392334, + "learning_rate": 1.1902030438259593e-05, + "loss": 0.3577, + "step": 16732 + }, + { + "epoch": 45.59400544959128, + "grad_norm": 6.048053741455078, + "learning_rate": 1.1901164046357192e-05, + "loss": 0.2992, + "step": 16733 + }, + { + "epoch": 45.596730245231605, + "grad_norm": 4.888824939727783, + "learning_rate": 1.1900297639648586e-05, + "loss": 0.231, + "step": 16734 + }, + { + "epoch": 45.59945504087194, + "grad_norm": 6.400858402252197, + "learning_rate": 1.1899431218140525e-05, + "loss": 0.1601, + "step": 16735 + }, + { + "epoch": 45.60217983651226, + "grad_norm": 8.345768928527832, + "learning_rate": 1.1898564781839752e-05, + "loss": 0.2145, + "step": 16736 + }, + { + "epoch": 45.60490463215259, + "grad_norm": 5.117101669311523, + "learning_rate": 1.1897698330753017e-05, + "loss": 0.2896, + "step": 16737 + }, + { + "epoch": 45.607629427792915, + "grad_norm": 5.829264163970947, + "learning_rate": 1.1896831864887071e-05, + "loss": 0.1202, + "step": 16738 + }, + { + "epoch": 45.61035422343324, + "grad_norm": 5.072994709014893, + "learning_rate": 1.189596538424866e-05, + "loss": 0.135, + "step": 16739 + }, + { + "epoch": 45.61307901907357, + "grad_norm": 5.669522762298584, + "learning_rate": 1.189509888884453e-05, + "loss": 0.2648, + "step": 16740 + }, + { + "epoch": 45.6158038147139, + "grad_norm": 6.418872356414795, + "learning_rate": 1.1894232378681432e-05, + "loss": 0.1324, + "step": 16741 + }, + { + "epoch": 45.618528610354225, + "grad_norm": 5.721817493438721, + "learning_rate": 1.1893365853766112e-05, + "loss": 0.1504, + "step": 16742 + }, + { + "epoch": 45.62125340599455, + "grad_norm": 4.870094299316406, + "learning_rate": 1.1892499314105322e-05, + "loss": 0.1526, + "step": 16743 + }, + { + "epoch": 45.62397820163488, + "grad_norm": 4.316743850708008, + "learning_rate": 1.1891632759705806e-05, + "loss": 0.2196, + "step": 16744 + }, + { + "epoch": 45.6267029972752, + "grad_norm": 5.4886698722839355, + "learning_rate": 1.1890766190574317e-05, + "loss": 0.2826, + "step": 16745 + }, + { + "epoch": 45.62942779291553, + "grad_norm": 5.585188388824463, + "learning_rate": 1.1889899606717596e-05, + "loss": 0.24, + "step": 16746 + }, + { + "epoch": 45.63215258855586, + "grad_norm": 5.05691385269165, + "learning_rate": 1.1889033008142405e-05, + "loss": 0.1792, + "step": 16747 + }, + { + "epoch": 45.63487738419619, + "grad_norm": 4.477142810821533, + "learning_rate": 1.188816639485548e-05, + "loss": 0.1701, + "step": 16748 + }, + { + "epoch": 45.63760217983651, + "grad_norm": 5.6869215965271, + "learning_rate": 1.188729976686358e-05, + "loss": 0.3177, + "step": 16749 + }, + { + "epoch": 45.64032697547684, + "grad_norm": 4.94856595993042, + "learning_rate": 1.1886433124173448e-05, + "loss": 0.1924, + "step": 16750 + }, + { + "epoch": 45.643051771117165, + "grad_norm": 6.606828689575195, + "learning_rate": 1.1885566466791838e-05, + "loss": 0.1509, + "step": 16751 + }, + { + "epoch": 45.64577656675749, + "grad_norm": 6.61343240737915, + "learning_rate": 1.1884699794725494e-05, + "loss": 0.2013, + "step": 16752 + }, + { + "epoch": 45.64850136239782, + "grad_norm": 5.412893772125244, + "learning_rate": 1.1883833107981173e-05, + "loss": 0.1584, + "step": 16753 + }, + { + "epoch": 45.65122615803815, + "grad_norm": 6.0776047706604, + "learning_rate": 1.1882966406565615e-05, + "loss": 0.2973, + "step": 16754 + }, + { + "epoch": 45.653950953678475, + "grad_norm": 6.073796272277832, + "learning_rate": 1.1882099690485578e-05, + "loss": 0.1985, + "step": 16755 + }, + { + "epoch": 45.6566757493188, + "grad_norm": 20.35211944580078, + "learning_rate": 1.1881232959747808e-05, + "loss": 0.1966, + "step": 16756 + }, + { + "epoch": 45.65940054495913, + "grad_norm": 5.905616760253906, + "learning_rate": 1.1880366214359058e-05, + "loss": 0.1485, + "step": 16757 + }, + { + "epoch": 45.66212534059945, + "grad_norm": 4.573220252990723, + "learning_rate": 1.1879499454326075e-05, + "loss": 0.0844, + "step": 16758 + }, + { + "epoch": 45.664850136239785, + "grad_norm": 5.227389812469482, + "learning_rate": 1.1878632679655613e-05, + "loss": 0.1249, + "step": 16759 + }, + { + "epoch": 45.66757493188011, + "grad_norm": 4.984939098358154, + "learning_rate": 1.1877765890354416e-05, + "loss": 0.0953, + "step": 16760 + }, + { + "epoch": 45.67029972752044, + "grad_norm": 6.445440769195557, + "learning_rate": 1.1876899086429243e-05, + "loss": 0.2402, + "step": 16761 + }, + { + "epoch": 45.67302452316076, + "grad_norm": 6.42676305770874, + "learning_rate": 1.1876032267886836e-05, + "loss": 0.21, + "step": 16762 + }, + { + "epoch": 45.67574931880109, + "grad_norm": 4.938652515411377, + "learning_rate": 1.1875165434733953e-05, + "loss": 0.2568, + "step": 16763 + }, + { + "epoch": 45.678474114441414, + "grad_norm": 5.695641994476318, + "learning_rate": 1.1874298586977343e-05, + "loss": 0.2105, + "step": 16764 + }, + { + "epoch": 45.68119891008175, + "grad_norm": 20.347829818725586, + "learning_rate": 1.1873431724623754e-05, + "loss": 0.2006, + "step": 16765 + }, + { + "epoch": 45.68392370572207, + "grad_norm": 4.463924407958984, + "learning_rate": 1.1872564847679937e-05, + "loss": 0.122, + "step": 16766 + }, + { + "epoch": 45.6866485013624, + "grad_norm": 5.034438133239746, + "learning_rate": 1.187169795615265e-05, + "loss": 0.3651, + "step": 16767 + }, + { + "epoch": 45.689373297002724, + "grad_norm": 6.706033229827881, + "learning_rate": 1.1870831050048637e-05, + "loss": 0.1983, + "step": 16768 + }, + { + "epoch": 45.69209809264305, + "grad_norm": 5.6929826736450195, + "learning_rate": 1.1869964129374653e-05, + "loss": 0.1591, + "step": 16769 + }, + { + "epoch": 45.694822888283376, + "grad_norm": 27.811521530151367, + "learning_rate": 1.1869097194137447e-05, + "loss": 0.1832, + "step": 16770 + }, + { + "epoch": 45.69754768392371, + "grad_norm": 4.503742218017578, + "learning_rate": 1.1868230244343772e-05, + "loss": 0.1942, + "step": 16771 + }, + { + "epoch": 45.700272479564035, + "grad_norm": 4.524623870849609, + "learning_rate": 1.1867363280000381e-05, + "loss": 0.1455, + "step": 16772 + }, + { + "epoch": 45.70299727520436, + "grad_norm": 10.254136085510254, + "learning_rate": 1.1866496301114024e-05, + "loss": 0.224, + "step": 16773 + }, + { + "epoch": 45.705722070844686, + "grad_norm": 5.565359115600586, + "learning_rate": 1.1865629307691457e-05, + "loss": 0.1702, + "step": 16774 + }, + { + "epoch": 45.70844686648501, + "grad_norm": 5.79984712600708, + "learning_rate": 1.1864762299739425e-05, + "loss": 0.195, + "step": 16775 + }, + { + "epoch": 45.71117166212534, + "grad_norm": 11.521369934082031, + "learning_rate": 1.1863895277264685e-05, + "loss": 0.2612, + "step": 16776 + }, + { + "epoch": 45.71389645776567, + "grad_norm": 4.3823676109313965, + "learning_rate": 1.186302824027399e-05, + "loss": 0.277, + "step": 16777 + }, + { + "epoch": 45.716621253406, + "grad_norm": 5.321345806121826, + "learning_rate": 1.186216118877409e-05, + "loss": 0.2387, + "step": 16778 + }, + { + "epoch": 45.71934604904632, + "grad_norm": 4.756073474884033, + "learning_rate": 1.186129412277174e-05, + "loss": 0.181, + "step": 16779 + }, + { + "epoch": 45.72207084468665, + "grad_norm": 5.8166399002075195, + "learning_rate": 1.186042704227369e-05, + "loss": 0.197, + "step": 16780 + }, + { + "epoch": 45.724795640326974, + "grad_norm": 6.273514270782471, + "learning_rate": 1.1859559947286695e-05, + "loss": 0.2122, + "step": 16781 + }, + { + "epoch": 45.7275204359673, + "grad_norm": 9.926748275756836, + "learning_rate": 1.1858692837817507e-05, + "loss": 0.2679, + "step": 16782 + }, + { + "epoch": 45.73024523160763, + "grad_norm": 5.106124401092529, + "learning_rate": 1.1857825713872877e-05, + "loss": 0.2026, + "step": 16783 + }, + { + "epoch": 45.73297002724796, + "grad_norm": 7.10134744644165, + "learning_rate": 1.1856958575459563e-05, + "loss": 0.2331, + "step": 16784 + }, + { + "epoch": 45.735694822888284, + "grad_norm": 5.939577102661133, + "learning_rate": 1.1856091422584312e-05, + "loss": 0.2202, + "step": 16785 + }, + { + "epoch": 45.73841961852861, + "grad_norm": 9.432857513427734, + "learning_rate": 1.1855224255253885e-05, + "loss": 0.1826, + "step": 16786 + }, + { + "epoch": 45.741144414168936, + "grad_norm": 5.389590263366699, + "learning_rate": 1.185435707347503e-05, + "loss": 0.1651, + "step": 16787 + }, + { + "epoch": 45.74386920980926, + "grad_norm": 5.081847190856934, + "learning_rate": 1.1853489877254498e-05, + "loss": 0.1582, + "step": 16788 + }, + { + "epoch": 45.746594005449595, + "grad_norm": 6.348358631134033, + "learning_rate": 1.1852622666599047e-05, + "loss": 0.2016, + "step": 16789 + }, + { + "epoch": 45.74931880108992, + "grad_norm": 5.817598342895508, + "learning_rate": 1.1851755441515435e-05, + "loss": 0.2261, + "step": 16790 + }, + { + "epoch": 45.752043596730246, + "grad_norm": 5.8689165115356445, + "learning_rate": 1.1850888202010408e-05, + "loss": 0.1593, + "step": 16791 + }, + { + "epoch": 45.75476839237057, + "grad_norm": 4.214691638946533, + "learning_rate": 1.1850020948090725e-05, + "loss": 0.1659, + "step": 16792 + }, + { + "epoch": 45.7574931880109, + "grad_norm": 5.222210884094238, + "learning_rate": 1.1849153679763137e-05, + "loss": 0.1364, + "step": 16793 + }, + { + "epoch": 45.76021798365122, + "grad_norm": 5.477433204650879, + "learning_rate": 1.1848286397034402e-05, + "loss": 0.1772, + "step": 16794 + }, + { + "epoch": 45.762942779291556, + "grad_norm": 5.0489020347595215, + "learning_rate": 1.1847419099911268e-05, + "loss": 0.2861, + "step": 16795 + }, + { + "epoch": 45.76566757493188, + "grad_norm": 8.0861234664917, + "learning_rate": 1.1846551788400497e-05, + "loss": 0.2905, + "step": 16796 + }, + { + "epoch": 45.76839237057221, + "grad_norm": 6.275272369384766, + "learning_rate": 1.1845684462508838e-05, + "loss": 0.2019, + "step": 16797 + }, + { + "epoch": 45.771117166212534, + "grad_norm": 9.220664978027344, + "learning_rate": 1.1844817122243047e-05, + "loss": 0.1202, + "step": 16798 + }, + { + "epoch": 45.77384196185286, + "grad_norm": 6.362813472747803, + "learning_rate": 1.1843949767609879e-05, + "loss": 0.2262, + "step": 16799 + }, + { + "epoch": 45.776566757493185, + "grad_norm": 5.926329135894775, + "learning_rate": 1.1843082398616095e-05, + "loss": 0.3897, + "step": 16800 + }, + { + "epoch": 45.77929155313352, + "grad_norm": 6.0297698974609375, + "learning_rate": 1.1842215015268439e-05, + "loss": 0.1284, + "step": 16801 + }, + { + "epoch": 45.782016348773844, + "grad_norm": 5.359635353088379, + "learning_rate": 1.1841347617573675e-05, + "loss": 0.1297, + "step": 16802 + }, + { + "epoch": 45.78474114441417, + "grad_norm": 5.568722724914551, + "learning_rate": 1.1840480205538553e-05, + "loss": 0.2027, + "step": 16803 + }, + { + "epoch": 45.787465940054496, + "grad_norm": 8.326163291931152, + "learning_rate": 1.1839612779169833e-05, + "loss": 0.1984, + "step": 16804 + }, + { + "epoch": 45.79019073569482, + "grad_norm": 5.921015739440918, + "learning_rate": 1.1838745338474266e-05, + "loss": 0.4049, + "step": 16805 + }, + { + "epoch": 45.79291553133515, + "grad_norm": 12.31640338897705, + "learning_rate": 1.183787788345861e-05, + "loss": 0.1637, + "step": 16806 + }, + { + "epoch": 45.79564032697548, + "grad_norm": 5.65764045715332, + "learning_rate": 1.1837010414129617e-05, + "loss": 0.2375, + "step": 16807 + }, + { + "epoch": 45.798365122615806, + "grad_norm": 4.975269794464111, + "learning_rate": 1.1836142930494053e-05, + "loss": 0.1195, + "step": 16808 + }, + { + "epoch": 45.80108991825613, + "grad_norm": 5.65529727935791, + "learning_rate": 1.1835275432558659e-05, + "loss": 0.1931, + "step": 16809 + }, + { + "epoch": 45.80381471389646, + "grad_norm": 8.044857025146484, + "learning_rate": 1.1834407920330207e-05, + "loss": 0.2065, + "step": 16810 + }, + { + "epoch": 45.80653950953678, + "grad_norm": 5.580800533294678, + "learning_rate": 1.1833540393815438e-05, + "loss": 0.3629, + "step": 16811 + }, + { + "epoch": 45.80926430517711, + "grad_norm": 4.198930263519287, + "learning_rate": 1.183267285302112e-05, + "loss": 0.258, + "step": 16812 + }, + { + "epoch": 45.81198910081744, + "grad_norm": 7.045481204986572, + "learning_rate": 1.1831805297954001e-05, + "loss": 0.1241, + "step": 16813 + }, + { + "epoch": 45.81471389645777, + "grad_norm": 6.636136054992676, + "learning_rate": 1.1830937728620847e-05, + "loss": 0.2276, + "step": 16814 + }, + { + "epoch": 45.817438692098094, + "grad_norm": 5.757200241088867, + "learning_rate": 1.1830070145028404e-05, + "loss": 0.1356, + "step": 16815 + }, + { + "epoch": 45.82016348773842, + "grad_norm": 5.463143348693848, + "learning_rate": 1.1829202547183434e-05, + "loss": 0.1717, + "step": 16816 + }, + { + "epoch": 45.822888283378745, + "grad_norm": 5.030807971954346, + "learning_rate": 1.1828334935092694e-05, + "loss": 0.1357, + "step": 16817 + }, + { + "epoch": 45.82561307901907, + "grad_norm": 9.538846969604492, + "learning_rate": 1.1827467308762943e-05, + "loss": 0.1935, + "step": 16818 + }, + { + "epoch": 45.828337874659404, + "grad_norm": 5.1914963722229, + "learning_rate": 1.1826599668200931e-05, + "loss": 0.2146, + "step": 16819 + }, + { + "epoch": 45.83106267029973, + "grad_norm": 6.6925458908081055, + "learning_rate": 1.1825732013413424e-05, + "loss": 0.286, + "step": 16820 + }, + { + "epoch": 45.833787465940055, + "grad_norm": 4.862399101257324, + "learning_rate": 1.1824864344407172e-05, + "loss": 0.117, + "step": 16821 + }, + { + "epoch": 45.83651226158038, + "grad_norm": 5.300833225250244, + "learning_rate": 1.1823996661188936e-05, + "loss": 0.2113, + "step": 16822 + }, + { + "epoch": 45.83923705722071, + "grad_norm": 5.468568801879883, + "learning_rate": 1.1823128963765472e-05, + "loss": 0.1965, + "step": 16823 + }, + { + "epoch": 45.84196185286103, + "grad_norm": 7.542404651641846, + "learning_rate": 1.1822261252143538e-05, + "loss": 0.1763, + "step": 16824 + }, + { + "epoch": 45.844686648501366, + "grad_norm": 5.1153459548950195, + "learning_rate": 1.1821393526329894e-05, + "loss": 0.1416, + "step": 16825 + }, + { + "epoch": 45.84741144414169, + "grad_norm": 7.301416397094727, + "learning_rate": 1.1820525786331296e-05, + "loss": 0.128, + "step": 16826 + }, + { + "epoch": 45.85013623978202, + "grad_norm": 4.820608615875244, + "learning_rate": 1.18196580321545e-05, + "loss": 0.1388, + "step": 16827 + }, + { + "epoch": 45.85286103542234, + "grad_norm": 5.057580947875977, + "learning_rate": 1.1818790263806265e-05, + "loss": 0.1096, + "step": 16828 + }, + { + "epoch": 45.85558583106267, + "grad_norm": 5.905057907104492, + "learning_rate": 1.1817922481293351e-05, + "loss": 0.1954, + "step": 16829 + }, + { + "epoch": 45.858310626702995, + "grad_norm": 6.665063381195068, + "learning_rate": 1.1817054684622518e-05, + "loss": 0.2183, + "step": 16830 + }, + { + "epoch": 45.86103542234333, + "grad_norm": 5.462371349334717, + "learning_rate": 1.1816186873800519e-05, + "loss": 0.2193, + "step": 16831 + }, + { + "epoch": 45.86376021798365, + "grad_norm": 6.108532905578613, + "learning_rate": 1.1815319048834113e-05, + "loss": 0.3233, + "step": 16832 + }, + { + "epoch": 45.86648501362398, + "grad_norm": 4.892570495605469, + "learning_rate": 1.1814451209730062e-05, + "loss": 0.1703, + "step": 16833 + }, + { + "epoch": 45.869209809264305, + "grad_norm": 4.645022869110107, + "learning_rate": 1.1813583356495126e-05, + "loss": 0.1634, + "step": 16834 + }, + { + "epoch": 45.87193460490463, + "grad_norm": 5.6142578125, + "learning_rate": 1.1812715489136059e-05, + "loss": 0.1651, + "step": 16835 + }, + { + "epoch": 45.87465940054496, + "grad_norm": 4.635265350341797, + "learning_rate": 1.1811847607659623e-05, + "loss": 0.292, + "step": 16836 + }, + { + "epoch": 45.87738419618529, + "grad_norm": 5.443964004516602, + "learning_rate": 1.1810979712072577e-05, + "loss": 0.3624, + "step": 16837 + }, + { + "epoch": 45.880108991825615, + "grad_norm": 6.793909072875977, + "learning_rate": 1.1810111802381679e-05, + "loss": 0.2163, + "step": 16838 + }, + { + "epoch": 45.88283378746594, + "grad_norm": 4.849037170410156, + "learning_rate": 1.1809243878593686e-05, + "loss": 0.2381, + "step": 16839 + }, + { + "epoch": 45.88555858310627, + "grad_norm": 5.565073013305664, + "learning_rate": 1.1808375940715362e-05, + "loss": 0.1832, + "step": 16840 + }, + { + "epoch": 45.88828337874659, + "grad_norm": 6.433823108673096, + "learning_rate": 1.1807507988753461e-05, + "loss": 0.133, + "step": 16841 + }, + { + "epoch": 45.89100817438692, + "grad_norm": 5.564578533172607, + "learning_rate": 1.180664002271475e-05, + "loss": 0.1701, + "step": 16842 + }, + { + "epoch": 45.89373297002725, + "grad_norm": 5.624913215637207, + "learning_rate": 1.1805772042605982e-05, + "loss": 0.1648, + "step": 16843 + }, + { + "epoch": 45.89645776566758, + "grad_norm": 5.615039348602295, + "learning_rate": 1.1804904048433925e-05, + "loss": 0.1364, + "step": 16844 + }, + { + "epoch": 45.8991825613079, + "grad_norm": 4.709343910217285, + "learning_rate": 1.1804036040205326e-05, + "loss": 0.1999, + "step": 16845 + }, + { + "epoch": 45.90190735694823, + "grad_norm": 7.4266557693481445, + "learning_rate": 1.1803168017926958e-05, + "loss": 0.1916, + "step": 16846 + }, + { + "epoch": 45.904632152588555, + "grad_norm": 7.247400283813477, + "learning_rate": 1.1802299981605572e-05, + "loss": 0.1903, + "step": 16847 + }, + { + "epoch": 45.90735694822888, + "grad_norm": 5.782771587371826, + "learning_rate": 1.1801431931247936e-05, + "loss": 0.1388, + "step": 16848 + }, + { + "epoch": 45.91008174386921, + "grad_norm": 6.266892910003662, + "learning_rate": 1.1800563866860802e-05, + "loss": 0.181, + "step": 16849 + }, + { + "epoch": 45.91280653950954, + "grad_norm": 5.285679817199707, + "learning_rate": 1.1799695788450933e-05, + "loss": 0.1858, + "step": 16850 + }, + { + "epoch": 45.915531335149865, + "grad_norm": 7.338531017303467, + "learning_rate": 1.1798827696025094e-05, + "loss": 0.2153, + "step": 16851 + }, + { + "epoch": 45.91825613079019, + "grad_norm": 8.412606239318848, + "learning_rate": 1.1797959589590042e-05, + "loss": 0.2985, + "step": 16852 + }, + { + "epoch": 45.920980926430516, + "grad_norm": 7.390754222869873, + "learning_rate": 1.179709146915254e-05, + "loss": 0.1792, + "step": 16853 + }, + { + "epoch": 45.92370572207084, + "grad_norm": 6.709893226623535, + "learning_rate": 1.1796223334719347e-05, + "loss": 0.357, + "step": 16854 + }, + { + "epoch": 45.926430517711175, + "grad_norm": 5.400599479675293, + "learning_rate": 1.1795355186297223e-05, + "loss": 0.1779, + "step": 16855 + }, + { + "epoch": 45.9291553133515, + "grad_norm": 6.281462669372559, + "learning_rate": 1.1794487023892934e-05, + "loss": 0.1422, + "step": 16856 + }, + { + "epoch": 45.93188010899183, + "grad_norm": 5.297862529754639, + "learning_rate": 1.1793618847513235e-05, + "loss": 0.1678, + "step": 16857 + }, + { + "epoch": 45.93460490463215, + "grad_norm": 5.953853607177734, + "learning_rate": 1.179275065716489e-05, + "loss": 0.2998, + "step": 16858 + }, + { + "epoch": 45.93732970027248, + "grad_norm": 5.778013706207275, + "learning_rate": 1.1791882452854661e-05, + "loss": 0.2167, + "step": 16859 + }, + { + "epoch": 45.940054495912804, + "grad_norm": 5.81217622756958, + "learning_rate": 1.1791014234589308e-05, + "loss": 0.2295, + "step": 16860 + }, + { + "epoch": 45.94277929155314, + "grad_norm": 5.243221759796143, + "learning_rate": 1.1790146002375597e-05, + "loss": 0.2875, + "step": 16861 + }, + { + "epoch": 45.94550408719346, + "grad_norm": 5.780571460723877, + "learning_rate": 1.1789277756220283e-05, + "loss": 0.1198, + "step": 16862 + }, + { + "epoch": 45.94822888283379, + "grad_norm": 8.66849136352539, + "learning_rate": 1.1788409496130133e-05, + "loss": 0.1437, + "step": 16863 + }, + { + "epoch": 45.950953678474114, + "grad_norm": 5.675642013549805, + "learning_rate": 1.178754122211191e-05, + "loss": 0.2999, + "step": 16864 + }, + { + "epoch": 45.95367847411444, + "grad_norm": 6.454855442047119, + "learning_rate": 1.178667293417237e-05, + "loss": 0.2019, + "step": 16865 + }, + { + "epoch": 45.956403269754766, + "grad_norm": 48.437015533447266, + "learning_rate": 1.1785804632318278e-05, + "loss": 0.106, + "step": 16866 + }, + { + "epoch": 45.95912806539509, + "grad_norm": 5.250528812408447, + "learning_rate": 1.1784936316556399e-05, + "loss": 0.1671, + "step": 16867 + }, + { + "epoch": 45.961852861035425, + "grad_norm": 4.772067546844482, + "learning_rate": 1.1784067986893492e-05, + "loss": 0.1622, + "step": 16868 + }, + { + "epoch": 45.96457765667575, + "grad_norm": 17.530364990234375, + "learning_rate": 1.1783199643336324e-05, + "loss": 0.1622, + "step": 16869 + }, + { + "epoch": 45.967302452316076, + "grad_norm": 6.608857154846191, + "learning_rate": 1.1782331285891654e-05, + "loss": 0.3674, + "step": 16870 + }, + { + "epoch": 45.9700272479564, + "grad_norm": 4.463240623474121, + "learning_rate": 1.1781462914566244e-05, + "loss": 0.1687, + "step": 16871 + }, + { + "epoch": 45.97275204359673, + "grad_norm": 5.558890342712402, + "learning_rate": 1.1780594529366856e-05, + "loss": 0.1276, + "step": 16872 + }, + { + "epoch": 45.97547683923706, + "grad_norm": 6.251444339752197, + "learning_rate": 1.177972613030026e-05, + "loss": 0.2368, + "step": 16873 + }, + { + "epoch": 45.97820163487739, + "grad_norm": 7.094636917114258, + "learning_rate": 1.1778857717373208e-05, + "loss": 0.2958, + "step": 16874 + }, + { + "epoch": 45.98092643051771, + "grad_norm": 4.030132293701172, + "learning_rate": 1.1777989290592474e-05, + "loss": 0.083, + "step": 16875 + }, + { + "epoch": 45.98365122615804, + "grad_norm": 4.525312423706055, + "learning_rate": 1.1777120849964814e-05, + "loss": 0.1293, + "step": 16876 + }, + { + "epoch": 45.986376021798364, + "grad_norm": 6.200839042663574, + "learning_rate": 1.1776252395496996e-05, + "loss": 0.2395, + "step": 16877 + }, + { + "epoch": 45.98910081743869, + "grad_norm": 12.559029579162598, + "learning_rate": 1.177538392719578e-05, + "loss": 0.3794, + "step": 16878 + }, + { + "epoch": 45.991825613079016, + "grad_norm": 5.862802505493164, + "learning_rate": 1.1774515445067933e-05, + "loss": 0.1498, + "step": 16879 + }, + { + "epoch": 45.99455040871935, + "grad_norm": 6.752175331115723, + "learning_rate": 1.1773646949120217e-05, + "loss": 0.2217, + "step": 16880 + }, + { + "epoch": 45.997275204359674, + "grad_norm": 7.321381092071533, + "learning_rate": 1.1772778439359393e-05, + "loss": 0.1709, + "step": 16881 + }, + { + "epoch": 46.0, + "grad_norm": 5.0732526779174805, + "learning_rate": 1.177190991579223e-05, + "loss": 0.1394, + "step": 16882 + }, + { + "epoch": 46.002724795640326, + "grad_norm": 5.083871364593506, + "learning_rate": 1.177104137842549e-05, + "loss": 0.1157, + "step": 16883 + }, + { + "epoch": 46.00544959128065, + "grad_norm": 4.938205718994141, + "learning_rate": 1.177017282726593e-05, + "loss": 0.1703, + "step": 16884 + }, + { + "epoch": 46.00817438692098, + "grad_norm": 4.9734673500061035, + "learning_rate": 1.1769304262320329e-05, + "loss": 0.2418, + "step": 16885 + }, + { + "epoch": 46.01089918256131, + "grad_norm": 4.630497932434082, + "learning_rate": 1.1768435683595441e-05, + "loss": 0.1616, + "step": 16886 + }, + { + "epoch": 46.013623978201636, + "grad_norm": 6.0803680419921875, + "learning_rate": 1.1767567091098033e-05, + "loss": 0.1457, + "step": 16887 + }, + { + "epoch": 46.01634877384196, + "grad_norm": 14.960121154785156, + "learning_rate": 1.1766698484834869e-05, + "loss": 0.1541, + "step": 16888 + }, + { + "epoch": 46.01907356948229, + "grad_norm": 7.334306240081787, + "learning_rate": 1.1765829864812714e-05, + "loss": 0.3031, + "step": 16889 + }, + { + "epoch": 46.02179836512261, + "grad_norm": 5.870535373687744, + "learning_rate": 1.1764961231038331e-05, + "loss": 0.197, + "step": 16890 + }, + { + "epoch": 46.02452316076294, + "grad_norm": 4.6464056968688965, + "learning_rate": 1.1764092583518491e-05, + "loss": 0.1464, + "step": 16891 + }, + { + "epoch": 46.02724795640327, + "grad_norm": 5.883876323699951, + "learning_rate": 1.176322392225995e-05, + "loss": 0.1725, + "step": 16892 + }, + { + "epoch": 46.0299727520436, + "grad_norm": 5.208800315856934, + "learning_rate": 1.1762355247269481e-05, + "loss": 0.3002, + "step": 16893 + }, + { + "epoch": 46.032697547683924, + "grad_norm": 5.147244930267334, + "learning_rate": 1.1761486558553843e-05, + "loss": 0.2334, + "step": 16894 + }, + { + "epoch": 46.03542234332425, + "grad_norm": 5.42535924911499, + "learning_rate": 1.1760617856119809e-05, + "loss": 0.224, + "step": 16895 + }, + { + "epoch": 46.038147138964575, + "grad_norm": 4.2400946617126465, + "learning_rate": 1.1759749139974137e-05, + "loss": 0.2851, + "step": 16896 + }, + { + "epoch": 46.0408719346049, + "grad_norm": 4.644554615020752, + "learning_rate": 1.1758880410123596e-05, + "loss": 0.1312, + "step": 16897 + }, + { + "epoch": 46.043596730245234, + "grad_norm": 4.072249889373779, + "learning_rate": 1.175801166657495e-05, + "loss": 0.1893, + "step": 16898 + }, + { + "epoch": 46.04632152588556, + "grad_norm": 5.934253215789795, + "learning_rate": 1.175714290933497e-05, + "loss": 0.2545, + "step": 16899 + }, + { + "epoch": 46.049046321525886, + "grad_norm": 6.599236011505127, + "learning_rate": 1.175627413841041e-05, + "loss": 0.2178, + "step": 16900 + }, + { + "epoch": 46.05177111716621, + "grad_norm": 7.527964115142822, + "learning_rate": 1.1755405353808047e-05, + "loss": 0.1436, + "step": 16901 + }, + { + "epoch": 46.05449591280654, + "grad_norm": 7.0813212394714355, + "learning_rate": 1.1754536555534643e-05, + "loss": 0.1468, + "step": 16902 + }, + { + "epoch": 46.05722070844686, + "grad_norm": 4.541636943817139, + "learning_rate": 1.1753667743596969e-05, + "loss": 0.1627, + "step": 16903 + }, + { + "epoch": 46.059945504087196, + "grad_norm": 5.095037460327148, + "learning_rate": 1.1752798918001782e-05, + "loss": 0.2652, + "step": 16904 + }, + { + "epoch": 46.06267029972752, + "grad_norm": 5.75819206237793, + "learning_rate": 1.1751930078755858e-05, + "loss": 0.1549, + "step": 16905 + }, + { + "epoch": 46.06539509536785, + "grad_norm": 6.596327781677246, + "learning_rate": 1.1751061225865953e-05, + "loss": 0.1703, + "step": 16906 + }, + { + "epoch": 46.06811989100817, + "grad_norm": 5.354146480560303, + "learning_rate": 1.1750192359338845e-05, + "loss": 0.2491, + "step": 16907 + }, + { + "epoch": 46.0708446866485, + "grad_norm": 4.3368754386901855, + "learning_rate": 1.1749323479181291e-05, + "loss": 0.2098, + "step": 16908 + }, + { + "epoch": 46.073569482288825, + "grad_norm": 4.405524730682373, + "learning_rate": 1.1748454585400064e-05, + "loss": 0.113, + "step": 16909 + }, + { + "epoch": 46.07629427792916, + "grad_norm": 5.045307636260986, + "learning_rate": 1.1747585678001929e-05, + "loss": 0.2091, + "step": 16910 + }, + { + "epoch": 46.079019073569484, + "grad_norm": 5.209238052368164, + "learning_rate": 1.1746716756993654e-05, + "loss": 0.2337, + "step": 16911 + }, + { + "epoch": 46.08174386920981, + "grad_norm": 4.878576278686523, + "learning_rate": 1.1745847822382004e-05, + "loss": 0.11, + "step": 16912 + }, + { + "epoch": 46.084468664850135, + "grad_norm": 6.489706516265869, + "learning_rate": 1.174497887417375e-05, + "loss": 0.2975, + "step": 16913 + }, + { + "epoch": 46.08719346049046, + "grad_norm": 5.230531692504883, + "learning_rate": 1.1744109912375652e-05, + "loss": 0.267, + "step": 16914 + }, + { + "epoch": 46.08991825613079, + "grad_norm": 4.458773136138916, + "learning_rate": 1.1743240936994484e-05, + "loss": 0.106, + "step": 16915 + }, + { + "epoch": 46.09264305177112, + "grad_norm": 3.952570915222168, + "learning_rate": 1.1742371948037012e-05, + "loss": 0.1326, + "step": 16916 + }, + { + "epoch": 46.095367847411445, + "grad_norm": 3.6904971599578857, + "learning_rate": 1.1741502945510005e-05, + "loss": 0.1023, + "step": 16917 + }, + { + "epoch": 46.09809264305177, + "grad_norm": 4.737332344055176, + "learning_rate": 1.1740633929420225e-05, + "loss": 0.1231, + "step": 16918 + }, + { + "epoch": 46.1008174386921, + "grad_norm": 5.266089916229248, + "learning_rate": 1.1739764899774447e-05, + "loss": 0.1163, + "step": 16919 + }, + { + "epoch": 46.10354223433242, + "grad_norm": 5.249556064605713, + "learning_rate": 1.1738895856579436e-05, + "loss": 0.203, + "step": 16920 + }, + { + "epoch": 46.10626702997275, + "grad_norm": 5.134702682495117, + "learning_rate": 1.173802679984196e-05, + "loss": 0.1029, + "step": 16921 + }, + { + "epoch": 46.10899182561308, + "grad_norm": 5.852989196777344, + "learning_rate": 1.1737157729568787e-05, + "loss": 0.1935, + "step": 16922 + }, + { + "epoch": 46.11171662125341, + "grad_norm": 12.089111328125, + "learning_rate": 1.1736288645766684e-05, + "loss": 0.1376, + "step": 16923 + }, + { + "epoch": 46.11444141689373, + "grad_norm": 5.578044891357422, + "learning_rate": 1.1735419548442422e-05, + "loss": 0.2012, + "step": 16924 + }, + { + "epoch": 46.11716621253406, + "grad_norm": 7.164999008178711, + "learning_rate": 1.173455043760277e-05, + "loss": 0.156, + "step": 16925 + }, + { + "epoch": 46.119891008174385, + "grad_norm": 5.309410572052002, + "learning_rate": 1.1733681313254492e-05, + "loss": 0.2188, + "step": 16926 + }, + { + "epoch": 46.12261580381471, + "grad_norm": 6.488722324371338, + "learning_rate": 1.1732812175404362e-05, + "loss": 0.2034, + "step": 16927 + }, + { + "epoch": 46.12534059945504, + "grad_norm": 4.2620391845703125, + "learning_rate": 1.1731943024059145e-05, + "loss": 0.1984, + "step": 16928 + }, + { + "epoch": 46.12806539509537, + "grad_norm": 5.6828742027282715, + "learning_rate": 1.1731073859225612e-05, + "loss": 0.2205, + "step": 16929 + }, + { + "epoch": 46.130790190735695, + "grad_norm": 7.540266990661621, + "learning_rate": 1.173020468091053e-05, + "loss": 0.2739, + "step": 16930 + }, + { + "epoch": 46.13351498637602, + "grad_norm": 4.928872108459473, + "learning_rate": 1.1729335489120675e-05, + "loss": 0.1258, + "step": 16931 + }, + { + "epoch": 46.13623978201635, + "grad_norm": 4.395156383514404, + "learning_rate": 1.1728466283862806e-05, + "loss": 0.0999, + "step": 16932 + }, + { + "epoch": 46.13896457765667, + "grad_norm": 4.242887496948242, + "learning_rate": 1.1727597065143699e-05, + "loss": 0.2232, + "step": 16933 + }, + { + "epoch": 46.141689373297005, + "grad_norm": 5.286397457122803, + "learning_rate": 1.1726727832970121e-05, + "loss": 0.1928, + "step": 16934 + }, + { + "epoch": 46.14441416893733, + "grad_norm": 5.503414154052734, + "learning_rate": 1.1725858587348842e-05, + "loss": 0.2134, + "step": 16935 + }, + { + "epoch": 46.14713896457766, + "grad_norm": 5.316442966461182, + "learning_rate": 1.1724989328286633e-05, + "loss": 0.1651, + "step": 16936 + }, + { + "epoch": 46.14986376021798, + "grad_norm": 3.8543577194213867, + "learning_rate": 1.172412005579026e-05, + "loss": 0.1191, + "step": 16937 + }, + { + "epoch": 46.15258855585831, + "grad_norm": 6.987120151519775, + "learning_rate": 1.1723250769866499e-05, + "loss": 0.1891, + "step": 16938 + }, + { + "epoch": 46.155313351498634, + "grad_norm": 4.610313892364502, + "learning_rate": 1.1722381470522116e-05, + "loss": 0.1173, + "step": 16939 + }, + { + "epoch": 46.15803814713897, + "grad_norm": 5.001042366027832, + "learning_rate": 1.1721512157763878e-05, + "loss": 0.151, + "step": 16940 + }, + { + "epoch": 46.16076294277929, + "grad_norm": 5.889011859893799, + "learning_rate": 1.1720642831598563e-05, + "loss": 0.2553, + "step": 16941 + }, + { + "epoch": 46.16348773841962, + "grad_norm": 4.743194103240967, + "learning_rate": 1.1719773492032933e-05, + "loss": 0.2292, + "step": 16942 + }, + { + "epoch": 46.166212534059945, + "grad_norm": 4.329124927520752, + "learning_rate": 1.1718904139073765e-05, + "loss": 0.107, + "step": 16943 + }, + { + "epoch": 46.16893732970027, + "grad_norm": 4.750197887420654, + "learning_rate": 1.1718034772727827e-05, + "loss": 0.1749, + "step": 16944 + }, + { + "epoch": 46.171662125340596, + "grad_norm": 5.156228065490723, + "learning_rate": 1.1717165393001888e-05, + "loss": 0.1928, + "step": 16945 + }, + { + "epoch": 46.17438692098093, + "grad_norm": 4.277947902679443, + "learning_rate": 1.1716295999902722e-05, + "loss": 0.1296, + "step": 16946 + }, + { + "epoch": 46.177111716621255, + "grad_norm": 6.750779151916504, + "learning_rate": 1.1715426593437096e-05, + "loss": 0.2778, + "step": 16947 + }, + { + "epoch": 46.17983651226158, + "grad_norm": 9.903641700744629, + "learning_rate": 1.1714557173611785e-05, + "loss": 0.2106, + "step": 16948 + }, + { + "epoch": 46.182561307901906, + "grad_norm": 4.747694492340088, + "learning_rate": 1.1713687740433557e-05, + "loss": 0.1006, + "step": 16949 + }, + { + "epoch": 46.18528610354223, + "grad_norm": 4.483840465545654, + "learning_rate": 1.1712818293909182e-05, + "loss": 0.2431, + "step": 16950 + }, + { + "epoch": 46.18801089918256, + "grad_norm": 6.454843521118164, + "learning_rate": 1.1711948834045437e-05, + "loss": 0.2097, + "step": 16951 + }, + { + "epoch": 46.19073569482289, + "grad_norm": 5.715302467346191, + "learning_rate": 1.1711079360849086e-05, + "loss": 0.1199, + "step": 16952 + }, + { + "epoch": 46.19346049046322, + "grad_norm": 5.379823207855225, + "learning_rate": 1.1710209874326905e-05, + "loss": 0.2381, + "step": 16953 + }, + { + "epoch": 46.19618528610354, + "grad_norm": 4.871223449707031, + "learning_rate": 1.1709340374485667e-05, + "loss": 0.1482, + "step": 16954 + }, + { + "epoch": 46.19891008174387, + "grad_norm": 5.154715538024902, + "learning_rate": 1.170847086133214e-05, + "loss": 0.2239, + "step": 16955 + }, + { + "epoch": 46.201634877384194, + "grad_norm": 7.11883020401001, + "learning_rate": 1.1707601334873097e-05, + "loss": 0.1468, + "step": 16956 + }, + { + "epoch": 46.20435967302452, + "grad_norm": 5.708817481994629, + "learning_rate": 1.1706731795115309e-05, + "loss": 0.2822, + "step": 16957 + }, + { + "epoch": 46.20708446866485, + "grad_norm": 5.6825971603393555, + "learning_rate": 1.1705862242065549e-05, + "loss": 0.2883, + "step": 16958 + }, + { + "epoch": 46.20980926430518, + "grad_norm": 6.1116766929626465, + "learning_rate": 1.1704992675730588e-05, + "loss": 0.2028, + "step": 16959 + }, + { + "epoch": 46.212534059945504, + "grad_norm": 4.810726642608643, + "learning_rate": 1.17041230961172e-05, + "loss": 0.181, + "step": 16960 + }, + { + "epoch": 46.21525885558583, + "grad_norm": 4.37108850479126, + "learning_rate": 1.1703253503232152e-05, + "loss": 0.1972, + "step": 16961 + }, + { + "epoch": 46.217983651226156, + "grad_norm": 6.069670677185059, + "learning_rate": 1.1702383897082229e-05, + "loss": 0.1389, + "step": 16962 + }, + { + "epoch": 46.22070844686648, + "grad_norm": 4.703593730926514, + "learning_rate": 1.1701514277674186e-05, + "loss": 0.4329, + "step": 16963 + }, + { + "epoch": 46.223433242506815, + "grad_norm": 5.444170951843262, + "learning_rate": 1.1700644645014812e-05, + "loss": 0.1443, + "step": 16964 + }, + { + "epoch": 46.22615803814714, + "grad_norm": 5.546870231628418, + "learning_rate": 1.1699774999110867e-05, + "loss": 0.1891, + "step": 16965 + }, + { + "epoch": 46.228882833787466, + "grad_norm": 4.24921178817749, + "learning_rate": 1.1698905339969133e-05, + "loss": 0.3073, + "step": 16966 + }, + { + "epoch": 46.23160762942779, + "grad_norm": 5.065343856811523, + "learning_rate": 1.1698035667596378e-05, + "loss": 0.1351, + "step": 16967 + }, + { + "epoch": 46.23433242506812, + "grad_norm": 5.259772300720215, + "learning_rate": 1.1697165981999375e-05, + "loss": 0.2985, + "step": 16968 + }, + { + "epoch": 46.237057220708444, + "grad_norm": 12.561153411865234, + "learning_rate": 1.1696296283184896e-05, + "loss": 0.2392, + "step": 16969 + }, + { + "epoch": 46.23978201634878, + "grad_norm": 6.302806854248047, + "learning_rate": 1.1695426571159718e-05, + "loss": 0.2354, + "step": 16970 + }, + { + "epoch": 46.2425068119891, + "grad_norm": 6.131228446960449, + "learning_rate": 1.1694556845930611e-05, + "loss": 0.2924, + "step": 16971 + }, + { + "epoch": 46.24523160762943, + "grad_norm": 4.117089748382568, + "learning_rate": 1.1693687107504352e-05, + "loss": 0.1476, + "step": 16972 + }, + { + "epoch": 46.247956403269754, + "grad_norm": 4.978460311889648, + "learning_rate": 1.169281735588771e-05, + "loss": 0.1621, + "step": 16973 + }, + { + "epoch": 46.25068119891008, + "grad_norm": 7.9032721519470215, + "learning_rate": 1.1691947591087464e-05, + "loss": 0.1782, + "step": 16974 + }, + { + "epoch": 46.253405994550405, + "grad_norm": 5.891063213348389, + "learning_rate": 1.1691077813110383e-05, + "loss": 0.1756, + "step": 16975 + }, + { + "epoch": 46.25613079019074, + "grad_norm": 5.366761207580566, + "learning_rate": 1.1690208021963243e-05, + "loss": 0.4038, + "step": 16976 + }, + { + "epoch": 46.258855585831064, + "grad_norm": 5.27750825881958, + "learning_rate": 1.1689338217652818e-05, + "loss": 0.1177, + "step": 16977 + }, + { + "epoch": 46.26158038147139, + "grad_norm": 5.0216288566589355, + "learning_rate": 1.1688468400185877e-05, + "loss": 0.3339, + "step": 16978 + }, + { + "epoch": 46.264305177111716, + "grad_norm": 4.817869663238525, + "learning_rate": 1.16875985695692e-05, + "loss": 0.0802, + "step": 16979 + }, + { + "epoch": 46.26702997275204, + "grad_norm": 5.414669513702393, + "learning_rate": 1.1686728725809564e-05, + "loss": 0.1339, + "step": 16980 + }, + { + "epoch": 46.26975476839237, + "grad_norm": 5.407716274261475, + "learning_rate": 1.1685858868913736e-05, + "loss": 0.2522, + "step": 16981 + }, + { + "epoch": 46.2724795640327, + "grad_norm": 4.433934688568115, + "learning_rate": 1.1684988998888494e-05, + "loss": 0.2352, + "step": 16982 + }, + { + "epoch": 46.275204359673026, + "grad_norm": 4.624395370483398, + "learning_rate": 1.168411911574061e-05, + "loss": 0.238, + "step": 16983 + }, + { + "epoch": 46.27792915531335, + "grad_norm": 5.083333492279053, + "learning_rate": 1.1683249219476864e-05, + "loss": 0.1794, + "step": 16984 + }, + { + "epoch": 46.28065395095368, + "grad_norm": 5.640879154205322, + "learning_rate": 1.1682379310104023e-05, + "loss": 0.1328, + "step": 16985 + }, + { + "epoch": 46.283378746594, + "grad_norm": 7.7753424644470215, + "learning_rate": 1.1681509387628871e-05, + "loss": 0.1967, + "step": 16986 + }, + { + "epoch": 46.28610354223433, + "grad_norm": 6.597271919250488, + "learning_rate": 1.1680639452058172e-05, + "loss": 0.3071, + "step": 16987 + }, + { + "epoch": 46.28882833787466, + "grad_norm": 4.760594844818115, + "learning_rate": 1.1679769503398712e-05, + "loss": 0.226, + "step": 16988 + }, + { + "epoch": 46.29155313351499, + "grad_norm": 4.12913179397583, + "learning_rate": 1.1678899541657258e-05, + "loss": 0.1955, + "step": 16989 + }, + { + "epoch": 46.294277929155314, + "grad_norm": 5.745121002197266, + "learning_rate": 1.1678029566840593e-05, + "loss": 0.1848, + "step": 16990 + }, + { + "epoch": 46.29700272479564, + "grad_norm": 8.40665054321289, + "learning_rate": 1.1677159578955481e-05, + "loss": 0.1738, + "step": 16991 + }, + { + "epoch": 46.299727520435965, + "grad_norm": 8.361091613769531, + "learning_rate": 1.167628957800871e-05, + "loss": 0.321, + "step": 16992 + }, + { + "epoch": 46.30245231607629, + "grad_norm": 7.860576152801514, + "learning_rate": 1.1675419564007046e-05, + "loss": 0.1078, + "step": 16993 + }, + { + "epoch": 46.305177111716624, + "grad_norm": 5.239068508148193, + "learning_rate": 1.167454953695727e-05, + "loss": 0.1725, + "step": 16994 + }, + { + "epoch": 46.30790190735695, + "grad_norm": 5.734799861907959, + "learning_rate": 1.1673679496866155e-05, + "loss": 0.0986, + "step": 16995 + }, + { + "epoch": 46.310626702997276, + "grad_norm": 12.02059268951416, + "learning_rate": 1.167280944374048e-05, + "loss": 0.1673, + "step": 16996 + }, + { + "epoch": 46.3133514986376, + "grad_norm": 6.198795795440674, + "learning_rate": 1.1671939377587018e-05, + "loss": 0.1999, + "step": 16997 + }, + { + "epoch": 46.31607629427793, + "grad_norm": 6.111451625823975, + "learning_rate": 1.1671069298412548e-05, + "loss": 0.1847, + "step": 16998 + }, + { + "epoch": 46.31880108991825, + "grad_norm": 7.072170734405518, + "learning_rate": 1.167019920622384e-05, + "loss": 0.1806, + "step": 16999 + }, + { + "epoch": 46.321525885558586, + "grad_norm": 6.404435634613037, + "learning_rate": 1.1669329101027677e-05, + "loss": 0.1762, + "step": 17000 + }, + { + "epoch": 46.32425068119891, + "grad_norm": 5.490909576416016, + "learning_rate": 1.166845898283083e-05, + "loss": 0.2574, + "step": 17001 + }, + { + "epoch": 46.32697547683924, + "grad_norm": 4.518784523010254, + "learning_rate": 1.1667588851640084e-05, + "loss": 0.1352, + "step": 17002 + }, + { + "epoch": 46.32970027247956, + "grad_norm": 5.648974895477295, + "learning_rate": 1.1666718707462203e-05, + "loss": 0.1929, + "step": 17003 + }, + { + "epoch": 46.33242506811989, + "grad_norm": 4.958102703094482, + "learning_rate": 1.1665848550303972e-05, + "loss": 0.2085, + "step": 17004 + }, + { + "epoch": 46.335149863760215, + "grad_norm": 5.627400875091553, + "learning_rate": 1.1664978380172167e-05, + "loss": 0.1024, + "step": 17005 + }, + { + "epoch": 46.33787465940055, + "grad_norm": 4.282506465911865, + "learning_rate": 1.1664108197073566e-05, + "loss": 0.1202, + "step": 17006 + }, + { + "epoch": 46.34059945504087, + "grad_norm": 14.788066864013672, + "learning_rate": 1.166323800101494e-05, + "loss": 0.1317, + "step": 17007 + }, + { + "epoch": 46.3433242506812, + "grad_norm": 13.455382347106934, + "learning_rate": 1.1662367792003075e-05, + "loss": 0.1522, + "step": 17008 + }, + { + "epoch": 46.346049046321525, + "grad_norm": 4.96815299987793, + "learning_rate": 1.1661497570044737e-05, + "loss": 0.1612, + "step": 17009 + }, + { + "epoch": 46.34877384196185, + "grad_norm": 7.081682205200195, + "learning_rate": 1.1660627335146714e-05, + "loss": 0.2652, + "step": 17010 + }, + { + "epoch": 46.35149863760218, + "grad_norm": 4.942091941833496, + "learning_rate": 1.1659757087315777e-05, + "loss": 0.1928, + "step": 17011 + }, + { + "epoch": 46.35422343324251, + "grad_norm": 5.042135715484619, + "learning_rate": 1.1658886826558709e-05, + "loss": 0.266, + "step": 17012 + }, + { + "epoch": 46.356948228882835, + "grad_norm": 6.583928108215332, + "learning_rate": 1.1658016552882279e-05, + "loss": 0.2129, + "step": 17013 + }, + { + "epoch": 46.35967302452316, + "grad_norm": 5.138932228088379, + "learning_rate": 1.1657146266293269e-05, + "loss": 0.1226, + "step": 17014 + }, + { + "epoch": 46.36239782016349, + "grad_norm": 5.067035675048828, + "learning_rate": 1.1656275966798458e-05, + "loss": 0.1469, + "step": 17015 + }, + { + "epoch": 46.36512261580381, + "grad_norm": 6.44582986831665, + "learning_rate": 1.1655405654404625e-05, + "loss": 0.3677, + "step": 17016 + }, + { + "epoch": 46.36784741144414, + "grad_norm": 5.958681106567383, + "learning_rate": 1.1654535329118545e-05, + "loss": 0.1352, + "step": 17017 + }, + { + "epoch": 46.37057220708447, + "grad_norm": 5.4483819007873535, + "learning_rate": 1.1653664990947e-05, + "loss": 0.1605, + "step": 17018 + }, + { + "epoch": 46.3732970027248, + "grad_norm": 5.049631595611572, + "learning_rate": 1.165279463989676e-05, + "loss": 0.2097, + "step": 17019 + }, + { + "epoch": 46.37602179836512, + "grad_norm": 6.19951868057251, + "learning_rate": 1.1651924275974613e-05, + "loss": 0.1634, + "step": 17020 + }, + { + "epoch": 46.37874659400545, + "grad_norm": 5.297245979309082, + "learning_rate": 1.165105389918733e-05, + "loss": 0.1602, + "step": 17021 + }, + { + "epoch": 46.381471389645775, + "grad_norm": 5.394540309906006, + "learning_rate": 1.1650183509541693e-05, + "loss": 0.1449, + "step": 17022 + }, + { + "epoch": 46.3841961852861, + "grad_norm": 4.56392765045166, + "learning_rate": 1.1649313107044483e-05, + "loss": 0.1062, + "step": 17023 + }, + { + "epoch": 46.38692098092643, + "grad_norm": 4.668919086456299, + "learning_rate": 1.164844269170247e-05, + "loss": 0.1717, + "step": 17024 + }, + { + "epoch": 46.38964577656676, + "grad_norm": 5.602856636047363, + "learning_rate": 1.1647572263522445e-05, + "loss": 0.1638, + "step": 17025 + }, + { + "epoch": 46.392370572207085, + "grad_norm": 5.524237155914307, + "learning_rate": 1.1646701822511173e-05, + "loss": 0.1851, + "step": 17026 + }, + { + "epoch": 46.39509536784741, + "grad_norm": 9.044189453125, + "learning_rate": 1.1645831368675445e-05, + "loss": 0.1613, + "step": 17027 + }, + { + "epoch": 46.39782016348774, + "grad_norm": 5.674327373504639, + "learning_rate": 1.1644960902022033e-05, + "loss": 0.1425, + "step": 17028 + }, + { + "epoch": 46.40054495912806, + "grad_norm": 4.188699245452881, + "learning_rate": 1.1644090422557719e-05, + "loss": 0.2439, + "step": 17029 + }, + { + "epoch": 46.403269754768395, + "grad_norm": 5.922665119171143, + "learning_rate": 1.1643219930289282e-05, + "loss": 0.1247, + "step": 17030 + }, + { + "epoch": 46.40599455040872, + "grad_norm": 6.207821846008301, + "learning_rate": 1.1642349425223502e-05, + "loss": 0.1871, + "step": 17031 + }, + { + "epoch": 46.40871934604905, + "grad_norm": 5.177120685577393, + "learning_rate": 1.1641478907367157e-05, + "loss": 0.1719, + "step": 17032 + }, + { + "epoch": 46.41144414168937, + "grad_norm": 7.872409820556641, + "learning_rate": 1.1640608376727028e-05, + "loss": 0.0984, + "step": 17033 + }, + { + "epoch": 46.4141689373297, + "grad_norm": 5.78146505355835, + "learning_rate": 1.163973783330989e-05, + "loss": 0.1353, + "step": 17034 + }, + { + "epoch": 46.416893732970024, + "grad_norm": 4.18654727935791, + "learning_rate": 1.1638867277122532e-05, + "loss": 0.1558, + "step": 17035 + }, + { + "epoch": 46.41961852861036, + "grad_norm": 5.658872127532959, + "learning_rate": 1.1637996708171725e-05, + "loss": 0.1506, + "step": 17036 + }, + { + "epoch": 46.42234332425068, + "grad_norm": 4.325180530548096, + "learning_rate": 1.163712612646425e-05, + "loss": 0.2835, + "step": 17037 + }, + { + "epoch": 46.42506811989101, + "grad_norm": 6.2680277824401855, + "learning_rate": 1.1636255532006892e-05, + "loss": 0.1261, + "step": 17038 + }, + { + "epoch": 46.427792915531334, + "grad_norm": 5.596966743469238, + "learning_rate": 1.163538492480643e-05, + "loss": 0.1306, + "step": 17039 + }, + { + "epoch": 46.43051771117166, + "grad_norm": 7.976938724517822, + "learning_rate": 1.1634514304869641e-05, + "loss": 0.2746, + "step": 17040 + }, + { + "epoch": 46.433242506811986, + "grad_norm": 4.647032737731934, + "learning_rate": 1.163364367220331e-05, + "loss": 0.1492, + "step": 17041 + }, + { + "epoch": 46.43596730245232, + "grad_norm": 4.698653221130371, + "learning_rate": 1.1632773026814213e-05, + "loss": 0.2278, + "step": 17042 + }, + { + "epoch": 46.438692098092645, + "grad_norm": 6.693230628967285, + "learning_rate": 1.1631902368709132e-05, + "loss": 0.1462, + "step": 17043 + }, + { + "epoch": 46.44141689373297, + "grad_norm": 5.366065502166748, + "learning_rate": 1.1631031697894846e-05, + "loss": 0.1761, + "step": 17044 + }, + { + "epoch": 46.444141689373296, + "grad_norm": 5.929636001586914, + "learning_rate": 1.1630161014378141e-05, + "loss": 0.1365, + "step": 17045 + }, + { + "epoch": 46.44686648501362, + "grad_norm": 9.201284408569336, + "learning_rate": 1.1629290318165792e-05, + "loss": 0.1515, + "step": 17046 + }, + { + "epoch": 46.44959128065395, + "grad_norm": 6.123513221740723, + "learning_rate": 1.1628419609264582e-05, + "loss": 0.2385, + "step": 17047 + }, + { + "epoch": 46.45231607629428, + "grad_norm": 5.181742191314697, + "learning_rate": 1.1627548887681292e-05, + "loss": 0.113, + "step": 17048 + }, + { + "epoch": 46.45504087193461, + "grad_norm": 5.155125141143799, + "learning_rate": 1.1626678153422708e-05, + "loss": 0.2259, + "step": 17049 + }, + { + "epoch": 46.45776566757493, + "grad_norm": 5.5835371017456055, + "learning_rate": 1.1625807406495605e-05, + "loss": 0.1088, + "step": 17050 + }, + { + "epoch": 46.46049046321526, + "grad_norm": 5.033536434173584, + "learning_rate": 1.1624936646906766e-05, + "loss": 0.1226, + "step": 17051 + }, + { + "epoch": 46.463215258855584, + "grad_norm": 4.7039618492126465, + "learning_rate": 1.1624065874662971e-05, + "loss": 0.0793, + "step": 17052 + }, + { + "epoch": 46.46594005449591, + "grad_norm": 5.142733097076416, + "learning_rate": 1.1623195089771005e-05, + "loss": 0.2472, + "step": 17053 + }, + { + "epoch": 46.46866485013624, + "grad_norm": 4.57804012298584, + "learning_rate": 1.1622324292237645e-05, + "loss": 0.1567, + "step": 17054 + }, + { + "epoch": 46.47138964577657, + "grad_norm": 5.453049182891846, + "learning_rate": 1.162145348206968e-05, + "loss": 0.2081, + "step": 17055 + }, + { + "epoch": 46.474114441416894, + "grad_norm": 7.133620738983154, + "learning_rate": 1.1620582659273882e-05, + "loss": 0.1425, + "step": 17056 + }, + { + "epoch": 46.47683923705722, + "grad_norm": 5.547028541564941, + "learning_rate": 1.1619711823857045e-05, + "loss": 0.1772, + "step": 17057 + }, + { + "epoch": 46.479564032697546, + "grad_norm": 5.2422919273376465, + "learning_rate": 1.161884097582594e-05, + "loss": 0.1627, + "step": 17058 + }, + { + "epoch": 46.48228882833787, + "grad_norm": 4.932727813720703, + "learning_rate": 1.1617970115187356e-05, + "loss": 0.1214, + "step": 17059 + }, + { + "epoch": 46.485013623978205, + "grad_norm": 4.722919464111328, + "learning_rate": 1.1617099241948072e-05, + "loss": 0.1622, + "step": 17060 + }, + { + "epoch": 46.48773841961853, + "grad_norm": 4.650905132293701, + "learning_rate": 1.1616228356114871e-05, + "loss": 0.1286, + "step": 17061 + }, + { + "epoch": 46.490463215258856, + "grad_norm": 6.387599468231201, + "learning_rate": 1.1615357457694534e-05, + "loss": 0.1863, + "step": 17062 + }, + { + "epoch": 46.49318801089918, + "grad_norm": 6.3198113441467285, + "learning_rate": 1.1614486546693848e-05, + "loss": 0.2276, + "step": 17063 + }, + { + "epoch": 46.49591280653951, + "grad_norm": 13.79389762878418, + "learning_rate": 1.1613615623119587e-05, + "loss": 0.1833, + "step": 17064 + }, + { + "epoch": 46.49863760217983, + "grad_norm": 5.718416690826416, + "learning_rate": 1.1612744686978545e-05, + "loss": 0.3176, + "step": 17065 + }, + { + "epoch": 46.50136239782017, + "grad_norm": 4.466360569000244, + "learning_rate": 1.1611873738277499e-05, + "loss": 0.1387, + "step": 17066 + }, + { + "epoch": 46.50408719346049, + "grad_norm": 16.300098419189453, + "learning_rate": 1.1611002777023233e-05, + "loss": 0.2676, + "step": 17067 + }, + { + "epoch": 46.50681198910082, + "grad_norm": 6.630517482757568, + "learning_rate": 1.1610131803222527e-05, + "loss": 0.1631, + "step": 17068 + }, + { + "epoch": 46.509536784741144, + "grad_norm": 6.6345977783203125, + "learning_rate": 1.1609260816882167e-05, + "loss": 0.1563, + "step": 17069 + }, + { + "epoch": 46.51226158038147, + "grad_norm": 6.348479747772217, + "learning_rate": 1.1608389818008933e-05, + "loss": 0.2277, + "step": 17070 + }, + { + "epoch": 46.514986376021795, + "grad_norm": 6.026793003082275, + "learning_rate": 1.1607518806609614e-05, + "loss": 0.1413, + "step": 17071 + }, + { + "epoch": 46.51771117166213, + "grad_norm": 5.881906509399414, + "learning_rate": 1.160664778269099e-05, + "loss": 0.2329, + "step": 17072 + }, + { + "epoch": 46.520435967302454, + "grad_norm": 5.612852573394775, + "learning_rate": 1.1605776746259844e-05, + "loss": 0.2504, + "step": 17073 + }, + { + "epoch": 46.52316076294278, + "grad_norm": 6.368758201599121, + "learning_rate": 1.1604905697322959e-05, + "loss": 0.2357, + "step": 17074 + }, + { + "epoch": 46.525885558583106, + "grad_norm": 4.724337100982666, + "learning_rate": 1.1604034635887123e-05, + "loss": 0.1575, + "step": 17075 + }, + { + "epoch": 46.52861035422343, + "grad_norm": 6.717184543609619, + "learning_rate": 1.1603163561959114e-05, + "loss": 0.2689, + "step": 17076 + }, + { + "epoch": 46.53133514986376, + "grad_norm": 5.42552375793457, + "learning_rate": 1.1602292475545722e-05, + "loss": 0.1152, + "step": 17077 + }, + { + "epoch": 46.53405994550409, + "grad_norm": 6.456541538238525, + "learning_rate": 1.1601421376653725e-05, + "loss": 0.2662, + "step": 17078 + }, + { + "epoch": 46.536784741144416, + "grad_norm": 7.436701774597168, + "learning_rate": 1.1600550265289913e-05, + "loss": 0.2448, + "step": 17079 + }, + { + "epoch": 46.53950953678474, + "grad_norm": 6.276247024536133, + "learning_rate": 1.1599679141461064e-05, + "loss": 0.1249, + "step": 17080 + }, + { + "epoch": 46.54223433242507, + "grad_norm": 5.149324893951416, + "learning_rate": 1.1598808005173967e-05, + "loss": 0.2059, + "step": 17081 + }, + { + "epoch": 46.54495912806539, + "grad_norm": 5.121246814727783, + "learning_rate": 1.15979368564354e-05, + "loss": 0.1415, + "step": 17082 + }, + { + "epoch": 46.54768392370572, + "grad_norm": 3.952131509780884, + "learning_rate": 1.1597065695252158e-05, + "loss": 0.1029, + "step": 17083 + }, + { + "epoch": 46.55040871934605, + "grad_norm": 5.1012282371521, + "learning_rate": 1.1596194521631018e-05, + "loss": 0.1665, + "step": 17084 + }, + { + "epoch": 46.55313351498638, + "grad_norm": 4.166836738586426, + "learning_rate": 1.159532333557877e-05, + "loss": 0.0947, + "step": 17085 + }, + { + "epoch": 46.555858310626704, + "grad_norm": 5.417153835296631, + "learning_rate": 1.159445213710219e-05, + "loss": 0.144, + "step": 17086 + }, + { + "epoch": 46.55858310626703, + "grad_norm": 4.658019065856934, + "learning_rate": 1.159358092620807e-05, + "loss": 0.1058, + "step": 17087 + }, + { + "epoch": 46.561307901907355, + "grad_norm": 6.91645622253418, + "learning_rate": 1.1592709702903193e-05, + "loss": 0.1344, + "step": 17088 + }, + { + "epoch": 46.56403269754768, + "grad_norm": 6.4773406982421875, + "learning_rate": 1.1591838467194345e-05, + "loss": 0.238, + "step": 17089 + }, + { + "epoch": 46.566757493188014, + "grad_norm": 5.077652454376221, + "learning_rate": 1.1590967219088305e-05, + "loss": 0.2961, + "step": 17090 + }, + { + "epoch": 46.56948228882834, + "grad_norm": 7.711599349975586, + "learning_rate": 1.159009595859187e-05, + "loss": 0.2155, + "step": 17091 + }, + { + "epoch": 46.572207084468666, + "grad_norm": 5.8498430252075195, + "learning_rate": 1.1589224685711816e-05, + "loss": 0.1707, + "step": 17092 + }, + { + "epoch": 46.57493188010899, + "grad_norm": 7.059077739715576, + "learning_rate": 1.1588353400454933e-05, + "loss": 0.1457, + "step": 17093 + }, + { + "epoch": 46.57765667574932, + "grad_norm": 4.909677028656006, + "learning_rate": 1.1587482102828002e-05, + "loss": 0.2807, + "step": 17094 + }, + { + "epoch": 46.58038147138964, + "grad_norm": 5.569499492645264, + "learning_rate": 1.1586610792837813e-05, + "loss": 0.3366, + "step": 17095 + }, + { + "epoch": 46.583106267029976, + "grad_norm": 4.240732669830322, + "learning_rate": 1.158573947049115e-05, + "loss": 0.147, + "step": 17096 + }, + { + "epoch": 46.5858310626703, + "grad_norm": 5.880338668823242, + "learning_rate": 1.1584868135794801e-05, + "loss": 0.256, + "step": 17097 + }, + { + "epoch": 46.58855585831063, + "grad_norm": 5.3914875984191895, + "learning_rate": 1.1583996788755548e-05, + "loss": 0.1347, + "step": 17098 + }, + { + "epoch": 46.59128065395095, + "grad_norm": 7.002774715423584, + "learning_rate": 1.1583125429380177e-05, + "loss": 0.1488, + "step": 17099 + }, + { + "epoch": 46.59400544959128, + "grad_norm": 4.866771697998047, + "learning_rate": 1.1582254057675481e-05, + "loss": 0.1221, + "step": 17100 + }, + { + "epoch": 46.596730245231605, + "grad_norm": 5.560983657836914, + "learning_rate": 1.1581382673648238e-05, + "loss": 0.2322, + "step": 17101 + }, + { + "epoch": 46.59945504087194, + "grad_norm": 5.6942620277404785, + "learning_rate": 1.1580511277305238e-05, + "loss": 0.1264, + "step": 17102 + }, + { + "epoch": 46.60217983651226, + "grad_norm": 5.447231769561768, + "learning_rate": 1.1579639868653267e-05, + "loss": 0.1602, + "step": 17103 + }, + { + "epoch": 46.60490463215259, + "grad_norm": 5.0954179763793945, + "learning_rate": 1.1578768447699111e-05, + "loss": 0.2193, + "step": 17104 + }, + { + "epoch": 46.607629427792915, + "grad_norm": 4.641750812530518, + "learning_rate": 1.1577897014449562e-05, + "loss": 0.1765, + "step": 17105 + }, + { + "epoch": 46.61035422343324, + "grad_norm": 4.832330226898193, + "learning_rate": 1.1577025568911395e-05, + "loss": 0.1841, + "step": 17106 + }, + { + "epoch": 46.61307901907357, + "grad_norm": 5.537833213806152, + "learning_rate": 1.1576154111091407e-05, + "loss": 0.257, + "step": 17107 + }, + { + "epoch": 46.6158038147139, + "grad_norm": 7.282318115234375, + "learning_rate": 1.157528264099638e-05, + "loss": 0.2022, + "step": 17108 + }, + { + "epoch": 46.618528610354225, + "grad_norm": 9.270844459533691, + "learning_rate": 1.1574411158633105e-05, + "loss": 0.2586, + "step": 17109 + }, + { + "epoch": 46.62125340599455, + "grad_norm": 5.545162677764893, + "learning_rate": 1.1573539664008367e-05, + "loss": 0.1764, + "step": 17110 + }, + { + "epoch": 46.62397820163488, + "grad_norm": 4.650853633880615, + "learning_rate": 1.157266815712895e-05, + "loss": 0.0835, + "step": 17111 + }, + { + "epoch": 46.6267029972752, + "grad_norm": 6.177081108093262, + "learning_rate": 1.1571796638001644e-05, + "loss": 0.1656, + "step": 17112 + }, + { + "epoch": 46.62942779291553, + "grad_norm": 6.224137306213379, + "learning_rate": 1.1570925106633237e-05, + "loss": 0.1861, + "step": 17113 + }, + { + "epoch": 46.63215258855586, + "grad_norm": 7.899147987365723, + "learning_rate": 1.1570053563030516e-05, + "loss": 0.1234, + "step": 17114 + }, + { + "epoch": 46.63487738419619, + "grad_norm": 4.292054176330566, + "learning_rate": 1.156918200720027e-05, + "loss": 0.1391, + "step": 17115 + }, + { + "epoch": 46.63760217983651, + "grad_norm": 6.130233287811279, + "learning_rate": 1.1568310439149281e-05, + "loss": 0.1378, + "step": 17116 + }, + { + "epoch": 46.64032697547684, + "grad_norm": 5.36210823059082, + "learning_rate": 1.1567438858884344e-05, + "loss": 0.2174, + "step": 17117 + }, + { + "epoch": 46.643051771117165, + "grad_norm": 4.932548999786377, + "learning_rate": 1.1566567266412243e-05, + "loss": 0.2543, + "step": 17118 + }, + { + "epoch": 46.64577656675749, + "grad_norm": 10.372445106506348, + "learning_rate": 1.1565695661739767e-05, + "loss": 0.2312, + "step": 17119 + }, + { + "epoch": 46.64850136239782, + "grad_norm": 6.825093746185303, + "learning_rate": 1.1564824044873704e-05, + "loss": 0.1279, + "step": 17120 + }, + { + "epoch": 46.65122615803815, + "grad_norm": 6.031970500946045, + "learning_rate": 1.156395241582084e-05, + "loss": 0.1711, + "step": 17121 + }, + { + "epoch": 46.653950953678475, + "grad_norm": 4.9874162673950195, + "learning_rate": 1.1563080774587967e-05, + "loss": 0.1428, + "step": 17122 + }, + { + "epoch": 46.6566757493188, + "grad_norm": 5.995129585266113, + "learning_rate": 1.1562209121181869e-05, + "loss": 0.1624, + "step": 17123 + }, + { + "epoch": 46.65940054495913, + "grad_norm": 4.370136737823486, + "learning_rate": 1.1561337455609336e-05, + "loss": 0.1771, + "step": 17124 + }, + { + "epoch": 46.66212534059945, + "grad_norm": 5.784974575042725, + "learning_rate": 1.1560465777877159e-05, + "loss": 0.3389, + "step": 17125 + }, + { + "epoch": 46.664850136239785, + "grad_norm": 5.641836643218994, + "learning_rate": 1.1559594087992126e-05, + "loss": 0.1953, + "step": 17126 + }, + { + "epoch": 46.66757493188011, + "grad_norm": 4.9505839347839355, + "learning_rate": 1.1558722385961022e-05, + "loss": 0.1016, + "step": 17127 + }, + { + "epoch": 46.67029972752044, + "grad_norm": 6.375181198120117, + "learning_rate": 1.1557850671790638e-05, + "loss": 0.4016, + "step": 17128 + }, + { + "epoch": 46.67302452316076, + "grad_norm": 6.434603214263916, + "learning_rate": 1.1556978945487764e-05, + "loss": 0.2028, + "step": 17129 + }, + { + "epoch": 46.67574931880109, + "grad_norm": 5.105738162994385, + "learning_rate": 1.1556107207059191e-05, + "loss": 0.1713, + "step": 17130 + }, + { + "epoch": 46.678474114441414, + "grad_norm": 6.207189083099365, + "learning_rate": 1.15552354565117e-05, + "loss": 0.2828, + "step": 17131 + }, + { + "epoch": 46.68119891008175, + "grad_norm": 5.005661487579346, + "learning_rate": 1.1554363693852088e-05, + "loss": 0.3001, + "step": 17132 + }, + { + "epoch": 46.68392370572207, + "grad_norm": 4.64664888381958, + "learning_rate": 1.155349191908714e-05, + "loss": 0.1309, + "step": 17133 + }, + { + "epoch": 46.6866485013624, + "grad_norm": 5.883870601654053, + "learning_rate": 1.1552620132223649e-05, + "loss": 0.1508, + "step": 17134 + }, + { + "epoch": 46.689373297002724, + "grad_norm": 6.420288562774658, + "learning_rate": 1.1551748333268402e-05, + "loss": 0.1644, + "step": 17135 + }, + { + "epoch": 46.69209809264305, + "grad_norm": 7.443354606628418, + "learning_rate": 1.155087652222819e-05, + "loss": 0.2949, + "step": 17136 + }, + { + "epoch": 46.694822888283376, + "grad_norm": 4.831696510314941, + "learning_rate": 1.1550004699109797e-05, + "loss": 0.1808, + "step": 17137 + }, + { + "epoch": 46.69754768392371, + "grad_norm": 5.709593772888184, + "learning_rate": 1.1549132863920023e-05, + "loss": 0.2093, + "step": 17138 + }, + { + "epoch": 46.700272479564035, + "grad_norm": 4.546253204345703, + "learning_rate": 1.154826101666565e-05, + "loss": 0.1078, + "step": 17139 + }, + { + "epoch": 46.70299727520436, + "grad_norm": 6.26744270324707, + "learning_rate": 1.154738915735347e-05, + "loss": 0.2678, + "step": 17140 + }, + { + "epoch": 46.705722070844686, + "grad_norm": 4.443904399871826, + "learning_rate": 1.1546517285990272e-05, + "loss": 0.1163, + "step": 17141 + }, + { + "epoch": 46.70844686648501, + "grad_norm": 6.217555522918701, + "learning_rate": 1.1545645402582845e-05, + "loss": 0.2317, + "step": 17142 + }, + { + "epoch": 46.71117166212534, + "grad_norm": 5.766835689544678, + "learning_rate": 1.1544773507137985e-05, + "loss": 0.1799, + "step": 17143 + }, + { + "epoch": 46.71389645776567, + "grad_norm": 5.947284698486328, + "learning_rate": 1.1543901599662476e-05, + "loss": 0.1737, + "step": 17144 + }, + { + "epoch": 46.716621253406, + "grad_norm": 5.5444254875183105, + "learning_rate": 1.1543029680163114e-05, + "loss": 0.1088, + "step": 17145 + }, + { + "epoch": 46.71934604904632, + "grad_norm": 5.982610702514648, + "learning_rate": 1.1542157748646687e-05, + "loss": 0.1342, + "step": 17146 + }, + { + "epoch": 46.72207084468665, + "grad_norm": 5.010898113250732, + "learning_rate": 1.1541285805119981e-05, + "loss": 0.2159, + "step": 17147 + }, + { + "epoch": 46.724795640326974, + "grad_norm": 5.242317199707031, + "learning_rate": 1.1540413849589795e-05, + "loss": 0.2223, + "step": 17148 + }, + { + "epoch": 46.7275204359673, + "grad_norm": 5.874389171600342, + "learning_rate": 1.1539541882062912e-05, + "loss": 0.1629, + "step": 17149 + }, + { + "epoch": 46.73024523160763, + "grad_norm": 5.2313151359558105, + "learning_rate": 1.1538669902546128e-05, + "loss": 0.1995, + "step": 17150 + }, + { + "epoch": 46.73297002724796, + "grad_norm": 4.858578681945801, + "learning_rate": 1.153779791104623e-05, + "loss": 0.2223, + "step": 17151 + }, + { + "epoch": 46.735694822888284, + "grad_norm": 6.7911601066589355, + "learning_rate": 1.1536925907570017e-05, + "loss": 0.1924, + "step": 17152 + }, + { + "epoch": 46.73841961852861, + "grad_norm": 5.80068302154541, + "learning_rate": 1.1536053892124271e-05, + "loss": 0.1387, + "step": 17153 + }, + { + "epoch": 46.741144414168936, + "grad_norm": 6.854654788970947, + "learning_rate": 1.1535181864715787e-05, + "loss": 0.2084, + "step": 17154 + }, + { + "epoch": 46.74386920980926, + "grad_norm": 6.12240743637085, + "learning_rate": 1.1534309825351355e-05, + "loss": 0.1462, + "step": 17155 + }, + { + "epoch": 46.746594005449595, + "grad_norm": 4.873581409454346, + "learning_rate": 1.153343777403777e-05, + "loss": 0.2224, + "step": 17156 + }, + { + "epoch": 46.74931880108992, + "grad_norm": 4.991065502166748, + "learning_rate": 1.153256571078182e-05, + "loss": 0.3822, + "step": 17157 + }, + { + "epoch": 46.752043596730246, + "grad_norm": 5.345722198486328, + "learning_rate": 1.1531693635590297e-05, + "loss": 0.1559, + "step": 17158 + }, + { + "epoch": 46.75476839237057, + "grad_norm": 4.802318096160889, + "learning_rate": 1.153082154846999e-05, + "loss": 0.0878, + "step": 17159 + }, + { + "epoch": 46.7574931880109, + "grad_norm": 16.177759170532227, + "learning_rate": 1.15299494494277e-05, + "loss": 0.1817, + "step": 17160 + }, + { + "epoch": 46.76021798365122, + "grad_norm": 5.017428874969482, + "learning_rate": 1.152907733847021e-05, + "loss": 0.1373, + "step": 17161 + }, + { + "epoch": 46.762942779291556, + "grad_norm": 4.417322635650635, + "learning_rate": 1.1528205215604315e-05, + "loss": 0.1326, + "step": 17162 + }, + { + "epoch": 46.76566757493188, + "grad_norm": 5.657163143157959, + "learning_rate": 1.1527333080836807e-05, + "loss": 0.2708, + "step": 17163 + }, + { + "epoch": 46.76839237057221, + "grad_norm": 6.762208461761475, + "learning_rate": 1.152646093417448e-05, + "loss": 0.1091, + "step": 17164 + }, + { + "epoch": 46.771117166212534, + "grad_norm": 7.414045333862305, + "learning_rate": 1.1525588775624122e-05, + "loss": 0.1453, + "step": 17165 + }, + { + "epoch": 46.77384196185286, + "grad_norm": 4.256861209869385, + "learning_rate": 1.1524716605192527e-05, + "loss": 0.1232, + "step": 17166 + }, + { + "epoch": 46.776566757493185, + "grad_norm": 6.971860885620117, + "learning_rate": 1.152384442288649e-05, + "loss": 0.131, + "step": 17167 + }, + { + "epoch": 46.77929155313352, + "grad_norm": 5.602042198181152, + "learning_rate": 1.1522972228712799e-05, + "loss": 0.1672, + "step": 17168 + }, + { + "epoch": 46.782016348773844, + "grad_norm": 5.54409122467041, + "learning_rate": 1.1522100022678251e-05, + "loss": 0.2248, + "step": 17169 + }, + { + "epoch": 46.78474114441417, + "grad_norm": 4.696835994720459, + "learning_rate": 1.1521227804789638e-05, + "loss": 0.3056, + "step": 17170 + }, + { + "epoch": 46.787465940054496, + "grad_norm": 10.720602035522461, + "learning_rate": 1.1520355575053752e-05, + "loss": 0.2274, + "step": 17171 + }, + { + "epoch": 46.79019073569482, + "grad_norm": 5.531253337860107, + "learning_rate": 1.1519483333477385e-05, + "loss": 0.1606, + "step": 17172 + }, + { + "epoch": 46.79291553133515, + "grad_norm": 5.234531879425049, + "learning_rate": 1.151861108006733e-05, + "loss": 0.201, + "step": 17173 + }, + { + "epoch": 46.79564032697548, + "grad_norm": 7.15482759475708, + "learning_rate": 1.1517738814830383e-05, + "loss": 0.1566, + "step": 17174 + }, + { + "epoch": 46.798365122615806, + "grad_norm": 8.959362983703613, + "learning_rate": 1.1516866537773332e-05, + "loss": 0.2745, + "step": 17175 + }, + { + "epoch": 46.80108991825613, + "grad_norm": 11.96219539642334, + "learning_rate": 1.1515994248902976e-05, + "loss": 0.2502, + "step": 17176 + }, + { + "epoch": 46.80381471389646, + "grad_norm": 4.936633110046387, + "learning_rate": 1.1515121948226102e-05, + "loss": 0.1515, + "step": 17177 + }, + { + "epoch": 46.80653950953678, + "grad_norm": 6.5064568519592285, + "learning_rate": 1.1514249635749511e-05, + "loss": 0.2102, + "step": 17178 + }, + { + "epoch": 46.80926430517711, + "grad_norm": 7.871065139770508, + "learning_rate": 1.1513377311479989e-05, + "loss": 0.1696, + "step": 17179 + }, + { + "epoch": 46.81198910081744, + "grad_norm": 5.331688404083252, + "learning_rate": 1.1512504975424338e-05, + "loss": 0.1754, + "step": 17180 + }, + { + "epoch": 46.81471389645777, + "grad_norm": 5.36503791809082, + "learning_rate": 1.1511632627589343e-05, + "loss": 0.1506, + "step": 17181 + }, + { + "epoch": 46.817438692098094, + "grad_norm": 4.530533790588379, + "learning_rate": 1.1510760267981803e-05, + "loss": 0.4418, + "step": 17182 + }, + { + "epoch": 46.82016348773842, + "grad_norm": 4.749527931213379, + "learning_rate": 1.1509887896608509e-05, + "loss": 0.1638, + "step": 17183 + }, + { + "epoch": 46.822888283378745, + "grad_norm": 5.135331153869629, + "learning_rate": 1.150901551347626e-05, + "loss": 0.208, + "step": 17184 + }, + { + "epoch": 46.82561307901907, + "grad_norm": 6.572135925292969, + "learning_rate": 1.1508143118591843e-05, + "loss": 0.2513, + "step": 17185 + }, + { + "epoch": 46.828337874659404, + "grad_norm": 5.860957622528076, + "learning_rate": 1.1507270711962057e-05, + "loss": 0.2179, + "step": 17186 + }, + { + "epoch": 46.83106267029973, + "grad_norm": 4.241574764251709, + "learning_rate": 1.1506398293593697e-05, + "loss": 0.1535, + "step": 17187 + }, + { + "epoch": 46.833787465940055, + "grad_norm": 5.161186695098877, + "learning_rate": 1.1505525863493554e-05, + "loss": 0.1632, + "step": 17188 + }, + { + "epoch": 46.83651226158038, + "grad_norm": 5.187852382659912, + "learning_rate": 1.1504653421668424e-05, + "loss": 0.2404, + "step": 17189 + }, + { + "epoch": 46.83923705722071, + "grad_norm": 5.943875312805176, + "learning_rate": 1.1503780968125105e-05, + "loss": 0.2124, + "step": 17190 + }, + { + "epoch": 46.84196185286103, + "grad_norm": 8.500675201416016, + "learning_rate": 1.1502908502870382e-05, + "loss": 0.3095, + "step": 17191 + }, + { + "epoch": 46.844686648501366, + "grad_norm": 5.175501346588135, + "learning_rate": 1.1502036025911061e-05, + "loss": 0.1518, + "step": 17192 + }, + { + "epoch": 46.84741144414169, + "grad_norm": 6.077765941619873, + "learning_rate": 1.150116353725393e-05, + "loss": 0.148, + "step": 17193 + }, + { + "epoch": 46.85013623978202, + "grad_norm": 5.665741443634033, + "learning_rate": 1.1500291036905784e-05, + "loss": 0.1457, + "step": 17194 + }, + { + "epoch": 46.85286103542234, + "grad_norm": 5.57317590713501, + "learning_rate": 1.1499418524873422e-05, + "loss": 0.3059, + "step": 17195 + }, + { + "epoch": 46.85558583106267, + "grad_norm": 6.533044338226318, + "learning_rate": 1.1498546001163638e-05, + "loss": 0.1403, + "step": 17196 + }, + { + "epoch": 46.858310626702995, + "grad_norm": 6.13126802444458, + "learning_rate": 1.1497673465783224e-05, + "loss": 0.2343, + "step": 17197 + }, + { + "epoch": 46.86103542234333, + "grad_norm": 5.1407060623168945, + "learning_rate": 1.1496800918738977e-05, + "loss": 0.1411, + "step": 17198 + }, + { + "epoch": 46.86376021798365, + "grad_norm": 8.173460960388184, + "learning_rate": 1.1495928360037691e-05, + "loss": 0.3423, + "step": 17199 + }, + { + "epoch": 46.86648501362398, + "grad_norm": 55.221885681152344, + "learning_rate": 1.1495055789686167e-05, + "loss": 0.2487, + "step": 17200 + }, + { + "epoch": 46.869209809264305, + "grad_norm": 7.013250827789307, + "learning_rate": 1.1494183207691194e-05, + "loss": 0.2019, + "step": 17201 + }, + { + "epoch": 46.87193460490463, + "grad_norm": 6.132880687713623, + "learning_rate": 1.149331061405957e-05, + "loss": 0.3039, + "step": 17202 + }, + { + "epoch": 46.87465940054496, + "grad_norm": 5.015172481536865, + "learning_rate": 1.1492438008798093e-05, + "loss": 0.2782, + "step": 17203 + }, + { + "epoch": 46.87738419618529, + "grad_norm": 6.557510852813721, + "learning_rate": 1.1491565391913555e-05, + "loss": 0.2694, + "step": 17204 + }, + { + "epoch": 46.880108991825615, + "grad_norm": 5.464590549468994, + "learning_rate": 1.1490692763412757e-05, + "loss": 0.439, + "step": 17205 + }, + { + "epoch": 46.88283378746594, + "grad_norm": 6.250936985015869, + "learning_rate": 1.1489820123302487e-05, + "loss": 0.1631, + "step": 17206 + }, + { + "epoch": 46.88555858310627, + "grad_norm": 5.934758186340332, + "learning_rate": 1.148894747158955e-05, + "loss": 0.186, + "step": 17207 + }, + { + "epoch": 46.88828337874659, + "grad_norm": 6.300573825836182, + "learning_rate": 1.1488074808280736e-05, + "loss": 0.2138, + "step": 17208 + }, + { + "epoch": 46.89100817438692, + "grad_norm": 4.808372497558594, + "learning_rate": 1.1487202133382844e-05, + "loss": 0.1864, + "step": 17209 + }, + { + "epoch": 46.89373297002725, + "grad_norm": 6.009509086608887, + "learning_rate": 1.1486329446902669e-05, + "loss": 0.1864, + "step": 17210 + }, + { + "epoch": 46.89645776566758, + "grad_norm": 5.693976402282715, + "learning_rate": 1.1485456748847006e-05, + "loss": 0.2315, + "step": 17211 + }, + { + "epoch": 46.8991825613079, + "grad_norm": 5.321122646331787, + "learning_rate": 1.1484584039222655e-05, + "loss": 0.313, + "step": 17212 + }, + { + "epoch": 46.90190735694823, + "grad_norm": 5.934122085571289, + "learning_rate": 1.1483711318036414e-05, + "loss": 0.1433, + "step": 17213 + }, + { + "epoch": 46.904632152588555, + "grad_norm": 5.832672119140625, + "learning_rate": 1.1482838585295076e-05, + "loss": 0.156, + "step": 17214 + }, + { + "epoch": 46.90735694822888, + "grad_norm": 6.689321041107178, + "learning_rate": 1.1481965841005438e-05, + "loss": 0.2502, + "step": 17215 + }, + { + "epoch": 46.91008174386921, + "grad_norm": 6.460909843444824, + "learning_rate": 1.1481093085174298e-05, + "loss": 0.2513, + "step": 17216 + }, + { + "epoch": 46.91280653950954, + "grad_norm": 6.603307247161865, + "learning_rate": 1.1480220317808453e-05, + "loss": 0.3076, + "step": 17217 + }, + { + "epoch": 46.915531335149865, + "grad_norm": 7.377344131469727, + "learning_rate": 1.1479347538914698e-05, + "loss": 0.2427, + "step": 17218 + }, + { + "epoch": 46.91825613079019, + "grad_norm": 4.96650505065918, + "learning_rate": 1.1478474748499833e-05, + "loss": 0.1482, + "step": 17219 + }, + { + "epoch": 46.920980926430516, + "grad_norm": 6.873035907745361, + "learning_rate": 1.1477601946570651e-05, + "loss": 0.2652, + "step": 17220 + }, + { + "epoch": 46.92370572207084, + "grad_norm": 5.6309309005737305, + "learning_rate": 1.147672913313396e-05, + "loss": 0.185, + "step": 17221 + }, + { + "epoch": 46.926430517711175, + "grad_norm": 5.095126152038574, + "learning_rate": 1.1475856308196544e-05, + "loss": 0.204, + "step": 17222 + }, + { + "epoch": 46.9291553133515, + "grad_norm": 6.1172966957092285, + "learning_rate": 1.1474983471765211e-05, + "loss": 0.2061, + "step": 17223 + }, + { + "epoch": 46.93188010899183, + "grad_norm": 8.968783378601074, + "learning_rate": 1.147411062384675e-05, + "loss": 0.258, + "step": 17224 + }, + { + "epoch": 46.93460490463215, + "grad_norm": 8.455772399902344, + "learning_rate": 1.1473237764447967e-05, + "loss": 0.1856, + "step": 17225 + }, + { + "epoch": 46.93732970027248, + "grad_norm": 5.343738555908203, + "learning_rate": 1.1472364893575651e-05, + "loss": 0.1199, + "step": 17226 + }, + { + "epoch": 46.940054495912804, + "grad_norm": 5.777643203735352, + "learning_rate": 1.1471492011236609e-05, + "loss": 0.2207, + "step": 17227 + }, + { + "epoch": 46.94277929155314, + "grad_norm": 6.920644283294678, + "learning_rate": 1.1470619117437629e-05, + "loss": 0.2204, + "step": 17228 + }, + { + "epoch": 46.94550408719346, + "grad_norm": 7.075724124908447, + "learning_rate": 1.146974621218552e-05, + "loss": 0.2559, + "step": 17229 + }, + { + "epoch": 46.94822888283379, + "grad_norm": 6.458963871002197, + "learning_rate": 1.1468873295487073e-05, + "loss": 0.2609, + "step": 17230 + }, + { + "epoch": 46.950953678474114, + "grad_norm": 8.322772979736328, + "learning_rate": 1.1468000367349088e-05, + "loss": 0.1818, + "step": 17231 + }, + { + "epoch": 46.95367847411444, + "grad_norm": 5.9607672691345215, + "learning_rate": 1.1467127427778364e-05, + "loss": 0.1233, + "step": 17232 + }, + { + "epoch": 46.956403269754766, + "grad_norm": 4.860105991363525, + "learning_rate": 1.14662544767817e-05, + "loss": 0.2093, + "step": 17233 + }, + { + "epoch": 46.95912806539509, + "grad_norm": 9.473416328430176, + "learning_rate": 1.146538151436589e-05, + "loss": 0.1582, + "step": 17234 + }, + { + "epoch": 46.961852861035425, + "grad_norm": 13.880687713623047, + "learning_rate": 1.1464508540537738e-05, + "loss": 0.2226, + "step": 17235 + }, + { + "epoch": 46.96457765667575, + "grad_norm": 4.40953254699707, + "learning_rate": 1.1463635555304038e-05, + "loss": 0.1368, + "step": 17236 + }, + { + "epoch": 46.967302452316076, + "grad_norm": 5.262019157409668, + "learning_rate": 1.1462762558671594e-05, + "loss": 0.1339, + "step": 17237 + }, + { + "epoch": 46.9700272479564, + "grad_norm": 4.952602386474609, + "learning_rate": 1.14618895506472e-05, + "loss": 0.239, + "step": 17238 + }, + { + "epoch": 46.97275204359673, + "grad_norm": 6.291650772094727, + "learning_rate": 1.1461016531237661e-05, + "loss": 0.138, + "step": 17239 + }, + { + "epoch": 46.97547683923706, + "grad_norm": 4.404817581176758, + "learning_rate": 1.1460143500449769e-05, + "loss": 0.3566, + "step": 17240 + }, + { + "epoch": 46.97820163487739, + "grad_norm": 6.670058250427246, + "learning_rate": 1.145927045829033e-05, + "loss": 0.2422, + "step": 17241 + }, + { + "epoch": 46.98092643051771, + "grad_norm": 3.762319564819336, + "learning_rate": 1.1458397404766138e-05, + "loss": 0.1222, + "step": 17242 + }, + { + "epoch": 46.98365122615804, + "grad_norm": 5.879096508026123, + "learning_rate": 1.1457524339883994e-05, + "loss": 0.2251, + "step": 17243 + }, + { + "epoch": 46.986376021798364, + "grad_norm": 5.028500556945801, + "learning_rate": 1.1456651263650695e-05, + "loss": 0.1746, + "step": 17244 + }, + { + "epoch": 46.98910081743869, + "grad_norm": 4.749955177307129, + "learning_rate": 1.1455778176073045e-05, + "loss": 0.1785, + "step": 17245 + }, + { + "epoch": 46.991825613079016, + "grad_norm": 5.498077869415283, + "learning_rate": 1.1454905077157839e-05, + "loss": 0.123, + "step": 17246 + }, + { + "epoch": 46.99455040871935, + "grad_norm": 4.786930561065674, + "learning_rate": 1.1454031966911883e-05, + "loss": 0.1777, + "step": 17247 + }, + { + "epoch": 46.997275204359674, + "grad_norm": 5.84864616394043, + "learning_rate": 1.1453158845341969e-05, + "loss": 0.1277, + "step": 17248 + }, + { + "epoch": 47.0, + "grad_norm": 4.433199882507324, + "learning_rate": 1.1452285712454905e-05, + "loss": 0.0942, + "step": 17249 + }, + { + "epoch": 47.002724795640326, + "grad_norm": 5.735518932342529, + "learning_rate": 1.1451412568257484e-05, + "loss": 0.1767, + "step": 17250 + }, + { + "epoch": 47.00544959128065, + "grad_norm": 4.625182151794434, + "learning_rate": 1.1450539412756509e-05, + "loss": 0.1015, + "step": 17251 + }, + { + "epoch": 47.00817438692098, + "grad_norm": 18.605335235595703, + "learning_rate": 1.144966624595878e-05, + "loss": 0.1508, + "step": 17252 + }, + { + "epoch": 47.01089918256131, + "grad_norm": 6.5579142570495605, + "learning_rate": 1.1448793067871095e-05, + "loss": 0.1519, + "step": 17253 + }, + { + "epoch": 47.013623978201636, + "grad_norm": 6.73146390914917, + "learning_rate": 1.1447919878500255e-05, + "loss": 0.1431, + "step": 17254 + }, + { + "epoch": 47.01634877384196, + "grad_norm": 10.806292533874512, + "learning_rate": 1.1447046677853066e-05, + "loss": 0.3581, + "step": 17255 + }, + { + "epoch": 47.01907356948229, + "grad_norm": 7.758955478668213, + "learning_rate": 1.1446173465936322e-05, + "loss": 0.2293, + "step": 17256 + }, + { + "epoch": 47.02179836512261, + "grad_norm": 5.246854305267334, + "learning_rate": 1.1445300242756827e-05, + "loss": 0.1232, + "step": 17257 + }, + { + "epoch": 47.02452316076294, + "grad_norm": 4.2169389724731445, + "learning_rate": 1.144442700832138e-05, + "loss": 0.1807, + "step": 17258 + }, + { + "epoch": 47.02724795640327, + "grad_norm": 5.507205486297607, + "learning_rate": 1.1443553762636781e-05, + "loss": 0.1362, + "step": 17259 + }, + { + "epoch": 47.0299727520436, + "grad_norm": 6.601847171783447, + "learning_rate": 1.1442680505709832e-05, + "loss": 0.1526, + "step": 17260 + }, + { + "epoch": 47.032697547683924, + "grad_norm": 4.276211738586426, + "learning_rate": 1.1441807237547336e-05, + "loss": 0.1558, + "step": 17261 + }, + { + "epoch": 47.03542234332425, + "grad_norm": 4.014583110809326, + "learning_rate": 1.1440933958156087e-05, + "loss": 0.1796, + "step": 17262 + }, + { + "epoch": 47.038147138964575, + "grad_norm": 9.991283416748047, + "learning_rate": 1.1440060667542891e-05, + "loss": 0.1512, + "step": 17263 + }, + { + "epoch": 47.0408719346049, + "grad_norm": 4.610074520111084, + "learning_rate": 1.143918736571455e-05, + "loss": 0.1224, + "step": 17264 + }, + { + "epoch": 47.043596730245234, + "grad_norm": 5.848897457122803, + "learning_rate": 1.1438314052677865e-05, + "loss": 0.1876, + "step": 17265 + }, + { + "epoch": 47.04632152588556, + "grad_norm": 6.770817756652832, + "learning_rate": 1.1437440728439637e-05, + "loss": 0.1305, + "step": 17266 + }, + { + "epoch": 47.049046321525886, + "grad_norm": 7.044491291046143, + "learning_rate": 1.1436567393006668e-05, + "loss": 0.204, + "step": 17267 + }, + { + "epoch": 47.05177111716621, + "grad_norm": 5.467977046966553, + "learning_rate": 1.1435694046385755e-05, + "loss": 0.1817, + "step": 17268 + }, + { + "epoch": 47.05449591280654, + "grad_norm": 5.026775360107422, + "learning_rate": 1.1434820688583706e-05, + "loss": 0.1329, + "step": 17269 + }, + { + "epoch": 47.05722070844686, + "grad_norm": 6.125763416290283, + "learning_rate": 1.1433947319607318e-05, + "loss": 0.1733, + "step": 17270 + }, + { + "epoch": 47.059945504087196, + "grad_norm": 6.257920742034912, + "learning_rate": 1.1433073939463393e-05, + "loss": 0.152, + "step": 17271 + }, + { + "epoch": 47.06267029972752, + "grad_norm": 7.099124908447266, + "learning_rate": 1.1432200548158738e-05, + "loss": 0.2168, + "step": 17272 + }, + { + "epoch": 47.06539509536785, + "grad_norm": 6.816453456878662, + "learning_rate": 1.1431327145700149e-05, + "loss": 0.2618, + "step": 17273 + }, + { + "epoch": 47.06811989100817, + "grad_norm": 5.101950168609619, + "learning_rate": 1.143045373209443e-05, + "loss": 0.1437, + "step": 17274 + }, + { + "epoch": 47.0708446866485, + "grad_norm": 17.04148292541504, + "learning_rate": 1.1429580307348385e-05, + "loss": 0.1967, + "step": 17275 + }, + { + "epoch": 47.073569482288825, + "grad_norm": 5.364077091217041, + "learning_rate": 1.142870687146881e-05, + "loss": 0.1554, + "step": 17276 + }, + { + "epoch": 47.07629427792916, + "grad_norm": 6.201749324798584, + "learning_rate": 1.1427833424462517e-05, + "loss": 0.19, + "step": 17277 + }, + { + "epoch": 47.079019073569484, + "grad_norm": 5.364887714385986, + "learning_rate": 1.1426959966336302e-05, + "loss": 0.2224, + "step": 17278 + }, + { + "epoch": 47.08174386920981, + "grad_norm": 7.636233806610107, + "learning_rate": 1.1426086497096966e-05, + "loss": 0.1855, + "step": 17279 + }, + { + "epoch": 47.084468664850135, + "grad_norm": 5.564447402954102, + "learning_rate": 1.1425213016751317e-05, + "loss": 0.1315, + "step": 17280 + }, + { + "epoch": 47.08719346049046, + "grad_norm": 4.97089958190918, + "learning_rate": 1.1424339525306154e-05, + "loss": 0.1413, + "step": 17281 + }, + { + "epoch": 47.08991825613079, + "grad_norm": 4.3761091232299805, + "learning_rate": 1.1423466022768283e-05, + "loss": 0.1186, + "step": 17282 + }, + { + "epoch": 47.09264305177112, + "grad_norm": 15.600180625915527, + "learning_rate": 1.14225925091445e-05, + "loss": 0.2701, + "step": 17283 + }, + { + "epoch": 47.095367847411445, + "grad_norm": 5.563814640045166, + "learning_rate": 1.1421718984441617e-05, + "loss": 0.2928, + "step": 17284 + }, + { + "epoch": 47.09809264305177, + "grad_norm": 6.132524490356445, + "learning_rate": 1.1420845448666429e-05, + "loss": 0.3414, + "step": 17285 + }, + { + "epoch": 47.1008174386921, + "grad_norm": 4.493549346923828, + "learning_rate": 1.1419971901825743e-05, + "loss": 0.2024, + "step": 17286 + }, + { + "epoch": 47.10354223433242, + "grad_norm": 11.406949043273926, + "learning_rate": 1.1419098343926363e-05, + "loss": 0.2807, + "step": 17287 + }, + { + "epoch": 47.10626702997275, + "grad_norm": 15.65683364868164, + "learning_rate": 1.1418224774975088e-05, + "loss": 0.1355, + "step": 17288 + }, + { + "epoch": 47.10899182561308, + "grad_norm": 6.96215295791626, + "learning_rate": 1.1417351194978725e-05, + "loss": 0.316, + "step": 17289 + }, + { + "epoch": 47.11171662125341, + "grad_norm": 8.716181755065918, + "learning_rate": 1.1416477603944078e-05, + "loss": 0.17, + "step": 17290 + }, + { + "epoch": 47.11444141689373, + "grad_norm": 5.2091217041015625, + "learning_rate": 1.1415604001877949e-05, + "loss": 0.2232, + "step": 17291 + }, + { + "epoch": 47.11716621253406, + "grad_norm": 11.852521896362305, + "learning_rate": 1.1414730388787143e-05, + "loss": 0.1593, + "step": 17292 + }, + { + "epoch": 47.119891008174385, + "grad_norm": 6.9596757888793945, + "learning_rate": 1.1413856764678459e-05, + "loss": 0.1775, + "step": 17293 + }, + { + "epoch": 47.12261580381471, + "grad_norm": 4.772704601287842, + "learning_rate": 1.1412983129558706e-05, + "loss": 0.2445, + "step": 17294 + }, + { + "epoch": 47.12534059945504, + "grad_norm": 6.12083625793457, + "learning_rate": 1.1412109483434683e-05, + "loss": 0.1868, + "step": 17295 + }, + { + "epoch": 47.12806539509537, + "grad_norm": 6.204431533813477, + "learning_rate": 1.1411235826313201e-05, + "loss": 0.2229, + "step": 17296 + }, + { + "epoch": 47.130790190735695, + "grad_norm": 5.632849216461182, + "learning_rate": 1.1410362158201054e-05, + "loss": 0.3334, + "step": 17297 + }, + { + "epoch": 47.13351498637602, + "grad_norm": 8.755095481872559, + "learning_rate": 1.1409488479105058e-05, + "loss": 0.1777, + "step": 17298 + }, + { + "epoch": 47.13623978201635, + "grad_norm": 4.300026893615723, + "learning_rate": 1.1408614789032007e-05, + "loss": 0.1565, + "step": 17299 + }, + { + "epoch": 47.13896457765667, + "grad_norm": 5.8478803634643555, + "learning_rate": 1.1407741087988713e-05, + "loss": 0.1355, + "step": 17300 + }, + { + "epoch": 47.141689373297005, + "grad_norm": 9.44076919555664, + "learning_rate": 1.1406867375981975e-05, + "loss": 0.2481, + "step": 17301 + }, + { + "epoch": 47.14441416893733, + "grad_norm": 5.266812801361084, + "learning_rate": 1.1405993653018599e-05, + "loss": 0.1623, + "step": 17302 + }, + { + "epoch": 47.14713896457766, + "grad_norm": 4.535799026489258, + "learning_rate": 1.1405119919105387e-05, + "loss": 0.1985, + "step": 17303 + }, + { + "epoch": 47.14986376021798, + "grad_norm": 6.18609094619751, + "learning_rate": 1.1404246174249152e-05, + "loss": 0.1531, + "step": 17304 + }, + { + "epoch": 47.15258855585831, + "grad_norm": 4.408097743988037, + "learning_rate": 1.1403372418456687e-05, + "loss": 0.2456, + "step": 17305 + }, + { + "epoch": 47.155313351498634, + "grad_norm": 5.561338901519775, + "learning_rate": 1.1402498651734806e-05, + "loss": 0.1267, + "step": 17306 + }, + { + "epoch": 47.15803814713897, + "grad_norm": 5.082563877105713, + "learning_rate": 1.1401624874090309e-05, + "loss": 0.1825, + "step": 17307 + }, + { + "epoch": 47.16076294277929, + "grad_norm": 5.351593494415283, + "learning_rate": 1.1400751085530006e-05, + "loss": 0.1378, + "step": 17308 + }, + { + "epoch": 47.16348773841962, + "grad_norm": 8.034741401672363, + "learning_rate": 1.1399877286060695e-05, + "loss": 0.1617, + "step": 17309 + }, + { + "epoch": 47.166212534059945, + "grad_norm": 10.069036483764648, + "learning_rate": 1.1399003475689187e-05, + "loss": 0.125, + "step": 17310 + }, + { + "epoch": 47.16893732970027, + "grad_norm": 4.9894490242004395, + "learning_rate": 1.1398129654422284e-05, + "loss": 0.2234, + "step": 17311 + }, + { + "epoch": 47.171662125340596, + "grad_norm": 5.806913375854492, + "learning_rate": 1.1397255822266794e-05, + "loss": 0.1104, + "step": 17312 + }, + { + "epoch": 47.17438692098093, + "grad_norm": 13.047809600830078, + "learning_rate": 1.1396381979229518e-05, + "loss": 0.2257, + "step": 17313 + }, + { + "epoch": 47.177111716621255, + "grad_norm": 6.9155168533325195, + "learning_rate": 1.1395508125317266e-05, + "loss": 0.1387, + "step": 17314 + }, + { + "epoch": 47.17983651226158, + "grad_norm": 4.971002578735352, + "learning_rate": 1.1394634260536839e-05, + "loss": 0.1436, + "step": 17315 + }, + { + "epoch": 47.182561307901906, + "grad_norm": 14.82128620147705, + "learning_rate": 1.1393760384895047e-05, + "loss": 0.1135, + "step": 17316 + }, + { + "epoch": 47.18528610354223, + "grad_norm": 6.719625949859619, + "learning_rate": 1.1392886498398695e-05, + "loss": 0.1841, + "step": 17317 + }, + { + "epoch": 47.18801089918256, + "grad_norm": 4.952080249786377, + "learning_rate": 1.1392012601054588e-05, + "loss": 0.1434, + "step": 17318 + }, + { + "epoch": 47.19073569482289, + "grad_norm": 5.241774082183838, + "learning_rate": 1.1391138692869528e-05, + "loss": 0.1313, + "step": 17319 + }, + { + "epoch": 47.19346049046322, + "grad_norm": 5.519021987915039, + "learning_rate": 1.1390264773850329e-05, + "loss": 0.1473, + "step": 17320 + }, + { + "epoch": 47.19618528610354, + "grad_norm": 10.155780792236328, + "learning_rate": 1.1389390844003789e-05, + "loss": 0.199, + "step": 17321 + }, + { + "epoch": 47.19891008174387, + "grad_norm": 7.600268840789795, + "learning_rate": 1.138851690333672e-05, + "loss": 0.2099, + "step": 17322 + }, + { + "epoch": 47.201634877384194, + "grad_norm": 5.401339530944824, + "learning_rate": 1.1387642951855925e-05, + "loss": 0.2131, + "step": 17323 + }, + { + "epoch": 47.20435967302452, + "grad_norm": 5.1407365798950195, + "learning_rate": 1.1386768989568213e-05, + "loss": 0.1204, + "step": 17324 + }, + { + "epoch": 47.20708446866485, + "grad_norm": 7.2260422706604, + "learning_rate": 1.1385895016480387e-05, + "loss": 0.1996, + "step": 17325 + }, + { + "epoch": 47.20980926430518, + "grad_norm": 8.958779335021973, + "learning_rate": 1.1385021032599257e-05, + "loss": 0.1553, + "step": 17326 + }, + { + "epoch": 47.212534059945504, + "grad_norm": 4.629421710968018, + "learning_rate": 1.1384147037931625e-05, + "loss": 0.0848, + "step": 17327 + }, + { + "epoch": 47.21525885558583, + "grad_norm": 7.2963128089904785, + "learning_rate": 1.1383273032484302e-05, + "loss": 0.2914, + "step": 17328 + }, + { + "epoch": 47.217983651226156, + "grad_norm": 8.382322311401367, + "learning_rate": 1.1382399016264093e-05, + "loss": 0.1498, + "step": 17329 + }, + { + "epoch": 47.22070844686648, + "grad_norm": 4.128012657165527, + "learning_rate": 1.1381524989277807e-05, + "loss": 0.2148, + "step": 17330 + }, + { + "epoch": 47.223433242506815, + "grad_norm": 4.981644630432129, + "learning_rate": 1.1380650951532243e-05, + "loss": 0.1136, + "step": 17331 + }, + { + "epoch": 47.22615803814714, + "grad_norm": 5.655073165893555, + "learning_rate": 1.137977690303422e-05, + "loss": 0.393, + "step": 17332 + }, + { + "epoch": 47.228882833787466, + "grad_norm": 4.699531078338623, + "learning_rate": 1.1378902843790538e-05, + "loss": 0.3039, + "step": 17333 + }, + { + "epoch": 47.23160762942779, + "grad_norm": 6.343612194061279, + "learning_rate": 1.1378028773808003e-05, + "loss": 0.1774, + "step": 17334 + }, + { + "epoch": 47.23433242506812, + "grad_norm": 5.021273136138916, + "learning_rate": 1.1377154693093426e-05, + "loss": 0.0888, + "step": 17335 + }, + { + "epoch": 47.237057220708444, + "grad_norm": 4.948480129241943, + "learning_rate": 1.1376280601653613e-05, + "loss": 0.1255, + "step": 17336 + }, + { + "epoch": 47.23978201634878, + "grad_norm": 5.859848976135254, + "learning_rate": 1.1375406499495367e-05, + "loss": 0.3579, + "step": 17337 + }, + { + "epoch": 47.2425068119891, + "grad_norm": 7.666250705718994, + "learning_rate": 1.1374532386625506e-05, + "loss": 0.1589, + "step": 17338 + }, + { + "epoch": 47.24523160762943, + "grad_norm": 7.62019157409668, + "learning_rate": 1.1373658263050824e-05, + "loss": 0.2307, + "step": 17339 + }, + { + "epoch": 47.247956403269754, + "grad_norm": 7.805665969848633, + "learning_rate": 1.1372784128778138e-05, + "loss": 0.274, + "step": 17340 + }, + { + "epoch": 47.25068119891008, + "grad_norm": 5.220042705535889, + "learning_rate": 1.1371909983814253e-05, + "loss": 0.2284, + "step": 17341 + }, + { + "epoch": 47.253405994550405, + "grad_norm": 5.222188949584961, + "learning_rate": 1.1371035828165979e-05, + "loss": 0.2258, + "step": 17342 + }, + { + "epoch": 47.25613079019074, + "grad_norm": 4.879983425140381, + "learning_rate": 1.1370161661840122e-05, + "loss": 0.2649, + "step": 17343 + }, + { + "epoch": 47.258855585831064, + "grad_norm": 4.29693603515625, + "learning_rate": 1.136928748484349e-05, + "loss": 0.2224, + "step": 17344 + }, + { + "epoch": 47.26158038147139, + "grad_norm": 6.894303321838379, + "learning_rate": 1.1368413297182892e-05, + "loss": 0.2061, + "step": 17345 + }, + { + "epoch": 47.264305177111716, + "grad_norm": 4.151698589324951, + "learning_rate": 1.1367539098865134e-05, + "loss": 0.1359, + "step": 17346 + }, + { + "epoch": 47.26702997275204, + "grad_norm": 7.282924175262451, + "learning_rate": 1.1366664889897025e-05, + "loss": 0.1911, + "step": 17347 + }, + { + "epoch": 47.26975476839237, + "grad_norm": 11.262412071228027, + "learning_rate": 1.1365790670285372e-05, + "loss": 0.2117, + "step": 17348 + }, + { + "epoch": 47.2724795640327, + "grad_norm": 5.026998519897461, + "learning_rate": 1.136491644003699e-05, + "loss": 0.127, + "step": 17349 + }, + { + "epoch": 47.275204359673026, + "grad_norm": 4.999397277832031, + "learning_rate": 1.1364042199158681e-05, + "loss": 0.134, + "step": 17350 + }, + { + "epoch": 47.27792915531335, + "grad_norm": 5.330348491668701, + "learning_rate": 1.1363167947657252e-05, + "loss": 0.1223, + "step": 17351 + }, + { + "epoch": 47.28065395095368, + "grad_norm": 5.6617865562438965, + "learning_rate": 1.1362293685539518e-05, + "loss": 0.1256, + "step": 17352 + }, + { + "epoch": 47.283378746594, + "grad_norm": 6.341552257537842, + "learning_rate": 1.1361419412812284e-05, + "loss": 0.1729, + "step": 17353 + }, + { + "epoch": 47.28610354223433, + "grad_norm": 6.309276580810547, + "learning_rate": 1.1360545129482361e-05, + "loss": 0.2233, + "step": 17354 + }, + { + "epoch": 47.28882833787466, + "grad_norm": 4.976595401763916, + "learning_rate": 1.1359670835556554e-05, + "loss": 0.1524, + "step": 17355 + }, + { + "epoch": 47.29155313351499, + "grad_norm": 4.946108341217041, + "learning_rate": 1.1358796531041676e-05, + "loss": 0.1253, + "step": 17356 + }, + { + "epoch": 47.294277929155314, + "grad_norm": 5.250059604644775, + "learning_rate": 1.1357922215944533e-05, + "loss": 0.123, + "step": 17357 + }, + { + "epoch": 47.29700272479564, + "grad_norm": 9.978639602661133, + "learning_rate": 1.1357047890271935e-05, + "loss": 0.3298, + "step": 17358 + }, + { + "epoch": 47.299727520435965, + "grad_norm": 5.052424907684326, + "learning_rate": 1.1356173554030692e-05, + "loss": 0.113, + "step": 17359 + }, + { + "epoch": 47.30245231607629, + "grad_norm": 7.464874744415283, + "learning_rate": 1.1355299207227612e-05, + "loss": 0.2352, + "step": 17360 + }, + { + "epoch": 47.305177111716624, + "grad_norm": 7.263399600982666, + "learning_rate": 1.135442484986951e-05, + "loss": 0.1648, + "step": 17361 + }, + { + "epoch": 47.30790190735695, + "grad_norm": 8.095212936401367, + "learning_rate": 1.1353550481963188e-05, + "loss": 0.1867, + "step": 17362 + }, + { + "epoch": 47.310626702997276, + "grad_norm": 6.417571544647217, + "learning_rate": 1.1352676103515456e-05, + "loss": 0.1455, + "step": 17363 + }, + { + "epoch": 47.3133514986376, + "grad_norm": 15.318137168884277, + "learning_rate": 1.135180171453313e-05, + "loss": 0.226, + "step": 17364 + }, + { + "epoch": 47.31607629427793, + "grad_norm": 4.018860340118408, + "learning_rate": 1.1350927315023012e-05, + "loss": 0.1905, + "step": 17365 + }, + { + "epoch": 47.31880108991825, + "grad_norm": 4.7360968589782715, + "learning_rate": 1.1350052904991917e-05, + "loss": 0.2281, + "step": 17366 + }, + { + "epoch": 47.321525885558586, + "grad_norm": 6.059764862060547, + "learning_rate": 1.1349178484446655e-05, + "loss": 0.2661, + "step": 17367 + }, + { + "epoch": 47.32425068119891, + "grad_norm": 5.604198455810547, + "learning_rate": 1.1348304053394032e-05, + "loss": 0.1767, + "step": 17368 + }, + { + "epoch": 47.32697547683924, + "grad_norm": 4.785433292388916, + "learning_rate": 1.1347429611840863e-05, + "loss": 0.1619, + "step": 17369 + }, + { + "epoch": 47.32970027247956, + "grad_norm": 6.601691246032715, + "learning_rate": 1.1346555159793956e-05, + "loss": 0.4151, + "step": 17370 + }, + { + "epoch": 47.33242506811989, + "grad_norm": 8.255234718322754, + "learning_rate": 1.134568069726012e-05, + "loss": 0.1947, + "step": 17371 + }, + { + "epoch": 47.335149863760215, + "grad_norm": 4.329376697540283, + "learning_rate": 1.1344806224246164e-05, + "loss": 0.0924, + "step": 17372 + }, + { + "epoch": 47.33787465940055, + "grad_norm": 7.335381984710693, + "learning_rate": 1.13439317407589e-05, + "loss": 0.2743, + "step": 17373 + }, + { + "epoch": 47.34059945504087, + "grad_norm": 5.078884601593018, + "learning_rate": 1.134305724680514e-05, + "loss": 0.1332, + "step": 17374 + }, + { + "epoch": 47.3433242506812, + "grad_norm": 5.090694427490234, + "learning_rate": 1.1342182742391693e-05, + "loss": 0.2632, + "step": 17375 + }, + { + "epoch": 47.346049046321525, + "grad_norm": 7.320001125335693, + "learning_rate": 1.1341308227525372e-05, + "loss": 0.1552, + "step": 17376 + }, + { + "epoch": 47.34877384196185, + "grad_norm": 8.654484748840332, + "learning_rate": 1.1340433702212986e-05, + "loss": 0.2031, + "step": 17377 + }, + { + "epoch": 47.35149863760218, + "grad_norm": 4.913638114929199, + "learning_rate": 1.1339559166461343e-05, + "loss": 0.2018, + "step": 17378 + }, + { + "epoch": 47.35422343324251, + "grad_norm": 5.031498432159424, + "learning_rate": 1.1338684620277259e-05, + "loss": 0.1499, + "step": 17379 + }, + { + "epoch": 47.356948228882835, + "grad_norm": 5.879524230957031, + "learning_rate": 1.1337810063667539e-05, + "loss": 0.1839, + "step": 17380 + }, + { + "epoch": 47.35967302452316, + "grad_norm": 6.057834148406982, + "learning_rate": 1.1336935496639e-05, + "loss": 0.2018, + "step": 17381 + }, + { + "epoch": 47.36239782016349, + "grad_norm": 5.919984817504883, + "learning_rate": 1.1336060919198449e-05, + "loss": 0.1179, + "step": 17382 + }, + { + "epoch": 47.36512261580381, + "grad_norm": 5.599321365356445, + "learning_rate": 1.1335186331352697e-05, + "loss": 0.0937, + "step": 17383 + }, + { + "epoch": 47.36784741144414, + "grad_norm": 5.7660369873046875, + "learning_rate": 1.1334311733108558e-05, + "loss": 0.1562, + "step": 17384 + }, + { + "epoch": 47.37057220708447, + "grad_norm": 5.741179466247559, + "learning_rate": 1.1333437124472844e-05, + "loss": 0.1245, + "step": 17385 + }, + { + "epoch": 47.3732970027248, + "grad_norm": 6.793684005737305, + "learning_rate": 1.1332562505452363e-05, + "loss": 0.2028, + "step": 17386 + }, + { + "epoch": 47.37602179836512, + "grad_norm": 6.103033542633057, + "learning_rate": 1.1331687876053929e-05, + "loss": 0.1651, + "step": 17387 + }, + { + "epoch": 47.37874659400545, + "grad_norm": 7.7717719078063965, + "learning_rate": 1.1330813236284353e-05, + "loss": 0.1776, + "step": 17388 + }, + { + "epoch": 47.381471389645775, + "grad_norm": 6.243279933929443, + "learning_rate": 1.1329938586150445e-05, + "loss": 0.2212, + "step": 17389 + }, + { + "epoch": 47.3841961852861, + "grad_norm": 6.319809436798096, + "learning_rate": 1.1329063925659018e-05, + "loss": 0.1883, + "step": 17390 + }, + { + "epoch": 47.38692098092643, + "grad_norm": 7.187377452850342, + "learning_rate": 1.1328189254816883e-05, + "loss": 0.1503, + "step": 17391 + }, + { + "epoch": 47.38964577656676, + "grad_norm": 4.905011177062988, + "learning_rate": 1.1327314573630855e-05, + "loss": 0.1894, + "step": 17392 + }, + { + "epoch": 47.392370572207085, + "grad_norm": 7.594850540161133, + "learning_rate": 1.1326439882107745e-05, + "loss": 0.2032, + "step": 17393 + }, + { + "epoch": 47.39509536784741, + "grad_norm": 4.616300106048584, + "learning_rate": 1.132556518025436e-05, + "loss": 0.2928, + "step": 17394 + }, + { + "epoch": 47.39782016348774, + "grad_norm": 6.146267414093018, + "learning_rate": 1.132469046807752e-05, + "loss": 0.1833, + "step": 17395 + }, + { + "epoch": 47.40054495912806, + "grad_norm": 6.339707851409912, + "learning_rate": 1.132381574558403e-05, + "loss": 0.2174, + "step": 17396 + }, + { + "epoch": 47.403269754768395, + "grad_norm": 6.550048828125, + "learning_rate": 1.1322941012780707e-05, + "loss": 0.2267, + "step": 17397 + }, + { + "epoch": 47.40599455040872, + "grad_norm": 6.415716171264648, + "learning_rate": 1.1322066269674364e-05, + "loss": 0.183, + "step": 17398 + }, + { + "epoch": 47.40871934604905, + "grad_norm": 4.894993782043457, + "learning_rate": 1.132119151627181e-05, + "loss": 0.1251, + "step": 17399 + }, + { + "epoch": 47.41144414168937, + "grad_norm": 7.787525653839111, + "learning_rate": 1.1320316752579854e-05, + "loss": 0.1692, + "step": 17400 + }, + { + "epoch": 47.4141689373297, + "grad_norm": 4.8304443359375, + "learning_rate": 1.1319441978605319e-05, + "loss": 0.3152, + "step": 17401 + }, + { + "epoch": 47.416893732970024, + "grad_norm": 5.751040935516357, + "learning_rate": 1.131856719435501e-05, + "loss": 0.1759, + "step": 17402 + }, + { + "epoch": 47.41961852861036, + "grad_norm": 4.539827346801758, + "learning_rate": 1.1317692399835746e-05, + "loss": 0.3914, + "step": 17403 + }, + { + "epoch": 47.42234332425068, + "grad_norm": 5.309699058532715, + "learning_rate": 1.1316817595054333e-05, + "loss": 0.1444, + "step": 17404 + }, + { + "epoch": 47.42506811989101, + "grad_norm": 5.834379196166992, + "learning_rate": 1.1315942780017589e-05, + "loss": 0.2961, + "step": 17405 + }, + { + "epoch": 47.427792915531334, + "grad_norm": 6.645628929138184, + "learning_rate": 1.1315067954732322e-05, + "loss": 0.4054, + "step": 17406 + }, + { + "epoch": 47.43051771117166, + "grad_norm": 5.270048141479492, + "learning_rate": 1.131419311920535e-05, + "loss": 0.1968, + "step": 17407 + }, + { + "epoch": 47.433242506811986, + "grad_norm": 10.516953468322754, + "learning_rate": 1.131331827344348e-05, + "loss": 0.3111, + "step": 17408 + }, + { + "epoch": 47.43596730245232, + "grad_norm": 4.475905895233154, + "learning_rate": 1.1312443417453535e-05, + "loss": 0.0942, + "step": 17409 + }, + { + "epoch": 47.438692098092645, + "grad_norm": 5.827042579650879, + "learning_rate": 1.131156855124232e-05, + "loss": 0.2352, + "step": 17410 + }, + { + "epoch": 47.44141689373297, + "grad_norm": 5.595770835876465, + "learning_rate": 1.1310693674816655e-05, + "loss": 0.2271, + "step": 17411 + }, + { + "epoch": 47.444141689373296, + "grad_norm": 4.498119831085205, + "learning_rate": 1.1309818788183347e-05, + "loss": 0.1723, + "step": 17412 + }, + { + "epoch": 47.44686648501362, + "grad_norm": 5.491279602050781, + "learning_rate": 1.1308943891349213e-05, + "loss": 0.1805, + "step": 17413 + }, + { + "epoch": 47.44959128065395, + "grad_norm": 5.263021469116211, + "learning_rate": 1.1308068984321066e-05, + "loss": 0.1742, + "step": 17414 + }, + { + "epoch": 47.45231607629428, + "grad_norm": 5.425411224365234, + "learning_rate": 1.130719406710572e-05, + "loss": 0.133, + "step": 17415 + }, + { + "epoch": 47.45504087193461, + "grad_norm": 4.812409400939941, + "learning_rate": 1.130631913970999e-05, + "loss": 0.2897, + "step": 17416 + }, + { + "epoch": 47.45776566757493, + "grad_norm": 4.713386535644531, + "learning_rate": 1.1305444202140685e-05, + "loss": 0.2036, + "step": 17417 + }, + { + "epoch": 47.46049046321526, + "grad_norm": 5.480905532836914, + "learning_rate": 1.1304569254404623e-05, + "loss": 0.1172, + "step": 17418 + }, + { + "epoch": 47.463215258855584, + "grad_norm": 8.589835166931152, + "learning_rate": 1.130369429650862e-05, + "loss": 0.1477, + "step": 17419 + }, + { + "epoch": 47.46594005449591, + "grad_norm": 6.506086349487305, + "learning_rate": 1.1302819328459487e-05, + "loss": 0.2017, + "step": 17420 + }, + { + "epoch": 47.46866485013624, + "grad_norm": 6.886260032653809, + "learning_rate": 1.130194435026404e-05, + "loss": 0.2262, + "step": 17421 + }, + { + "epoch": 47.47138964577657, + "grad_norm": 5.667884349822998, + "learning_rate": 1.1301069361929092e-05, + "loss": 0.126, + "step": 17422 + }, + { + "epoch": 47.474114441416894, + "grad_norm": 4.748784065246582, + "learning_rate": 1.1300194363461456e-05, + "loss": 0.1147, + "step": 17423 + }, + { + "epoch": 47.47683923705722, + "grad_norm": 6.0897722244262695, + "learning_rate": 1.129931935486795e-05, + "loss": 0.1983, + "step": 17424 + }, + { + "epoch": 47.479564032697546, + "grad_norm": 6.235533237457275, + "learning_rate": 1.1298444336155388e-05, + "loss": 0.1375, + "step": 17425 + }, + { + "epoch": 47.48228882833787, + "grad_norm": 5.98510217666626, + "learning_rate": 1.1297569307330576e-05, + "loss": 0.1994, + "step": 17426 + }, + { + "epoch": 47.485013623978205, + "grad_norm": 5.428730487823486, + "learning_rate": 1.1296694268400343e-05, + "loss": 0.1193, + "step": 17427 + }, + { + "epoch": 47.48773841961853, + "grad_norm": 5.673888683319092, + "learning_rate": 1.1295819219371494e-05, + "loss": 0.2798, + "step": 17428 + }, + { + "epoch": 47.490463215258856, + "grad_norm": 12.204548835754395, + "learning_rate": 1.1294944160250849e-05, + "loss": 0.3595, + "step": 17429 + }, + { + "epoch": 47.49318801089918, + "grad_norm": 5.644983291625977, + "learning_rate": 1.129406909104522e-05, + "loss": 0.1491, + "step": 17430 + }, + { + "epoch": 47.49591280653951, + "grad_norm": 7.090771675109863, + "learning_rate": 1.1293194011761421e-05, + "loss": 0.2103, + "step": 17431 + }, + { + "epoch": 47.49863760217983, + "grad_norm": 5.9541916847229, + "learning_rate": 1.1292318922406268e-05, + "loss": 0.1831, + "step": 17432 + }, + { + "epoch": 47.50136239782017, + "grad_norm": 4.507806777954102, + "learning_rate": 1.129144382298658e-05, + "loss": 0.1984, + "step": 17433 + }, + { + "epoch": 47.50408719346049, + "grad_norm": 5.049549102783203, + "learning_rate": 1.1290568713509166e-05, + "loss": 0.209, + "step": 17434 + }, + { + "epoch": 47.50681198910082, + "grad_norm": 5.580391883850098, + "learning_rate": 1.1289693593980843e-05, + "loss": 0.1354, + "step": 17435 + }, + { + "epoch": 47.509536784741144, + "grad_norm": 10.421479225158691, + "learning_rate": 1.1288818464408433e-05, + "loss": 0.1727, + "step": 17436 + }, + { + "epoch": 47.51226158038147, + "grad_norm": 10.88788890838623, + "learning_rate": 1.1287943324798744e-05, + "loss": 0.1282, + "step": 17437 + }, + { + "epoch": 47.514986376021795, + "grad_norm": 5.003871440887451, + "learning_rate": 1.1287068175158594e-05, + "loss": 0.1301, + "step": 17438 + }, + { + "epoch": 47.51771117166213, + "grad_norm": 5.405365943908691, + "learning_rate": 1.1286193015494797e-05, + "loss": 0.4263, + "step": 17439 + }, + { + "epoch": 47.520435967302454, + "grad_norm": 5.518341064453125, + "learning_rate": 1.128531784581417e-05, + "loss": 0.1235, + "step": 17440 + }, + { + "epoch": 47.52316076294278, + "grad_norm": 5.502331733703613, + "learning_rate": 1.1284442666123532e-05, + "loss": 0.126, + "step": 17441 + }, + { + "epoch": 47.525885558583106, + "grad_norm": 6.106025218963623, + "learning_rate": 1.1283567476429693e-05, + "loss": 0.123, + "step": 17442 + }, + { + "epoch": 47.52861035422343, + "grad_norm": 5.299657344818115, + "learning_rate": 1.1282692276739473e-05, + "loss": 0.1493, + "step": 17443 + }, + { + "epoch": 47.53133514986376, + "grad_norm": 6.045785903930664, + "learning_rate": 1.1281817067059689e-05, + "loss": 0.1349, + "step": 17444 + }, + { + "epoch": 47.53405994550409, + "grad_norm": 5.7348527908325195, + "learning_rate": 1.128094184739715e-05, + "loss": 0.1582, + "step": 17445 + }, + { + "epoch": 47.536784741144416, + "grad_norm": 4.512693405151367, + "learning_rate": 1.128006661775868e-05, + "loss": 0.1694, + "step": 17446 + }, + { + "epoch": 47.53950953678474, + "grad_norm": 6.702103137969971, + "learning_rate": 1.1279191378151094e-05, + "loss": 0.1433, + "step": 17447 + }, + { + "epoch": 47.54223433242507, + "grad_norm": 6.371593475341797, + "learning_rate": 1.1278316128581205e-05, + "loss": 0.3932, + "step": 17448 + }, + { + "epoch": 47.54495912806539, + "grad_norm": 5.314506530761719, + "learning_rate": 1.1277440869055829e-05, + "loss": 0.1245, + "step": 17449 + }, + { + "epoch": 47.54768392370572, + "grad_norm": 8.911656379699707, + "learning_rate": 1.1276565599581786e-05, + "loss": 0.2033, + "step": 17450 + }, + { + "epoch": 47.55040871934605, + "grad_norm": 4.4906005859375, + "learning_rate": 1.1275690320165891e-05, + "loss": 0.169, + "step": 17451 + }, + { + "epoch": 47.55313351498638, + "grad_norm": 5.4205474853515625, + "learning_rate": 1.1274815030814962e-05, + "loss": 0.1658, + "step": 17452 + }, + { + "epoch": 47.555858310626704, + "grad_norm": 5.942286014556885, + "learning_rate": 1.1273939731535814e-05, + "loss": 0.2132, + "step": 17453 + }, + { + "epoch": 47.55858310626703, + "grad_norm": 5.758001804351807, + "learning_rate": 1.1273064422335266e-05, + "loss": 0.1875, + "step": 17454 + }, + { + "epoch": 47.561307901907355, + "grad_norm": 5.243936538696289, + "learning_rate": 1.127218910322013e-05, + "loss": 0.1523, + "step": 17455 + }, + { + "epoch": 47.56403269754768, + "grad_norm": 9.450494766235352, + "learning_rate": 1.127131377419723e-05, + "loss": 0.1725, + "step": 17456 + }, + { + "epoch": 47.566757493188014, + "grad_norm": 6.759274482727051, + "learning_rate": 1.1270438435273376e-05, + "loss": 0.3017, + "step": 17457 + }, + { + "epoch": 47.56948228882834, + "grad_norm": 6.860689163208008, + "learning_rate": 1.1269563086455393e-05, + "loss": 0.1928, + "step": 17458 + }, + { + "epoch": 47.572207084468666, + "grad_norm": 8.381548881530762, + "learning_rate": 1.126868772775009e-05, + "loss": 0.1584, + "step": 17459 + }, + { + "epoch": 47.57493188010899, + "grad_norm": 8.353500366210938, + "learning_rate": 1.1267812359164286e-05, + "loss": 0.1151, + "step": 17460 + }, + { + "epoch": 47.57765667574932, + "grad_norm": 10.234742164611816, + "learning_rate": 1.1266936980704801e-05, + "loss": 0.1353, + "step": 17461 + }, + { + "epoch": 47.58038147138964, + "grad_norm": 5.291065692901611, + "learning_rate": 1.1266061592378455e-05, + "loss": 0.2135, + "step": 17462 + }, + { + "epoch": 47.583106267029976, + "grad_norm": 8.350508689880371, + "learning_rate": 1.1265186194192058e-05, + "loss": 0.117, + "step": 17463 + }, + { + "epoch": 47.5858310626703, + "grad_norm": 6.17387580871582, + "learning_rate": 1.1264310786152434e-05, + "loss": 0.1594, + "step": 17464 + }, + { + "epoch": 47.58855585831063, + "grad_norm": 5.931378364562988, + "learning_rate": 1.1263435368266397e-05, + "loss": 0.147, + "step": 17465 + }, + { + "epoch": 47.59128065395095, + "grad_norm": 6.011143684387207, + "learning_rate": 1.1262559940540769e-05, + "loss": 0.3531, + "step": 17466 + }, + { + "epoch": 47.59400544959128, + "grad_norm": 6.663870811462402, + "learning_rate": 1.1261684502982363e-05, + "loss": 0.1823, + "step": 17467 + }, + { + "epoch": 47.596730245231605, + "grad_norm": 5.473087310791016, + "learning_rate": 1.1260809055597996e-05, + "loss": 0.3148, + "step": 17468 + }, + { + "epoch": 47.59945504087194, + "grad_norm": 5.8604416847229, + "learning_rate": 1.125993359839449e-05, + "loss": 0.1427, + "step": 17469 + }, + { + "epoch": 47.60217983651226, + "grad_norm": 5.006176471710205, + "learning_rate": 1.1259058131378665e-05, + "loss": 0.1764, + "step": 17470 + }, + { + "epoch": 47.60490463215259, + "grad_norm": 6.329784393310547, + "learning_rate": 1.125818265455733e-05, + "loss": 0.1748, + "step": 17471 + }, + { + "epoch": 47.607629427792915, + "grad_norm": 5.836141109466553, + "learning_rate": 1.1257307167937315e-05, + "loss": 0.2063, + "step": 17472 + }, + { + "epoch": 47.61035422343324, + "grad_norm": 5.373903274536133, + "learning_rate": 1.1256431671525428e-05, + "loss": 0.1913, + "step": 17473 + }, + { + "epoch": 47.61307901907357, + "grad_norm": 6.745926380157471, + "learning_rate": 1.1255556165328494e-05, + "loss": 0.2, + "step": 17474 + }, + { + "epoch": 47.6158038147139, + "grad_norm": 4.685171127319336, + "learning_rate": 1.125468064935333e-05, + "loss": 0.099, + "step": 17475 + }, + { + "epoch": 47.618528610354225, + "grad_norm": 4.967680931091309, + "learning_rate": 1.1253805123606752e-05, + "loss": 0.1854, + "step": 17476 + }, + { + "epoch": 47.62125340599455, + "grad_norm": 6.480405330657959, + "learning_rate": 1.1252929588095576e-05, + "loss": 0.116, + "step": 17477 + }, + { + "epoch": 47.62397820163488, + "grad_norm": 7.122380256652832, + "learning_rate": 1.1252054042826627e-05, + "loss": 0.2554, + "step": 17478 + }, + { + "epoch": 47.6267029972752, + "grad_norm": 6.015350341796875, + "learning_rate": 1.1251178487806725e-05, + "loss": 0.2606, + "step": 17479 + }, + { + "epoch": 47.62942779291553, + "grad_norm": 6.103729724884033, + "learning_rate": 1.1250302923042684e-05, + "loss": 0.131, + "step": 17480 + }, + { + "epoch": 47.63215258855586, + "grad_norm": 4.799370765686035, + "learning_rate": 1.1249427348541322e-05, + "loss": 0.1053, + "step": 17481 + }, + { + "epoch": 47.63487738419619, + "grad_norm": 4.938962936401367, + "learning_rate": 1.124855176430946e-05, + "loss": 0.0967, + "step": 17482 + }, + { + "epoch": 47.63760217983651, + "grad_norm": 5.413734436035156, + "learning_rate": 1.1247676170353918e-05, + "loss": 0.1881, + "step": 17483 + }, + { + "epoch": 47.64032697547684, + "grad_norm": 6.096156597137451, + "learning_rate": 1.1246800566681517e-05, + "loss": 0.1828, + "step": 17484 + }, + { + "epoch": 47.643051771117165, + "grad_norm": 4.924108028411865, + "learning_rate": 1.124592495329907e-05, + "loss": 0.2259, + "step": 17485 + }, + { + "epoch": 47.64577656675749, + "grad_norm": 5.234230041503906, + "learning_rate": 1.1245049330213398e-05, + "loss": 0.1552, + "step": 17486 + }, + { + "epoch": 47.64850136239782, + "grad_norm": 4.4490275382995605, + "learning_rate": 1.1244173697431324e-05, + "loss": 0.2035, + "step": 17487 + }, + { + "epoch": 47.65122615803815, + "grad_norm": 5.975407600402832, + "learning_rate": 1.1243298054959666e-05, + "loss": 0.2455, + "step": 17488 + }, + { + "epoch": 47.653950953678475, + "grad_norm": 6.0566205978393555, + "learning_rate": 1.1242422402805242e-05, + "loss": 0.2092, + "step": 17489 + }, + { + "epoch": 47.6566757493188, + "grad_norm": 5.6127729415893555, + "learning_rate": 1.1241546740974874e-05, + "loss": 0.1373, + "step": 17490 + }, + { + "epoch": 47.65940054495913, + "grad_norm": 5.423619270324707, + "learning_rate": 1.1240671069475377e-05, + "loss": 0.2289, + "step": 17491 + }, + { + "epoch": 47.66212534059945, + "grad_norm": 5.537922382354736, + "learning_rate": 1.1239795388313578e-05, + "loss": 0.1996, + "step": 17492 + }, + { + "epoch": 47.664850136239785, + "grad_norm": 5.652258396148682, + "learning_rate": 1.1238919697496287e-05, + "loss": 0.2054, + "step": 17493 + }, + { + "epoch": 47.66757493188011, + "grad_norm": 4.688675880432129, + "learning_rate": 1.123804399703033e-05, + "loss": 0.1739, + "step": 17494 + }, + { + "epoch": 47.67029972752044, + "grad_norm": 4.451544284820557, + "learning_rate": 1.1237168286922528e-05, + "loss": 0.1129, + "step": 17495 + }, + { + "epoch": 47.67302452316076, + "grad_norm": 15.768667221069336, + "learning_rate": 1.1236292567179702e-05, + "loss": 0.2325, + "step": 17496 + }, + { + "epoch": 47.67574931880109, + "grad_norm": 4.785447597503662, + "learning_rate": 1.1235416837808663e-05, + "loss": 0.137, + "step": 17497 + }, + { + "epoch": 47.678474114441414, + "grad_norm": 4.1190996170043945, + "learning_rate": 1.1234541098816244e-05, + "loss": 0.1097, + "step": 17498 + }, + { + "epoch": 47.68119891008175, + "grad_norm": 6.4247822761535645, + "learning_rate": 1.1233665350209253e-05, + "loss": 0.1627, + "step": 17499 + }, + { + "epoch": 47.68392370572207, + "grad_norm": 5.705071926116943, + "learning_rate": 1.123278959199452e-05, + "loss": 0.1465, + "step": 17500 + }, + { + "epoch": 47.6866485013624, + "grad_norm": 5.82485818862915, + "learning_rate": 1.1231913824178859e-05, + "loss": 0.1548, + "step": 17501 + }, + { + "epoch": 47.689373297002724, + "grad_norm": 4.3881964683532715, + "learning_rate": 1.1231038046769094e-05, + "loss": 0.1803, + "step": 17502 + }, + { + "epoch": 47.69209809264305, + "grad_norm": 5.945643424987793, + "learning_rate": 1.1230162259772041e-05, + "loss": 0.196, + "step": 17503 + }, + { + "epoch": 47.694822888283376, + "grad_norm": 5.282832145690918, + "learning_rate": 1.1229286463194529e-05, + "loss": 0.1717, + "step": 17504 + }, + { + "epoch": 47.69754768392371, + "grad_norm": 5.0459113121032715, + "learning_rate": 1.1228410657043369e-05, + "loss": 0.1257, + "step": 17505 + }, + { + "epoch": 47.700272479564035, + "grad_norm": 5.307849884033203, + "learning_rate": 1.1227534841325392e-05, + "loss": 0.1627, + "step": 17506 + }, + { + "epoch": 47.70299727520436, + "grad_norm": 4.829582214355469, + "learning_rate": 1.1226659016047408e-05, + "loss": 0.203, + "step": 17507 + }, + { + "epoch": 47.705722070844686, + "grad_norm": 5.935482501983643, + "learning_rate": 1.1225783181216245e-05, + "loss": 0.2103, + "step": 17508 + }, + { + "epoch": 47.70844686648501, + "grad_norm": 5.641786098480225, + "learning_rate": 1.1224907336838722e-05, + "loss": 0.3269, + "step": 17509 + }, + { + "epoch": 47.71117166212534, + "grad_norm": 5.684382438659668, + "learning_rate": 1.1224031482921662e-05, + "loss": 0.1154, + "step": 17510 + }, + { + "epoch": 47.71389645776567, + "grad_norm": 14.90807819366455, + "learning_rate": 1.122315561947188e-05, + "loss": 0.1667, + "step": 17511 + }, + { + "epoch": 47.716621253406, + "grad_norm": 4.395716190338135, + "learning_rate": 1.1222279746496203e-05, + "loss": 0.107, + "step": 17512 + }, + { + "epoch": 47.71934604904632, + "grad_norm": 4.7664008140563965, + "learning_rate": 1.1221403864001452e-05, + "loss": 0.2012, + "step": 17513 + }, + { + "epoch": 47.72207084468665, + "grad_norm": 5.558382034301758, + "learning_rate": 1.1220527971994447e-05, + "loss": 0.2555, + "step": 17514 + }, + { + "epoch": 47.724795640326974, + "grad_norm": 4.383884906768799, + "learning_rate": 1.1219652070482007e-05, + "loss": 0.1831, + "step": 17515 + }, + { + "epoch": 47.7275204359673, + "grad_norm": 4.921212673187256, + "learning_rate": 1.1218776159470962e-05, + "loss": 0.1973, + "step": 17516 + }, + { + "epoch": 47.73024523160763, + "grad_norm": 7.012421607971191, + "learning_rate": 1.121790023896812e-05, + "loss": 0.3093, + "step": 17517 + }, + { + "epoch": 47.73297002724796, + "grad_norm": 3.847579002380371, + "learning_rate": 1.1217024308980316e-05, + "loss": 0.0867, + "step": 17518 + }, + { + "epoch": 47.735694822888284, + "grad_norm": 5.985230922698975, + "learning_rate": 1.1216148369514361e-05, + "loss": 0.2108, + "step": 17519 + }, + { + "epoch": 47.73841961852861, + "grad_norm": 4.878545761108398, + "learning_rate": 1.1215272420577084e-05, + "loss": 0.1246, + "step": 17520 + }, + { + "epoch": 47.741144414168936, + "grad_norm": 5.384594440460205, + "learning_rate": 1.1214396462175306e-05, + "loss": 0.2503, + "step": 17521 + }, + { + "epoch": 47.74386920980926, + "grad_norm": 4.4147748947143555, + "learning_rate": 1.1213520494315844e-05, + "loss": 0.1209, + "step": 17522 + }, + { + "epoch": 47.746594005449595, + "grad_norm": 5.7944512367248535, + "learning_rate": 1.1212644517005527e-05, + "loss": 0.1086, + "step": 17523 + }, + { + "epoch": 47.74931880108992, + "grad_norm": 4.662676811218262, + "learning_rate": 1.121176853025117e-05, + "loss": 0.1195, + "step": 17524 + }, + { + "epoch": 47.752043596730246, + "grad_norm": 7.815180778503418, + "learning_rate": 1.1210892534059599e-05, + "loss": 0.2545, + "step": 17525 + }, + { + "epoch": 47.75476839237057, + "grad_norm": 9.577667236328125, + "learning_rate": 1.121001652843764e-05, + "loss": 0.2967, + "step": 17526 + }, + { + "epoch": 47.7574931880109, + "grad_norm": 4.301311492919922, + "learning_rate": 1.1209140513392108e-05, + "loss": 0.2221, + "step": 17527 + }, + { + "epoch": 47.76021798365122, + "grad_norm": 6.129922389984131, + "learning_rate": 1.120826448892983e-05, + "loss": 0.3099, + "step": 17528 + }, + { + "epoch": 47.762942779291556, + "grad_norm": 4.257871627807617, + "learning_rate": 1.1207388455057623e-05, + "loss": 0.1592, + "step": 17529 + }, + { + "epoch": 47.76566757493188, + "grad_norm": 5.939739227294922, + "learning_rate": 1.1206512411782318e-05, + "loss": 0.2376, + "step": 17530 + }, + { + "epoch": 47.76839237057221, + "grad_norm": 6.521246910095215, + "learning_rate": 1.1205636359110733e-05, + "loss": 0.1876, + "step": 17531 + }, + { + "epoch": 47.771117166212534, + "grad_norm": 5.632286548614502, + "learning_rate": 1.1204760297049688e-05, + "loss": 0.2123, + "step": 17532 + }, + { + "epoch": 47.77384196185286, + "grad_norm": 6.878013610839844, + "learning_rate": 1.1203884225606012e-05, + "loss": 0.1777, + "step": 17533 + }, + { + "epoch": 47.776566757493185, + "grad_norm": 6.377793312072754, + "learning_rate": 1.1203008144786523e-05, + "loss": 0.1919, + "step": 17534 + }, + { + "epoch": 47.77929155313352, + "grad_norm": 5.528269290924072, + "learning_rate": 1.1202132054598045e-05, + "loss": 0.1104, + "step": 17535 + }, + { + "epoch": 47.782016348773844, + "grad_norm": 8.225494384765625, + "learning_rate": 1.1201255955047401e-05, + "loss": 0.1152, + "step": 17536 + }, + { + "epoch": 47.78474114441417, + "grad_norm": 6.01784086227417, + "learning_rate": 1.1200379846141414e-05, + "loss": 0.1954, + "step": 17537 + }, + { + "epoch": 47.787465940054496, + "grad_norm": 7.055092811584473, + "learning_rate": 1.1199503727886906e-05, + "loss": 0.1979, + "step": 17538 + }, + { + "epoch": 47.79019073569482, + "grad_norm": 5.262936592102051, + "learning_rate": 1.1198627600290705e-05, + "loss": 0.2109, + "step": 17539 + }, + { + "epoch": 47.79291553133515, + "grad_norm": 4.87378454208374, + "learning_rate": 1.119775146335963e-05, + "loss": 0.1322, + "step": 17540 + }, + { + "epoch": 47.79564032697548, + "grad_norm": 10.3624906539917, + "learning_rate": 1.1196875317100507e-05, + "loss": 0.308, + "step": 17541 + }, + { + "epoch": 47.798365122615806, + "grad_norm": 5.652101039886475, + "learning_rate": 1.1195999161520152e-05, + "loss": 0.2001, + "step": 17542 + }, + { + "epoch": 47.80108991825613, + "grad_norm": 8.375594139099121, + "learning_rate": 1.1195122996625399e-05, + "loss": 0.1048, + "step": 17543 + }, + { + "epoch": 47.80381471389646, + "grad_norm": 4.651740550994873, + "learning_rate": 1.1194246822423063e-05, + "loss": 0.1327, + "step": 17544 + }, + { + "epoch": 47.80653950953678, + "grad_norm": 4.437902450561523, + "learning_rate": 1.1193370638919976e-05, + "loss": 0.199, + "step": 17545 + }, + { + "epoch": 47.80926430517711, + "grad_norm": 25.399202346801758, + "learning_rate": 1.119249444612295e-05, + "loss": 0.2416, + "step": 17546 + }, + { + "epoch": 47.81198910081744, + "grad_norm": 7.21932315826416, + "learning_rate": 1.119161824403882e-05, + "loss": 0.2107, + "step": 17547 + }, + { + "epoch": 47.81471389645777, + "grad_norm": 5.15492057800293, + "learning_rate": 1.1190742032674404e-05, + "loss": 0.1763, + "step": 17548 + }, + { + "epoch": 47.817438692098094, + "grad_norm": 4.759138584136963, + "learning_rate": 1.118986581203653e-05, + "loss": 0.2657, + "step": 17549 + }, + { + "epoch": 47.82016348773842, + "grad_norm": 4.424410343170166, + "learning_rate": 1.1188989582132016e-05, + "loss": 0.1495, + "step": 17550 + }, + { + "epoch": 47.822888283378745, + "grad_norm": 5.128902912139893, + "learning_rate": 1.1188113342967692e-05, + "loss": 0.25, + "step": 17551 + }, + { + "epoch": 47.82561307901907, + "grad_norm": 6.951042175292969, + "learning_rate": 1.1187237094550378e-05, + "loss": 0.1469, + "step": 17552 + }, + { + "epoch": 47.828337874659404, + "grad_norm": 5.308253288269043, + "learning_rate": 1.1186360836886903e-05, + "loss": 0.1671, + "step": 17553 + }, + { + "epoch": 47.83106267029973, + "grad_norm": 5.095129489898682, + "learning_rate": 1.1185484569984082e-05, + "loss": 0.1024, + "step": 17554 + }, + { + "epoch": 47.833787465940055, + "grad_norm": 5.261958599090576, + "learning_rate": 1.1184608293848748e-05, + "loss": 0.1865, + "step": 17555 + }, + { + "epoch": 47.83651226158038, + "grad_norm": 6.035133361816406, + "learning_rate": 1.1183732008487723e-05, + "loss": 0.1757, + "step": 17556 + }, + { + "epoch": 47.83923705722071, + "grad_norm": 5.6396565437316895, + "learning_rate": 1.1182855713907831e-05, + "loss": 0.1738, + "step": 17557 + }, + { + "epoch": 47.84196185286103, + "grad_norm": 8.060161590576172, + "learning_rate": 1.1181979410115897e-05, + "loss": 0.2106, + "step": 17558 + }, + { + "epoch": 47.844686648501366, + "grad_norm": 10.053136825561523, + "learning_rate": 1.1181103097118748e-05, + "loss": 0.1968, + "step": 17559 + }, + { + "epoch": 47.84741144414169, + "grad_norm": 5.771396160125732, + "learning_rate": 1.1180226774923204e-05, + "loss": 0.2558, + "step": 17560 + }, + { + "epoch": 47.85013623978202, + "grad_norm": 7.158561706542969, + "learning_rate": 1.1179350443536092e-05, + "loss": 0.2619, + "step": 17561 + }, + { + "epoch": 47.85286103542234, + "grad_norm": 7.704658508300781, + "learning_rate": 1.1178474102964236e-05, + "loss": 0.196, + "step": 17562 + }, + { + "epoch": 47.85558583106267, + "grad_norm": 5.428753852844238, + "learning_rate": 1.117759775321446e-05, + "loss": 0.1781, + "step": 17563 + }, + { + "epoch": 47.858310626702995, + "grad_norm": 4.305299282073975, + "learning_rate": 1.1176721394293593e-05, + "loss": 0.1271, + "step": 17564 + }, + { + "epoch": 47.86103542234333, + "grad_norm": 7.138521194458008, + "learning_rate": 1.1175845026208458e-05, + "loss": 0.2738, + "step": 17565 + }, + { + "epoch": 47.86376021798365, + "grad_norm": 6.107406139373779, + "learning_rate": 1.1174968648965878e-05, + "loss": 0.1829, + "step": 17566 + }, + { + "epoch": 47.86648501362398, + "grad_norm": 5.503721714019775, + "learning_rate": 1.1174092262572682e-05, + "loss": 0.2099, + "step": 17567 + }, + { + "epoch": 47.869209809264305, + "grad_norm": 5.220943450927734, + "learning_rate": 1.1173215867035692e-05, + "loss": 0.0943, + "step": 17568 + }, + { + "epoch": 47.87193460490463, + "grad_norm": 9.411043167114258, + "learning_rate": 1.1172339462361735e-05, + "loss": 0.1556, + "step": 17569 + }, + { + "epoch": 47.87465940054496, + "grad_norm": 5.23283576965332, + "learning_rate": 1.1171463048557636e-05, + "loss": 0.1575, + "step": 17570 + }, + { + "epoch": 47.87738419618529, + "grad_norm": 4.6045026779174805, + "learning_rate": 1.117058662563022e-05, + "loss": 0.1449, + "step": 17571 + }, + { + "epoch": 47.880108991825615, + "grad_norm": 4.9127678871154785, + "learning_rate": 1.1169710193586312e-05, + "loss": 0.1686, + "step": 17572 + }, + { + "epoch": 47.88283378746594, + "grad_norm": 5.103357791900635, + "learning_rate": 1.1168833752432739e-05, + "loss": 0.1299, + "step": 17573 + }, + { + "epoch": 47.88555858310627, + "grad_norm": 6.955219745635986, + "learning_rate": 1.1167957302176327e-05, + "loss": 0.167, + "step": 17574 + }, + { + "epoch": 47.88828337874659, + "grad_norm": 5.665987491607666, + "learning_rate": 1.1167080842823904e-05, + "loss": 0.2096, + "step": 17575 + }, + { + "epoch": 47.89100817438692, + "grad_norm": 5.6638054847717285, + "learning_rate": 1.1166204374382287e-05, + "loss": 0.2489, + "step": 17576 + }, + { + "epoch": 47.89373297002725, + "grad_norm": 4.14143705368042, + "learning_rate": 1.1165327896858314e-05, + "loss": 0.2216, + "step": 17577 + }, + { + "epoch": 47.89645776566758, + "grad_norm": 5.11337947845459, + "learning_rate": 1.1164451410258801e-05, + "loss": 0.285, + "step": 17578 + }, + { + "epoch": 47.8991825613079, + "grad_norm": 5.634405136108398, + "learning_rate": 1.116357491459058e-05, + "loss": 0.163, + "step": 17579 + }, + { + "epoch": 47.90190735694823, + "grad_norm": 4.708236217498779, + "learning_rate": 1.1162698409860471e-05, + "loss": 0.2005, + "step": 17580 + }, + { + "epoch": 47.904632152588555, + "grad_norm": 13.555902481079102, + "learning_rate": 1.1161821896075309e-05, + "loss": 0.1329, + "step": 17581 + }, + { + "epoch": 47.90735694822888, + "grad_norm": 3.5687427520751953, + "learning_rate": 1.1160945373241914e-05, + "loss": 0.1467, + "step": 17582 + }, + { + "epoch": 47.91008174386921, + "grad_norm": 6.148223876953125, + "learning_rate": 1.1160068841367113e-05, + "loss": 0.1637, + "step": 17583 + }, + { + "epoch": 47.91280653950954, + "grad_norm": 5.446135520935059, + "learning_rate": 1.1159192300457733e-05, + "loss": 0.1921, + "step": 17584 + }, + { + "epoch": 47.915531335149865, + "grad_norm": 3.317143678665161, + "learning_rate": 1.1158315750520603e-05, + "loss": 0.1658, + "step": 17585 + }, + { + "epoch": 47.91825613079019, + "grad_norm": 8.444612503051758, + "learning_rate": 1.1157439191562545e-05, + "loss": 0.1204, + "step": 17586 + }, + { + "epoch": 47.920980926430516, + "grad_norm": 4.2756547927856445, + "learning_rate": 1.1156562623590391e-05, + "loss": 0.2194, + "step": 17587 + }, + { + "epoch": 47.92370572207084, + "grad_norm": 5.209869861602783, + "learning_rate": 1.1155686046610958e-05, + "loss": 0.1105, + "step": 17588 + }, + { + "epoch": 47.926430517711175, + "grad_norm": 4.758162975311279, + "learning_rate": 1.1154809460631084e-05, + "loss": 0.1089, + "step": 17589 + }, + { + "epoch": 47.9291553133515, + "grad_norm": 5.233775615692139, + "learning_rate": 1.1153932865657588e-05, + "loss": 0.111, + "step": 17590 + }, + { + "epoch": 47.93188010899183, + "grad_norm": 5.705069065093994, + "learning_rate": 1.1153056261697303e-05, + "loss": 0.3223, + "step": 17591 + }, + { + "epoch": 47.93460490463215, + "grad_norm": 6.418481826782227, + "learning_rate": 1.1152179648757053e-05, + "loss": 0.1835, + "step": 17592 + }, + { + "epoch": 47.93732970027248, + "grad_norm": 6.488126754760742, + "learning_rate": 1.1151303026843664e-05, + "loss": 0.2548, + "step": 17593 + }, + { + "epoch": 47.940054495912804, + "grad_norm": 4.554354667663574, + "learning_rate": 1.1150426395963964e-05, + "loss": 0.1249, + "step": 17594 + }, + { + "epoch": 47.94277929155314, + "grad_norm": 5.311594486236572, + "learning_rate": 1.1149549756124782e-05, + "loss": 0.1586, + "step": 17595 + }, + { + "epoch": 47.94550408719346, + "grad_norm": 6.385234355926514, + "learning_rate": 1.1148673107332942e-05, + "loss": 0.1875, + "step": 17596 + }, + { + "epoch": 47.94822888283379, + "grad_norm": 4.108850479125977, + "learning_rate": 1.1147796449595274e-05, + "loss": 0.2056, + "step": 17597 + }, + { + "epoch": 47.950953678474114, + "grad_norm": 5.044709205627441, + "learning_rate": 1.1146919782918601e-05, + "loss": 0.1718, + "step": 17598 + }, + { + "epoch": 47.95367847411444, + "grad_norm": 4.59542989730835, + "learning_rate": 1.1146043107309754e-05, + "loss": 0.1536, + "step": 17599 + }, + { + "epoch": 47.956403269754766, + "grad_norm": 11.871831893920898, + "learning_rate": 1.1145166422775562e-05, + "loss": 0.2989, + "step": 17600 + }, + { + "epoch": 47.95912806539509, + "grad_norm": 4.525768280029297, + "learning_rate": 1.1144289729322853e-05, + "loss": 0.2321, + "step": 17601 + }, + { + "epoch": 47.961852861035425, + "grad_norm": 5.020235061645508, + "learning_rate": 1.1143413026958448e-05, + "loss": 0.1179, + "step": 17602 + }, + { + "epoch": 47.96457765667575, + "grad_norm": 6.464372634887695, + "learning_rate": 1.1142536315689183e-05, + "loss": 0.2007, + "step": 17603 + }, + { + "epoch": 47.967302452316076, + "grad_norm": 4.812226295471191, + "learning_rate": 1.1141659595521879e-05, + "loss": 0.1165, + "step": 17604 + }, + { + "epoch": 47.9700272479564, + "grad_norm": 5.447220325469971, + "learning_rate": 1.1140782866463369e-05, + "loss": 0.1425, + "step": 17605 + }, + { + "epoch": 47.97275204359673, + "grad_norm": 5.454530239105225, + "learning_rate": 1.1139906128520476e-05, + "loss": 0.2015, + "step": 17606 + }, + { + "epoch": 47.97547683923706, + "grad_norm": 6.178712368011475, + "learning_rate": 1.1139029381700033e-05, + "loss": 0.1644, + "step": 17607 + }, + { + "epoch": 47.97820163487739, + "grad_norm": 4.985306739807129, + "learning_rate": 1.1138152626008864e-05, + "loss": 0.2515, + "step": 17608 + }, + { + "epoch": 47.98092643051771, + "grad_norm": 5.267483234405518, + "learning_rate": 1.1137275861453801e-05, + "loss": 0.1962, + "step": 17609 + }, + { + "epoch": 47.98365122615804, + "grad_norm": 7.079397201538086, + "learning_rate": 1.113639908804167e-05, + "loss": 0.1802, + "step": 17610 + }, + { + "epoch": 47.986376021798364, + "grad_norm": 4.777469158172607, + "learning_rate": 1.1135522305779298e-05, + "loss": 0.1946, + "step": 17611 + }, + { + "epoch": 47.98910081743869, + "grad_norm": 5.747976303100586, + "learning_rate": 1.1134645514673514e-05, + "loss": 0.4596, + "step": 17612 + }, + { + "epoch": 47.991825613079016, + "grad_norm": 5.1898698806762695, + "learning_rate": 1.1133768714731152e-05, + "loss": 0.094, + "step": 17613 + }, + { + "epoch": 47.99455040871935, + "grad_norm": 4.5456390380859375, + "learning_rate": 1.113289190595903e-05, + "loss": 0.1426, + "step": 17614 + }, + { + "epoch": 47.997275204359674, + "grad_norm": 4.944077968597412, + "learning_rate": 1.1132015088363985e-05, + "loss": 0.2636, + "step": 17615 + }, + { + "epoch": 48.0, + "grad_norm": 5.0380401611328125, + "learning_rate": 1.1131138261952845e-05, + "loss": 0.1395, + "step": 17616 + }, + { + "epoch": 48.002724795640326, + "grad_norm": 23.600337982177734, + "learning_rate": 1.1130261426732433e-05, + "loss": 0.2574, + "step": 17617 + }, + { + "epoch": 48.00544959128065, + "grad_norm": 4.308071613311768, + "learning_rate": 1.1129384582709584e-05, + "loss": 0.2789, + "step": 17618 + }, + { + "epoch": 48.00817438692098, + "grad_norm": 5.865283012390137, + "learning_rate": 1.1128507729891123e-05, + "loss": 0.1063, + "step": 17619 + }, + { + "epoch": 48.01089918256131, + "grad_norm": 6.204005718231201, + "learning_rate": 1.1127630868283881e-05, + "loss": 0.224, + "step": 17620 + }, + { + "epoch": 48.013623978201636, + "grad_norm": 7.709722518920898, + "learning_rate": 1.1126753997894683e-05, + "loss": 0.3526, + "step": 17621 + }, + { + "epoch": 48.01634877384196, + "grad_norm": 4.147298336029053, + "learning_rate": 1.1125877118730363e-05, + "loss": 0.1381, + "step": 17622 + }, + { + "epoch": 48.01907356948229, + "grad_norm": 3.798046350479126, + "learning_rate": 1.112500023079775e-05, + "loss": 0.2069, + "step": 17623 + }, + { + "epoch": 48.02179836512261, + "grad_norm": 5.765188694000244, + "learning_rate": 1.1124123334103671e-05, + "loss": 0.1226, + "step": 17624 + }, + { + "epoch": 48.02452316076294, + "grad_norm": 4.516467094421387, + "learning_rate": 1.1123246428654953e-05, + "loss": 0.1196, + "step": 17625 + }, + { + "epoch": 48.02724795640327, + "grad_norm": 5.7083845138549805, + "learning_rate": 1.1122369514458431e-05, + "loss": 0.2256, + "step": 17626 + }, + { + "epoch": 48.0299727520436, + "grad_norm": 4.721480369567871, + "learning_rate": 1.112149259152093e-05, + "loss": 0.0924, + "step": 17627 + }, + { + "epoch": 48.032697547683924, + "grad_norm": 6.462025165557861, + "learning_rate": 1.112061565984928e-05, + "loss": 0.1297, + "step": 17628 + }, + { + "epoch": 48.03542234332425, + "grad_norm": 4.309183597564697, + "learning_rate": 1.1119738719450312e-05, + "loss": 0.2081, + "step": 17629 + }, + { + "epoch": 48.038147138964575, + "grad_norm": 6.586560249328613, + "learning_rate": 1.1118861770330857e-05, + "loss": 0.1908, + "step": 17630 + }, + { + "epoch": 48.0408719346049, + "grad_norm": 4.4471659660339355, + "learning_rate": 1.1117984812497739e-05, + "loss": 0.1516, + "step": 17631 + }, + { + "epoch": 48.043596730245234, + "grad_norm": 4.485964775085449, + "learning_rate": 1.1117107845957793e-05, + "loss": 0.1233, + "step": 17632 + }, + { + "epoch": 48.04632152588556, + "grad_norm": 6.085051536560059, + "learning_rate": 1.1116230870717846e-05, + "loss": 0.2802, + "step": 17633 + }, + { + "epoch": 48.049046321525886, + "grad_norm": 7.2233991622924805, + "learning_rate": 1.1115353886784732e-05, + "loss": 0.2454, + "step": 17634 + }, + { + "epoch": 48.05177111716621, + "grad_norm": 4.020181179046631, + "learning_rate": 1.1114476894165273e-05, + "loss": 0.2004, + "step": 17635 + }, + { + "epoch": 48.05449591280654, + "grad_norm": 4.400680065155029, + "learning_rate": 1.1113599892866309e-05, + "loss": 0.0985, + "step": 17636 + }, + { + "epoch": 48.05722070844686, + "grad_norm": 4.079622268676758, + "learning_rate": 1.1112722882894662e-05, + "loss": 0.1791, + "step": 17637 + }, + { + "epoch": 48.059945504087196, + "grad_norm": 4.532163143157959, + "learning_rate": 1.1111845864257166e-05, + "loss": 0.1177, + "step": 17638 + }, + { + "epoch": 48.06267029972752, + "grad_norm": 5.875760555267334, + "learning_rate": 1.111096883696065e-05, + "loss": 0.2561, + "step": 17639 + }, + { + "epoch": 48.06539509536785, + "grad_norm": 4.709860324859619, + "learning_rate": 1.1110091801011944e-05, + "loss": 0.1643, + "step": 17640 + }, + { + "epoch": 48.06811989100817, + "grad_norm": 6.544802188873291, + "learning_rate": 1.1109214756417876e-05, + "loss": 0.1373, + "step": 17641 + }, + { + "epoch": 48.0708446866485, + "grad_norm": 3.946495532989502, + "learning_rate": 1.1108337703185283e-05, + "loss": 0.2344, + "step": 17642 + }, + { + "epoch": 48.073569482288825, + "grad_norm": 3.775704860687256, + "learning_rate": 1.1107460641320991e-05, + "loss": 0.1107, + "step": 17643 + }, + { + "epoch": 48.07629427792916, + "grad_norm": 5.911627769470215, + "learning_rate": 1.110658357083183e-05, + "loss": 0.1627, + "step": 17644 + }, + { + "epoch": 48.079019073569484, + "grad_norm": 5.471261501312256, + "learning_rate": 1.1105706491724633e-05, + "loss": 0.3694, + "step": 17645 + }, + { + "epoch": 48.08174386920981, + "grad_norm": 4.470165729522705, + "learning_rate": 1.110482940400623e-05, + "loss": 0.1108, + "step": 17646 + }, + { + "epoch": 48.084468664850135, + "grad_norm": 4.8588786125183105, + "learning_rate": 1.110395230768345e-05, + "loss": 0.1053, + "step": 17647 + }, + { + "epoch": 48.08719346049046, + "grad_norm": 7.981325149536133, + "learning_rate": 1.1103075202763125e-05, + "loss": 0.2082, + "step": 17648 + }, + { + "epoch": 48.08991825613079, + "grad_norm": 5.377898693084717, + "learning_rate": 1.1102198089252083e-05, + "loss": 0.1289, + "step": 17649 + }, + { + "epoch": 48.09264305177112, + "grad_norm": 4.502743244171143, + "learning_rate": 1.1101320967157164e-05, + "loss": 0.3021, + "step": 17650 + }, + { + "epoch": 48.095367847411445, + "grad_norm": 3.802295446395874, + "learning_rate": 1.1100443836485187e-05, + "loss": 0.0957, + "step": 17651 + }, + { + "epoch": 48.09809264305177, + "grad_norm": 5.665125846862793, + "learning_rate": 1.1099566697242992e-05, + "loss": 0.1497, + "step": 17652 + }, + { + "epoch": 48.1008174386921, + "grad_norm": 4.261890888214111, + "learning_rate": 1.1098689549437406e-05, + "loss": 0.137, + "step": 17653 + }, + { + "epoch": 48.10354223433242, + "grad_norm": 5.558714389801025, + "learning_rate": 1.1097812393075262e-05, + "loss": 0.2521, + "step": 17654 + }, + { + "epoch": 48.10626702997275, + "grad_norm": 4.837158203125, + "learning_rate": 1.1096935228163387e-05, + "loss": 0.0972, + "step": 17655 + }, + { + "epoch": 48.10899182561308, + "grad_norm": 5.561313629150391, + "learning_rate": 1.1096058054708624e-05, + "loss": 0.2004, + "step": 17656 + }, + { + "epoch": 48.11171662125341, + "grad_norm": 6.110978126525879, + "learning_rate": 1.1095180872717789e-05, + "loss": 0.2212, + "step": 17657 + }, + { + "epoch": 48.11444141689373, + "grad_norm": 4.91227388381958, + "learning_rate": 1.109430368219772e-05, + "loss": 0.1553, + "step": 17658 + }, + { + "epoch": 48.11716621253406, + "grad_norm": 5.304751873016357, + "learning_rate": 1.109342648315525e-05, + "loss": 0.0942, + "step": 17659 + }, + { + "epoch": 48.119891008174385, + "grad_norm": 6.523604869842529, + "learning_rate": 1.1092549275597213e-05, + "loss": 0.2844, + "step": 17660 + }, + { + "epoch": 48.12261580381471, + "grad_norm": 4.470745086669922, + "learning_rate": 1.1091672059530434e-05, + "loss": 0.1423, + "step": 17661 + }, + { + "epoch": 48.12534059945504, + "grad_norm": 4.966081142425537, + "learning_rate": 1.1090794834961751e-05, + "loss": 0.2176, + "step": 17662 + }, + { + "epoch": 48.12806539509537, + "grad_norm": 4.370601177215576, + "learning_rate": 1.108991760189799e-05, + "loss": 0.1076, + "step": 17663 + }, + { + "epoch": 48.130790190735695, + "grad_norm": 4.971834182739258, + "learning_rate": 1.1089040360345991e-05, + "loss": 0.1852, + "step": 17664 + }, + { + "epoch": 48.13351498637602, + "grad_norm": 3.0083553791046143, + "learning_rate": 1.1088163110312576e-05, + "loss": 0.1391, + "step": 17665 + }, + { + "epoch": 48.13623978201635, + "grad_norm": 5.607665538787842, + "learning_rate": 1.108728585180458e-05, + "loss": 0.3079, + "step": 17666 + }, + { + "epoch": 48.13896457765667, + "grad_norm": 4.5860595703125, + "learning_rate": 1.1086408584828841e-05, + "loss": 0.1729, + "step": 17667 + }, + { + "epoch": 48.141689373297005, + "grad_norm": 6.232942581176758, + "learning_rate": 1.1085531309392186e-05, + "loss": 0.086, + "step": 17668 + }, + { + "epoch": 48.14441416893733, + "grad_norm": 5.38991641998291, + "learning_rate": 1.1084654025501446e-05, + "loss": 0.1033, + "step": 17669 + }, + { + "epoch": 48.14713896457766, + "grad_norm": 4.217653751373291, + "learning_rate": 1.1083776733163459e-05, + "loss": 0.12, + "step": 17670 + }, + { + "epoch": 48.14986376021798, + "grad_norm": 3.475024938583374, + "learning_rate": 1.108289943238505e-05, + "loss": 0.1121, + "step": 17671 + }, + { + "epoch": 48.15258855585831, + "grad_norm": 4.399120807647705, + "learning_rate": 1.108202212317306e-05, + "loss": 0.1247, + "step": 17672 + }, + { + "epoch": 48.155313351498634, + "grad_norm": 5.111778736114502, + "learning_rate": 1.1081144805534311e-05, + "loss": 0.2277, + "step": 17673 + }, + { + "epoch": 48.15803814713897, + "grad_norm": 5.794163227081299, + "learning_rate": 1.1080267479475644e-05, + "loss": 0.2108, + "step": 17674 + }, + { + "epoch": 48.16076294277929, + "grad_norm": 5.117379665374756, + "learning_rate": 1.1079390145003886e-05, + "loss": 0.124, + "step": 17675 + }, + { + "epoch": 48.16348773841962, + "grad_norm": 4.971923351287842, + "learning_rate": 1.1078512802125876e-05, + "loss": 0.2581, + "step": 17676 + }, + { + "epoch": 48.166212534059945, + "grad_norm": 4.8347368240356445, + "learning_rate": 1.1077635450848439e-05, + "loss": 0.169, + "step": 17677 + }, + { + "epoch": 48.16893732970027, + "grad_norm": 4.8003249168396, + "learning_rate": 1.1076758091178417e-05, + "loss": 0.2206, + "step": 17678 + }, + { + "epoch": 48.171662125340596, + "grad_norm": 4.9459004402160645, + "learning_rate": 1.1075880723122632e-05, + "loss": 0.1044, + "step": 17679 + }, + { + "epoch": 48.17438692098093, + "grad_norm": 4.366501331329346, + "learning_rate": 1.1075003346687927e-05, + "loss": 0.1245, + "step": 17680 + }, + { + "epoch": 48.177111716621255, + "grad_norm": 5.24885368347168, + "learning_rate": 1.1074125961881128e-05, + "loss": 0.3014, + "step": 17681 + }, + { + "epoch": 48.17983651226158, + "grad_norm": 4.298219203948975, + "learning_rate": 1.1073248568709073e-05, + "loss": 0.1314, + "step": 17682 + }, + { + "epoch": 48.182561307901906, + "grad_norm": 4.7655439376831055, + "learning_rate": 1.1072371167178591e-05, + "loss": 0.2176, + "step": 17683 + }, + { + "epoch": 48.18528610354223, + "grad_norm": 4.6595845222473145, + "learning_rate": 1.1071493757296515e-05, + "loss": 0.1591, + "step": 17684 + }, + { + "epoch": 48.18801089918256, + "grad_norm": 5.491793632507324, + "learning_rate": 1.1070616339069683e-05, + "loss": 0.3436, + "step": 17685 + }, + { + "epoch": 48.19073569482289, + "grad_norm": 3.7247369289398193, + "learning_rate": 1.1069738912504924e-05, + "loss": 0.0642, + "step": 17686 + }, + { + "epoch": 48.19346049046322, + "grad_norm": 4.61937952041626, + "learning_rate": 1.1068861477609072e-05, + "loss": 0.1947, + "step": 17687 + }, + { + "epoch": 48.19618528610354, + "grad_norm": 5.518864154815674, + "learning_rate": 1.1067984034388963e-05, + "loss": 0.1409, + "step": 17688 + }, + { + "epoch": 48.19891008174387, + "grad_norm": 4.456373691558838, + "learning_rate": 1.1067106582851427e-05, + "loss": 0.1544, + "step": 17689 + }, + { + "epoch": 48.201634877384194, + "grad_norm": 6.588265419006348, + "learning_rate": 1.1066229123003302e-05, + "loss": 0.2329, + "step": 17690 + }, + { + "epoch": 48.20435967302452, + "grad_norm": 4.4196457862854, + "learning_rate": 1.1065351654851417e-05, + "loss": 0.115, + "step": 17691 + }, + { + "epoch": 48.20708446866485, + "grad_norm": 8.519316673278809, + "learning_rate": 1.1064474178402607e-05, + "loss": 0.2761, + "step": 17692 + }, + { + "epoch": 48.20980926430518, + "grad_norm": 4.9979963302612305, + "learning_rate": 1.106359669366371e-05, + "loss": 0.1371, + "step": 17693 + }, + { + "epoch": 48.212534059945504, + "grad_norm": 4.272399425506592, + "learning_rate": 1.1062719200641551e-05, + "loss": 0.191, + "step": 17694 + }, + { + "epoch": 48.21525885558583, + "grad_norm": 3.858732223510742, + "learning_rate": 1.1061841699342975e-05, + "loss": 0.1189, + "step": 17695 + }, + { + "epoch": 48.217983651226156, + "grad_norm": 4.810211181640625, + "learning_rate": 1.1060964189774804e-05, + "loss": 0.0938, + "step": 17696 + }, + { + "epoch": 48.22070844686648, + "grad_norm": 4.097233772277832, + "learning_rate": 1.106008667194388e-05, + "loss": 0.1729, + "step": 17697 + }, + { + "epoch": 48.223433242506815, + "grad_norm": 5.586561679840088, + "learning_rate": 1.1059209145857038e-05, + "loss": 0.1512, + "step": 17698 + }, + { + "epoch": 48.22615803814714, + "grad_norm": 5.138467311859131, + "learning_rate": 1.1058331611521105e-05, + "loss": 0.1904, + "step": 17699 + }, + { + "epoch": 48.228882833787466, + "grad_norm": 7.284699440002441, + "learning_rate": 1.1057454068942923e-05, + "loss": 0.1239, + "step": 17700 + }, + { + "epoch": 48.23160762942779, + "grad_norm": 4.594121932983398, + "learning_rate": 1.105657651812932e-05, + "loss": 0.2418, + "step": 17701 + }, + { + "epoch": 48.23433242506812, + "grad_norm": 5.351985454559326, + "learning_rate": 1.1055698959087133e-05, + "loss": 0.0924, + "step": 17702 + }, + { + "epoch": 48.237057220708444, + "grad_norm": 3.99371600151062, + "learning_rate": 1.10548213918232e-05, + "loss": 0.0705, + "step": 17703 + }, + { + "epoch": 48.23978201634878, + "grad_norm": 4.211036205291748, + "learning_rate": 1.1053943816344348e-05, + "loss": 0.3535, + "step": 17704 + }, + { + "epoch": 48.2425068119891, + "grad_norm": 5.788252830505371, + "learning_rate": 1.1053066232657419e-05, + "loss": 0.1866, + "step": 17705 + }, + { + "epoch": 48.24523160762943, + "grad_norm": 4.31191349029541, + "learning_rate": 1.1052188640769242e-05, + "loss": 0.1199, + "step": 17706 + }, + { + "epoch": 48.247956403269754, + "grad_norm": 4.442556381225586, + "learning_rate": 1.1051311040686654e-05, + "loss": 0.2192, + "step": 17707 + }, + { + "epoch": 48.25068119891008, + "grad_norm": 4.344634056091309, + "learning_rate": 1.105043343241649e-05, + "loss": 0.1389, + "step": 17708 + }, + { + "epoch": 48.253405994550405, + "grad_norm": 6.456859111785889, + "learning_rate": 1.1049555815965583e-05, + "loss": 0.2467, + "step": 17709 + }, + { + "epoch": 48.25613079019074, + "grad_norm": 4.2649993896484375, + "learning_rate": 1.1048678191340766e-05, + "loss": 0.1074, + "step": 17710 + }, + { + "epoch": 48.258855585831064, + "grad_norm": 6.091101169586182, + "learning_rate": 1.1047800558548885e-05, + "loss": 0.3346, + "step": 17711 + }, + { + "epoch": 48.26158038147139, + "grad_norm": 5.986828804016113, + "learning_rate": 1.1046922917596761e-05, + "loss": 0.2379, + "step": 17712 + }, + { + "epoch": 48.264305177111716, + "grad_norm": 3.8978688716888428, + "learning_rate": 1.1046045268491237e-05, + "loss": 0.1309, + "step": 17713 + }, + { + "epoch": 48.26702997275204, + "grad_norm": 13.23773193359375, + "learning_rate": 1.1045167611239145e-05, + "loss": 0.2822, + "step": 17714 + }, + { + "epoch": 48.26975476839237, + "grad_norm": 4.466581344604492, + "learning_rate": 1.1044289945847325e-05, + "loss": 0.1192, + "step": 17715 + }, + { + "epoch": 48.2724795640327, + "grad_norm": 4.531101226806641, + "learning_rate": 1.1043412272322605e-05, + "loss": 0.3405, + "step": 17716 + }, + { + "epoch": 48.275204359673026, + "grad_norm": 3.8679039478302, + "learning_rate": 1.1042534590671825e-05, + "loss": 0.2082, + "step": 17717 + }, + { + "epoch": 48.27792915531335, + "grad_norm": 4.445958614349365, + "learning_rate": 1.1041656900901816e-05, + "loss": 0.2833, + "step": 17718 + }, + { + "epoch": 48.28065395095368, + "grad_norm": 4.962905406951904, + "learning_rate": 1.104077920301942e-05, + "loss": 0.1478, + "step": 17719 + }, + { + "epoch": 48.283378746594, + "grad_norm": 5.9054951667785645, + "learning_rate": 1.1039901497031466e-05, + "loss": 0.1653, + "step": 17720 + }, + { + "epoch": 48.28610354223433, + "grad_norm": 5.974760055541992, + "learning_rate": 1.1039023782944798e-05, + "loss": 0.0797, + "step": 17721 + }, + { + "epoch": 48.28882833787466, + "grad_norm": 6.065160274505615, + "learning_rate": 1.1038146060766241e-05, + "loss": 0.1601, + "step": 17722 + }, + { + "epoch": 48.29155313351499, + "grad_norm": 5.21046781539917, + "learning_rate": 1.103726833050264e-05, + "loss": 0.2534, + "step": 17723 + }, + { + "epoch": 48.294277929155314, + "grad_norm": 5.575509548187256, + "learning_rate": 1.1036390592160824e-05, + "loss": 0.2999, + "step": 17724 + }, + { + "epoch": 48.29700272479564, + "grad_norm": 4.694852828979492, + "learning_rate": 1.1035512845747633e-05, + "loss": 0.3159, + "step": 17725 + }, + { + "epoch": 48.299727520435965, + "grad_norm": 5.344362735748291, + "learning_rate": 1.1034635091269899e-05, + "loss": 0.1761, + "step": 17726 + }, + { + "epoch": 48.30245231607629, + "grad_norm": 4.941341400146484, + "learning_rate": 1.1033757328734461e-05, + "loss": 0.2184, + "step": 17727 + }, + { + "epoch": 48.305177111716624, + "grad_norm": 3.8010690212249756, + "learning_rate": 1.1032879558148152e-05, + "loss": 0.1603, + "step": 17728 + }, + { + "epoch": 48.30790190735695, + "grad_norm": 4.248983383178711, + "learning_rate": 1.1032001779517816e-05, + "loss": 0.2535, + "step": 17729 + }, + { + "epoch": 48.310626702997276, + "grad_norm": 6.031062126159668, + "learning_rate": 1.1031123992850279e-05, + "loss": 0.117, + "step": 17730 + }, + { + "epoch": 48.3133514986376, + "grad_norm": 3.9195001125335693, + "learning_rate": 1.1030246198152386e-05, + "loss": 0.0703, + "step": 17731 + }, + { + "epoch": 48.31607629427793, + "grad_norm": 4.528135776519775, + "learning_rate": 1.1029368395430964e-05, + "loss": 0.0937, + "step": 17732 + }, + { + "epoch": 48.31880108991825, + "grad_norm": 5.599699974060059, + "learning_rate": 1.1028490584692856e-05, + "loss": 0.1284, + "step": 17733 + }, + { + "epoch": 48.321525885558586, + "grad_norm": 4.686074733734131, + "learning_rate": 1.1027612765944895e-05, + "loss": 0.1411, + "step": 17734 + }, + { + "epoch": 48.32425068119891, + "grad_norm": 5.885397434234619, + "learning_rate": 1.102673493919392e-05, + "loss": 0.1282, + "step": 17735 + }, + { + "epoch": 48.32697547683924, + "grad_norm": 4.175334930419922, + "learning_rate": 1.1025857104446765e-05, + "loss": 0.1643, + "step": 17736 + }, + { + "epoch": 48.32970027247956, + "grad_norm": 6.086652755737305, + "learning_rate": 1.1024979261710271e-05, + "loss": 0.1401, + "step": 17737 + }, + { + "epoch": 48.33242506811989, + "grad_norm": 6.760055065155029, + "learning_rate": 1.1024101410991268e-05, + "loss": 0.1443, + "step": 17738 + }, + { + "epoch": 48.335149863760215, + "grad_norm": 4.661835670471191, + "learning_rate": 1.1023223552296601e-05, + "loss": 0.3518, + "step": 17739 + }, + { + "epoch": 48.33787465940055, + "grad_norm": 5.910048961639404, + "learning_rate": 1.1022345685633095e-05, + "loss": 0.1884, + "step": 17740 + }, + { + "epoch": 48.34059945504087, + "grad_norm": 4.59259557723999, + "learning_rate": 1.10214678110076e-05, + "loss": 0.1301, + "step": 17741 + }, + { + "epoch": 48.3433242506812, + "grad_norm": 4.3317341804504395, + "learning_rate": 1.1020589928426944e-05, + "loss": 0.1671, + "step": 17742 + }, + { + "epoch": 48.346049046321525, + "grad_norm": 4.421215534210205, + "learning_rate": 1.1019712037897967e-05, + "loss": 0.2242, + "step": 17743 + }, + { + "epoch": 48.34877384196185, + "grad_norm": 4.629679203033447, + "learning_rate": 1.1018834139427503e-05, + "loss": 0.1191, + "step": 17744 + }, + { + "epoch": 48.35149863760218, + "grad_norm": 3.6511409282684326, + "learning_rate": 1.1017956233022394e-05, + "loss": 0.0969, + "step": 17745 + }, + { + "epoch": 48.35422343324251, + "grad_norm": 4.725893020629883, + "learning_rate": 1.1017078318689473e-05, + "loss": 0.1221, + "step": 17746 + }, + { + "epoch": 48.356948228882835, + "grad_norm": 4.646679401397705, + "learning_rate": 1.1016200396435581e-05, + "loss": 0.1594, + "step": 17747 + }, + { + "epoch": 48.35967302452316, + "grad_norm": 4.431085586547852, + "learning_rate": 1.1015322466267552e-05, + "loss": 0.165, + "step": 17748 + }, + { + "epoch": 48.36239782016349, + "grad_norm": 6.013887882232666, + "learning_rate": 1.1014444528192225e-05, + "loss": 0.2449, + "step": 17749 + }, + { + "epoch": 48.36512261580381, + "grad_norm": 4.200595378875732, + "learning_rate": 1.1013566582216436e-05, + "loss": 0.0898, + "step": 17750 + }, + { + "epoch": 48.36784741144414, + "grad_norm": 5.01737117767334, + "learning_rate": 1.1012688628347024e-05, + "loss": 0.0877, + "step": 17751 + }, + { + "epoch": 48.37057220708447, + "grad_norm": 4.337869167327881, + "learning_rate": 1.1011810666590824e-05, + "loss": 0.1086, + "step": 17752 + }, + { + "epoch": 48.3732970027248, + "grad_norm": 4.994279861450195, + "learning_rate": 1.1010932696954675e-05, + "loss": 0.1671, + "step": 17753 + }, + { + "epoch": 48.37602179836512, + "grad_norm": 3.789541721343994, + "learning_rate": 1.1010054719445414e-05, + "loss": 0.224, + "step": 17754 + }, + { + "epoch": 48.37874659400545, + "grad_norm": 5.507375240325928, + "learning_rate": 1.1009176734069881e-05, + "loss": 0.2105, + "step": 17755 + }, + { + "epoch": 48.381471389645775, + "grad_norm": 4.9275126457214355, + "learning_rate": 1.1008298740834911e-05, + "loss": 0.1468, + "step": 17756 + }, + { + "epoch": 48.3841961852861, + "grad_norm": 5.050284385681152, + "learning_rate": 1.1007420739747345e-05, + "loss": 0.2736, + "step": 17757 + }, + { + "epoch": 48.38692098092643, + "grad_norm": 6.128137111663818, + "learning_rate": 1.1006542730814017e-05, + "loss": 0.1295, + "step": 17758 + }, + { + "epoch": 48.38964577656676, + "grad_norm": 4.414264678955078, + "learning_rate": 1.1005664714041768e-05, + "loss": 0.2319, + "step": 17759 + }, + { + "epoch": 48.392370572207085, + "grad_norm": 4.139552116394043, + "learning_rate": 1.1004786689437433e-05, + "loss": 0.191, + "step": 17760 + }, + { + "epoch": 48.39509536784741, + "grad_norm": 5.218533039093018, + "learning_rate": 1.1003908657007851e-05, + "loss": 0.1057, + "step": 17761 + }, + { + "epoch": 48.39782016348774, + "grad_norm": 5.753410339355469, + "learning_rate": 1.100303061675986e-05, + "loss": 0.1035, + "step": 17762 + }, + { + "epoch": 48.40054495912806, + "grad_norm": 4.692521095275879, + "learning_rate": 1.1002152568700302e-05, + "loss": 0.1673, + "step": 17763 + }, + { + "epoch": 48.403269754768395, + "grad_norm": 4.142365455627441, + "learning_rate": 1.1001274512836011e-05, + "loss": 0.1165, + "step": 17764 + }, + { + "epoch": 48.40599455040872, + "grad_norm": 5.406883239746094, + "learning_rate": 1.1000396449173826e-05, + "loss": 0.314, + "step": 17765 + }, + { + "epoch": 48.40871934604905, + "grad_norm": 4.213931083679199, + "learning_rate": 1.0999518377720587e-05, + "loss": 0.1259, + "step": 17766 + }, + { + "epoch": 48.41144414168937, + "grad_norm": 4.824357986450195, + "learning_rate": 1.099864029848313e-05, + "loss": 0.1755, + "step": 17767 + }, + { + "epoch": 48.4141689373297, + "grad_norm": 4.123696804046631, + "learning_rate": 1.0997762211468292e-05, + "loss": 0.2553, + "step": 17768 + }, + { + "epoch": 48.416893732970024, + "grad_norm": 8.818885803222656, + "learning_rate": 1.0996884116682918e-05, + "loss": 0.2187, + "step": 17769 + }, + { + "epoch": 48.41961852861036, + "grad_norm": 4.484251499176025, + "learning_rate": 1.099600601413384e-05, + "loss": 0.1441, + "step": 17770 + }, + { + "epoch": 48.42234332425068, + "grad_norm": 4.239068031311035, + "learning_rate": 1.09951279038279e-05, + "loss": 0.223, + "step": 17771 + }, + { + "epoch": 48.42506811989101, + "grad_norm": 4.117552280426025, + "learning_rate": 1.0994249785771938e-05, + "loss": 0.2856, + "step": 17772 + }, + { + "epoch": 48.427792915531334, + "grad_norm": 6.538234233856201, + "learning_rate": 1.0993371659972786e-05, + "loss": 0.2195, + "step": 17773 + }, + { + "epoch": 48.43051771117166, + "grad_norm": 3.74076509475708, + "learning_rate": 1.0992493526437288e-05, + "loss": 0.1529, + "step": 17774 + }, + { + "epoch": 48.433242506811986, + "grad_norm": 4.483790874481201, + "learning_rate": 1.0991615385172288e-05, + "loss": 0.1295, + "step": 17775 + }, + { + "epoch": 48.43596730245232, + "grad_norm": 4.919607639312744, + "learning_rate": 1.0990737236184615e-05, + "loss": 0.1698, + "step": 17776 + }, + { + "epoch": 48.438692098092645, + "grad_norm": 5.5300140380859375, + "learning_rate": 1.0989859079481114e-05, + "loss": 0.1996, + "step": 17777 + }, + { + "epoch": 48.44141689373297, + "grad_norm": 8.211633682250977, + "learning_rate": 1.098898091506862e-05, + "loss": 0.1651, + "step": 17778 + }, + { + "epoch": 48.444141689373296, + "grad_norm": 5.996046543121338, + "learning_rate": 1.0988102742953975e-05, + "loss": 0.2726, + "step": 17779 + }, + { + "epoch": 48.44686648501362, + "grad_norm": 4.44057035446167, + "learning_rate": 1.0987224563144018e-05, + "loss": 0.0924, + "step": 17780 + }, + { + "epoch": 48.44959128065395, + "grad_norm": 5.444934844970703, + "learning_rate": 1.098634637564559e-05, + "loss": 0.1428, + "step": 17781 + }, + { + "epoch": 48.45231607629428, + "grad_norm": 3.993893623352051, + "learning_rate": 1.0985468180465525e-05, + "loss": 0.1146, + "step": 17782 + }, + { + "epoch": 48.45504087193461, + "grad_norm": 4.247274875640869, + "learning_rate": 1.0984589977610669e-05, + "loss": 0.195, + "step": 17783 + }, + { + "epoch": 48.45776566757493, + "grad_norm": 4.251191139221191, + "learning_rate": 1.0983711767087856e-05, + "loss": 0.1395, + "step": 17784 + }, + { + "epoch": 48.46049046321526, + "grad_norm": 4.462006092071533, + "learning_rate": 1.0982833548903926e-05, + "loss": 0.1132, + "step": 17785 + }, + { + "epoch": 48.463215258855584, + "grad_norm": 3.7238845825195312, + "learning_rate": 1.0981955323065723e-05, + "loss": 0.1435, + "step": 17786 + }, + { + "epoch": 48.46594005449591, + "grad_norm": 4.878916263580322, + "learning_rate": 1.098107708958008e-05, + "loss": 0.2097, + "step": 17787 + }, + { + "epoch": 48.46866485013624, + "grad_norm": 5.452115058898926, + "learning_rate": 1.0980198848453843e-05, + "loss": 0.1718, + "step": 17788 + }, + { + "epoch": 48.47138964577657, + "grad_norm": 4.800817966461182, + "learning_rate": 1.0979320599693848e-05, + "loss": 0.1466, + "step": 17789 + }, + { + "epoch": 48.474114441416894, + "grad_norm": 3.7360053062438965, + "learning_rate": 1.0978442343306936e-05, + "loss": 0.2216, + "step": 17790 + }, + { + "epoch": 48.47683923705722, + "grad_norm": 3.831552505493164, + "learning_rate": 1.0977564079299946e-05, + "loss": 0.1302, + "step": 17791 + }, + { + "epoch": 48.479564032697546, + "grad_norm": 3.7697205543518066, + "learning_rate": 1.0976685807679719e-05, + "loss": 0.2297, + "step": 17792 + }, + { + "epoch": 48.48228882833787, + "grad_norm": 6.190758228302002, + "learning_rate": 1.0975807528453093e-05, + "loss": 0.1273, + "step": 17793 + }, + { + "epoch": 48.485013623978205, + "grad_norm": 4.133101940155029, + "learning_rate": 1.0974929241626912e-05, + "loss": 0.2018, + "step": 17794 + }, + { + "epoch": 48.48773841961853, + "grad_norm": 5.943972110748291, + "learning_rate": 1.0974050947208012e-05, + "loss": 0.1339, + "step": 17795 + }, + { + "epoch": 48.490463215258856, + "grad_norm": 7.384430408477783, + "learning_rate": 1.0973172645203235e-05, + "loss": 0.1288, + "step": 17796 + }, + { + "epoch": 48.49318801089918, + "grad_norm": 4.5868377685546875, + "learning_rate": 1.0972294335619418e-05, + "loss": 0.0871, + "step": 17797 + }, + { + "epoch": 48.49591280653951, + "grad_norm": 4.389998912811279, + "learning_rate": 1.0971416018463406e-05, + "loss": 0.1223, + "step": 17798 + }, + { + "epoch": 48.49863760217983, + "grad_norm": 3.918980598449707, + "learning_rate": 1.0970537693742038e-05, + "loss": 0.2619, + "step": 17799 + }, + { + "epoch": 48.50136239782017, + "grad_norm": 4.901152610778809, + "learning_rate": 1.0969659361462153e-05, + "loss": 0.1312, + "step": 17800 + }, + { + "epoch": 48.50408719346049, + "grad_norm": 4.2105865478515625, + "learning_rate": 1.0968781021630593e-05, + "loss": 0.198, + "step": 17801 + }, + { + "epoch": 48.50681198910082, + "grad_norm": 6.870593070983887, + "learning_rate": 1.0967902674254199e-05, + "loss": 0.1419, + "step": 17802 + }, + { + "epoch": 48.509536784741144, + "grad_norm": 4.70383358001709, + "learning_rate": 1.0967024319339806e-05, + "loss": 0.1556, + "step": 17803 + }, + { + "epoch": 48.51226158038147, + "grad_norm": 4.624796390533447, + "learning_rate": 1.0966145956894259e-05, + "loss": 0.1064, + "step": 17804 + }, + { + "epoch": 48.514986376021795, + "grad_norm": 5.43842077255249, + "learning_rate": 1.0965267586924399e-05, + "loss": 0.2489, + "step": 17805 + }, + { + "epoch": 48.51771117166213, + "grad_norm": 4.296053886413574, + "learning_rate": 1.096438920943707e-05, + "loss": 0.219, + "step": 17806 + }, + { + "epoch": 48.520435967302454, + "grad_norm": 3.50492000579834, + "learning_rate": 1.0963510824439102e-05, + "loss": 0.1002, + "step": 17807 + }, + { + "epoch": 48.52316076294278, + "grad_norm": 5.498265266418457, + "learning_rate": 1.096263243193735e-05, + "loss": 0.1517, + "step": 17808 + }, + { + "epoch": 48.525885558583106, + "grad_norm": 4.727783203125, + "learning_rate": 1.0961754031938643e-05, + "loss": 0.2114, + "step": 17809 + }, + { + "epoch": 48.52861035422343, + "grad_norm": 5.354934215545654, + "learning_rate": 1.096087562444983e-05, + "loss": 0.1706, + "step": 17810 + }, + { + "epoch": 48.53133514986376, + "grad_norm": 4.985727787017822, + "learning_rate": 1.0959997209477747e-05, + "loss": 0.1196, + "step": 17811 + }, + { + "epoch": 48.53405994550409, + "grad_norm": 4.712111473083496, + "learning_rate": 1.0959118787029236e-05, + "loss": 0.1507, + "step": 17812 + }, + { + "epoch": 48.536784741144416, + "grad_norm": 6.8252058029174805, + "learning_rate": 1.0958240357111136e-05, + "loss": 0.2059, + "step": 17813 + }, + { + "epoch": 48.53950953678474, + "grad_norm": 4.87732458114624, + "learning_rate": 1.0957361919730293e-05, + "loss": 0.1522, + "step": 17814 + }, + { + "epoch": 48.54223433242507, + "grad_norm": 3.610193967819214, + "learning_rate": 1.095648347489355e-05, + "loss": 0.1651, + "step": 17815 + }, + { + "epoch": 48.54495912806539, + "grad_norm": 5.8085551261901855, + "learning_rate": 1.095560502260774e-05, + "loss": 0.127, + "step": 17816 + }, + { + "epoch": 48.54768392370572, + "grad_norm": 3.7117836475372314, + "learning_rate": 1.0954726562879709e-05, + "loss": 0.0835, + "step": 17817 + }, + { + "epoch": 48.55040871934605, + "grad_norm": 3.1796491146087646, + "learning_rate": 1.0953848095716302e-05, + "loss": 0.0797, + "step": 17818 + }, + { + "epoch": 48.55313351498638, + "grad_norm": 4.152004241943359, + "learning_rate": 1.0952969621124354e-05, + "loss": 0.1352, + "step": 17819 + }, + { + "epoch": 48.555858310626704, + "grad_norm": 7.578192710876465, + "learning_rate": 1.095209113911071e-05, + "loss": 0.2625, + "step": 17820 + }, + { + "epoch": 48.55858310626703, + "grad_norm": 4.083261013031006, + "learning_rate": 1.0951212649682208e-05, + "loss": 0.0693, + "step": 17821 + }, + { + "epoch": 48.561307901907355, + "grad_norm": 4.408059120178223, + "learning_rate": 1.0950334152845697e-05, + "loss": 0.2066, + "step": 17822 + }, + { + "epoch": 48.56403269754768, + "grad_norm": 5.4838547706604, + "learning_rate": 1.094945564860801e-05, + "loss": 0.138, + "step": 17823 + }, + { + "epoch": 48.566757493188014, + "grad_norm": 4.158769607543945, + "learning_rate": 1.0948577136975998e-05, + "loss": 0.2052, + "step": 17824 + }, + { + "epoch": 48.56948228882834, + "grad_norm": 6.033012866973877, + "learning_rate": 1.0947698617956493e-05, + "loss": 0.1823, + "step": 17825 + }, + { + "epoch": 48.572207084468666, + "grad_norm": 4.139128684997559, + "learning_rate": 1.0946820091556345e-05, + "loss": 0.2572, + "step": 17826 + }, + { + "epoch": 48.57493188010899, + "grad_norm": 4.893764495849609, + "learning_rate": 1.0945941557782389e-05, + "loss": 0.1458, + "step": 17827 + }, + { + "epoch": 48.57765667574932, + "grad_norm": 4.853830337524414, + "learning_rate": 1.0945063016641475e-05, + "loss": 0.1359, + "step": 17828 + }, + { + "epoch": 48.58038147138964, + "grad_norm": 4.356120586395264, + "learning_rate": 1.0944184468140438e-05, + "loss": 0.2207, + "step": 17829 + }, + { + "epoch": 48.583106267029976, + "grad_norm": 4.447303295135498, + "learning_rate": 1.0943305912286122e-05, + "loss": 0.218, + "step": 17830 + }, + { + "epoch": 48.5858310626703, + "grad_norm": 4.7632246017456055, + "learning_rate": 1.0942427349085369e-05, + "loss": 0.1986, + "step": 17831 + }, + { + "epoch": 48.58855585831063, + "grad_norm": 5.0486860275268555, + "learning_rate": 1.0941548778545026e-05, + "loss": 0.2096, + "step": 17832 + }, + { + "epoch": 48.59128065395095, + "grad_norm": 4.926656246185303, + "learning_rate": 1.0940670200671927e-05, + "loss": 0.1386, + "step": 17833 + }, + { + "epoch": 48.59400544959128, + "grad_norm": 6.114628791809082, + "learning_rate": 1.0939791615472925e-05, + "loss": 0.1548, + "step": 17834 + }, + { + "epoch": 48.596730245231605, + "grad_norm": 4.695802211761475, + "learning_rate": 1.093891302295485e-05, + "loss": 0.131, + "step": 17835 + }, + { + "epoch": 48.59945504087194, + "grad_norm": 4.727912902832031, + "learning_rate": 1.0938034423124556e-05, + "loss": 0.2326, + "step": 17836 + }, + { + "epoch": 48.60217983651226, + "grad_norm": 5.18319845199585, + "learning_rate": 1.0937155815988876e-05, + "loss": 0.135, + "step": 17837 + }, + { + "epoch": 48.60490463215259, + "grad_norm": 4.774102210998535, + "learning_rate": 1.0936277201554659e-05, + "loss": 0.1554, + "step": 17838 + }, + { + "epoch": 48.607629427792915, + "grad_norm": 4.480764389038086, + "learning_rate": 1.093539857982874e-05, + "loss": 0.0951, + "step": 17839 + }, + { + "epoch": 48.61035422343324, + "grad_norm": 5.493941307067871, + "learning_rate": 1.0934519950817975e-05, + "loss": 0.145, + "step": 17840 + }, + { + "epoch": 48.61307901907357, + "grad_norm": 12.467942237854004, + "learning_rate": 1.0933641314529194e-05, + "loss": 0.1568, + "step": 17841 + }, + { + "epoch": 48.6158038147139, + "grad_norm": 4.472496509552002, + "learning_rate": 1.0932762670969245e-05, + "loss": 0.3599, + "step": 17842 + }, + { + "epoch": 48.618528610354225, + "grad_norm": 4.142789840698242, + "learning_rate": 1.093188402014497e-05, + "loss": 0.1164, + "step": 17843 + }, + { + "epoch": 48.62125340599455, + "grad_norm": 11.64066219329834, + "learning_rate": 1.0931005362063215e-05, + "loss": 0.0925, + "step": 17844 + }, + { + "epoch": 48.62397820163488, + "grad_norm": 4.357254505157471, + "learning_rate": 1.0930126696730817e-05, + "loss": 0.1776, + "step": 17845 + }, + { + "epoch": 48.6267029972752, + "grad_norm": 4.873206615447998, + "learning_rate": 1.0929248024154623e-05, + "loss": 0.114, + "step": 17846 + }, + { + "epoch": 48.62942779291553, + "grad_norm": 3.566783905029297, + "learning_rate": 1.0928369344341475e-05, + "loss": 0.0887, + "step": 17847 + }, + { + "epoch": 48.63215258855586, + "grad_norm": 4.783731460571289, + "learning_rate": 1.0927490657298217e-05, + "loss": 0.3098, + "step": 17848 + }, + { + "epoch": 48.63487738419619, + "grad_norm": 9.20406436920166, + "learning_rate": 1.092661196303169e-05, + "loss": 0.1396, + "step": 17849 + }, + { + "epoch": 48.63760217983651, + "grad_norm": 5.053576469421387, + "learning_rate": 1.092573326154874e-05, + "loss": 0.1924, + "step": 17850 + }, + { + "epoch": 48.64032697547684, + "grad_norm": 6.097115516662598, + "learning_rate": 1.092485455285621e-05, + "loss": 0.188, + "step": 17851 + }, + { + "epoch": 48.643051771117165, + "grad_norm": 4.562507629394531, + "learning_rate": 1.0923975836960945e-05, + "loss": 0.1523, + "step": 17852 + }, + { + "epoch": 48.64577656675749, + "grad_norm": 5.5145063400268555, + "learning_rate": 1.092309711386978e-05, + "loss": 0.2023, + "step": 17853 + }, + { + "epoch": 48.64850136239782, + "grad_norm": 3.9514994621276855, + "learning_rate": 1.0922218383589571e-05, + "loss": 0.147, + "step": 17854 + }, + { + "epoch": 48.65122615803815, + "grad_norm": 4.680118083953857, + "learning_rate": 1.0921339646127149e-05, + "loss": 0.2202, + "step": 17855 + }, + { + "epoch": 48.653950953678475, + "grad_norm": 5.517587184906006, + "learning_rate": 1.0920460901489367e-05, + "loss": 0.2085, + "step": 17856 + }, + { + "epoch": 48.6566757493188, + "grad_norm": 4.694092750549316, + "learning_rate": 1.0919582149683063e-05, + "loss": 0.1227, + "step": 17857 + }, + { + "epoch": 48.65940054495913, + "grad_norm": 4.772033214569092, + "learning_rate": 1.0918703390715085e-05, + "loss": 0.1051, + "step": 17858 + }, + { + "epoch": 48.66212534059945, + "grad_norm": 4.644705772399902, + "learning_rate": 1.0917824624592275e-05, + "loss": 0.1581, + "step": 17859 + }, + { + "epoch": 48.664850136239785, + "grad_norm": 8.996315956115723, + "learning_rate": 1.0916945851321472e-05, + "loss": 0.137, + "step": 17860 + }, + { + "epoch": 48.66757493188011, + "grad_norm": 3.949974775314331, + "learning_rate": 1.0916067070909526e-05, + "loss": 0.2643, + "step": 17861 + }, + { + "epoch": 48.67029972752044, + "grad_norm": 5.861550807952881, + "learning_rate": 1.0915188283363282e-05, + "loss": 0.2017, + "step": 17862 + }, + { + "epoch": 48.67302452316076, + "grad_norm": 5.690976142883301, + "learning_rate": 1.0914309488689578e-05, + "loss": 0.2188, + "step": 17863 + }, + { + "epoch": 48.67574931880109, + "grad_norm": 4.927664279937744, + "learning_rate": 1.0913430686895261e-05, + "loss": 0.0955, + "step": 17864 + }, + { + "epoch": 48.678474114441414, + "grad_norm": 4.175412654876709, + "learning_rate": 1.0912551877987179e-05, + "loss": 0.1394, + "step": 17865 + }, + { + "epoch": 48.68119891008175, + "grad_norm": 7.90694522857666, + "learning_rate": 1.0911673061972168e-05, + "loss": 0.3055, + "step": 17866 + }, + { + "epoch": 48.68392370572207, + "grad_norm": 5.071043968200684, + "learning_rate": 1.0910794238857082e-05, + "loss": 0.2462, + "step": 17867 + }, + { + "epoch": 48.6866485013624, + "grad_norm": 3.9485936164855957, + "learning_rate": 1.0909915408648755e-05, + "loss": 0.1552, + "step": 17868 + }, + { + "epoch": 48.689373297002724, + "grad_norm": 4.367345809936523, + "learning_rate": 1.0909036571354037e-05, + "loss": 0.0789, + "step": 17869 + }, + { + "epoch": 48.69209809264305, + "grad_norm": 6.0083417892456055, + "learning_rate": 1.0908157726979772e-05, + "loss": 0.2444, + "step": 17870 + }, + { + "epoch": 48.694822888283376, + "grad_norm": 4.69628381729126, + "learning_rate": 1.0907278875532805e-05, + "loss": 0.2709, + "step": 17871 + }, + { + "epoch": 48.69754768392371, + "grad_norm": 5.077993392944336, + "learning_rate": 1.0906400017019976e-05, + "loss": 0.1828, + "step": 17872 + }, + { + "epoch": 48.700272479564035, + "grad_norm": 8.109603881835938, + "learning_rate": 1.0905521151448132e-05, + "loss": 0.194, + "step": 17873 + }, + { + "epoch": 48.70299727520436, + "grad_norm": 4.917482852935791, + "learning_rate": 1.0904642278824122e-05, + "loss": 0.1781, + "step": 17874 + }, + { + "epoch": 48.705722070844686, + "grad_norm": 7.983536243438721, + "learning_rate": 1.0903763399154787e-05, + "loss": 0.1718, + "step": 17875 + }, + { + "epoch": 48.70844686648501, + "grad_norm": 4.195606708526611, + "learning_rate": 1.0902884512446972e-05, + "loss": 0.1059, + "step": 17876 + }, + { + "epoch": 48.71117166212534, + "grad_norm": 4.410258769989014, + "learning_rate": 1.090200561870752e-05, + "loss": 0.1021, + "step": 17877 + }, + { + "epoch": 48.71389645776567, + "grad_norm": 4.368112087249756, + "learning_rate": 1.0901126717943277e-05, + "loss": 0.1574, + "step": 17878 + }, + { + "epoch": 48.716621253406, + "grad_norm": 3.8354806900024414, + "learning_rate": 1.0900247810161091e-05, + "loss": 0.1346, + "step": 17879 + }, + { + "epoch": 48.71934604904632, + "grad_norm": 3.4195239543914795, + "learning_rate": 1.0899368895367802e-05, + "loss": 0.1244, + "step": 17880 + }, + { + "epoch": 48.72207084468665, + "grad_norm": 4.415281295776367, + "learning_rate": 1.0898489973570256e-05, + "loss": 0.1332, + "step": 17881 + }, + { + "epoch": 48.724795640326974, + "grad_norm": 6.313999652862549, + "learning_rate": 1.0897611044775299e-05, + "loss": 0.155, + "step": 17882 + }, + { + "epoch": 48.7275204359673, + "grad_norm": 5.8819804191589355, + "learning_rate": 1.0896732108989775e-05, + "loss": 0.1077, + "step": 17883 + }, + { + "epoch": 48.73024523160763, + "grad_norm": 5.503526210784912, + "learning_rate": 1.0895853166220534e-05, + "loss": 0.1199, + "step": 17884 + }, + { + "epoch": 48.73297002724796, + "grad_norm": 5.5648369789123535, + "learning_rate": 1.0894974216474415e-05, + "loss": 0.1902, + "step": 17885 + }, + { + "epoch": 48.735694822888284, + "grad_norm": 6.182637691497803, + "learning_rate": 1.0894095259758267e-05, + "loss": 0.1331, + "step": 17886 + }, + { + "epoch": 48.73841961852861, + "grad_norm": 5.193334579467773, + "learning_rate": 1.0893216296078932e-05, + "loss": 0.2414, + "step": 17887 + }, + { + "epoch": 48.741144414168936, + "grad_norm": 4.44490909576416, + "learning_rate": 1.0892337325443259e-05, + "loss": 0.2874, + "step": 17888 + }, + { + "epoch": 48.74386920980926, + "grad_norm": 4.241389274597168, + "learning_rate": 1.089145834785809e-05, + "loss": 0.2356, + "step": 17889 + }, + { + "epoch": 48.746594005449595, + "grad_norm": 4.388084888458252, + "learning_rate": 1.0890579363330271e-05, + "loss": 0.1595, + "step": 17890 + }, + { + "epoch": 48.74931880108992, + "grad_norm": 5.427707672119141, + "learning_rate": 1.0889700371866651e-05, + "loss": 0.4053, + "step": 17891 + }, + { + "epoch": 48.752043596730246, + "grad_norm": 4.970544815063477, + "learning_rate": 1.0888821373474073e-05, + "loss": 0.1579, + "step": 17892 + }, + { + "epoch": 48.75476839237057, + "grad_norm": 3.7840118408203125, + "learning_rate": 1.0887942368159384e-05, + "loss": 0.1369, + "step": 17893 + }, + { + "epoch": 48.7574931880109, + "grad_norm": 4.346770763397217, + "learning_rate": 1.0887063355929426e-05, + "loss": 0.0802, + "step": 17894 + }, + { + "epoch": 48.76021798365122, + "grad_norm": 4.558623313903809, + "learning_rate": 1.0886184336791047e-05, + "loss": 0.2136, + "step": 17895 + }, + { + "epoch": 48.762942779291556, + "grad_norm": 4.797070026397705, + "learning_rate": 1.0885305310751095e-05, + "loss": 0.0827, + "step": 17896 + }, + { + "epoch": 48.76566757493188, + "grad_norm": 4.973506450653076, + "learning_rate": 1.0884426277816413e-05, + "loss": 0.1287, + "step": 17897 + }, + { + "epoch": 48.76839237057221, + "grad_norm": 5.083658218383789, + "learning_rate": 1.0883547237993846e-05, + "loss": 0.2286, + "step": 17898 + }, + { + "epoch": 48.771117166212534, + "grad_norm": 5.547389507293701, + "learning_rate": 1.0882668191290242e-05, + "loss": 0.2499, + "step": 17899 + }, + { + "epoch": 48.77384196185286, + "grad_norm": 4.125782012939453, + "learning_rate": 1.0881789137712446e-05, + "loss": 0.1324, + "step": 17900 + }, + { + "epoch": 48.776566757493185, + "grad_norm": 4.395590782165527, + "learning_rate": 1.0880910077267308e-05, + "loss": 0.1084, + "step": 17901 + }, + { + "epoch": 48.77929155313352, + "grad_norm": 4.682062149047852, + "learning_rate": 1.0880031009961667e-05, + "loss": 0.2002, + "step": 17902 + }, + { + "epoch": 48.782016348773844, + "grad_norm": 4.319581508636475, + "learning_rate": 1.0879151935802376e-05, + "loss": 0.1735, + "step": 17903 + }, + { + "epoch": 48.78474114441417, + "grad_norm": 4.89421272277832, + "learning_rate": 1.0878272854796274e-05, + "loss": 0.2112, + "step": 17904 + }, + { + "epoch": 48.787465940054496, + "grad_norm": 3.7251944541931152, + "learning_rate": 1.0877393766950217e-05, + "loss": 0.0972, + "step": 17905 + }, + { + "epoch": 48.79019073569482, + "grad_norm": 4.159662246704102, + "learning_rate": 1.0876514672271041e-05, + "loss": 0.1897, + "step": 17906 + }, + { + "epoch": 48.79291553133515, + "grad_norm": 5.107697486877441, + "learning_rate": 1.0875635570765596e-05, + "loss": 0.3254, + "step": 17907 + }, + { + "epoch": 48.79564032697548, + "grad_norm": 4.411425590515137, + "learning_rate": 1.0874756462440732e-05, + "loss": 0.1898, + "step": 17908 + }, + { + "epoch": 48.798365122615806, + "grad_norm": 3.6324493885040283, + "learning_rate": 1.0873877347303295e-05, + "loss": 0.1586, + "step": 17909 + }, + { + "epoch": 48.80108991825613, + "grad_norm": 5.099329948425293, + "learning_rate": 1.0872998225360126e-05, + "loss": 0.1069, + "step": 17910 + }, + { + "epoch": 48.80381471389646, + "grad_norm": 4.622508525848389, + "learning_rate": 1.0872119096618074e-05, + "loss": 0.1519, + "step": 17911 + }, + { + "epoch": 48.80653950953678, + "grad_norm": 5.181702136993408, + "learning_rate": 1.0871239961083987e-05, + "loss": 0.1398, + "step": 17912 + }, + { + "epoch": 48.80926430517711, + "grad_norm": 3.86995792388916, + "learning_rate": 1.0870360818764716e-05, + "loss": 0.1343, + "step": 17913 + }, + { + "epoch": 48.81198910081744, + "grad_norm": 4.519218444824219, + "learning_rate": 1.0869481669667097e-05, + "loss": 0.1195, + "step": 17914 + }, + { + "epoch": 48.81471389645777, + "grad_norm": 7.27349853515625, + "learning_rate": 1.0868602513797989e-05, + "loss": 0.2016, + "step": 17915 + }, + { + "epoch": 48.817438692098094, + "grad_norm": 3.614105701446533, + "learning_rate": 1.0867723351164223e-05, + "loss": 0.2255, + "step": 17916 + }, + { + "epoch": 48.82016348773842, + "grad_norm": 4.0133442878723145, + "learning_rate": 1.0866844181772662e-05, + "loss": 0.1782, + "step": 17917 + }, + { + "epoch": 48.822888283378745, + "grad_norm": 4.203430652618408, + "learning_rate": 1.0865965005630147e-05, + "loss": 0.1177, + "step": 17918 + }, + { + "epoch": 48.82561307901907, + "grad_norm": 4.711203575134277, + "learning_rate": 1.0865085822743521e-05, + "loss": 0.1313, + "step": 17919 + }, + { + "epoch": 48.828337874659404, + "grad_norm": 6.362487316131592, + "learning_rate": 1.0864206633119637e-05, + "loss": 0.3236, + "step": 17920 + }, + { + "epoch": 48.83106267029973, + "grad_norm": 4.486247539520264, + "learning_rate": 1.0863327436765342e-05, + "loss": 0.211, + "step": 17921 + }, + { + "epoch": 48.833787465940055, + "grad_norm": 5.597450256347656, + "learning_rate": 1.0862448233687475e-05, + "loss": 0.1327, + "step": 17922 + }, + { + "epoch": 48.83651226158038, + "grad_norm": 5.655049800872803, + "learning_rate": 1.0861569023892893e-05, + "loss": 0.139, + "step": 17923 + }, + { + "epoch": 48.83923705722071, + "grad_norm": 4.612045764923096, + "learning_rate": 1.0860689807388437e-05, + "loss": 0.1858, + "step": 17924 + }, + { + "epoch": 48.84196185286103, + "grad_norm": 6.127689838409424, + "learning_rate": 1.0859810584180956e-05, + "loss": 0.207, + "step": 17925 + }, + { + "epoch": 48.844686648501366, + "grad_norm": 4.130288600921631, + "learning_rate": 1.0858931354277299e-05, + "loss": 0.1206, + "step": 17926 + }, + { + "epoch": 48.84741144414169, + "grad_norm": 4.735872268676758, + "learning_rate": 1.0858052117684312e-05, + "loss": 0.1348, + "step": 17927 + }, + { + "epoch": 48.85013623978202, + "grad_norm": 4.604114532470703, + "learning_rate": 1.0857172874408844e-05, + "loss": 0.2167, + "step": 17928 + }, + { + "epoch": 48.85286103542234, + "grad_norm": 4.775600910186768, + "learning_rate": 1.0856293624457741e-05, + "loss": 0.3827, + "step": 17929 + }, + { + "epoch": 48.85558583106267, + "grad_norm": 3.6267833709716797, + "learning_rate": 1.0855414367837848e-05, + "loss": 0.0815, + "step": 17930 + }, + { + "epoch": 48.858310626702995, + "grad_norm": 4.787769317626953, + "learning_rate": 1.0854535104556019e-05, + "loss": 0.0944, + "step": 17931 + }, + { + "epoch": 48.86103542234333, + "grad_norm": 5.059425354003906, + "learning_rate": 1.0853655834619096e-05, + "loss": 0.1597, + "step": 17932 + }, + { + "epoch": 48.86376021798365, + "grad_norm": 4.373810768127441, + "learning_rate": 1.0852776558033928e-05, + "loss": 0.1992, + "step": 17933 + }, + { + "epoch": 48.86648501362398, + "grad_norm": 8.81373405456543, + "learning_rate": 1.0851897274807368e-05, + "loss": 0.2454, + "step": 17934 + }, + { + "epoch": 48.869209809264305, + "grad_norm": 4.95613431930542, + "learning_rate": 1.0851017984946255e-05, + "loss": 0.1094, + "step": 17935 + }, + { + "epoch": 48.87193460490463, + "grad_norm": 4.967520713806152, + "learning_rate": 1.0850138688457441e-05, + "loss": 0.1375, + "step": 17936 + }, + { + "epoch": 48.87465940054496, + "grad_norm": 6.082039833068848, + "learning_rate": 1.0849259385347779e-05, + "loss": 0.2957, + "step": 17937 + }, + { + "epoch": 48.87738419618529, + "grad_norm": 4.3331685066223145, + "learning_rate": 1.0848380075624107e-05, + "loss": 0.2389, + "step": 17938 + }, + { + "epoch": 48.880108991825615, + "grad_norm": 6.027491092681885, + "learning_rate": 1.0847500759293284e-05, + "loss": 0.1063, + "step": 17939 + }, + { + "epoch": 48.88283378746594, + "grad_norm": 3.9232709407806396, + "learning_rate": 1.0846621436362146e-05, + "loss": 0.1005, + "step": 17940 + }, + { + "epoch": 48.88555858310627, + "grad_norm": 3.850847005844116, + "learning_rate": 1.0845742106837553e-05, + "loss": 0.1297, + "step": 17941 + }, + { + "epoch": 48.88828337874659, + "grad_norm": 8.043157577514648, + "learning_rate": 1.0844862770726344e-05, + "loss": 0.1501, + "step": 17942 + }, + { + "epoch": 48.89100817438692, + "grad_norm": 4.68732213973999, + "learning_rate": 1.0843983428035372e-05, + "loss": 0.1081, + "step": 17943 + }, + { + "epoch": 48.89373297002725, + "grad_norm": 4.118488311767578, + "learning_rate": 1.0843104078771485e-05, + "loss": 0.0933, + "step": 17944 + }, + { + "epoch": 48.89645776566758, + "grad_norm": 4.96099853515625, + "learning_rate": 1.0842224722941528e-05, + "loss": 0.0891, + "step": 17945 + }, + { + "epoch": 48.8991825613079, + "grad_norm": 5.396556854248047, + "learning_rate": 1.0841345360552356e-05, + "loss": 0.174, + "step": 17946 + }, + { + "epoch": 48.90190735694823, + "grad_norm": 4.59935998916626, + "learning_rate": 1.084046599161081e-05, + "loss": 0.0983, + "step": 17947 + }, + { + "epoch": 48.904632152588555, + "grad_norm": 5.52337121963501, + "learning_rate": 1.0839586616123743e-05, + "loss": 0.2061, + "step": 17948 + }, + { + "epoch": 48.90735694822888, + "grad_norm": 4.852114677429199, + "learning_rate": 1.0838707234098003e-05, + "loss": 0.1496, + "step": 17949 + }, + { + "epoch": 48.91008174386921, + "grad_norm": 5.507870197296143, + "learning_rate": 1.0837827845540438e-05, + "loss": 0.1866, + "step": 17950 + }, + { + "epoch": 48.91280653950954, + "grad_norm": 6.330488681793213, + "learning_rate": 1.0836948450457894e-05, + "loss": 0.1924, + "step": 17951 + }, + { + "epoch": 48.915531335149865, + "grad_norm": 4.366691589355469, + "learning_rate": 1.0836069048857228e-05, + "loss": 0.1955, + "step": 17952 + }, + { + "epoch": 48.91825613079019, + "grad_norm": 5.374604225158691, + "learning_rate": 1.0835189640745279e-05, + "loss": 0.1514, + "step": 17953 + }, + { + "epoch": 48.920980926430516, + "grad_norm": 4.547908306121826, + "learning_rate": 1.08343102261289e-05, + "loss": 0.2376, + "step": 17954 + }, + { + "epoch": 48.92370572207084, + "grad_norm": 4.376667022705078, + "learning_rate": 1.0833430805014942e-05, + "loss": 0.0857, + "step": 17955 + }, + { + "epoch": 48.926430517711175, + "grad_norm": 4.054291725158691, + "learning_rate": 1.0832551377410252e-05, + "loss": 0.2339, + "step": 17956 + }, + { + "epoch": 48.9291553133515, + "grad_norm": 8.085643768310547, + "learning_rate": 1.0831671943321675e-05, + "loss": 0.1084, + "step": 17957 + }, + { + "epoch": 48.93188010899183, + "grad_norm": 7.077549457550049, + "learning_rate": 1.0830792502756067e-05, + "loss": 0.1158, + "step": 17958 + }, + { + "epoch": 48.93460490463215, + "grad_norm": 4.296553611755371, + "learning_rate": 1.0829913055720268e-05, + "loss": 0.1128, + "step": 17959 + }, + { + "epoch": 48.93732970027248, + "grad_norm": 6.046850204467773, + "learning_rate": 1.082903360222114e-05, + "loss": 0.2121, + "step": 17960 + }, + { + "epoch": 48.940054495912804, + "grad_norm": 4.763850212097168, + "learning_rate": 1.0828154142265521e-05, + "loss": 0.2364, + "step": 17961 + }, + { + "epoch": 48.94277929155314, + "grad_norm": 4.865629196166992, + "learning_rate": 1.0827274675860266e-05, + "loss": 0.1177, + "step": 17962 + }, + { + "epoch": 48.94550408719346, + "grad_norm": 3.9033432006835938, + "learning_rate": 1.0826395203012223e-05, + "loss": 0.0955, + "step": 17963 + }, + { + "epoch": 48.94822888283379, + "grad_norm": 4.03185510635376, + "learning_rate": 1.0825515723728241e-05, + "loss": 0.1818, + "step": 17964 + }, + { + "epoch": 48.950953678474114, + "grad_norm": 6.728121757507324, + "learning_rate": 1.0824636238015167e-05, + "loss": 0.2241, + "step": 17965 + }, + { + "epoch": 48.95367847411444, + "grad_norm": 4.339187145233154, + "learning_rate": 1.0823756745879853e-05, + "loss": 0.1173, + "step": 17966 + }, + { + "epoch": 48.956403269754766, + "grad_norm": 4.03483247756958, + "learning_rate": 1.0822877247329148e-05, + "loss": 0.1961, + "step": 17967 + }, + { + "epoch": 48.95912806539509, + "grad_norm": 6.427977561950684, + "learning_rate": 1.0821997742369901e-05, + "loss": 0.1114, + "step": 17968 + }, + { + "epoch": 48.961852861035425, + "grad_norm": 5.688981533050537, + "learning_rate": 1.0821118231008963e-05, + "loss": 0.1795, + "step": 17969 + }, + { + "epoch": 48.96457765667575, + "grad_norm": 3.970400094985962, + "learning_rate": 1.0820238713253184e-05, + "loss": 0.0742, + "step": 17970 + }, + { + "epoch": 48.967302452316076, + "grad_norm": 4.422605991363525, + "learning_rate": 1.0819359189109409e-05, + "loss": 0.2069, + "step": 17971 + }, + { + "epoch": 48.9700272479564, + "grad_norm": 5.416562557220459, + "learning_rate": 1.0818479658584495e-05, + "loss": 0.1225, + "step": 17972 + }, + { + "epoch": 48.97275204359673, + "grad_norm": 4.591360092163086, + "learning_rate": 1.0817600121685283e-05, + "loss": 0.1456, + "step": 17973 + }, + { + "epoch": 48.97547683923706, + "grad_norm": 5.2208099365234375, + "learning_rate": 1.0816720578418634e-05, + "loss": 0.1883, + "step": 17974 + }, + { + "epoch": 48.97820163487739, + "grad_norm": 4.898530006408691, + "learning_rate": 1.0815841028791385e-05, + "loss": 0.117, + "step": 17975 + }, + { + "epoch": 48.98092643051771, + "grad_norm": 4.976808547973633, + "learning_rate": 1.0814961472810395e-05, + "loss": 0.1436, + "step": 17976 + }, + { + "epoch": 48.98365122615804, + "grad_norm": 5.774075508117676, + "learning_rate": 1.081408191048251e-05, + "loss": 0.1706, + "step": 17977 + }, + { + "epoch": 48.986376021798364, + "grad_norm": 6.600642681121826, + "learning_rate": 1.0813202341814583e-05, + "loss": 0.1776, + "step": 17978 + }, + { + "epoch": 48.98910081743869, + "grad_norm": 6.6657185554504395, + "learning_rate": 1.081232276681346e-05, + "loss": 0.2789, + "step": 17979 + }, + { + "epoch": 48.991825613079016, + "grad_norm": 3.7275452613830566, + "learning_rate": 1.0811443185485998e-05, + "loss": 0.12, + "step": 17980 + }, + { + "epoch": 48.99455040871935, + "grad_norm": 4.625736236572266, + "learning_rate": 1.0810563597839039e-05, + "loss": 0.2359, + "step": 17981 + }, + { + "epoch": 48.997275204359674, + "grad_norm": 4.443175792694092, + "learning_rate": 1.0809684003879438e-05, + "loss": 0.1874, + "step": 17982 + }, + { + "epoch": 49.0, + "grad_norm": 5.10296106338501, + "learning_rate": 1.0808804403614044e-05, + "loss": 0.1693, + "step": 17983 + }, + { + "epoch": 49.002724795640326, + "grad_norm": 4.369555950164795, + "learning_rate": 1.0807924797049707e-05, + "loss": 0.3171, + "step": 17984 + }, + { + "epoch": 49.00544959128065, + "grad_norm": 4.7278056144714355, + "learning_rate": 1.0807045184193274e-05, + "loss": 0.2289, + "step": 17985 + }, + { + "epoch": 49.00817438692098, + "grad_norm": 4.353641986846924, + "learning_rate": 1.0806165565051606e-05, + "loss": 0.1017, + "step": 17986 + }, + { + "epoch": 49.01089918256131, + "grad_norm": 4.177628517150879, + "learning_rate": 1.0805285939631543e-05, + "loss": 0.2429, + "step": 17987 + }, + { + "epoch": 49.013623978201636, + "grad_norm": 4.302578449249268, + "learning_rate": 1.0804406307939938e-05, + "loss": 0.2183, + "step": 17988 + }, + { + "epoch": 49.01634877384196, + "grad_norm": 4.035937786102295, + "learning_rate": 1.0803526669983644e-05, + "loss": 0.1412, + "step": 17989 + }, + { + "epoch": 49.01907356948229, + "grad_norm": 4.200725078582764, + "learning_rate": 1.0802647025769511e-05, + "loss": 0.2043, + "step": 17990 + }, + { + "epoch": 49.02179836512261, + "grad_norm": 5.639614582061768, + "learning_rate": 1.0801767375304388e-05, + "loss": 0.3566, + "step": 17991 + }, + { + "epoch": 49.02452316076294, + "grad_norm": 4.2248945236206055, + "learning_rate": 1.0800887718595127e-05, + "loss": 0.1866, + "step": 17992 + }, + { + "epoch": 49.02724795640327, + "grad_norm": 4.550290584564209, + "learning_rate": 1.0800008055648574e-05, + "loss": 0.1476, + "step": 17993 + }, + { + "epoch": 49.0299727520436, + "grad_norm": 5.263301849365234, + "learning_rate": 1.0799128386471589e-05, + "loss": 0.1947, + "step": 17994 + }, + { + "epoch": 49.032697547683924, + "grad_norm": 5.180984020233154, + "learning_rate": 1.0798248711071016e-05, + "loss": 0.2674, + "step": 17995 + }, + { + "epoch": 49.03542234332425, + "grad_norm": 5.652591228485107, + "learning_rate": 1.0797369029453708e-05, + "loss": 0.1565, + "step": 17996 + }, + { + "epoch": 49.038147138964575, + "grad_norm": 8.383416175842285, + "learning_rate": 1.0796489341626515e-05, + "loss": 0.1568, + "step": 17997 + }, + { + "epoch": 49.0408719346049, + "grad_norm": 4.705984592437744, + "learning_rate": 1.0795609647596292e-05, + "loss": 0.2035, + "step": 17998 + }, + { + "epoch": 49.043596730245234, + "grad_norm": 4.038379669189453, + "learning_rate": 1.0794729947369881e-05, + "loss": 0.1252, + "step": 17999 + }, + { + "epoch": 49.04632152588556, + "grad_norm": 3.832319974899292, + "learning_rate": 1.0793850240954145e-05, + "loss": 0.0876, + "step": 18000 + }, + { + "epoch": 49.049046321525886, + "grad_norm": 4.551717758178711, + "learning_rate": 1.0792970528355925e-05, + "loss": 0.2588, + "step": 18001 + }, + { + "epoch": 49.05177111716621, + "grad_norm": 5.047624111175537, + "learning_rate": 1.0792090809582077e-05, + "loss": 0.1498, + "step": 18002 + }, + { + "epoch": 49.05449591280654, + "grad_norm": 3.703632354736328, + "learning_rate": 1.0791211084639448e-05, + "loss": 0.073, + "step": 18003 + }, + { + "epoch": 49.05722070844686, + "grad_norm": 4.088559150695801, + "learning_rate": 1.0790331353534898e-05, + "loss": 0.1275, + "step": 18004 + }, + { + "epoch": 49.059945504087196, + "grad_norm": 4.196995258331299, + "learning_rate": 1.0789451616275268e-05, + "loss": 0.1185, + "step": 18005 + }, + { + "epoch": 49.06267029972752, + "grad_norm": 4.991589546203613, + "learning_rate": 1.078857187286742e-05, + "loss": 0.1148, + "step": 18006 + }, + { + "epoch": 49.06539509536785, + "grad_norm": 4.610150337219238, + "learning_rate": 1.0787692123318193e-05, + "loss": 0.1873, + "step": 18007 + }, + { + "epoch": 49.06811989100817, + "grad_norm": 3.9155521392822266, + "learning_rate": 1.0786812367634452e-05, + "loss": 0.0902, + "step": 18008 + }, + { + "epoch": 49.0708446866485, + "grad_norm": 5.252546310424805, + "learning_rate": 1.0785932605823035e-05, + "loss": 0.1207, + "step": 18009 + }, + { + "epoch": 49.073569482288825, + "grad_norm": 8.474834442138672, + "learning_rate": 1.0785052837890805e-05, + "loss": 0.1332, + "step": 18010 + }, + { + "epoch": 49.07629427792916, + "grad_norm": 5.846328258514404, + "learning_rate": 1.0784173063844606e-05, + "loss": 0.2301, + "step": 18011 + }, + { + "epoch": 49.079019073569484, + "grad_norm": 5.642576217651367, + "learning_rate": 1.0783293283691292e-05, + "loss": 0.1465, + "step": 18012 + }, + { + "epoch": 49.08174386920981, + "grad_norm": 3.442023992538452, + "learning_rate": 1.0782413497437716e-05, + "loss": 0.1454, + "step": 18013 + }, + { + "epoch": 49.084468664850135, + "grad_norm": 3.6676108837127686, + "learning_rate": 1.078153370509073e-05, + "loss": 0.0996, + "step": 18014 + }, + { + "epoch": 49.08719346049046, + "grad_norm": 3.262950897216797, + "learning_rate": 1.0780653906657183e-05, + "loss": 0.0632, + "step": 18015 + }, + { + "epoch": 49.08991825613079, + "grad_norm": 7.376670837402344, + "learning_rate": 1.0779774102143932e-05, + "loss": 0.1095, + "step": 18016 + }, + { + "epoch": 49.09264305177112, + "grad_norm": 4.342564582824707, + "learning_rate": 1.0778894291557822e-05, + "loss": 0.1534, + "step": 18017 + }, + { + "epoch": 49.095367847411445, + "grad_norm": 3.993922233581543, + "learning_rate": 1.077801447490571e-05, + "loss": 0.0923, + "step": 18018 + }, + { + "epoch": 49.09809264305177, + "grad_norm": 4.462991714477539, + "learning_rate": 1.0777134652194444e-05, + "loss": 0.1785, + "step": 18019 + }, + { + "epoch": 49.1008174386921, + "grad_norm": 3.691136360168457, + "learning_rate": 1.077625482343088e-05, + "loss": 0.1676, + "step": 18020 + }, + { + "epoch": 49.10354223433242, + "grad_norm": 4.868034839630127, + "learning_rate": 1.077537498862187e-05, + "loss": 0.2172, + "step": 18021 + }, + { + "epoch": 49.10626702997275, + "grad_norm": 4.317085266113281, + "learning_rate": 1.077449514777426e-05, + "loss": 0.107, + "step": 18022 + }, + { + "epoch": 49.10899182561308, + "grad_norm": 4.479748725891113, + "learning_rate": 1.0773615300894908e-05, + "loss": 0.2292, + "step": 18023 + }, + { + "epoch": 49.11171662125341, + "grad_norm": 4.770779609680176, + "learning_rate": 1.0772735447990669e-05, + "loss": 0.0942, + "step": 18024 + }, + { + "epoch": 49.11444141689373, + "grad_norm": 4.341066837310791, + "learning_rate": 1.0771855589068387e-05, + "loss": 0.152, + "step": 18025 + }, + { + "epoch": 49.11716621253406, + "grad_norm": 4.202481269836426, + "learning_rate": 1.0770975724134922e-05, + "loss": 0.137, + "step": 18026 + }, + { + "epoch": 49.119891008174385, + "grad_norm": 4.304060935974121, + "learning_rate": 1.077009585319712e-05, + "loss": 0.0935, + "step": 18027 + }, + { + "epoch": 49.12261580381471, + "grad_norm": 4.502399444580078, + "learning_rate": 1.0769215976261838e-05, + "loss": 0.157, + "step": 18028 + }, + { + "epoch": 49.12534059945504, + "grad_norm": 3.793384313583374, + "learning_rate": 1.0768336093335928e-05, + "loss": 0.0881, + "step": 18029 + }, + { + "epoch": 49.12806539509537, + "grad_norm": 5.380351543426514, + "learning_rate": 1.0767456204426236e-05, + "loss": 0.1699, + "step": 18030 + }, + { + "epoch": 49.130790190735695, + "grad_norm": 3.9379515647888184, + "learning_rate": 1.0766576309539624e-05, + "loss": 0.086, + "step": 18031 + }, + { + "epoch": 49.13351498637602, + "grad_norm": 4.494139194488525, + "learning_rate": 1.076569640868294e-05, + "loss": 0.1696, + "step": 18032 + }, + { + "epoch": 49.13623978201635, + "grad_norm": 4.4707932472229, + "learning_rate": 1.0764816501863038e-05, + "loss": 0.1769, + "step": 18033 + }, + { + "epoch": 49.13896457765667, + "grad_norm": 3.2799689769744873, + "learning_rate": 1.0763936589086765e-05, + "loss": 0.1579, + "step": 18034 + }, + { + "epoch": 49.141689373297005, + "grad_norm": 4.310459136962891, + "learning_rate": 1.0763056670360983e-05, + "loss": 0.1066, + "step": 18035 + }, + { + "epoch": 49.14441416893733, + "grad_norm": 7.240693092346191, + "learning_rate": 1.0762176745692536e-05, + "loss": 0.2024, + "step": 18036 + }, + { + "epoch": 49.14713896457766, + "grad_norm": 5.299901485443115, + "learning_rate": 1.0761296815088286e-05, + "loss": 0.2777, + "step": 18037 + }, + { + "epoch": 49.14986376021798, + "grad_norm": 5.850484371185303, + "learning_rate": 1.0760416878555078e-05, + "loss": 0.2594, + "step": 18038 + }, + { + "epoch": 49.15258855585831, + "grad_norm": 4.424598693847656, + "learning_rate": 1.075953693609977e-05, + "loss": 0.1136, + "step": 18039 + }, + { + "epoch": 49.155313351498634, + "grad_norm": 4.08601188659668, + "learning_rate": 1.075865698772921e-05, + "loss": 0.2056, + "step": 18040 + }, + { + "epoch": 49.15803814713897, + "grad_norm": 5.298847675323486, + "learning_rate": 1.0757777033450257e-05, + "loss": 0.1508, + "step": 18041 + }, + { + "epoch": 49.16076294277929, + "grad_norm": 3.9473395347595215, + "learning_rate": 1.0756897073269758e-05, + "loss": 0.0882, + "step": 18042 + }, + { + "epoch": 49.16348773841962, + "grad_norm": 3.3817026615142822, + "learning_rate": 1.0756017107194569e-05, + "loss": 0.0952, + "step": 18043 + }, + { + "epoch": 49.166212534059945, + "grad_norm": 4.317387104034424, + "learning_rate": 1.0755137135231544e-05, + "loss": 0.2264, + "step": 18044 + }, + { + "epoch": 49.16893732970027, + "grad_norm": 5.175841331481934, + "learning_rate": 1.0754257157387536e-05, + "loss": 0.3095, + "step": 18045 + }, + { + "epoch": 49.171662125340596, + "grad_norm": 5.526827335357666, + "learning_rate": 1.0753377173669394e-05, + "loss": 0.1276, + "step": 18046 + }, + { + "epoch": 49.17438692098093, + "grad_norm": 5.604735851287842, + "learning_rate": 1.075249718408398e-05, + "loss": 0.197, + "step": 18047 + }, + { + "epoch": 49.177111716621255, + "grad_norm": 4.368131160736084, + "learning_rate": 1.075161718863814e-05, + "loss": 0.1844, + "step": 18048 + }, + { + "epoch": 49.17983651226158, + "grad_norm": 4.580317974090576, + "learning_rate": 1.0750737187338729e-05, + "loss": 0.1741, + "step": 18049 + }, + { + "epoch": 49.182561307901906, + "grad_norm": 4.791848659515381, + "learning_rate": 1.0749857180192603e-05, + "loss": 0.1884, + "step": 18050 + }, + { + "epoch": 49.18528610354223, + "grad_norm": 4.375580310821533, + "learning_rate": 1.0748977167206611e-05, + "loss": 0.1462, + "step": 18051 + }, + { + "epoch": 49.18801089918256, + "grad_norm": 3.8808562755584717, + "learning_rate": 1.0748097148387609e-05, + "loss": 0.1322, + "step": 18052 + }, + { + "epoch": 49.19073569482289, + "grad_norm": 4.329455375671387, + "learning_rate": 1.0747217123742453e-05, + "loss": 0.1538, + "step": 18053 + }, + { + "epoch": 49.19346049046322, + "grad_norm": 7.597806930541992, + "learning_rate": 1.0746337093277987e-05, + "loss": 0.3893, + "step": 18054 + }, + { + "epoch": 49.19618528610354, + "grad_norm": 5.23726749420166, + "learning_rate": 1.0745457057001079e-05, + "loss": 0.0787, + "step": 18055 + }, + { + "epoch": 49.19891008174387, + "grad_norm": 4.245670795440674, + "learning_rate": 1.0744577014918574e-05, + "loss": 0.2025, + "step": 18056 + }, + { + "epoch": 49.201634877384194, + "grad_norm": 4.973139762878418, + "learning_rate": 1.0743696967037327e-05, + "loss": 0.2124, + "step": 18057 + }, + { + "epoch": 49.20435967302452, + "grad_norm": 5.1174187660217285, + "learning_rate": 1.074281691336419e-05, + "loss": 0.2098, + "step": 18058 + }, + { + "epoch": 49.20708446866485, + "grad_norm": 4.663021564483643, + "learning_rate": 1.0741936853906023e-05, + "loss": 0.1087, + "step": 18059 + }, + { + "epoch": 49.20980926430518, + "grad_norm": 3.7342076301574707, + "learning_rate": 1.0741056788669671e-05, + "loss": 0.2342, + "step": 18060 + }, + { + "epoch": 49.212534059945504, + "grad_norm": 4.790356159210205, + "learning_rate": 1.0740176717661997e-05, + "loss": 0.1091, + "step": 18061 + }, + { + "epoch": 49.21525885558583, + "grad_norm": 5.599277496337891, + "learning_rate": 1.0739296640889844e-05, + "loss": 0.222, + "step": 18062 + }, + { + "epoch": 49.217983651226156, + "grad_norm": 4.795881271362305, + "learning_rate": 1.073841655836008e-05, + "loss": 0.302, + "step": 18063 + }, + { + "epoch": 49.22070844686648, + "grad_norm": 4.898931980133057, + "learning_rate": 1.0737536470079545e-05, + "loss": 0.2092, + "step": 18064 + }, + { + "epoch": 49.223433242506815, + "grad_norm": 4.329406261444092, + "learning_rate": 1.0736656376055106e-05, + "loss": 0.0806, + "step": 18065 + }, + { + "epoch": 49.22615803814714, + "grad_norm": 4.139956474304199, + "learning_rate": 1.0735776276293605e-05, + "loss": 0.2472, + "step": 18066 + }, + { + "epoch": 49.228882833787466, + "grad_norm": 7.229269027709961, + "learning_rate": 1.0734896170801907e-05, + "loss": 0.1951, + "step": 18067 + }, + { + "epoch": 49.23160762942779, + "grad_norm": 3.936602830886841, + "learning_rate": 1.0734016059586858e-05, + "loss": 0.0831, + "step": 18068 + }, + { + "epoch": 49.23433242506812, + "grad_norm": 5.162415504455566, + "learning_rate": 1.0733135942655318e-05, + "loss": 0.2105, + "step": 18069 + }, + { + "epoch": 49.237057220708444, + "grad_norm": 5.241152286529541, + "learning_rate": 1.0732255820014137e-05, + "loss": 0.1564, + "step": 18070 + }, + { + "epoch": 49.23978201634878, + "grad_norm": 3.9510488510131836, + "learning_rate": 1.073137569167017e-05, + "loss": 0.3114, + "step": 18071 + }, + { + "epoch": 49.2425068119891, + "grad_norm": 4.706510543823242, + "learning_rate": 1.0730495557630275e-05, + "loss": 0.0815, + "step": 18072 + }, + { + "epoch": 49.24523160762943, + "grad_norm": 5.237221717834473, + "learning_rate": 1.0729615417901305e-05, + "loss": 0.3302, + "step": 18073 + }, + { + "epoch": 49.247956403269754, + "grad_norm": 4.733431339263916, + "learning_rate": 1.072873527249011e-05, + "loss": 0.2856, + "step": 18074 + }, + { + "epoch": 49.25068119891008, + "grad_norm": 6.3101043701171875, + "learning_rate": 1.0727855121403551e-05, + "loss": 0.165, + "step": 18075 + }, + { + "epoch": 49.253405994550405, + "grad_norm": 3.8238027095794678, + "learning_rate": 1.0726974964648478e-05, + "loss": 0.1038, + "step": 18076 + }, + { + "epoch": 49.25613079019074, + "grad_norm": 6.8419084548950195, + "learning_rate": 1.072609480223175e-05, + "loss": 0.1189, + "step": 18077 + }, + { + "epoch": 49.258855585831064, + "grad_norm": 4.807248592376709, + "learning_rate": 1.0725214634160217e-05, + "loss": 0.099, + "step": 18078 + }, + { + "epoch": 49.26158038147139, + "grad_norm": 3.048029661178589, + "learning_rate": 1.0724334460440735e-05, + "loss": 0.1367, + "step": 18079 + }, + { + "epoch": 49.264305177111716, + "grad_norm": 4.009759426116943, + "learning_rate": 1.0723454281080161e-05, + "loss": 0.1014, + "step": 18080 + }, + { + "epoch": 49.26702997275204, + "grad_norm": 6.9584126472473145, + "learning_rate": 1.072257409608535e-05, + "loss": 0.1801, + "step": 18081 + }, + { + "epoch": 49.26975476839237, + "grad_norm": 3.863007068634033, + "learning_rate": 1.072169390546315e-05, + "loss": 0.0648, + "step": 18082 + }, + { + "epoch": 49.2724795640327, + "grad_norm": 8.388815879821777, + "learning_rate": 1.0720813709220427e-05, + "loss": 0.1313, + "step": 18083 + }, + { + "epoch": 49.275204359673026, + "grad_norm": 4.568418502807617, + "learning_rate": 1.0719933507364027e-05, + "loss": 0.145, + "step": 18084 + }, + { + "epoch": 49.27792915531335, + "grad_norm": 3.9196252822875977, + "learning_rate": 1.071905329990081e-05, + "loss": 0.1087, + "step": 18085 + }, + { + "epoch": 49.28065395095368, + "grad_norm": 4.317632675170898, + "learning_rate": 1.0718173086837626e-05, + "loss": 0.1917, + "step": 18086 + }, + { + "epoch": 49.283378746594, + "grad_norm": 6.338841915130615, + "learning_rate": 1.0717292868181335e-05, + "loss": 0.1705, + "step": 18087 + }, + { + "epoch": 49.28610354223433, + "grad_norm": 4.756075859069824, + "learning_rate": 1.0716412643938788e-05, + "loss": 0.396, + "step": 18088 + }, + { + "epoch": 49.28882833787466, + "grad_norm": 4.442616939544678, + "learning_rate": 1.0715532414116844e-05, + "loss": 0.1386, + "step": 18089 + }, + { + "epoch": 49.29155313351499, + "grad_norm": 4.1272783279418945, + "learning_rate": 1.0714652178722357e-05, + "loss": 0.0948, + "step": 18090 + }, + { + "epoch": 49.294277929155314, + "grad_norm": 4.293083667755127, + "learning_rate": 1.0713771937762183e-05, + "loss": 0.0735, + "step": 18091 + }, + { + "epoch": 49.29700272479564, + "grad_norm": 6.48081636428833, + "learning_rate": 1.0712891691243174e-05, + "loss": 0.148, + "step": 18092 + }, + { + "epoch": 49.299727520435965, + "grad_norm": 5.072357177734375, + "learning_rate": 1.0712011439172189e-05, + "loss": 0.2161, + "step": 18093 + }, + { + "epoch": 49.30245231607629, + "grad_norm": 5.972768783569336, + "learning_rate": 1.071113118155608e-05, + "loss": 0.2425, + "step": 18094 + }, + { + "epoch": 49.305177111716624, + "grad_norm": 4.665791034698486, + "learning_rate": 1.0710250918401709e-05, + "loss": 0.1129, + "step": 18095 + }, + { + "epoch": 49.30790190735695, + "grad_norm": 5.621108531951904, + "learning_rate": 1.070937064971592e-05, + "loss": 0.1445, + "step": 18096 + }, + { + "epoch": 49.310626702997276, + "grad_norm": 5.065195560455322, + "learning_rate": 1.0708490375505577e-05, + "loss": 0.1042, + "step": 18097 + }, + { + "epoch": 49.3133514986376, + "grad_norm": 5.798933506011963, + "learning_rate": 1.0707610095777534e-05, + "loss": 0.1124, + "step": 18098 + }, + { + "epoch": 49.31607629427793, + "grad_norm": 3.935114622116089, + "learning_rate": 1.070672981053865e-05, + "loss": 0.1385, + "step": 18099 + }, + { + "epoch": 49.31880108991825, + "grad_norm": 4.582058906555176, + "learning_rate": 1.0705849519795772e-05, + "loss": 0.1604, + "step": 18100 + }, + { + "epoch": 49.321525885558586, + "grad_norm": 4.798512935638428, + "learning_rate": 1.0704969223555766e-05, + "loss": 0.0866, + "step": 18101 + }, + { + "epoch": 49.32425068119891, + "grad_norm": 3.550732135772705, + "learning_rate": 1.0704088921825477e-05, + "loss": 0.0992, + "step": 18102 + }, + { + "epoch": 49.32697547683924, + "grad_norm": 3.969743490219116, + "learning_rate": 1.0703208614611772e-05, + "loss": 0.127, + "step": 18103 + }, + { + "epoch": 49.32970027247956, + "grad_norm": 5.467886924743652, + "learning_rate": 1.0702328301921495e-05, + "loss": 0.1953, + "step": 18104 + }, + { + "epoch": 49.33242506811989, + "grad_norm": 4.552988052368164, + "learning_rate": 1.0701447983761508e-05, + "loss": 0.2266, + "step": 18105 + }, + { + "epoch": 49.335149863760215, + "grad_norm": 4.883590221405029, + "learning_rate": 1.0700567660138672e-05, + "loss": 0.1233, + "step": 18106 + }, + { + "epoch": 49.33787465940055, + "grad_norm": 7.797180652618408, + "learning_rate": 1.0699687331059834e-05, + "loss": 0.234, + "step": 18107 + }, + { + "epoch": 49.34059945504087, + "grad_norm": 4.586651802062988, + "learning_rate": 1.0698806996531855e-05, + "loss": 0.1167, + "step": 18108 + }, + { + "epoch": 49.3433242506812, + "grad_norm": 4.137990474700928, + "learning_rate": 1.0697926656561588e-05, + "loss": 0.2158, + "step": 18109 + }, + { + "epoch": 49.346049046321525, + "grad_norm": 4.418461322784424, + "learning_rate": 1.069704631115589e-05, + "loss": 0.1901, + "step": 18110 + }, + { + "epoch": 49.34877384196185, + "grad_norm": 5.157928943634033, + "learning_rate": 1.069616596032162e-05, + "loss": 0.2292, + "step": 18111 + }, + { + "epoch": 49.35149863760218, + "grad_norm": 3.745630979537964, + "learning_rate": 1.069528560406563e-05, + "loss": 0.2967, + "step": 18112 + }, + { + "epoch": 49.35422343324251, + "grad_norm": 9.908339500427246, + "learning_rate": 1.069440524239478e-05, + "loss": 0.1697, + "step": 18113 + }, + { + "epoch": 49.356948228882835, + "grad_norm": 4.503567218780518, + "learning_rate": 1.0693524875315924e-05, + "loss": 0.1747, + "step": 18114 + }, + { + "epoch": 49.35967302452316, + "grad_norm": 4.296820163726807, + "learning_rate": 1.0692644502835915e-05, + "loss": 0.0885, + "step": 18115 + }, + { + "epoch": 49.36239782016349, + "grad_norm": 3.2776989936828613, + "learning_rate": 1.0691764124961618e-05, + "loss": 0.2318, + "step": 18116 + }, + { + "epoch": 49.36512261580381, + "grad_norm": 5.114651679992676, + "learning_rate": 1.0690883741699882e-05, + "loss": 0.2653, + "step": 18117 + }, + { + "epoch": 49.36784741144414, + "grad_norm": 8.092615127563477, + "learning_rate": 1.0690003353057567e-05, + "loss": 0.0964, + "step": 18118 + }, + { + "epoch": 49.37057220708447, + "grad_norm": 4.071983337402344, + "learning_rate": 1.0689122959041524e-05, + "loss": 0.3459, + "step": 18119 + }, + { + "epoch": 49.3732970027248, + "grad_norm": 4.370309829711914, + "learning_rate": 1.068824255965862e-05, + "loss": 0.2297, + "step": 18120 + }, + { + "epoch": 49.37602179836512, + "grad_norm": 4.2969207763671875, + "learning_rate": 1.0687362154915699e-05, + "loss": 0.1268, + "step": 18121 + }, + { + "epoch": 49.37874659400545, + "grad_norm": 4.603678226470947, + "learning_rate": 1.0686481744819626e-05, + "loss": 0.1205, + "step": 18122 + }, + { + "epoch": 49.381471389645775, + "grad_norm": 4.215365886688232, + "learning_rate": 1.0685601329377255e-05, + "loss": 0.2, + "step": 18123 + }, + { + "epoch": 49.3841961852861, + "grad_norm": 4.711794376373291, + "learning_rate": 1.0684720908595445e-05, + "loss": 0.2561, + "step": 18124 + }, + { + "epoch": 49.38692098092643, + "grad_norm": 4.6763691902160645, + "learning_rate": 1.0683840482481046e-05, + "loss": 0.184, + "step": 18125 + }, + { + "epoch": 49.38964577656676, + "grad_norm": 5.492859840393066, + "learning_rate": 1.0682960051040924e-05, + "loss": 0.143, + "step": 18126 + }, + { + "epoch": 49.392370572207085, + "grad_norm": 5.027314186096191, + "learning_rate": 1.068207961428193e-05, + "loss": 0.1715, + "step": 18127 + }, + { + "epoch": 49.39509536784741, + "grad_norm": 3.5511410236358643, + "learning_rate": 1.0681199172210923e-05, + "loss": 0.106, + "step": 18128 + }, + { + "epoch": 49.39782016348774, + "grad_norm": 5.608665466308594, + "learning_rate": 1.0680318724834758e-05, + "loss": 0.2715, + "step": 18129 + }, + { + "epoch": 49.40054495912806, + "grad_norm": 5.252490997314453, + "learning_rate": 1.0679438272160292e-05, + "loss": 0.1136, + "step": 18130 + }, + { + "epoch": 49.403269754768395, + "grad_norm": 16.229663848876953, + "learning_rate": 1.067855781419438e-05, + "loss": 0.251, + "step": 18131 + }, + { + "epoch": 49.40599455040872, + "grad_norm": 4.906930446624756, + "learning_rate": 1.0677677350943885e-05, + "loss": 0.1255, + "step": 18132 + }, + { + "epoch": 49.40871934604905, + "grad_norm": 4.8139777183532715, + "learning_rate": 1.0676796882415658e-05, + "loss": 0.0892, + "step": 18133 + }, + { + "epoch": 49.41144414168937, + "grad_norm": 4.291130065917969, + "learning_rate": 1.0675916408616562e-05, + "loss": 0.1425, + "step": 18134 + }, + { + "epoch": 49.4141689373297, + "grad_norm": 5.100659370422363, + "learning_rate": 1.0675035929553448e-05, + "loss": 0.1028, + "step": 18135 + }, + { + "epoch": 49.416893732970024, + "grad_norm": 6.584331035614014, + "learning_rate": 1.0674155445233179e-05, + "loss": 0.1488, + "step": 18136 + }, + { + "epoch": 49.41961852861036, + "grad_norm": 6.058783531188965, + "learning_rate": 1.0673274955662604e-05, + "loss": 0.1697, + "step": 18137 + }, + { + "epoch": 49.42234332425068, + "grad_norm": 4.610739231109619, + "learning_rate": 1.067239446084859e-05, + "loss": 0.2024, + "step": 18138 + }, + { + "epoch": 49.42506811989101, + "grad_norm": 5.838510036468506, + "learning_rate": 1.0671513960797988e-05, + "loss": 0.1562, + "step": 18139 + }, + { + "epoch": 49.427792915531334, + "grad_norm": 3.6795663833618164, + "learning_rate": 1.0670633455517656e-05, + "loss": 0.1504, + "step": 18140 + }, + { + "epoch": 49.43051771117166, + "grad_norm": 3.164093255996704, + "learning_rate": 1.0669752945014452e-05, + "loss": 0.0783, + "step": 18141 + }, + { + "epoch": 49.433242506811986, + "grad_norm": 4.077607154846191, + "learning_rate": 1.0668872429295236e-05, + "loss": 0.1422, + "step": 18142 + }, + { + "epoch": 49.43596730245232, + "grad_norm": 3.4083364009857178, + "learning_rate": 1.0667991908366861e-05, + "loss": 0.0929, + "step": 18143 + }, + { + "epoch": 49.438692098092645, + "grad_norm": 3.873018980026245, + "learning_rate": 1.0667111382236187e-05, + "loss": 0.1183, + "step": 18144 + }, + { + "epoch": 49.44141689373297, + "grad_norm": 4.201215744018555, + "learning_rate": 1.0666230850910071e-05, + "loss": 0.1714, + "step": 18145 + }, + { + "epoch": 49.444141689373296, + "grad_norm": 4.790209770202637, + "learning_rate": 1.0665350314395373e-05, + "loss": 0.1645, + "step": 18146 + }, + { + "epoch": 49.44686648501362, + "grad_norm": 4.523641586303711, + "learning_rate": 1.0664469772698945e-05, + "loss": 0.0816, + "step": 18147 + }, + { + "epoch": 49.44959128065395, + "grad_norm": 5.0345258712768555, + "learning_rate": 1.0663589225827648e-05, + "loss": 0.1731, + "step": 18148 + }, + { + "epoch": 49.45231607629428, + "grad_norm": 3.8730554580688477, + "learning_rate": 1.066270867378834e-05, + "loss": 0.1498, + "step": 18149 + }, + { + "epoch": 49.45504087193461, + "grad_norm": 4.271957874298096, + "learning_rate": 1.0661828116587878e-05, + "loss": 0.1517, + "step": 18150 + }, + { + "epoch": 49.45776566757493, + "grad_norm": 8.417770385742188, + "learning_rate": 1.066094755423312e-05, + "loss": 0.0968, + "step": 18151 + }, + { + "epoch": 49.46049046321526, + "grad_norm": 4.589767932891846, + "learning_rate": 1.0660066986730925e-05, + "loss": 0.2009, + "step": 18152 + }, + { + "epoch": 49.463215258855584, + "grad_norm": 5.2906413078308105, + "learning_rate": 1.0659186414088148e-05, + "loss": 0.1702, + "step": 18153 + }, + { + "epoch": 49.46594005449591, + "grad_norm": 5.601592063903809, + "learning_rate": 1.0658305836311651e-05, + "loss": 0.1856, + "step": 18154 + }, + { + "epoch": 49.46866485013624, + "grad_norm": 6.945178031921387, + "learning_rate": 1.0657425253408287e-05, + "loss": 0.2302, + "step": 18155 + }, + { + "epoch": 49.47138964577657, + "grad_norm": 4.493739128112793, + "learning_rate": 1.0656544665384918e-05, + "loss": 0.0931, + "step": 18156 + }, + { + "epoch": 49.474114441416894, + "grad_norm": 7.880306720733643, + "learning_rate": 1.0655664072248395e-05, + "loss": 0.0797, + "step": 18157 + }, + { + "epoch": 49.47683923705722, + "grad_norm": 4.8007707595825195, + "learning_rate": 1.0654783474005587e-05, + "loss": 0.1721, + "step": 18158 + }, + { + "epoch": 49.479564032697546, + "grad_norm": 6.430230617523193, + "learning_rate": 1.0653902870663344e-05, + "loss": 0.0995, + "step": 18159 + }, + { + "epoch": 49.48228882833787, + "grad_norm": 4.005404472351074, + "learning_rate": 1.0653022262228527e-05, + "loss": 0.2804, + "step": 18160 + }, + { + "epoch": 49.485013623978205, + "grad_norm": 6.052149772644043, + "learning_rate": 1.0652141648707994e-05, + "loss": 0.2013, + "step": 18161 + }, + { + "epoch": 49.48773841961853, + "grad_norm": 4.363229751586914, + "learning_rate": 1.0651261030108603e-05, + "loss": 0.1064, + "step": 18162 + }, + { + "epoch": 49.490463215258856, + "grad_norm": 4.8147759437561035, + "learning_rate": 1.065038040643721e-05, + "loss": 0.1154, + "step": 18163 + }, + { + "epoch": 49.49318801089918, + "grad_norm": 6.709095478057861, + "learning_rate": 1.064949977770068e-05, + "loss": 0.2924, + "step": 18164 + }, + { + "epoch": 49.49591280653951, + "grad_norm": 4.5668840408325195, + "learning_rate": 1.064861914390586e-05, + "loss": 0.0771, + "step": 18165 + }, + { + "epoch": 49.49863760217983, + "grad_norm": 4.888486862182617, + "learning_rate": 1.064773850505962e-05, + "loss": 0.2727, + "step": 18166 + }, + { + "epoch": 49.50136239782017, + "grad_norm": 5.187841892242432, + "learning_rate": 1.0646857861168811e-05, + "loss": 0.2116, + "step": 18167 + }, + { + "epoch": 49.50408719346049, + "grad_norm": 4.599339485168457, + "learning_rate": 1.0645977212240297e-05, + "loss": 0.207, + "step": 18168 + }, + { + "epoch": 49.50681198910082, + "grad_norm": 4.81515645980835, + "learning_rate": 1.064509655828093e-05, + "loss": 0.2151, + "step": 18169 + }, + { + "epoch": 49.509536784741144, + "grad_norm": 4.856693744659424, + "learning_rate": 1.0644215899297574e-05, + "loss": 0.2136, + "step": 18170 + }, + { + "epoch": 49.51226158038147, + "grad_norm": 4.939047813415527, + "learning_rate": 1.0643335235297084e-05, + "loss": 0.0968, + "step": 18171 + }, + { + "epoch": 49.514986376021795, + "grad_norm": 6.327423095703125, + "learning_rate": 1.0642454566286319e-05, + "loss": 0.2723, + "step": 18172 + }, + { + "epoch": 49.51771117166213, + "grad_norm": 5.196204662322998, + "learning_rate": 1.064157389227214e-05, + "loss": 0.2142, + "step": 18173 + }, + { + "epoch": 49.520435967302454, + "grad_norm": 5.256061553955078, + "learning_rate": 1.0640693213261404e-05, + "loss": 0.1198, + "step": 18174 + }, + { + "epoch": 49.52316076294278, + "grad_norm": 3.857426404953003, + "learning_rate": 1.0639812529260967e-05, + "loss": 0.0641, + "step": 18175 + }, + { + "epoch": 49.525885558583106, + "grad_norm": 5.198551654815674, + "learning_rate": 1.0638931840277696e-05, + "loss": 0.1856, + "step": 18176 + }, + { + "epoch": 49.52861035422343, + "grad_norm": 4.237199306488037, + "learning_rate": 1.063805114631844e-05, + "loss": 0.166, + "step": 18177 + }, + { + "epoch": 49.53133514986376, + "grad_norm": 3.5271968841552734, + "learning_rate": 1.0637170447390063e-05, + "loss": 0.065, + "step": 18178 + }, + { + "epoch": 49.53405994550409, + "grad_norm": 3.8488316535949707, + "learning_rate": 1.0636289743499424e-05, + "loss": 0.1502, + "step": 18179 + }, + { + "epoch": 49.536784741144416, + "grad_norm": 12.370738983154297, + "learning_rate": 1.0635409034653383e-05, + "loss": 0.1002, + "step": 18180 + }, + { + "epoch": 49.53950953678474, + "grad_norm": 6.158624649047852, + "learning_rate": 1.0634528320858792e-05, + "loss": 0.1541, + "step": 18181 + }, + { + "epoch": 49.54223433242507, + "grad_norm": 4.370608806610107, + "learning_rate": 1.0633647602122521e-05, + "loss": 0.0896, + "step": 18182 + }, + { + "epoch": 49.54495912806539, + "grad_norm": 4.981345176696777, + "learning_rate": 1.0632766878451416e-05, + "loss": 0.2075, + "step": 18183 + }, + { + "epoch": 49.54768392370572, + "grad_norm": 8.145125389099121, + "learning_rate": 1.0631886149852347e-05, + "loss": 0.1988, + "step": 18184 + }, + { + "epoch": 49.55040871934605, + "grad_norm": 12.380273818969727, + "learning_rate": 1.0631005416332168e-05, + "loss": 0.1242, + "step": 18185 + }, + { + "epoch": 49.55313351498638, + "grad_norm": 4.580547332763672, + "learning_rate": 1.063012467789774e-05, + "loss": 0.2128, + "step": 18186 + }, + { + "epoch": 49.555858310626704, + "grad_norm": 6.241352558135986, + "learning_rate": 1.0629243934555919e-05, + "loss": 0.1936, + "step": 18187 + }, + { + "epoch": 49.55858310626703, + "grad_norm": 4.160164833068848, + "learning_rate": 1.062836318631357e-05, + "loss": 0.1873, + "step": 18188 + }, + { + "epoch": 49.561307901907355, + "grad_norm": 6.1277995109558105, + "learning_rate": 1.0627482433177547e-05, + "loss": 0.3317, + "step": 18189 + }, + { + "epoch": 49.56403269754768, + "grad_norm": 4.253282070159912, + "learning_rate": 1.0626601675154713e-05, + "loss": 0.1541, + "step": 18190 + }, + { + "epoch": 49.566757493188014, + "grad_norm": 4.2864766120910645, + "learning_rate": 1.0625720912251923e-05, + "loss": 0.1371, + "step": 18191 + }, + { + "epoch": 49.56948228882834, + "grad_norm": 9.15553092956543, + "learning_rate": 1.0624840144476036e-05, + "loss": 0.1497, + "step": 18192 + }, + { + "epoch": 49.572207084468666, + "grad_norm": 5.953794479370117, + "learning_rate": 1.0623959371833918e-05, + "loss": 0.1323, + "step": 18193 + }, + { + "epoch": 49.57493188010899, + "grad_norm": 6.5279459953308105, + "learning_rate": 1.0623078594332424e-05, + "loss": 0.1452, + "step": 18194 + }, + { + "epoch": 49.57765667574932, + "grad_norm": 9.369184494018555, + "learning_rate": 1.0622197811978414e-05, + "loss": 0.1026, + "step": 18195 + }, + { + "epoch": 49.58038147138964, + "grad_norm": 4.457242012023926, + "learning_rate": 1.0621317024778747e-05, + "loss": 0.2238, + "step": 18196 + }, + { + "epoch": 49.583106267029976, + "grad_norm": 8.569912910461426, + "learning_rate": 1.062043623274028e-05, + "loss": 0.1649, + "step": 18197 + }, + { + "epoch": 49.5858310626703, + "grad_norm": 4.9559736251831055, + "learning_rate": 1.0619555435869881e-05, + "loss": 0.0911, + "step": 18198 + }, + { + "epoch": 49.58855585831063, + "grad_norm": 4.798398017883301, + "learning_rate": 1.0618674634174402e-05, + "loss": 0.1421, + "step": 18199 + }, + { + "epoch": 49.59128065395095, + "grad_norm": 5.347679615020752, + "learning_rate": 1.0617793827660703e-05, + "loss": 0.1805, + "step": 18200 + }, + { + "epoch": 49.59400544959128, + "grad_norm": 3.8213841915130615, + "learning_rate": 1.0616913016335648e-05, + "loss": 0.0836, + "step": 18201 + }, + { + "epoch": 49.596730245231605, + "grad_norm": 5.150428295135498, + "learning_rate": 1.0616032200206094e-05, + "loss": 0.1916, + "step": 18202 + }, + { + "epoch": 49.59945504087194, + "grad_norm": 4.489078521728516, + "learning_rate": 1.0615151379278901e-05, + "loss": 0.1812, + "step": 18203 + }, + { + "epoch": 49.60217983651226, + "grad_norm": 4.463815689086914, + "learning_rate": 1.0614270553560928e-05, + "loss": 0.0996, + "step": 18204 + }, + { + "epoch": 49.60490463215259, + "grad_norm": 9.333776473999023, + "learning_rate": 1.0613389723059037e-05, + "loss": 0.1649, + "step": 18205 + }, + { + "epoch": 49.607629427792915, + "grad_norm": 3.7884669303894043, + "learning_rate": 1.0612508887780085e-05, + "loss": 0.1649, + "step": 18206 + }, + { + "epoch": 49.61035422343324, + "grad_norm": 4.525467872619629, + "learning_rate": 1.0611628047730935e-05, + "loss": 0.1861, + "step": 18207 + }, + { + "epoch": 49.61307901907357, + "grad_norm": 7.235852241516113, + "learning_rate": 1.0610747202918442e-05, + "loss": 0.13, + "step": 18208 + }, + { + "epoch": 49.6158038147139, + "grad_norm": 9.90200138092041, + "learning_rate": 1.0609866353349474e-05, + "loss": 0.1544, + "step": 18209 + }, + { + "epoch": 49.618528610354225, + "grad_norm": 4.8709869384765625, + "learning_rate": 1.0608985499030884e-05, + "loss": 0.0988, + "step": 18210 + }, + { + "epoch": 49.62125340599455, + "grad_norm": 6.361578941345215, + "learning_rate": 1.0608104639969535e-05, + "loss": 0.1463, + "step": 18211 + }, + { + "epoch": 49.62397820163488, + "grad_norm": 6.684064865112305, + "learning_rate": 1.0607223776172287e-05, + "loss": 0.2931, + "step": 18212 + }, + { + "epoch": 49.6267029972752, + "grad_norm": 4.376237869262695, + "learning_rate": 1.0606342907645998e-05, + "loss": 0.1451, + "step": 18213 + }, + { + "epoch": 49.62942779291553, + "grad_norm": 5.746951580047607, + "learning_rate": 1.0605462034397532e-05, + "loss": 0.16, + "step": 18214 + }, + { + "epoch": 49.63215258855586, + "grad_norm": 4.049665927886963, + "learning_rate": 1.060458115643375e-05, + "loss": 0.2061, + "step": 18215 + }, + { + "epoch": 49.63487738419619, + "grad_norm": 5.825301170349121, + "learning_rate": 1.0603700273761504e-05, + "loss": 0.1265, + "step": 18216 + }, + { + "epoch": 49.63760217983651, + "grad_norm": 3.50651478767395, + "learning_rate": 1.060281938638766e-05, + "loss": 0.0803, + "step": 18217 + }, + { + "epoch": 49.64032697547684, + "grad_norm": 3.667231559753418, + "learning_rate": 1.060193849431908e-05, + "loss": 0.1276, + "step": 18218 + }, + { + "epoch": 49.643051771117165, + "grad_norm": 4.3791327476501465, + "learning_rate": 1.0601057597562623e-05, + "loss": 0.2172, + "step": 18219 + }, + { + "epoch": 49.64577656675749, + "grad_norm": 5.698973178863525, + "learning_rate": 1.0600176696125146e-05, + "loss": 0.1031, + "step": 18220 + }, + { + "epoch": 49.64850136239782, + "grad_norm": 7.409605979919434, + "learning_rate": 1.0599295790013515e-05, + "loss": 0.1568, + "step": 18221 + }, + { + "epoch": 49.65122615803815, + "grad_norm": 5.001932144165039, + "learning_rate": 1.0598414879234587e-05, + "loss": 0.2364, + "step": 18222 + }, + { + "epoch": 49.653950953678475, + "grad_norm": 4.489975929260254, + "learning_rate": 1.0597533963795223e-05, + "loss": 0.093, + "step": 18223 + }, + { + "epoch": 49.6566757493188, + "grad_norm": 6.3259596824646, + "learning_rate": 1.0596653043702283e-05, + "loss": 0.1477, + "step": 18224 + }, + { + "epoch": 49.65940054495913, + "grad_norm": 7.116461277008057, + "learning_rate": 1.0595772118962631e-05, + "loss": 0.3108, + "step": 18225 + }, + { + "epoch": 49.66212534059945, + "grad_norm": 4.958671569824219, + "learning_rate": 1.0594891189583119e-05, + "loss": 0.0998, + "step": 18226 + }, + { + "epoch": 49.664850136239785, + "grad_norm": 15.675604820251465, + "learning_rate": 1.059401025557062e-05, + "loss": 0.1984, + "step": 18227 + }, + { + "epoch": 49.66757493188011, + "grad_norm": 6.726870536804199, + "learning_rate": 1.0593129316931985e-05, + "loss": 0.1522, + "step": 18228 + }, + { + "epoch": 49.67029972752044, + "grad_norm": 5.004068374633789, + "learning_rate": 1.0592248373674078e-05, + "loss": 0.2209, + "step": 18229 + }, + { + "epoch": 49.67302452316076, + "grad_norm": 4.550838470458984, + "learning_rate": 1.059136742580376e-05, + "loss": 0.0881, + "step": 18230 + }, + { + "epoch": 49.67574931880109, + "grad_norm": 4.816982746124268, + "learning_rate": 1.0590486473327894e-05, + "loss": 0.1794, + "step": 18231 + }, + { + "epoch": 49.678474114441414, + "grad_norm": 5.47058629989624, + "learning_rate": 1.0589605516253333e-05, + "loss": 0.2464, + "step": 18232 + }, + { + "epoch": 49.68119891008175, + "grad_norm": 6.425475120544434, + "learning_rate": 1.058872455458695e-05, + "loss": 0.1028, + "step": 18233 + }, + { + "epoch": 49.68392370572207, + "grad_norm": 5.621904373168945, + "learning_rate": 1.0587843588335592e-05, + "loss": 0.2819, + "step": 18234 + }, + { + "epoch": 49.6866485013624, + "grad_norm": 4.362329959869385, + "learning_rate": 1.058696261750613e-05, + "loss": 0.1758, + "step": 18235 + }, + { + "epoch": 49.689373297002724, + "grad_norm": 6.487398147583008, + "learning_rate": 1.0586081642105423e-05, + "loss": 0.2571, + "step": 18236 + }, + { + "epoch": 49.69209809264305, + "grad_norm": 5.748312473297119, + "learning_rate": 1.0585200662140334e-05, + "loss": 0.3426, + "step": 18237 + }, + { + "epoch": 49.694822888283376, + "grad_norm": 4.671896934509277, + "learning_rate": 1.0584319677617716e-05, + "loss": 0.1777, + "step": 18238 + }, + { + "epoch": 49.69754768392371, + "grad_norm": 4.370096206665039, + "learning_rate": 1.0583438688544438e-05, + "loss": 0.1786, + "step": 18239 + }, + { + "epoch": 49.700272479564035, + "grad_norm": 4.892489433288574, + "learning_rate": 1.0582557694927356e-05, + "loss": 0.139, + "step": 18240 + }, + { + "epoch": 49.70299727520436, + "grad_norm": 4.985652923583984, + "learning_rate": 1.0581676696773336e-05, + "loss": 0.3533, + "step": 18241 + }, + { + "epoch": 49.705722070844686, + "grad_norm": 7.21626615524292, + "learning_rate": 1.0580795694089234e-05, + "loss": 0.1689, + "step": 18242 + }, + { + "epoch": 49.70844686648501, + "grad_norm": 3.7203969955444336, + "learning_rate": 1.0579914686881914e-05, + "loss": 0.0635, + "step": 18243 + }, + { + "epoch": 49.71117166212534, + "grad_norm": 4.61190128326416, + "learning_rate": 1.0579033675158236e-05, + "loss": 0.1296, + "step": 18244 + }, + { + "epoch": 49.71389645776567, + "grad_norm": 4.63526725769043, + "learning_rate": 1.0578152658925066e-05, + "loss": 0.2572, + "step": 18245 + }, + { + "epoch": 49.716621253406, + "grad_norm": 5.661147117614746, + "learning_rate": 1.0577271638189261e-05, + "loss": 0.2119, + "step": 18246 + }, + { + "epoch": 49.71934604904632, + "grad_norm": 5.838468074798584, + "learning_rate": 1.0576390612957683e-05, + "loss": 0.1644, + "step": 18247 + }, + { + "epoch": 49.72207084468665, + "grad_norm": 4.0203962326049805, + "learning_rate": 1.057550958323719e-05, + "loss": 0.0692, + "step": 18248 + }, + { + "epoch": 49.724795640326974, + "grad_norm": 5.284526824951172, + "learning_rate": 1.0574628549034653e-05, + "loss": 0.1809, + "step": 18249 + }, + { + "epoch": 49.7275204359673, + "grad_norm": 5.219470024108887, + "learning_rate": 1.0573747510356923e-05, + "loss": 0.1761, + "step": 18250 + }, + { + "epoch": 49.73024523160763, + "grad_norm": 4.994770526885986, + "learning_rate": 1.0572866467210865e-05, + "loss": 0.157, + "step": 18251 + }, + { + "epoch": 49.73297002724796, + "grad_norm": 6.430014610290527, + "learning_rate": 1.0571985419603343e-05, + "loss": 0.259, + "step": 18252 + }, + { + "epoch": 49.735694822888284, + "grad_norm": 6.348018646240234, + "learning_rate": 1.0571104367541218e-05, + "loss": 0.2008, + "step": 18253 + }, + { + "epoch": 49.73841961852861, + "grad_norm": 4.19774866104126, + "learning_rate": 1.0570223311031349e-05, + "loss": 0.1261, + "step": 18254 + }, + { + "epoch": 49.741144414168936, + "grad_norm": 4.381269931793213, + "learning_rate": 1.0569342250080601e-05, + "loss": 0.0822, + "step": 18255 + }, + { + "epoch": 49.74386920980926, + "grad_norm": 5.628778457641602, + "learning_rate": 1.0568461184695833e-05, + "loss": 0.2369, + "step": 18256 + }, + { + "epoch": 49.746594005449595, + "grad_norm": 5.383265495300293, + "learning_rate": 1.056758011488391e-05, + "loss": 0.2278, + "step": 18257 + }, + { + "epoch": 49.74931880108992, + "grad_norm": 4.400010108947754, + "learning_rate": 1.0566699040651687e-05, + "loss": 0.1128, + "step": 18258 + }, + { + "epoch": 49.752043596730246, + "grad_norm": 6.867877006530762, + "learning_rate": 1.0565817962006033e-05, + "loss": 0.2063, + "step": 18259 + }, + { + "epoch": 49.75476839237057, + "grad_norm": 3.7297110557556152, + "learning_rate": 1.0564936878953804e-05, + "loss": 0.1872, + "step": 18260 + }, + { + "epoch": 49.7574931880109, + "grad_norm": 6.1977858543396, + "learning_rate": 1.0564055791501867e-05, + "loss": 0.2369, + "step": 18261 + }, + { + "epoch": 49.76021798365122, + "grad_norm": 5.163815975189209, + "learning_rate": 1.056317469965708e-05, + "loss": 0.1626, + "step": 18262 + }, + { + "epoch": 49.762942779291556, + "grad_norm": 4.913216590881348, + "learning_rate": 1.0562293603426309e-05, + "loss": 0.1421, + "step": 18263 + }, + { + "epoch": 49.76566757493188, + "grad_norm": 4.714107513427734, + "learning_rate": 1.0561412502816411e-05, + "loss": 0.1879, + "step": 18264 + }, + { + "epoch": 49.76839237057221, + "grad_norm": 5.038058757781982, + "learning_rate": 1.0560531397834253e-05, + "loss": 0.2115, + "step": 18265 + }, + { + "epoch": 49.771117166212534, + "grad_norm": 13.269697189331055, + "learning_rate": 1.055965028848669e-05, + "loss": 0.1234, + "step": 18266 + }, + { + "epoch": 49.77384196185286, + "grad_norm": 4.1821699142456055, + "learning_rate": 1.0558769174780595e-05, + "loss": 0.0749, + "step": 18267 + }, + { + "epoch": 49.776566757493185, + "grad_norm": 6.874485969543457, + "learning_rate": 1.055788805672282e-05, + "loss": 0.2055, + "step": 18268 + }, + { + "epoch": 49.77929155313352, + "grad_norm": 4.795389175415039, + "learning_rate": 1.0557006934320232e-05, + "loss": 0.1236, + "step": 18269 + }, + { + "epoch": 49.782016348773844, + "grad_norm": 13.366247177124023, + "learning_rate": 1.0556125807579691e-05, + "loss": 0.2072, + "step": 18270 + }, + { + "epoch": 49.78474114441417, + "grad_norm": 3.8460803031921387, + "learning_rate": 1.0555244676508058e-05, + "loss": 0.0697, + "step": 18271 + }, + { + "epoch": 49.787465940054496, + "grad_norm": 4.661848545074463, + "learning_rate": 1.05543635411122e-05, + "loss": 0.1132, + "step": 18272 + }, + { + "epoch": 49.79019073569482, + "grad_norm": 11.662322998046875, + "learning_rate": 1.0553482401398979e-05, + "loss": 0.1519, + "step": 18273 + }, + { + "epoch": 49.79291553133515, + "grad_norm": 7.327706336975098, + "learning_rate": 1.055260125737525e-05, + "loss": 0.0829, + "step": 18274 + }, + { + "epoch": 49.79564032697548, + "grad_norm": 6.02321195602417, + "learning_rate": 1.0551720109047883e-05, + "loss": 0.1618, + "step": 18275 + }, + { + "epoch": 49.798365122615806, + "grad_norm": 5.443646430969238, + "learning_rate": 1.0550838956423737e-05, + "loss": 0.0948, + "step": 18276 + }, + { + "epoch": 49.80108991825613, + "grad_norm": 4.680039405822754, + "learning_rate": 1.0549957799509674e-05, + "loss": 0.2436, + "step": 18277 + }, + { + "epoch": 49.80381471389646, + "grad_norm": 4.676031589508057, + "learning_rate": 1.0549076638312558e-05, + "loss": 0.28, + "step": 18278 + }, + { + "epoch": 49.80653950953678, + "grad_norm": 4.422796249389648, + "learning_rate": 1.0548195472839251e-05, + "loss": 0.2487, + "step": 18279 + }, + { + "epoch": 49.80926430517711, + "grad_norm": 6.870621204376221, + "learning_rate": 1.0547314303096617e-05, + "loss": 0.116, + "step": 18280 + }, + { + "epoch": 49.81198910081744, + "grad_norm": 5.2428154945373535, + "learning_rate": 1.0546433129091514e-05, + "loss": 0.1182, + "step": 18281 + }, + { + "epoch": 49.81471389645777, + "grad_norm": 4.760616779327393, + "learning_rate": 1.0545551950830808e-05, + "loss": 0.1925, + "step": 18282 + }, + { + "epoch": 49.817438692098094, + "grad_norm": 5.274930000305176, + "learning_rate": 1.054467076832136e-05, + "loss": 0.1249, + "step": 18283 + }, + { + "epoch": 49.82016348773842, + "grad_norm": 4.147454738616943, + "learning_rate": 1.0543789581570037e-05, + "loss": 0.097, + "step": 18284 + }, + { + "epoch": 49.822888283378745, + "grad_norm": 4.724230766296387, + "learning_rate": 1.0542908390583694e-05, + "loss": 0.1272, + "step": 18285 + }, + { + "epoch": 49.82561307901907, + "grad_norm": 3.691598653793335, + "learning_rate": 1.0542027195369202e-05, + "loss": 0.1959, + "step": 18286 + }, + { + "epoch": 49.828337874659404, + "grad_norm": 4.603728771209717, + "learning_rate": 1.0541145995933416e-05, + "loss": 0.124, + "step": 18287 + }, + { + "epoch": 49.83106267029973, + "grad_norm": 5.445811748504639, + "learning_rate": 1.0540264792283205e-05, + "loss": 0.0962, + "step": 18288 + }, + { + "epoch": 49.833787465940055, + "grad_norm": 3.8996129035949707, + "learning_rate": 1.0539383584425428e-05, + "loss": 0.1087, + "step": 18289 + }, + { + "epoch": 49.83651226158038, + "grad_norm": 5.699887752532959, + "learning_rate": 1.053850237236695e-05, + "loss": 0.1406, + "step": 18290 + }, + { + "epoch": 49.83923705722071, + "grad_norm": 6.749419212341309, + "learning_rate": 1.0537621156114633e-05, + "loss": 0.2279, + "step": 18291 + }, + { + "epoch": 49.84196185286103, + "grad_norm": 12.689628601074219, + "learning_rate": 1.053673993567534e-05, + "loss": 0.15, + "step": 18292 + }, + { + "epoch": 49.844686648501366, + "grad_norm": 5.9806742668151855, + "learning_rate": 1.0535858711055931e-05, + "loss": 0.2104, + "step": 18293 + }, + { + "epoch": 49.84741144414169, + "grad_norm": 4.2488017082214355, + "learning_rate": 1.0534977482263274e-05, + "loss": 0.1174, + "step": 18294 + }, + { + "epoch": 49.85013623978202, + "grad_norm": 4.2461771965026855, + "learning_rate": 1.0534096249304226e-05, + "loss": 0.1724, + "step": 18295 + }, + { + "epoch": 49.85286103542234, + "grad_norm": 4.024528503417969, + "learning_rate": 1.0533215012185659e-05, + "loss": 0.2053, + "step": 18296 + }, + { + "epoch": 49.85558583106267, + "grad_norm": 4.433617115020752, + "learning_rate": 1.0532333770914427e-05, + "loss": 0.1113, + "step": 18297 + }, + { + "epoch": 49.858310626702995, + "grad_norm": 3.990469455718994, + "learning_rate": 1.0531452525497398e-05, + "loss": 0.1112, + "step": 18298 + }, + { + "epoch": 49.86103542234333, + "grad_norm": 5.256641387939453, + "learning_rate": 1.0530571275941433e-05, + "loss": 0.1691, + "step": 18299 + }, + { + "epoch": 49.86376021798365, + "grad_norm": 4.690814971923828, + "learning_rate": 1.0529690022253398e-05, + "loss": 0.1937, + "step": 18300 + }, + { + "epoch": 49.86648501362398, + "grad_norm": 4.61068868637085, + "learning_rate": 1.0528808764440152e-05, + "loss": 0.1708, + "step": 18301 + }, + { + "epoch": 49.869209809264305, + "grad_norm": 5.555260181427002, + "learning_rate": 1.052792750250856e-05, + "loss": 0.2876, + "step": 18302 + }, + { + "epoch": 49.87193460490463, + "grad_norm": 23.923898696899414, + "learning_rate": 1.0527046236465485e-05, + "loss": 0.2312, + "step": 18303 + }, + { + "epoch": 49.87465940054496, + "grad_norm": 4.177738189697266, + "learning_rate": 1.0526164966317796e-05, + "loss": 0.219, + "step": 18304 + }, + { + "epoch": 49.87738419618529, + "grad_norm": 5.994362831115723, + "learning_rate": 1.0525283692072346e-05, + "loss": 0.1716, + "step": 18305 + }, + { + "epoch": 49.880108991825615, + "grad_norm": 5.897968769073486, + "learning_rate": 1.0524402413736005e-05, + "loss": 0.1874, + "step": 18306 + }, + { + "epoch": 49.88283378746594, + "grad_norm": 9.682744026184082, + "learning_rate": 1.0523521131315636e-05, + "loss": 0.1946, + "step": 18307 + }, + { + "epoch": 49.88555858310627, + "grad_norm": 4.334563732147217, + "learning_rate": 1.0522639844818102e-05, + "loss": 0.1312, + "step": 18308 + }, + { + "epoch": 49.88828337874659, + "grad_norm": 4.382263660430908, + "learning_rate": 1.0521758554250263e-05, + "loss": 0.1112, + "step": 18309 + }, + { + "epoch": 49.89100817438692, + "grad_norm": 3.9178307056427, + "learning_rate": 1.0520877259618986e-05, + "loss": 0.0924, + "step": 18310 + }, + { + "epoch": 49.89373297002725, + "grad_norm": 4.639375686645508, + "learning_rate": 1.0519995960931136e-05, + "loss": 0.1725, + "step": 18311 + }, + { + "epoch": 49.89645776566758, + "grad_norm": 4.992181777954102, + "learning_rate": 1.051911465819357e-05, + "loss": 0.1519, + "step": 18312 + }, + { + "epoch": 49.8991825613079, + "grad_norm": 6.2513275146484375, + "learning_rate": 1.0518233351413155e-05, + "loss": 0.0841, + "step": 18313 + }, + { + "epoch": 49.90190735694823, + "grad_norm": 4.794405937194824, + "learning_rate": 1.0517352040596762e-05, + "loss": 0.3198, + "step": 18314 + }, + { + "epoch": 49.904632152588555, + "grad_norm": 4.1200032234191895, + "learning_rate": 1.0516470725751242e-05, + "loss": 0.1155, + "step": 18315 + }, + { + "epoch": 49.90735694822888, + "grad_norm": 5.223155975341797, + "learning_rate": 1.0515589406883469e-05, + "loss": 0.1609, + "step": 18316 + }, + { + "epoch": 49.91008174386921, + "grad_norm": 4.886833667755127, + "learning_rate": 1.05147080840003e-05, + "loss": 0.3186, + "step": 18317 + }, + { + "epoch": 49.91280653950954, + "grad_norm": 5.794650077819824, + "learning_rate": 1.0513826757108603e-05, + "loss": 0.0866, + "step": 18318 + }, + { + "epoch": 49.915531335149865, + "grad_norm": 4.465744972229004, + "learning_rate": 1.0512945426215234e-05, + "loss": 0.1001, + "step": 18319 + }, + { + "epoch": 49.91825613079019, + "grad_norm": 9.17824935913086, + "learning_rate": 1.0512064091327067e-05, + "loss": 0.0945, + "step": 18320 + }, + { + "epoch": 49.920980926430516, + "grad_norm": 6.776849746704102, + "learning_rate": 1.0511182752450959e-05, + "loss": 0.1981, + "step": 18321 + }, + { + "epoch": 49.92370572207084, + "grad_norm": 5.3896098136901855, + "learning_rate": 1.0510301409593779e-05, + "loss": 0.1399, + "step": 18322 + }, + { + "epoch": 49.926430517711175, + "grad_norm": 3.8560609817504883, + "learning_rate": 1.0509420062762388e-05, + "loss": 0.1679, + "step": 18323 + }, + { + "epoch": 49.9291553133515, + "grad_norm": 5.350097179412842, + "learning_rate": 1.0508538711963649e-05, + "loss": 0.2121, + "step": 18324 + }, + { + "epoch": 49.93188010899183, + "grad_norm": 4.888600826263428, + "learning_rate": 1.0507657357204426e-05, + "loss": 0.1259, + "step": 18325 + }, + { + "epoch": 49.93460490463215, + "grad_norm": 3.7617251873016357, + "learning_rate": 1.0506775998491587e-05, + "loss": 0.1737, + "step": 18326 + }, + { + "epoch": 49.93732970027248, + "grad_norm": 5.460902214050293, + "learning_rate": 1.050589463583199e-05, + "loss": 0.1618, + "step": 18327 + }, + { + "epoch": 49.940054495912804, + "grad_norm": 7.914155960083008, + "learning_rate": 1.0505013269232503e-05, + "loss": 0.2932, + "step": 18328 + }, + { + "epoch": 49.94277929155314, + "grad_norm": 6.479796886444092, + "learning_rate": 1.0504131898699985e-05, + "loss": 0.119, + "step": 18329 + }, + { + "epoch": 49.94550408719346, + "grad_norm": 4.8925628662109375, + "learning_rate": 1.0503250524241308e-05, + "loss": 0.2076, + "step": 18330 + }, + { + "epoch": 49.94822888283379, + "grad_norm": 4.879620552062988, + "learning_rate": 1.0502369145863332e-05, + "loss": 0.1089, + "step": 18331 + }, + { + "epoch": 49.950953678474114, + "grad_norm": 5.510569095611572, + "learning_rate": 1.0501487763572921e-05, + "loss": 0.1811, + "step": 18332 + }, + { + "epoch": 49.95367847411444, + "grad_norm": 5.198431968688965, + "learning_rate": 1.0500606377376938e-05, + "loss": 0.2939, + "step": 18333 + }, + { + "epoch": 49.956403269754766, + "grad_norm": 5.519257545471191, + "learning_rate": 1.0499724987282251e-05, + "loss": 0.1253, + "step": 18334 + }, + { + "epoch": 49.95912806539509, + "grad_norm": 4.976462364196777, + "learning_rate": 1.049884359329572e-05, + "loss": 0.2019, + "step": 18335 + }, + { + "epoch": 49.961852861035425, + "grad_norm": 4.999112606048584, + "learning_rate": 1.0497962195424214e-05, + "loss": 0.1197, + "step": 18336 + }, + { + "epoch": 49.96457765667575, + "grad_norm": 4.481200218200684, + "learning_rate": 1.049708079367459e-05, + "loss": 0.082, + "step": 18337 + }, + { + "epoch": 49.967302452316076, + "grad_norm": 5.327234268188477, + "learning_rate": 1.0496199388053718e-05, + "loss": 0.1496, + "step": 18338 + }, + { + "epoch": 49.9700272479564, + "grad_norm": 5.957428455352783, + "learning_rate": 1.0495317978568462e-05, + "loss": 0.1545, + "step": 18339 + }, + { + "epoch": 49.97275204359673, + "grad_norm": 4.346925735473633, + "learning_rate": 1.0494436565225688e-05, + "loss": 0.1513, + "step": 18340 + }, + { + "epoch": 49.97547683923706, + "grad_norm": 4.060068607330322, + "learning_rate": 1.0493555148032253e-05, + "loss": 0.1498, + "step": 18341 + }, + { + "epoch": 49.97820163487739, + "grad_norm": 6.395273685455322, + "learning_rate": 1.0492673726995031e-05, + "loss": 0.2749, + "step": 18342 + }, + { + "epoch": 49.98092643051771, + "grad_norm": 7.144204139709473, + "learning_rate": 1.0491792302120879e-05, + "loss": 0.1537, + "step": 18343 + }, + { + "epoch": 49.98365122615804, + "grad_norm": 4.112253665924072, + "learning_rate": 1.0490910873416667e-05, + "loss": 0.1762, + "step": 18344 + }, + { + "epoch": 49.986376021798364, + "grad_norm": 5.929678916931152, + "learning_rate": 1.0490029440889254e-05, + "loss": 0.1125, + "step": 18345 + }, + { + "epoch": 49.98910081743869, + "grad_norm": 5.074626445770264, + "learning_rate": 1.0489148004545506e-05, + "loss": 0.1712, + "step": 18346 + }, + { + "epoch": 49.991825613079016, + "grad_norm": 5.8632612228393555, + "learning_rate": 1.0488266564392293e-05, + "loss": 0.1416, + "step": 18347 + }, + { + "epoch": 49.99455040871935, + "grad_norm": 4.237979888916016, + "learning_rate": 1.0487385120436475e-05, + "loss": 0.177, + "step": 18348 + }, + { + "epoch": 49.997275204359674, + "grad_norm": 5.096149444580078, + "learning_rate": 1.0486503672684915e-05, + "loss": 0.1208, + "step": 18349 + }, + { + "epoch": 50.0, + "grad_norm": 5.351661205291748, + "learning_rate": 1.0485622221144485e-05, + "loss": 0.175, + "step": 18350 + }, + { + "epoch": 50.002724795640326, + "grad_norm": 4.498886585235596, + "learning_rate": 1.048474076582204e-05, + "loss": 0.1241, + "step": 18351 + }, + { + "epoch": 50.00544959128065, + "grad_norm": 4.655673503875732, + "learning_rate": 1.0483859306724451e-05, + "loss": 0.2254, + "step": 18352 + }, + { + "epoch": 50.00817438692098, + "grad_norm": 4.227473735809326, + "learning_rate": 1.0482977843858581e-05, + "loss": 0.2683, + "step": 18353 + }, + { + "epoch": 50.01089918256131, + "grad_norm": 9.067605018615723, + "learning_rate": 1.0482096377231297e-05, + "loss": 0.1116, + "step": 18354 + }, + { + "epoch": 50.013623978201636, + "grad_norm": 5.1989874839782715, + "learning_rate": 1.0481214906849459e-05, + "loss": 0.1028, + "step": 18355 + }, + { + "epoch": 50.01634877384196, + "grad_norm": 3.9210336208343506, + "learning_rate": 1.0480333432719936e-05, + "loss": 0.1528, + "step": 18356 + }, + { + "epoch": 50.01907356948229, + "grad_norm": 4.288864612579346, + "learning_rate": 1.0479451954849594e-05, + "loss": 0.2224, + "step": 18357 + }, + { + "epoch": 50.02179836512261, + "grad_norm": 3.425851345062256, + "learning_rate": 1.0478570473245293e-05, + "loss": 0.0959, + "step": 18358 + }, + { + "epoch": 50.02452316076294, + "grad_norm": 5.149254322052002, + "learning_rate": 1.0477688987913898e-05, + "loss": 0.0959, + "step": 18359 + }, + { + "epoch": 50.02724795640327, + "grad_norm": 4.205198287963867, + "learning_rate": 1.0476807498862282e-05, + "loss": 0.0985, + "step": 18360 + }, + { + "epoch": 50.0299727520436, + "grad_norm": 4.834911823272705, + "learning_rate": 1.04759260060973e-05, + "loss": 0.192, + "step": 18361 + }, + { + "epoch": 50.032697547683924, + "grad_norm": 3.771606683731079, + "learning_rate": 1.0475044509625827e-05, + "loss": 0.0944, + "step": 18362 + }, + { + "epoch": 50.03542234332425, + "grad_norm": 5.029878616333008, + "learning_rate": 1.0474163009454718e-05, + "loss": 0.0996, + "step": 18363 + }, + { + "epoch": 50.038147138964575, + "grad_norm": 3.8827707767486572, + "learning_rate": 1.0473281505590844e-05, + "loss": 0.0865, + "step": 18364 + }, + { + "epoch": 50.0408719346049, + "grad_norm": 4.6911773681640625, + "learning_rate": 1.047239999804107e-05, + "loss": 0.1315, + "step": 18365 + }, + { + "epoch": 50.043596730245234, + "grad_norm": 9.542468070983887, + "learning_rate": 1.0471518486812258e-05, + "loss": 0.2691, + "step": 18366 + }, + { + "epoch": 50.04632152588556, + "grad_norm": 5.197531700134277, + "learning_rate": 1.0470636971911277e-05, + "loss": 0.2597, + "step": 18367 + }, + { + "epoch": 50.049046321525886, + "grad_norm": 4.857045650482178, + "learning_rate": 1.0469755453344989e-05, + "loss": 0.1893, + "step": 18368 + }, + { + "epoch": 50.05177111716621, + "grad_norm": 4.129888534545898, + "learning_rate": 1.0468873931120263e-05, + "loss": 0.1494, + "step": 18369 + }, + { + "epoch": 50.05449591280654, + "grad_norm": 5.007657527923584, + "learning_rate": 1.0467992405243959e-05, + "loss": 0.2078, + "step": 18370 + }, + { + "epoch": 50.05722070844686, + "grad_norm": 4.791961193084717, + "learning_rate": 1.0467110875722945e-05, + "loss": 0.1493, + "step": 18371 + }, + { + "epoch": 50.059945504087196, + "grad_norm": 4.589936256408691, + "learning_rate": 1.0466229342564087e-05, + "loss": 0.1173, + "step": 18372 + }, + { + "epoch": 50.06267029972752, + "grad_norm": 4.196911811828613, + "learning_rate": 1.0465347805774253e-05, + "loss": 0.1584, + "step": 18373 + }, + { + "epoch": 50.06539509536785, + "grad_norm": 4.869670867919922, + "learning_rate": 1.0464466265360303e-05, + "loss": 0.2005, + "step": 18374 + }, + { + "epoch": 50.06811989100817, + "grad_norm": 3.5600781440734863, + "learning_rate": 1.0463584721329105e-05, + "loss": 0.2594, + "step": 18375 + }, + { + "epoch": 50.0708446866485, + "grad_norm": 4.4433979988098145, + "learning_rate": 1.0462703173687523e-05, + "loss": 0.229, + "step": 18376 + }, + { + "epoch": 50.073569482288825, + "grad_norm": 4.804118633270264, + "learning_rate": 1.0461821622442425e-05, + "loss": 0.2624, + "step": 18377 + }, + { + "epoch": 50.07629427792916, + "grad_norm": 4.39185094833374, + "learning_rate": 1.0460940067600676e-05, + "loss": 0.0922, + "step": 18378 + }, + { + "epoch": 50.079019073569484, + "grad_norm": 6.641062259674072, + "learning_rate": 1.046005850916914e-05, + "loss": 0.09, + "step": 18379 + }, + { + "epoch": 50.08174386920981, + "grad_norm": 4.962137699127197, + "learning_rate": 1.0459176947154682e-05, + "loss": 0.1016, + "step": 18380 + }, + { + "epoch": 50.084468664850135, + "grad_norm": 5.6916279792785645, + "learning_rate": 1.0458295381564168e-05, + "loss": 0.1782, + "step": 18381 + }, + { + "epoch": 50.08719346049046, + "grad_norm": 3.9860925674438477, + "learning_rate": 1.0457413812404461e-05, + "loss": 0.2467, + "step": 18382 + }, + { + "epoch": 50.08991825613079, + "grad_norm": 9.179952621459961, + "learning_rate": 1.0456532239682438e-05, + "loss": 0.1843, + "step": 18383 + }, + { + "epoch": 50.09264305177112, + "grad_norm": 4.272060394287109, + "learning_rate": 1.0455650663404953e-05, + "loss": 0.1184, + "step": 18384 + }, + { + "epoch": 50.095367847411445, + "grad_norm": 5.147090911865234, + "learning_rate": 1.0454769083578876e-05, + "loss": 0.1671, + "step": 18385 + }, + { + "epoch": 50.09809264305177, + "grad_norm": 4.8225836753845215, + "learning_rate": 1.0453887500211068e-05, + "loss": 0.0667, + "step": 18386 + }, + { + "epoch": 50.1008174386921, + "grad_norm": 4.201931476593018, + "learning_rate": 1.0453005913308405e-05, + "loss": 0.099, + "step": 18387 + }, + { + "epoch": 50.10354223433242, + "grad_norm": 5.505147457122803, + "learning_rate": 1.0452124322877741e-05, + "loss": 0.0965, + "step": 18388 + }, + { + "epoch": 50.10626702997275, + "grad_norm": 6.157524108886719, + "learning_rate": 1.045124272892595e-05, + "loss": 0.2204, + "step": 18389 + }, + { + "epoch": 50.10899182561308, + "grad_norm": 4.28139066696167, + "learning_rate": 1.0450361131459894e-05, + "loss": 0.2364, + "step": 18390 + }, + { + "epoch": 50.11171662125341, + "grad_norm": 5.012563228607178, + "learning_rate": 1.0449479530486441e-05, + "loss": 0.1196, + "step": 18391 + }, + { + "epoch": 50.11444141689373, + "grad_norm": 4.472416877746582, + "learning_rate": 1.0448597926012456e-05, + "loss": 0.2205, + "step": 18392 + }, + { + "epoch": 50.11716621253406, + "grad_norm": 5.370371341705322, + "learning_rate": 1.0447716318044807e-05, + "loss": 0.1321, + "step": 18393 + }, + { + "epoch": 50.119891008174385, + "grad_norm": 6.545853137969971, + "learning_rate": 1.0446834706590354e-05, + "loss": 0.0559, + "step": 18394 + }, + { + "epoch": 50.12261580381471, + "grad_norm": 5.600507736206055, + "learning_rate": 1.044595309165597e-05, + "loss": 0.1398, + "step": 18395 + }, + { + "epoch": 50.12534059945504, + "grad_norm": 6.128230094909668, + "learning_rate": 1.0445071473248514e-05, + "loss": 0.145, + "step": 18396 + }, + { + "epoch": 50.12806539509537, + "grad_norm": 4.690159797668457, + "learning_rate": 1.0444189851374857e-05, + "loss": 0.2394, + "step": 18397 + }, + { + "epoch": 50.130790190735695, + "grad_norm": 4.9555487632751465, + "learning_rate": 1.0443308226041862e-05, + "loss": 0.1515, + "step": 18398 + }, + { + "epoch": 50.13351498637602, + "grad_norm": 4.733140468597412, + "learning_rate": 1.04424265972564e-05, + "loss": 0.1177, + "step": 18399 + }, + { + "epoch": 50.13623978201635, + "grad_norm": 4.880582332611084, + "learning_rate": 1.0441544965025332e-05, + "loss": 0.1291, + "step": 18400 + }, + { + "epoch": 50.13896457765667, + "grad_norm": 3.9399352073669434, + "learning_rate": 1.044066332935553e-05, + "loss": 0.0717, + "step": 18401 + }, + { + "epoch": 50.141689373297005, + "grad_norm": 7.9581708908081055, + "learning_rate": 1.0439781690253851e-05, + "loss": 0.1258, + "step": 18402 + }, + { + "epoch": 50.14441416893733, + "grad_norm": 5.133094787597656, + "learning_rate": 1.043890004772717e-05, + "loss": 0.0825, + "step": 18403 + }, + { + "epoch": 50.14713896457766, + "grad_norm": 3.9729957580566406, + "learning_rate": 1.0438018401782347e-05, + "loss": 0.1867, + "step": 18404 + }, + { + "epoch": 50.14986376021798, + "grad_norm": 3.989093542098999, + "learning_rate": 1.0437136752426254e-05, + "loss": 0.2117, + "step": 18405 + }, + { + "epoch": 50.15258855585831, + "grad_norm": 4.257974624633789, + "learning_rate": 1.0436255099665746e-05, + "loss": 0.2167, + "step": 18406 + }, + { + "epoch": 50.155313351498634, + "grad_norm": 4.502657413482666, + "learning_rate": 1.0435373443507706e-05, + "loss": 0.1782, + "step": 18407 + }, + { + "epoch": 50.15803814713897, + "grad_norm": 5.227933406829834, + "learning_rate": 1.0434491783958986e-05, + "loss": 0.1995, + "step": 18408 + }, + { + "epoch": 50.16076294277929, + "grad_norm": 9.845762252807617, + "learning_rate": 1.0433610121026463e-05, + "loss": 0.1165, + "step": 18409 + }, + { + "epoch": 50.16348773841962, + "grad_norm": 4.153945446014404, + "learning_rate": 1.0432728454716996e-05, + "loss": 0.1055, + "step": 18410 + }, + { + "epoch": 50.166212534059945, + "grad_norm": 5.337934970855713, + "learning_rate": 1.0431846785037454e-05, + "loss": 0.2107, + "step": 18411 + }, + { + "epoch": 50.16893732970027, + "grad_norm": 4.0061750411987305, + "learning_rate": 1.0430965111994701e-05, + "loss": 0.091, + "step": 18412 + }, + { + "epoch": 50.171662125340596, + "grad_norm": 67.78372192382812, + "learning_rate": 1.0430083435595611e-05, + "loss": 0.1771, + "step": 18413 + }, + { + "epoch": 50.17438692098093, + "grad_norm": 4.743940830230713, + "learning_rate": 1.0429201755847041e-05, + "loss": 0.0999, + "step": 18414 + }, + { + "epoch": 50.177111716621255, + "grad_norm": 4.93541145324707, + "learning_rate": 1.042832007275586e-05, + "loss": 0.1944, + "step": 18415 + }, + { + "epoch": 50.17983651226158, + "grad_norm": 5.489130020141602, + "learning_rate": 1.0427438386328936e-05, + "loss": 0.1787, + "step": 18416 + }, + { + "epoch": 50.182561307901906, + "grad_norm": 4.149992942810059, + "learning_rate": 1.042655669657314e-05, + "loss": 0.1445, + "step": 18417 + }, + { + "epoch": 50.18528610354223, + "grad_norm": 5.850244045257568, + "learning_rate": 1.0425675003495333e-05, + "loss": 0.0969, + "step": 18418 + }, + { + "epoch": 50.18801089918256, + "grad_norm": 5.269390106201172, + "learning_rate": 1.0424793307102381e-05, + "loss": 0.1114, + "step": 18419 + }, + { + "epoch": 50.19073569482289, + "grad_norm": 7.50940465927124, + "learning_rate": 1.0423911607401152e-05, + "loss": 0.2189, + "step": 18420 + }, + { + "epoch": 50.19346049046322, + "grad_norm": 5.363705635070801, + "learning_rate": 1.0423029904398515e-05, + "loss": 0.1729, + "step": 18421 + }, + { + "epoch": 50.19618528610354, + "grad_norm": 5.508678436279297, + "learning_rate": 1.0422148198101334e-05, + "loss": 0.1864, + "step": 18422 + }, + { + "epoch": 50.19891008174387, + "grad_norm": 8.772170066833496, + "learning_rate": 1.0421266488516478e-05, + "loss": 0.3508, + "step": 18423 + }, + { + "epoch": 50.201634877384194, + "grad_norm": 6.351077079772949, + "learning_rate": 1.0420384775650806e-05, + "loss": 0.1513, + "step": 18424 + }, + { + "epoch": 50.20435967302452, + "grad_norm": 8.251812934875488, + "learning_rate": 1.0419503059511197e-05, + "loss": 0.1293, + "step": 18425 + }, + { + "epoch": 50.20708446866485, + "grad_norm": 4.953874111175537, + "learning_rate": 1.0418621340104509e-05, + "loss": 0.1023, + "step": 18426 + }, + { + "epoch": 50.20980926430518, + "grad_norm": 4.948370456695557, + "learning_rate": 1.0417739617437615e-05, + "loss": 0.117, + "step": 18427 + }, + { + "epoch": 50.212534059945504, + "grad_norm": 6.658825397491455, + "learning_rate": 1.0416857891517374e-05, + "loss": 0.1379, + "step": 18428 + }, + { + "epoch": 50.21525885558583, + "grad_norm": 5.551758289337158, + "learning_rate": 1.041597616235066e-05, + "loss": 0.1382, + "step": 18429 + }, + { + "epoch": 50.217983651226156, + "grad_norm": 6.4018683433532715, + "learning_rate": 1.0415094429944334e-05, + "loss": 0.2777, + "step": 18430 + }, + { + "epoch": 50.22070844686648, + "grad_norm": 6.368010997772217, + "learning_rate": 1.041421269430527e-05, + "loss": 0.1227, + "step": 18431 + }, + { + "epoch": 50.223433242506815, + "grad_norm": 7.071566581726074, + "learning_rate": 1.0413330955440328e-05, + "loss": 0.1889, + "step": 18432 + }, + { + "epoch": 50.22615803814714, + "grad_norm": 4.986183166503906, + "learning_rate": 1.0412449213356377e-05, + "loss": 0.1167, + "step": 18433 + }, + { + "epoch": 50.228882833787466, + "grad_norm": 6.3849029541015625, + "learning_rate": 1.0411567468060288e-05, + "loss": 0.2268, + "step": 18434 + }, + { + "epoch": 50.23160762942779, + "grad_norm": 7.67453145980835, + "learning_rate": 1.0410685719558921e-05, + "loss": 0.0973, + "step": 18435 + }, + { + "epoch": 50.23433242506812, + "grad_norm": 11.306721687316895, + "learning_rate": 1.040980396785915e-05, + "loss": 0.1166, + "step": 18436 + }, + { + "epoch": 50.237057220708444, + "grad_norm": 5.158883094787598, + "learning_rate": 1.0408922212967839e-05, + "loss": 0.1354, + "step": 18437 + }, + { + "epoch": 50.23978201634878, + "grad_norm": 5.250732898712158, + "learning_rate": 1.0408040454891852e-05, + "loss": 0.095, + "step": 18438 + }, + { + "epoch": 50.2425068119891, + "grad_norm": 5.08771276473999, + "learning_rate": 1.0407158693638065e-05, + "loss": 0.2626, + "step": 18439 + }, + { + "epoch": 50.24523160762943, + "grad_norm": 6.133188724517822, + "learning_rate": 1.0406276929213332e-05, + "loss": 0.2383, + "step": 18440 + }, + { + "epoch": 50.247956403269754, + "grad_norm": 9.72242259979248, + "learning_rate": 1.040539516162453e-05, + "loss": 0.1978, + "step": 18441 + }, + { + "epoch": 50.25068119891008, + "grad_norm": 7.685892581939697, + "learning_rate": 1.0404513390878526e-05, + "loss": 0.1966, + "step": 18442 + }, + { + "epoch": 50.253405994550405, + "grad_norm": 23.41997718811035, + "learning_rate": 1.0403631616982181e-05, + "loss": 0.2018, + "step": 18443 + }, + { + "epoch": 50.25613079019074, + "grad_norm": 18.337629318237305, + "learning_rate": 1.040274983994237e-05, + "loss": 0.1876, + "step": 18444 + }, + { + "epoch": 50.258855585831064, + "grad_norm": 6.652121543884277, + "learning_rate": 1.0401868059765952e-05, + "loss": 0.1405, + "step": 18445 + }, + { + "epoch": 50.26158038147139, + "grad_norm": 6.964537143707275, + "learning_rate": 1.04009862764598e-05, + "loss": 0.25, + "step": 18446 + }, + { + "epoch": 50.264305177111716, + "grad_norm": 7.468809604644775, + "learning_rate": 1.0400104490030781e-05, + "loss": 0.311, + "step": 18447 + }, + { + "epoch": 50.26702997275204, + "grad_norm": 8.93313217163086, + "learning_rate": 1.039922270048576e-05, + "loss": 0.1644, + "step": 18448 + }, + { + "epoch": 50.26975476839237, + "grad_norm": 5.838148593902588, + "learning_rate": 1.0398340907831603e-05, + "loss": 0.1412, + "step": 18449 + }, + { + "epoch": 50.2724795640327, + "grad_norm": 15.795492172241211, + "learning_rate": 1.0397459112075186e-05, + "loss": 0.1476, + "step": 18450 + }, + { + "epoch": 50.275204359673026, + "grad_norm": 7.08922815322876, + "learning_rate": 1.0396577313223367e-05, + "loss": 0.1622, + "step": 18451 + }, + { + "epoch": 50.27792915531335, + "grad_norm": 6.640037536621094, + "learning_rate": 1.0395695511283015e-05, + "loss": 0.1612, + "step": 18452 + }, + { + "epoch": 50.28065395095368, + "grad_norm": 6.648226261138916, + "learning_rate": 1.0394813706261e-05, + "loss": 0.0946, + "step": 18453 + }, + { + "epoch": 50.283378746594, + "grad_norm": 5.4601593017578125, + "learning_rate": 1.0393931898164191e-05, + "loss": 0.1922, + "step": 18454 + }, + { + "epoch": 50.28610354223433, + "grad_norm": 16.282859802246094, + "learning_rate": 1.039305008699945e-05, + "loss": 0.1048, + "step": 18455 + }, + { + "epoch": 50.28882833787466, + "grad_norm": 7.032933235168457, + "learning_rate": 1.0392168272773651e-05, + "loss": 0.1855, + "step": 18456 + }, + { + "epoch": 50.29155313351499, + "grad_norm": 7.576723575592041, + "learning_rate": 1.0391286455493655e-05, + "loss": 0.2885, + "step": 18457 + }, + { + "epoch": 50.294277929155314, + "grad_norm": 6.466182708740234, + "learning_rate": 1.0390404635166331e-05, + "loss": 0.1541, + "step": 18458 + }, + { + "epoch": 50.29700272479564, + "grad_norm": 5.537355422973633, + "learning_rate": 1.0389522811798551e-05, + "loss": 0.1611, + "step": 18459 + }, + { + "epoch": 50.299727520435965, + "grad_norm": 7.105430603027344, + "learning_rate": 1.038864098539718e-05, + "loss": 0.134, + "step": 18460 + }, + { + "epoch": 50.30245231607629, + "grad_norm": 5.081597328186035, + "learning_rate": 1.0387759155969085e-05, + "loss": 0.2542, + "step": 18461 + }, + { + "epoch": 50.305177111716624, + "grad_norm": 5.218195915222168, + "learning_rate": 1.0386877323521137e-05, + "loss": 0.1787, + "step": 18462 + }, + { + "epoch": 50.30790190735695, + "grad_norm": 6.520836353302002, + "learning_rate": 1.0385995488060196e-05, + "loss": 0.1189, + "step": 18463 + }, + { + "epoch": 50.310626702997276, + "grad_norm": 5.77503776550293, + "learning_rate": 1.0385113649593137e-05, + "loss": 0.2085, + "step": 18464 + }, + { + "epoch": 50.3133514986376, + "grad_norm": 4.978865146636963, + "learning_rate": 1.0384231808126826e-05, + "loss": 0.3342, + "step": 18465 + }, + { + "epoch": 50.31607629427793, + "grad_norm": 5.38184928894043, + "learning_rate": 1.038334996366813e-05, + "loss": 0.1617, + "step": 18466 + }, + { + "epoch": 50.31880108991825, + "grad_norm": 5.251583099365234, + "learning_rate": 1.0382468116223912e-05, + "loss": 0.243, + "step": 18467 + }, + { + "epoch": 50.321525885558586, + "grad_norm": 5.05536413192749, + "learning_rate": 1.0381586265801049e-05, + "loss": 0.302, + "step": 18468 + }, + { + "epoch": 50.32425068119891, + "grad_norm": 4.584299564361572, + "learning_rate": 1.0380704412406405e-05, + "loss": 0.109, + "step": 18469 + }, + { + "epoch": 50.32697547683924, + "grad_norm": 4.566288471221924, + "learning_rate": 1.0379822556046845e-05, + "loss": 0.2359, + "step": 18470 + }, + { + "epoch": 50.32970027247956, + "grad_norm": 5.151820659637451, + "learning_rate": 1.037894069672924e-05, + "loss": 0.2084, + "step": 18471 + }, + { + "epoch": 50.33242506811989, + "grad_norm": 6.798867225646973, + "learning_rate": 1.037805883446046e-05, + "loss": 0.1276, + "step": 18472 + }, + { + "epoch": 50.335149863760215, + "grad_norm": 4.876811981201172, + "learning_rate": 1.0377176969247366e-05, + "loss": 0.1242, + "step": 18473 + }, + { + "epoch": 50.33787465940055, + "grad_norm": 5.204194068908691, + "learning_rate": 1.0376295101096834e-05, + "loss": 0.1834, + "step": 18474 + }, + { + "epoch": 50.34059945504087, + "grad_norm": 7.647690773010254, + "learning_rate": 1.037541323001572e-05, + "loss": 0.1279, + "step": 18475 + }, + { + "epoch": 50.3433242506812, + "grad_norm": 6.199369430541992, + "learning_rate": 1.0374531356010909e-05, + "loss": 0.1893, + "step": 18476 + }, + { + "epoch": 50.346049046321525, + "grad_norm": 4.2011189460754395, + "learning_rate": 1.0373649479089254e-05, + "loss": 0.1199, + "step": 18477 + }, + { + "epoch": 50.34877384196185, + "grad_norm": 7.538383483886719, + "learning_rate": 1.0372767599257631e-05, + "loss": 0.1437, + "step": 18478 + }, + { + "epoch": 50.35149863760218, + "grad_norm": 4.226534843444824, + "learning_rate": 1.0371885716522904e-05, + "loss": 0.1227, + "step": 18479 + }, + { + "epoch": 50.35422343324251, + "grad_norm": 5.861737251281738, + "learning_rate": 1.0371003830891948e-05, + "loss": 0.1451, + "step": 18480 + }, + { + "epoch": 50.356948228882835, + "grad_norm": 7.6636762619018555, + "learning_rate": 1.0370121942371623e-05, + "loss": 0.1809, + "step": 18481 + }, + { + "epoch": 50.35967302452316, + "grad_norm": 6.123965263366699, + "learning_rate": 1.0369240050968802e-05, + "loss": 0.1501, + "step": 18482 + }, + { + "epoch": 50.36239782016349, + "grad_norm": 5.685791015625, + "learning_rate": 1.0368358156690345e-05, + "loss": 0.1547, + "step": 18483 + }, + { + "epoch": 50.36512261580381, + "grad_norm": 5.073871612548828, + "learning_rate": 1.0367476259543133e-05, + "loss": 0.1027, + "step": 18484 + }, + { + "epoch": 50.36784741144414, + "grad_norm": 7.540602684020996, + "learning_rate": 1.0366594359534024e-05, + "loss": 0.1327, + "step": 18485 + }, + { + "epoch": 50.37057220708447, + "grad_norm": 5.798464298248291, + "learning_rate": 1.0365712456669891e-05, + "loss": 0.145, + "step": 18486 + }, + { + "epoch": 50.3732970027248, + "grad_norm": 4.602923393249512, + "learning_rate": 1.0364830550957603e-05, + "loss": 0.1547, + "step": 18487 + }, + { + "epoch": 50.37602179836512, + "grad_norm": 7.460385322570801, + "learning_rate": 1.0363948642404025e-05, + "loss": 0.1556, + "step": 18488 + }, + { + "epoch": 50.37874659400545, + "grad_norm": 5.966169834136963, + "learning_rate": 1.0363066731016026e-05, + "loss": 0.3613, + "step": 18489 + }, + { + "epoch": 50.381471389645775, + "grad_norm": 6.093320369720459, + "learning_rate": 1.0362184816800478e-05, + "loss": 0.1202, + "step": 18490 + }, + { + "epoch": 50.3841961852861, + "grad_norm": 5.022852420806885, + "learning_rate": 1.0361302899764242e-05, + "loss": 0.199, + "step": 18491 + }, + { + "epoch": 50.38692098092643, + "grad_norm": 6.382558822631836, + "learning_rate": 1.0360420979914192e-05, + "loss": 0.1699, + "step": 18492 + }, + { + "epoch": 50.38964577656676, + "grad_norm": 4.964744567871094, + "learning_rate": 1.0359539057257196e-05, + "loss": 0.283, + "step": 18493 + }, + { + "epoch": 50.392370572207085, + "grad_norm": 7.423490047454834, + "learning_rate": 1.0358657131800123e-05, + "loss": 0.1443, + "step": 18494 + }, + { + "epoch": 50.39509536784741, + "grad_norm": 4.478601932525635, + "learning_rate": 1.0357775203549836e-05, + "loss": 0.2648, + "step": 18495 + }, + { + "epoch": 50.39782016348774, + "grad_norm": 5.2288818359375, + "learning_rate": 1.0356893272513211e-05, + "loss": 0.1324, + "step": 18496 + }, + { + "epoch": 50.40054495912806, + "grad_norm": 3.6058640480041504, + "learning_rate": 1.0356011338697109e-05, + "loss": 0.0967, + "step": 18497 + }, + { + "epoch": 50.403269754768395, + "grad_norm": 6.091643810272217, + "learning_rate": 1.0355129402108407e-05, + "loss": 0.1614, + "step": 18498 + }, + { + "epoch": 50.40599455040872, + "grad_norm": 5.402215003967285, + "learning_rate": 1.0354247462753964e-05, + "loss": 0.1089, + "step": 18499 + }, + { + "epoch": 50.40871934604905, + "grad_norm": 5.242166996002197, + "learning_rate": 1.0353365520640657e-05, + "loss": 0.1504, + "step": 18500 + }, + { + "epoch": 50.41144414168937, + "grad_norm": 6.618157386779785, + "learning_rate": 1.0352483575775345e-05, + "loss": 0.0943, + "step": 18501 + }, + { + "epoch": 50.4141689373297, + "grad_norm": 6.022257328033447, + "learning_rate": 1.0351601628164906e-05, + "loss": 0.1216, + "step": 18502 + }, + { + "epoch": 50.416893732970024, + "grad_norm": 5.579530239105225, + "learning_rate": 1.0350719677816206e-05, + "loss": 0.091, + "step": 18503 + }, + { + "epoch": 50.41961852861036, + "grad_norm": 5.442110061645508, + "learning_rate": 1.0349837724736111e-05, + "loss": 0.2021, + "step": 18504 + }, + { + "epoch": 50.42234332425068, + "grad_norm": 6.488962173461914, + "learning_rate": 1.034895576893149e-05, + "loss": 0.1867, + "step": 18505 + }, + { + "epoch": 50.42506811989101, + "grad_norm": 13.680377960205078, + "learning_rate": 1.0348073810409216e-05, + "loss": 0.2782, + "step": 18506 + }, + { + "epoch": 50.427792915531334, + "grad_norm": 3.9911866188049316, + "learning_rate": 1.0347191849176151e-05, + "loss": 0.0757, + "step": 18507 + }, + { + "epoch": 50.43051771117166, + "grad_norm": 5.4325714111328125, + "learning_rate": 1.034630988523917e-05, + "loss": 0.1251, + "step": 18508 + }, + { + "epoch": 50.433242506811986, + "grad_norm": 4.3573384284973145, + "learning_rate": 1.0345427918605136e-05, + "loss": 0.0782, + "step": 18509 + }, + { + "epoch": 50.43596730245232, + "grad_norm": 3.7895023822784424, + "learning_rate": 1.034454594928092e-05, + "loss": 0.0818, + "step": 18510 + }, + { + "epoch": 50.438692098092645, + "grad_norm": 5.045506954193115, + "learning_rate": 1.0343663977273393e-05, + "loss": 0.0791, + "step": 18511 + }, + { + "epoch": 50.44141689373297, + "grad_norm": 5.500280857086182, + "learning_rate": 1.0342782002589421e-05, + "loss": 0.2222, + "step": 18512 + }, + { + "epoch": 50.444141689373296, + "grad_norm": 4.472443103790283, + "learning_rate": 1.0341900025235876e-05, + "loss": 0.1824, + "step": 18513 + }, + { + "epoch": 50.44686648501362, + "grad_norm": 5.784664630889893, + "learning_rate": 1.0341018045219624e-05, + "loss": 0.1524, + "step": 18514 + }, + { + "epoch": 50.44959128065395, + "grad_norm": 5.076463222503662, + "learning_rate": 1.0340136062547531e-05, + "loss": 0.2144, + "step": 18515 + }, + { + "epoch": 50.45231607629428, + "grad_norm": 5.553852081298828, + "learning_rate": 1.0339254077226474e-05, + "loss": 0.2322, + "step": 18516 + }, + { + "epoch": 50.45504087193461, + "grad_norm": 5.4261698722839355, + "learning_rate": 1.0338372089263316e-05, + "loss": 0.2037, + "step": 18517 + }, + { + "epoch": 50.45776566757493, + "grad_norm": 20.90692901611328, + "learning_rate": 1.0337490098664923e-05, + "loss": 0.1938, + "step": 18518 + }, + { + "epoch": 50.46049046321526, + "grad_norm": 7.544172763824463, + "learning_rate": 1.0336608105438172e-05, + "loss": 0.2766, + "step": 18519 + }, + { + "epoch": 50.463215258855584, + "grad_norm": 4.8083977699279785, + "learning_rate": 1.0335726109589927e-05, + "loss": 0.1645, + "step": 18520 + }, + { + "epoch": 50.46594005449591, + "grad_norm": 5.119318008422852, + "learning_rate": 1.0334844111127058e-05, + "loss": 0.1378, + "step": 18521 + }, + { + "epoch": 50.46866485013624, + "grad_norm": 13.963621139526367, + "learning_rate": 1.0333962110056435e-05, + "loss": 0.1564, + "step": 18522 + }, + { + "epoch": 50.47138964577657, + "grad_norm": 5.176802635192871, + "learning_rate": 1.0333080106384922e-05, + "loss": 0.1489, + "step": 18523 + }, + { + "epoch": 50.474114441416894, + "grad_norm": 6.25013542175293, + "learning_rate": 1.0332198100119398e-05, + "loss": 0.1352, + "step": 18524 + }, + { + "epoch": 50.47683923705722, + "grad_norm": 4.3459320068359375, + "learning_rate": 1.033131609126672e-05, + "loss": 0.1453, + "step": 18525 + }, + { + "epoch": 50.479564032697546, + "grad_norm": 5.281796455383301, + "learning_rate": 1.0330434079833767e-05, + "loss": 0.2247, + "step": 18526 + }, + { + "epoch": 50.48228882833787, + "grad_norm": 5.650903224945068, + "learning_rate": 1.0329552065827402e-05, + "loss": 0.1086, + "step": 18527 + }, + { + "epoch": 50.485013623978205, + "grad_norm": 5.897468090057373, + "learning_rate": 1.0328670049254494e-05, + "loss": 0.1713, + "step": 18528 + }, + { + "epoch": 50.48773841961853, + "grad_norm": 5.536411285400391, + "learning_rate": 1.032778803012192e-05, + "loss": 0.1332, + "step": 18529 + }, + { + "epoch": 50.490463215258856, + "grad_norm": 4.596107482910156, + "learning_rate": 1.0326906008436537e-05, + "loss": 0.1164, + "step": 18530 + }, + { + "epoch": 50.49318801089918, + "grad_norm": 12.462303161621094, + "learning_rate": 1.0326023984205224e-05, + "loss": 0.2555, + "step": 18531 + }, + { + "epoch": 50.49591280653951, + "grad_norm": 4.766989707946777, + "learning_rate": 1.0325141957434848e-05, + "loss": 0.103, + "step": 18532 + }, + { + "epoch": 50.49863760217983, + "grad_norm": 5.915868759155273, + "learning_rate": 1.0324259928132273e-05, + "loss": 0.2964, + "step": 18533 + }, + { + "epoch": 50.50136239782017, + "grad_norm": 4.585247993469238, + "learning_rate": 1.0323377896304377e-05, + "loss": 0.1374, + "step": 18534 + }, + { + "epoch": 50.50408719346049, + "grad_norm": 6.821434497833252, + "learning_rate": 1.032249586195802e-05, + "loss": 0.2504, + "step": 18535 + }, + { + "epoch": 50.50681198910082, + "grad_norm": 4.72754430770874, + "learning_rate": 1.0321613825100076e-05, + "loss": 0.1451, + "step": 18536 + }, + { + "epoch": 50.509536784741144, + "grad_norm": 4.41359806060791, + "learning_rate": 1.0320731785737417e-05, + "loss": 0.2929, + "step": 18537 + }, + { + "epoch": 50.51226158038147, + "grad_norm": 5.099160671234131, + "learning_rate": 1.0319849743876904e-05, + "loss": 0.1279, + "step": 18538 + }, + { + "epoch": 50.514986376021795, + "grad_norm": 4.279083728790283, + "learning_rate": 1.0318967699525418e-05, + "loss": 0.0831, + "step": 18539 + }, + { + "epoch": 50.51771117166213, + "grad_norm": 3.7065377235412598, + "learning_rate": 1.0318085652689817e-05, + "loss": 0.2047, + "step": 18540 + }, + { + "epoch": 50.520435967302454, + "grad_norm": 5.958557605743408, + "learning_rate": 1.0317203603376978e-05, + "loss": 0.1109, + "step": 18541 + }, + { + "epoch": 50.52316076294278, + "grad_norm": 5.407521724700928, + "learning_rate": 1.0316321551593765e-05, + "loss": 0.1997, + "step": 18542 + }, + { + "epoch": 50.525885558583106, + "grad_norm": 4.932890892028809, + "learning_rate": 1.0315439497347053e-05, + "loss": 0.092, + "step": 18543 + }, + { + "epoch": 50.52861035422343, + "grad_norm": 5.787096977233887, + "learning_rate": 1.0314557440643704e-05, + "loss": 0.2025, + "step": 18544 + }, + { + "epoch": 50.53133514986376, + "grad_norm": 5.552667617797852, + "learning_rate": 1.0313675381490596e-05, + "loss": 0.2368, + "step": 18545 + }, + { + "epoch": 50.53405994550409, + "grad_norm": 4.171079158782959, + "learning_rate": 1.031279331989459e-05, + "loss": 0.1034, + "step": 18546 + }, + { + "epoch": 50.536784741144416, + "grad_norm": 4.297781467437744, + "learning_rate": 1.0311911255862563e-05, + "loss": 0.0874, + "step": 18547 + }, + { + "epoch": 50.53950953678474, + "grad_norm": 6.7232441902160645, + "learning_rate": 1.0311029189401381e-05, + "loss": 0.2101, + "step": 18548 + }, + { + "epoch": 50.54223433242507, + "grad_norm": 4.8784589767456055, + "learning_rate": 1.0310147120517914e-05, + "loss": 0.3153, + "step": 18549 + }, + { + "epoch": 50.54495912806539, + "grad_norm": 6.15592622756958, + "learning_rate": 1.030926504921903e-05, + "loss": 0.2002, + "step": 18550 + }, + { + "epoch": 50.54768392370572, + "grad_norm": 15.851859092712402, + "learning_rate": 1.0308382975511601e-05, + "loss": 0.1726, + "step": 18551 + }, + { + "epoch": 50.55040871934605, + "grad_norm": 7.502651691436768, + "learning_rate": 1.0307500899402493e-05, + "loss": 0.364, + "step": 18552 + }, + { + "epoch": 50.55313351498638, + "grad_norm": 4.7100396156311035, + "learning_rate": 1.0306618820898579e-05, + "loss": 0.1076, + "step": 18553 + }, + { + "epoch": 50.555858310626704, + "grad_norm": 6.022217750549316, + "learning_rate": 1.0305736740006726e-05, + "loss": 0.1563, + "step": 18554 + }, + { + "epoch": 50.55858310626703, + "grad_norm": 8.388520240783691, + "learning_rate": 1.0304854656733808e-05, + "loss": 0.1141, + "step": 18555 + }, + { + "epoch": 50.561307901907355, + "grad_norm": 5.04994535446167, + "learning_rate": 1.0303972571086691e-05, + "loss": 0.1208, + "step": 18556 + }, + { + "epoch": 50.56403269754768, + "grad_norm": 6.984668254852295, + "learning_rate": 1.0303090483072247e-05, + "loss": 0.1762, + "step": 18557 + }, + { + "epoch": 50.566757493188014, + "grad_norm": 4.813941955566406, + "learning_rate": 1.0302208392697339e-05, + "loss": 0.0937, + "step": 18558 + }, + { + "epoch": 50.56948228882834, + "grad_norm": 5.3015875816345215, + "learning_rate": 1.0301326299968848e-05, + "loss": 0.1246, + "step": 18559 + }, + { + "epoch": 50.572207084468666, + "grad_norm": 7.070939064025879, + "learning_rate": 1.0300444204893634e-05, + "loss": 0.2059, + "step": 18560 + }, + { + "epoch": 50.57493188010899, + "grad_norm": 4.208089351654053, + "learning_rate": 1.0299562107478569e-05, + "loss": 0.0784, + "step": 18561 + }, + { + "epoch": 50.57765667574932, + "grad_norm": 5.170956134796143, + "learning_rate": 1.0298680007730525e-05, + "loss": 0.2942, + "step": 18562 + }, + { + "epoch": 50.58038147138964, + "grad_norm": 4.3384575843811035, + "learning_rate": 1.029779790565637e-05, + "loss": 0.2176, + "step": 18563 + }, + { + "epoch": 50.583106267029976, + "grad_norm": 4.105449199676514, + "learning_rate": 1.0296915801262977e-05, + "loss": 0.0632, + "step": 18564 + }, + { + "epoch": 50.5858310626703, + "grad_norm": 5.115097999572754, + "learning_rate": 1.0296033694557213e-05, + "loss": 0.1507, + "step": 18565 + }, + { + "epoch": 50.58855585831063, + "grad_norm": 5.516662120819092, + "learning_rate": 1.0295151585545947e-05, + "loss": 0.1112, + "step": 18566 + }, + { + "epoch": 50.59128065395095, + "grad_norm": 4.84885311126709, + "learning_rate": 1.029426947423605e-05, + "loss": 0.1101, + "step": 18567 + }, + { + "epoch": 50.59400544959128, + "grad_norm": 4.946444988250732, + "learning_rate": 1.029338736063439e-05, + "loss": 0.0787, + "step": 18568 + }, + { + "epoch": 50.596730245231605, + "grad_norm": 4.045813083648682, + "learning_rate": 1.0292505244747843e-05, + "loss": 0.1009, + "step": 18569 + }, + { + "epoch": 50.59945504087194, + "grad_norm": 6.580115795135498, + "learning_rate": 1.0291623126583268e-05, + "loss": 0.1581, + "step": 18570 + }, + { + "epoch": 50.60217983651226, + "grad_norm": 4.543004512786865, + "learning_rate": 1.0290741006147548e-05, + "loss": 0.0934, + "step": 18571 + }, + { + "epoch": 50.60490463215259, + "grad_norm": 5.4109368324279785, + "learning_rate": 1.0289858883447544e-05, + "loss": 0.2124, + "step": 18572 + }, + { + "epoch": 50.607629427792915, + "grad_norm": 10.45888900756836, + "learning_rate": 1.0288976758490129e-05, + "loss": 0.1781, + "step": 18573 + }, + { + "epoch": 50.61035422343324, + "grad_norm": 5.362655162811279, + "learning_rate": 1.028809463128217e-05, + "loss": 0.1545, + "step": 18574 + }, + { + "epoch": 50.61307901907357, + "grad_norm": 7.316466331481934, + "learning_rate": 1.0287212501830543e-05, + "loss": 0.2022, + "step": 18575 + }, + { + "epoch": 50.6158038147139, + "grad_norm": 3.898688316345215, + "learning_rate": 1.0286330370142111e-05, + "loss": 0.0998, + "step": 18576 + }, + { + "epoch": 50.618528610354225, + "grad_norm": 3.980304479598999, + "learning_rate": 1.028544823622375e-05, + "loss": 0.1586, + "step": 18577 + }, + { + "epoch": 50.62125340599455, + "grad_norm": 4.505300998687744, + "learning_rate": 1.0284566100082323e-05, + "loss": 0.2628, + "step": 18578 + }, + { + "epoch": 50.62397820163488, + "grad_norm": 5.694802284240723, + "learning_rate": 1.0283683961724708e-05, + "loss": 0.1341, + "step": 18579 + }, + { + "epoch": 50.6267029972752, + "grad_norm": 3.978081464767456, + "learning_rate": 1.0282801821157768e-05, + "loss": 0.154, + "step": 18580 + }, + { + "epoch": 50.62942779291553, + "grad_norm": 4.474717617034912, + "learning_rate": 1.0281919678388382e-05, + "loss": 0.2082, + "step": 18581 + }, + { + "epoch": 50.63215258855586, + "grad_norm": 8.891847610473633, + "learning_rate": 1.028103753342341e-05, + "loss": 0.1251, + "step": 18582 + }, + { + "epoch": 50.63487738419619, + "grad_norm": 7.032039165496826, + "learning_rate": 1.028015538626973e-05, + "loss": 0.2065, + "step": 18583 + }, + { + "epoch": 50.63760217983651, + "grad_norm": 9.012201309204102, + "learning_rate": 1.0279273236934207e-05, + "loss": 0.1921, + "step": 18584 + }, + { + "epoch": 50.64032697547684, + "grad_norm": 4.566155433654785, + "learning_rate": 1.0278391085423715e-05, + "loss": 0.1126, + "step": 18585 + }, + { + "epoch": 50.643051771117165, + "grad_norm": 5.303219795227051, + "learning_rate": 1.0277508931745119e-05, + "loss": 0.2254, + "step": 18586 + }, + { + "epoch": 50.64577656675749, + "grad_norm": 4.0097832679748535, + "learning_rate": 1.0276626775905294e-05, + "loss": 0.2024, + "step": 18587 + }, + { + "epoch": 50.64850136239782, + "grad_norm": 4.792849540710449, + "learning_rate": 1.0275744617911107e-05, + "loss": 0.2083, + "step": 18588 + }, + { + "epoch": 50.65122615803815, + "grad_norm": 4.081125259399414, + "learning_rate": 1.0274862457769432e-05, + "loss": 0.1437, + "step": 18589 + }, + { + "epoch": 50.653950953678475, + "grad_norm": 5.231274127960205, + "learning_rate": 1.0273980295487136e-05, + "loss": 0.1261, + "step": 18590 + }, + { + "epoch": 50.6566757493188, + "grad_norm": 5.771617412567139, + "learning_rate": 1.027309813107109e-05, + "loss": 0.1846, + "step": 18591 + }, + { + "epoch": 50.65940054495913, + "grad_norm": 5.414749622344971, + "learning_rate": 1.0272215964528168e-05, + "loss": 0.1033, + "step": 18592 + }, + { + "epoch": 50.66212534059945, + "grad_norm": 5.166776180267334, + "learning_rate": 1.0271333795865233e-05, + "loss": 0.1527, + "step": 18593 + }, + { + "epoch": 50.664850136239785, + "grad_norm": 5.49155330657959, + "learning_rate": 1.027045162508916e-05, + "loss": 0.1975, + "step": 18594 + }, + { + "epoch": 50.66757493188011, + "grad_norm": 4.783842086791992, + "learning_rate": 1.026956945220682e-05, + "loss": 0.1186, + "step": 18595 + }, + { + "epoch": 50.67029972752044, + "grad_norm": 8.354765892028809, + "learning_rate": 1.026868727722508e-05, + "loss": 0.1232, + "step": 18596 + }, + { + "epoch": 50.67302452316076, + "grad_norm": 5.419940948486328, + "learning_rate": 1.0267805100150811e-05, + "loss": 0.2251, + "step": 18597 + }, + { + "epoch": 50.67574931880109, + "grad_norm": 3.7597742080688477, + "learning_rate": 1.0266922920990885e-05, + "loss": 0.0977, + "step": 18598 + }, + { + "epoch": 50.678474114441414, + "grad_norm": 5.967283248901367, + "learning_rate": 1.0266040739752175e-05, + "loss": 0.2887, + "step": 18599 + }, + { + "epoch": 50.68119891008175, + "grad_norm": 5.507992744445801, + "learning_rate": 1.0265158556441543e-05, + "loss": 0.1203, + "step": 18600 + }, + { + "epoch": 50.68392370572207, + "grad_norm": 7.205935955047607, + "learning_rate": 1.0264276371065871e-05, + "loss": 0.1477, + "step": 18601 + }, + { + "epoch": 50.6866485013624, + "grad_norm": 6.18890380859375, + "learning_rate": 1.026339418363202e-05, + "loss": 0.1459, + "step": 18602 + }, + { + "epoch": 50.689373297002724, + "grad_norm": 7.717989444732666, + "learning_rate": 1.0262511994146862e-05, + "loss": 0.1926, + "step": 18603 + }, + { + "epoch": 50.69209809264305, + "grad_norm": 5.477873802185059, + "learning_rate": 1.026162980261727e-05, + "loss": 0.2208, + "step": 18604 + }, + { + "epoch": 50.694822888283376, + "grad_norm": 5.5274271965026855, + "learning_rate": 1.0260747609050115e-05, + "loss": 0.0972, + "step": 18605 + }, + { + "epoch": 50.69754768392371, + "grad_norm": 5.3758673667907715, + "learning_rate": 1.0259865413452266e-05, + "loss": 0.1111, + "step": 18606 + }, + { + "epoch": 50.700272479564035, + "grad_norm": 5.199080467224121, + "learning_rate": 1.0258983215830591e-05, + "loss": 0.189, + "step": 18607 + }, + { + "epoch": 50.70299727520436, + "grad_norm": 7.787143230438232, + "learning_rate": 1.0258101016191963e-05, + "loss": 0.3012, + "step": 18608 + }, + { + "epoch": 50.705722070844686, + "grad_norm": 4.525249004364014, + "learning_rate": 1.0257218814543257e-05, + "loss": 0.1977, + "step": 18609 + }, + { + "epoch": 50.70844686648501, + "grad_norm": 4.9005913734436035, + "learning_rate": 1.0256336610891336e-05, + "loss": 0.0966, + "step": 18610 + }, + { + "epoch": 50.71117166212534, + "grad_norm": 4.556335926055908, + "learning_rate": 1.0255454405243076e-05, + "loss": 0.1, + "step": 18611 + }, + { + "epoch": 50.71389645776567, + "grad_norm": 7.69804048538208, + "learning_rate": 1.0254572197605341e-05, + "loss": 0.1512, + "step": 18612 + }, + { + "epoch": 50.716621253406, + "grad_norm": 8.30517578125, + "learning_rate": 1.0253689987985008e-05, + "loss": 0.0957, + "step": 18613 + }, + { + "epoch": 50.71934604904632, + "grad_norm": 6.534460067749023, + "learning_rate": 1.0252807776388946e-05, + "loss": 0.1291, + "step": 18614 + }, + { + "epoch": 50.72207084468665, + "grad_norm": 5.42502498626709, + "learning_rate": 1.0251925562824026e-05, + "loss": 0.1425, + "step": 18615 + }, + { + "epoch": 50.724795640326974, + "grad_norm": 4.998002052307129, + "learning_rate": 1.0251043347297118e-05, + "loss": 0.0969, + "step": 18616 + }, + { + "epoch": 50.7275204359673, + "grad_norm": 9.392294883728027, + "learning_rate": 1.0250161129815091e-05, + "loss": 0.1188, + "step": 18617 + }, + { + "epoch": 50.73024523160763, + "grad_norm": 6.346102714538574, + "learning_rate": 1.0249278910384817e-05, + "loss": 0.213, + "step": 18618 + }, + { + "epoch": 50.73297002724796, + "grad_norm": 4.94590950012207, + "learning_rate": 1.0248396689013166e-05, + "loss": 0.1149, + "step": 18619 + }, + { + "epoch": 50.735694822888284, + "grad_norm": 5.284358501434326, + "learning_rate": 1.0247514465707012e-05, + "loss": 0.0735, + "step": 18620 + }, + { + "epoch": 50.73841961852861, + "grad_norm": 11.247912406921387, + "learning_rate": 1.024663224047322e-05, + "loss": 0.1569, + "step": 18621 + }, + { + "epoch": 50.741144414168936, + "grad_norm": 5.320253849029541, + "learning_rate": 1.0245750013318669e-05, + "loss": 0.1623, + "step": 18622 + }, + { + "epoch": 50.74386920980926, + "grad_norm": 6.120570659637451, + "learning_rate": 1.024486778425022e-05, + "loss": 0.2398, + "step": 18623 + }, + { + "epoch": 50.746594005449595, + "grad_norm": 5.824092388153076, + "learning_rate": 1.0243985553274753e-05, + "loss": 0.1296, + "step": 18624 + }, + { + "epoch": 50.74931880108992, + "grad_norm": 6.964953422546387, + "learning_rate": 1.024310332039913e-05, + "loss": 0.1353, + "step": 18625 + }, + { + "epoch": 50.752043596730246, + "grad_norm": 7.604491710662842, + "learning_rate": 1.024222108563023e-05, + "loss": 0.1786, + "step": 18626 + }, + { + "epoch": 50.75476839237057, + "grad_norm": 6.910664081573486, + "learning_rate": 1.0241338848974918e-05, + "loss": 0.2086, + "step": 18627 + }, + { + "epoch": 50.7574931880109, + "grad_norm": 5.907593727111816, + "learning_rate": 1.0240456610440068e-05, + "loss": 0.3074, + "step": 18628 + }, + { + "epoch": 50.76021798365122, + "grad_norm": 5.974182605743408, + "learning_rate": 1.0239574370032548e-05, + "loss": 0.1979, + "step": 18629 + }, + { + "epoch": 50.762942779291556, + "grad_norm": 5.4504289627075195, + "learning_rate": 1.0238692127759232e-05, + "loss": 0.1797, + "step": 18630 + }, + { + "epoch": 50.76566757493188, + "grad_norm": 14.588968276977539, + "learning_rate": 1.0237809883626986e-05, + "loss": 0.149, + "step": 18631 + }, + { + "epoch": 50.76839237057221, + "grad_norm": 15.98033332824707, + "learning_rate": 1.0236927637642688e-05, + "loss": 0.238, + "step": 18632 + }, + { + "epoch": 50.771117166212534, + "grad_norm": 4.419747829437256, + "learning_rate": 1.0236045389813203e-05, + "loss": 0.2188, + "step": 18633 + }, + { + "epoch": 50.77384196185286, + "grad_norm": 6.706301689147949, + "learning_rate": 1.0235163140145408e-05, + "loss": 0.3224, + "step": 18634 + }, + { + "epoch": 50.776566757493185, + "grad_norm": 6.188803672790527, + "learning_rate": 1.0234280888646166e-05, + "loss": 0.0994, + "step": 18635 + }, + { + "epoch": 50.77929155313352, + "grad_norm": 7.780112266540527, + "learning_rate": 1.0233398635322353e-05, + "loss": 0.1531, + "step": 18636 + }, + { + "epoch": 50.782016348773844, + "grad_norm": 5.561610698699951, + "learning_rate": 1.023251638018084e-05, + "loss": 0.1296, + "step": 18637 + }, + { + "epoch": 50.78474114441417, + "grad_norm": 4.837251663208008, + "learning_rate": 1.0231634123228498e-05, + "loss": 0.0933, + "step": 18638 + }, + { + "epoch": 50.787465940054496, + "grad_norm": 3.9444570541381836, + "learning_rate": 1.023075186447219e-05, + "loss": 0.1079, + "step": 18639 + }, + { + "epoch": 50.79019073569482, + "grad_norm": 6.445371627807617, + "learning_rate": 1.0229869603918801e-05, + "loss": 0.2153, + "step": 18640 + }, + { + "epoch": 50.79291553133515, + "grad_norm": 6.34771203994751, + "learning_rate": 1.0228987341575192e-05, + "loss": 0.1475, + "step": 18641 + }, + { + "epoch": 50.79564032697548, + "grad_norm": 8.866080284118652, + "learning_rate": 1.0228105077448239e-05, + "loss": 0.1518, + "step": 18642 + }, + { + "epoch": 50.798365122615806, + "grad_norm": 5.695035457611084, + "learning_rate": 1.0227222811544807e-05, + "loss": 0.1191, + "step": 18643 + }, + { + "epoch": 50.80108991825613, + "grad_norm": 5.830082416534424, + "learning_rate": 1.0226340543871778e-05, + "loss": 0.2573, + "step": 18644 + }, + { + "epoch": 50.80381471389646, + "grad_norm": 4.047380447387695, + "learning_rate": 1.0225458274436011e-05, + "loss": 0.1415, + "step": 18645 + }, + { + "epoch": 50.80653950953678, + "grad_norm": 7.31242561340332, + "learning_rate": 1.0224576003244385e-05, + "loss": 0.2494, + "step": 18646 + }, + { + "epoch": 50.80926430517711, + "grad_norm": 4.944585800170898, + "learning_rate": 1.0223693730303761e-05, + "loss": 0.2513, + "step": 18647 + }, + { + "epoch": 50.81198910081744, + "grad_norm": 4.9357733726501465, + "learning_rate": 1.0222811455621025e-05, + "loss": 0.392, + "step": 18648 + }, + { + "epoch": 50.81471389645777, + "grad_norm": 6.6110029220581055, + "learning_rate": 1.0221929179203038e-05, + "loss": 0.1249, + "step": 18649 + }, + { + "epoch": 50.817438692098094, + "grad_norm": 6.397737979888916, + "learning_rate": 1.0221046901056675e-05, + "loss": 0.1245, + "step": 18650 + }, + { + "epoch": 50.82016348773842, + "grad_norm": 5.183709144592285, + "learning_rate": 1.0220164621188804e-05, + "loss": 0.1974, + "step": 18651 + }, + { + "epoch": 50.822888283378745, + "grad_norm": 5.553018569946289, + "learning_rate": 1.02192823396063e-05, + "loss": 0.2481, + "step": 18652 + }, + { + "epoch": 50.82561307901907, + "grad_norm": 4.401885986328125, + "learning_rate": 1.0218400056316031e-05, + "loss": 0.1696, + "step": 18653 + }, + { + "epoch": 50.828337874659404, + "grad_norm": 3.9832563400268555, + "learning_rate": 1.0217517771324871e-05, + "loss": 0.3923, + "step": 18654 + }, + { + "epoch": 50.83106267029973, + "grad_norm": 4.639732837677002, + "learning_rate": 1.0216635484639688e-05, + "loss": 0.177, + "step": 18655 + }, + { + "epoch": 50.833787465940055, + "grad_norm": 4.781457901000977, + "learning_rate": 1.0215753196267352e-05, + "loss": 0.1861, + "step": 18656 + }, + { + "epoch": 50.83651226158038, + "grad_norm": 4.005565643310547, + "learning_rate": 1.021487090621474e-05, + "loss": 0.0803, + "step": 18657 + }, + { + "epoch": 50.83923705722071, + "grad_norm": 5.11945915222168, + "learning_rate": 1.0213988614488721e-05, + "loss": 0.1536, + "step": 18658 + }, + { + "epoch": 50.84196185286103, + "grad_norm": 4.560452938079834, + "learning_rate": 1.0213106321096164e-05, + "loss": 0.2326, + "step": 18659 + }, + { + "epoch": 50.844686648501366, + "grad_norm": 6.021965026855469, + "learning_rate": 1.0212224026043945e-05, + "loss": 0.1181, + "step": 18660 + }, + { + "epoch": 50.84741144414169, + "grad_norm": 3.8789072036743164, + "learning_rate": 1.0211341729338928e-05, + "loss": 0.1204, + "step": 18661 + }, + { + "epoch": 50.85013623978202, + "grad_norm": 5.305844783782959, + "learning_rate": 1.0210459430987993e-05, + "loss": 0.1091, + "step": 18662 + }, + { + "epoch": 50.85286103542234, + "grad_norm": 4.129421234130859, + "learning_rate": 1.0209577130998002e-05, + "loss": 0.1939, + "step": 18663 + }, + { + "epoch": 50.85558583106267, + "grad_norm": 5.56313943862915, + "learning_rate": 1.0208694829375834e-05, + "loss": 0.1791, + "step": 18664 + }, + { + "epoch": 50.858310626702995, + "grad_norm": 4.692027568817139, + "learning_rate": 1.0207812526128356e-05, + "loss": 0.1208, + "step": 18665 + }, + { + "epoch": 50.86103542234333, + "grad_norm": 5.1737961769104, + "learning_rate": 1.020693022126244e-05, + "loss": 0.1212, + "step": 18666 + }, + { + "epoch": 50.86376021798365, + "grad_norm": 6.0052361488342285, + "learning_rate": 1.020604791478496e-05, + "loss": 0.2019, + "step": 18667 + }, + { + "epoch": 50.86648501362398, + "grad_norm": 5.494925498962402, + "learning_rate": 1.0205165606702784e-05, + "loss": 0.2635, + "step": 18668 + }, + { + "epoch": 50.869209809264305, + "grad_norm": 7.216293811798096, + "learning_rate": 1.0204283297022786e-05, + "loss": 0.1622, + "step": 18669 + }, + { + "epoch": 50.87193460490463, + "grad_norm": 5.883440017700195, + "learning_rate": 1.0203400985751838e-05, + "loss": 0.292, + "step": 18670 + }, + { + "epoch": 50.87465940054496, + "grad_norm": 5.328831195831299, + "learning_rate": 1.0202518672896806e-05, + "loss": 0.1097, + "step": 18671 + }, + { + "epoch": 50.87738419618529, + "grad_norm": 5.100024223327637, + "learning_rate": 1.0201636358464568e-05, + "loss": 0.276, + "step": 18672 + }, + { + "epoch": 50.880108991825615, + "grad_norm": 3.971789598464966, + "learning_rate": 1.0200754042461988e-05, + "loss": 0.1783, + "step": 18673 + }, + { + "epoch": 50.88283378746594, + "grad_norm": 4.622824668884277, + "learning_rate": 1.0199871724895947e-05, + "loss": 0.153, + "step": 18674 + }, + { + "epoch": 50.88555858310627, + "grad_norm": 24.071992874145508, + "learning_rate": 1.0198989405773307e-05, + "loss": 0.1639, + "step": 18675 + }, + { + "epoch": 50.88828337874659, + "grad_norm": 5.242025375366211, + "learning_rate": 1.019810708510095e-05, + "loss": 0.1633, + "step": 18676 + }, + { + "epoch": 50.89100817438692, + "grad_norm": 4.857852935791016, + "learning_rate": 1.0197224762885735e-05, + "loss": 0.1911, + "step": 18677 + }, + { + "epoch": 50.89373297002725, + "grad_norm": 5.67581844329834, + "learning_rate": 1.0196342439134546e-05, + "loss": 0.3513, + "step": 18678 + }, + { + "epoch": 50.89645776566758, + "grad_norm": 6.3713274002075195, + "learning_rate": 1.0195460113854243e-05, + "loss": 0.1237, + "step": 18679 + }, + { + "epoch": 50.8991825613079, + "grad_norm": 5.207911491394043, + "learning_rate": 1.0194577787051708e-05, + "loss": 0.1406, + "step": 18680 + }, + { + "epoch": 50.90190735694823, + "grad_norm": 8.377357482910156, + "learning_rate": 1.0193695458733803e-05, + "loss": 0.1182, + "step": 18681 + }, + { + "epoch": 50.904632152588555, + "grad_norm": 4.9795708656311035, + "learning_rate": 1.0192813128907404e-05, + "loss": 0.3101, + "step": 18682 + }, + { + "epoch": 50.90735694822888, + "grad_norm": 6.144087314605713, + "learning_rate": 1.0191930797579386e-05, + "loss": 0.148, + "step": 18683 + }, + { + "epoch": 50.91008174386921, + "grad_norm": 5.1268439292907715, + "learning_rate": 1.0191048464756615e-05, + "loss": 0.1114, + "step": 18684 + }, + { + "epoch": 50.91280653950954, + "grad_norm": 4.573668479919434, + "learning_rate": 1.0190166130445964e-05, + "loss": 0.0848, + "step": 18685 + }, + { + "epoch": 50.915531335149865, + "grad_norm": 4.333711624145508, + "learning_rate": 1.0189283794654308e-05, + "loss": 0.1864, + "step": 18686 + }, + { + "epoch": 50.91825613079019, + "grad_norm": 6.886716842651367, + "learning_rate": 1.0188401457388513e-05, + "loss": 0.1345, + "step": 18687 + }, + { + "epoch": 50.920980926430516, + "grad_norm": 4.428810119628906, + "learning_rate": 1.0187519118655456e-05, + "loss": 0.1554, + "step": 18688 + }, + { + "epoch": 50.92370572207084, + "grad_norm": 4.6712141036987305, + "learning_rate": 1.0186636778462002e-05, + "loss": 0.0946, + "step": 18689 + }, + { + "epoch": 50.926430517711175, + "grad_norm": 5.9868035316467285, + "learning_rate": 1.0185754436815029e-05, + "loss": 0.135, + "step": 18690 + }, + { + "epoch": 50.9291553133515, + "grad_norm": 5.404600620269775, + "learning_rate": 1.018487209372141e-05, + "loss": 0.2366, + "step": 18691 + }, + { + "epoch": 50.93188010899183, + "grad_norm": 8.686942100524902, + "learning_rate": 1.0183989749188009e-05, + "loss": 0.1878, + "step": 18692 + }, + { + "epoch": 50.93460490463215, + "grad_norm": 9.665703773498535, + "learning_rate": 1.0183107403221703e-05, + "loss": 0.151, + "step": 18693 + }, + { + "epoch": 50.93732970027248, + "grad_norm": 5.4269890785217285, + "learning_rate": 1.0182225055829362e-05, + "loss": 0.2427, + "step": 18694 + }, + { + "epoch": 50.940054495912804, + "grad_norm": 52.33797073364258, + "learning_rate": 1.0181342707017859e-05, + "loss": 0.0847, + "step": 18695 + }, + { + "epoch": 50.94277929155314, + "grad_norm": 6.4972310066223145, + "learning_rate": 1.0180460356794065e-05, + "loss": 0.2136, + "step": 18696 + }, + { + "epoch": 50.94550408719346, + "grad_norm": 9.618993759155273, + "learning_rate": 1.017957800516485e-05, + "loss": 0.2531, + "step": 18697 + }, + { + "epoch": 50.94822888283379, + "grad_norm": 8.187857627868652, + "learning_rate": 1.0178695652137088e-05, + "loss": 0.2706, + "step": 18698 + }, + { + "epoch": 50.950953678474114, + "grad_norm": 6.918089866638184, + "learning_rate": 1.0177813297717649e-05, + "loss": 0.1428, + "step": 18699 + }, + { + "epoch": 50.95367847411444, + "grad_norm": 6.106166839599609, + "learning_rate": 1.0176930941913405e-05, + "loss": 0.2265, + "step": 18700 + }, + { + "epoch": 50.956403269754766, + "grad_norm": 5.025012016296387, + "learning_rate": 1.0176048584731233e-05, + "loss": 0.1294, + "step": 18701 + }, + { + "epoch": 50.95912806539509, + "grad_norm": 5.337967395782471, + "learning_rate": 1.0175166226177998e-05, + "loss": 0.1372, + "step": 18702 + }, + { + "epoch": 50.961852861035425, + "grad_norm": 4.797581195831299, + "learning_rate": 1.0174283866260575e-05, + "loss": 0.1651, + "step": 18703 + }, + { + "epoch": 50.96457765667575, + "grad_norm": 5.887904167175293, + "learning_rate": 1.0173401504985831e-05, + "loss": 0.2833, + "step": 18704 + }, + { + "epoch": 50.967302452316076, + "grad_norm": 6.55267333984375, + "learning_rate": 1.0172519142360646e-05, + "loss": 0.1519, + "step": 18705 + }, + { + "epoch": 50.9700272479564, + "grad_norm": 6.467425346374512, + "learning_rate": 1.0171636778391885e-05, + "loss": 0.1798, + "step": 18706 + }, + { + "epoch": 50.97275204359673, + "grad_norm": 5.7684526443481445, + "learning_rate": 1.0170754413086422e-05, + "loss": 0.1561, + "step": 18707 + }, + { + "epoch": 50.97547683923706, + "grad_norm": 11.755709648132324, + "learning_rate": 1.016987204645113e-05, + "loss": 0.2787, + "step": 18708 + }, + { + "epoch": 50.97820163487739, + "grad_norm": 5.804837703704834, + "learning_rate": 1.016898967849288e-05, + "loss": 0.1966, + "step": 18709 + }, + { + "epoch": 50.98092643051771, + "grad_norm": 4.074558258056641, + "learning_rate": 1.0168107309218545e-05, + "loss": 0.1037, + "step": 18710 + }, + { + "epoch": 50.98365122615804, + "grad_norm": 6.014253616333008, + "learning_rate": 1.0167224938634994e-05, + "loss": 0.22, + "step": 18711 + }, + { + "epoch": 50.986376021798364, + "grad_norm": 5.788711071014404, + "learning_rate": 1.01663425667491e-05, + "loss": 0.2037, + "step": 18712 + }, + { + "epoch": 50.98910081743869, + "grad_norm": 5.540937900543213, + "learning_rate": 1.016546019356774e-05, + "loss": 0.1178, + "step": 18713 + }, + { + "epoch": 50.991825613079016, + "grad_norm": 6.734719753265381, + "learning_rate": 1.0164577819097777e-05, + "loss": 0.2364, + "step": 18714 + }, + { + "epoch": 50.99455040871935, + "grad_norm": 7.610739231109619, + "learning_rate": 1.016369544334609e-05, + "loss": 0.1228, + "step": 18715 + }, + { + "epoch": 50.997275204359674, + "grad_norm": 5.655003070831299, + "learning_rate": 1.0162813066319542e-05, + "loss": 0.1497, + "step": 18716 + }, + { + "epoch": 51.0, + "grad_norm": 5.585046768188477, + "learning_rate": 1.0161930688025018e-05, + "loss": 0.1662, + "step": 18717 + }, + { + "epoch": 51.002724795640326, + "grad_norm": 11.332860946655273, + "learning_rate": 1.0161048308469378e-05, + "loss": 0.2005, + "step": 18718 + }, + { + "epoch": 51.00544959128065, + "grad_norm": 17.428442001342773, + "learning_rate": 1.0160165927659502e-05, + "loss": 0.1392, + "step": 18719 + }, + { + "epoch": 51.00817438692098, + "grad_norm": 5.3399658203125, + "learning_rate": 1.015928354560226e-05, + "loss": 0.2174, + "step": 18720 + }, + { + "epoch": 51.01089918256131, + "grad_norm": 4.200045585632324, + "learning_rate": 1.0158401162304522e-05, + "loss": 0.3348, + "step": 18721 + }, + { + "epoch": 51.013623978201636, + "grad_norm": 4.7197675704956055, + "learning_rate": 1.0157518777773159e-05, + "loss": 0.0845, + "step": 18722 + }, + { + "epoch": 51.01634877384196, + "grad_norm": 5.308382511138916, + "learning_rate": 1.0156636392015046e-05, + "loss": 0.2566, + "step": 18723 + }, + { + "epoch": 51.01907356948229, + "grad_norm": 4.911110877990723, + "learning_rate": 1.0155754005037054e-05, + "loss": 0.1306, + "step": 18724 + }, + { + "epoch": 51.02179836512261, + "grad_norm": 6.263029098510742, + "learning_rate": 1.015487161684605e-05, + "loss": 0.2966, + "step": 18725 + }, + { + "epoch": 51.02452316076294, + "grad_norm": 4.92348051071167, + "learning_rate": 1.0153989227448917e-05, + "loss": 0.1635, + "step": 18726 + }, + { + "epoch": 51.02724795640327, + "grad_norm": 5.831380844116211, + "learning_rate": 1.015310683685252e-05, + "loss": 0.0931, + "step": 18727 + }, + { + "epoch": 51.0299727520436, + "grad_norm": 12.072651863098145, + "learning_rate": 1.015222444506373e-05, + "loss": 0.1893, + "step": 18728 + }, + { + "epoch": 51.032697547683924, + "grad_norm": 11.225703239440918, + "learning_rate": 1.0151342052089423e-05, + "loss": 0.2093, + "step": 18729 + }, + { + "epoch": 51.03542234332425, + "grad_norm": 7.203643798828125, + "learning_rate": 1.0150459657936469e-05, + "loss": 0.1521, + "step": 18730 + }, + { + "epoch": 51.038147138964575, + "grad_norm": 5.221952438354492, + "learning_rate": 1.0149577262611739e-05, + "loss": 0.117, + "step": 18731 + }, + { + "epoch": 51.0408719346049, + "grad_norm": 4.445789337158203, + "learning_rate": 1.0148694866122107e-05, + "loss": 0.1751, + "step": 18732 + }, + { + "epoch": 51.043596730245234, + "grad_norm": 6.010112285614014, + "learning_rate": 1.014781246847444e-05, + "loss": 0.1888, + "step": 18733 + }, + { + "epoch": 51.04632152588556, + "grad_norm": 4.826539039611816, + "learning_rate": 1.0146930069675617e-05, + "loss": 0.0933, + "step": 18734 + }, + { + "epoch": 51.049046321525886, + "grad_norm": 4.85269021987915, + "learning_rate": 1.014604766973251e-05, + "loss": 0.0985, + "step": 18735 + }, + { + "epoch": 51.05177111716621, + "grad_norm": 6.659588813781738, + "learning_rate": 1.0145165268651985e-05, + "loss": 0.1496, + "step": 18736 + }, + { + "epoch": 51.05449591280654, + "grad_norm": 4.729734420776367, + "learning_rate": 1.014428286644092e-05, + "loss": 0.1488, + "step": 18737 + }, + { + "epoch": 51.05722070844686, + "grad_norm": 5.822243690490723, + "learning_rate": 1.0143400463106184e-05, + "loss": 0.1028, + "step": 18738 + }, + { + "epoch": 51.059945504087196, + "grad_norm": 5.308828830718994, + "learning_rate": 1.0142518058654649e-05, + "loss": 0.0896, + "step": 18739 + }, + { + "epoch": 51.06267029972752, + "grad_norm": 5.010536193847656, + "learning_rate": 1.0141635653093187e-05, + "loss": 0.1237, + "step": 18740 + }, + { + "epoch": 51.06539509536785, + "grad_norm": 5.888706684112549, + "learning_rate": 1.0140753246428674e-05, + "loss": 0.1296, + "step": 18741 + }, + { + "epoch": 51.06811989100817, + "grad_norm": 40.01289749145508, + "learning_rate": 1.0139870838667976e-05, + "loss": 0.2059, + "step": 18742 + }, + { + "epoch": 51.0708446866485, + "grad_norm": 4.776760578155518, + "learning_rate": 1.0138988429817971e-05, + "loss": 0.1722, + "step": 18743 + }, + { + "epoch": 51.073569482288825, + "grad_norm": 9.24162483215332, + "learning_rate": 1.0138106019885525e-05, + "loss": 0.185, + "step": 18744 + }, + { + "epoch": 51.07629427792916, + "grad_norm": 4.977770805358887, + "learning_rate": 1.0137223608877518e-05, + "loss": 0.2341, + "step": 18745 + }, + { + "epoch": 51.079019073569484, + "grad_norm": 6.066573619842529, + "learning_rate": 1.0136341196800816e-05, + "loss": 0.1852, + "step": 18746 + }, + { + "epoch": 51.08174386920981, + "grad_norm": 5.879281997680664, + "learning_rate": 1.0135458783662296e-05, + "loss": 0.143, + "step": 18747 + }, + { + "epoch": 51.084468664850135, + "grad_norm": 4.567464828491211, + "learning_rate": 1.0134576369468823e-05, + "loss": 0.0869, + "step": 18748 + }, + { + "epoch": 51.08719346049046, + "grad_norm": 7.318799018859863, + "learning_rate": 1.0133693954227278e-05, + "loss": 0.1819, + "step": 18749 + }, + { + "epoch": 51.08991825613079, + "grad_norm": 9.434854507446289, + "learning_rate": 1.0132811537944522e-05, + "loss": 0.1568, + "step": 18750 + }, + { + "epoch": 51.09264305177112, + "grad_norm": 4.460082054138184, + "learning_rate": 1.0131929120627439e-05, + "loss": 0.1595, + "step": 18751 + }, + { + "epoch": 51.095367847411445, + "grad_norm": 4.987976551055908, + "learning_rate": 1.0131046702282893e-05, + "loss": 0.086, + "step": 18752 + }, + { + "epoch": 51.09809264305177, + "grad_norm": 4.004764556884766, + "learning_rate": 1.0130164282917764e-05, + "loss": 0.2204, + "step": 18753 + }, + { + "epoch": 51.1008174386921, + "grad_norm": 5.967334747314453, + "learning_rate": 1.0129281862538918e-05, + "loss": 0.2305, + "step": 18754 + }, + { + "epoch": 51.10354223433242, + "grad_norm": 4.764896392822266, + "learning_rate": 1.012839944115323e-05, + "loss": 0.129, + "step": 18755 + }, + { + "epoch": 51.10626702997275, + "grad_norm": 7.496785640716553, + "learning_rate": 1.0127517018767569e-05, + "loss": 0.0907, + "step": 18756 + }, + { + "epoch": 51.10899182561308, + "grad_norm": 3.6667022705078125, + "learning_rate": 1.0126634595388812e-05, + "loss": 0.1383, + "step": 18757 + }, + { + "epoch": 51.11171662125341, + "grad_norm": 10.265843391418457, + "learning_rate": 1.0125752171023825e-05, + "loss": 0.2072, + "step": 18758 + }, + { + "epoch": 51.11444141689373, + "grad_norm": 5.989264011383057, + "learning_rate": 1.0124869745679486e-05, + "loss": 0.1543, + "step": 18759 + }, + { + "epoch": 51.11716621253406, + "grad_norm": 8.33877944946289, + "learning_rate": 1.0123987319362668e-05, + "loss": 0.1829, + "step": 18760 + }, + { + "epoch": 51.119891008174385, + "grad_norm": 5.455020427703857, + "learning_rate": 1.0123104892080237e-05, + "loss": 0.1301, + "step": 18761 + }, + { + "epoch": 51.12261580381471, + "grad_norm": 4.6251726150512695, + "learning_rate": 1.012222246383907e-05, + "loss": 0.1591, + "step": 18762 + }, + { + "epoch": 51.12534059945504, + "grad_norm": 5.778083324432373, + "learning_rate": 1.0121340034646041e-05, + "loss": 0.1534, + "step": 18763 + }, + { + "epoch": 51.12806539509537, + "grad_norm": 6.038066864013672, + "learning_rate": 1.0120457604508019e-05, + "loss": 0.1822, + "step": 18764 + }, + { + "epoch": 51.130790190735695, + "grad_norm": 6.604792594909668, + "learning_rate": 1.0119575173431877e-05, + "loss": 0.1728, + "step": 18765 + }, + { + "epoch": 51.13351498637602, + "grad_norm": 6.406408309936523, + "learning_rate": 1.0118692741424485e-05, + "loss": 0.1196, + "step": 18766 + }, + { + "epoch": 51.13623978201635, + "grad_norm": 6.284243583679199, + "learning_rate": 1.0117810308492719e-05, + "loss": 0.2791, + "step": 18767 + }, + { + "epoch": 51.13896457765667, + "grad_norm": 5.192579746246338, + "learning_rate": 1.011692787464345e-05, + "loss": 0.0937, + "step": 18768 + }, + { + "epoch": 51.141689373297005, + "grad_norm": 5.316946029663086, + "learning_rate": 1.011604543988355e-05, + "loss": 0.0972, + "step": 18769 + }, + { + "epoch": 51.14441416893733, + "grad_norm": 4.363719940185547, + "learning_rate": 1.0115163004219894e-05, + "loss": 0.166, + "step": 18770 + }, + { + "epoch": 51.14713896457766, + "grad_norm": 5.205626010894775, + "learning_rate": 1.011428056765935e-05, + "loss": 0.1089, + "step": 18771 + }, + { + "epoch": 51.14986376021798, + "grad_norm": 6.125519275665283, + "learning_rate": 1.0113398130208791e-05, + "loss": 0.1815, + "step": 18772 + }, + { + "epoch": 51.15258855585831, + "grad_norm": 6.656401634216309, + "learning_rate": 1.0112515691875095e-05, + "loss": 0.1347, + "step": 18773 + }, + { + "epoch": 51.155313351498634, + "grad_norm": 5.416975021362305, + "learning_rate": 1.0111633252665129e-05, + "loss": 0.2934, + "step": 18774 + }, + { + "epoch": 51.15803814713897, + "grad_norm": 79.0899658203125, + "learning_rate": 1.0110750812585767e-05, + "loss": 0.2813, + "step": 18775 + }, + { + "epoch": 51.16076294277929, + "grad_norm": 5.5814642906188965, + "learning_rate": 1.010986837164388e-05, + "loss": 0.2162, + "step": 18776 + }, + { + "epoch": 51.16348773841962, + "grad_norm": 9.727604866027832, + "learning_rate": 1.0108985929846342e-05, + "loss": 0.1799, + "step": 18777 + }, + { + "epoch": 51.166212534059945, + "grad_norm": 6.37643575668335, + "learning_rate": 1.0108103487200028e-05, + "loss": 0.1972, + "step": 18778 + }, + { + "epoch": 51.16893732970027, + "grad_norm": 5.157503604888916, + "learning_rate": 1.0107221043711804e-05, + "loss": 0.1791, + "step": 18779 + }, + { + "epoch": 51.171662125340596, + "grad_norm": 5.511967658996582, + "learning_rate": 1.0106338599388548e-05, + "loss": 0.2906, + "step": 18780 + }, + { + "epoch": 51.17438692098093, + "grad_norm": 5.359907150268555, + "learning_rate": 1.010545615423713e-05, + "loss": 0.2688, + "step": 18781 + }, + { + "epoch": 51.177111716621255, + "grad_norm": 8.087959289550781, + "learning_rate": 1.010457370826442e-05, + "loss": 0.18, + "step": 18782 + }, + { + "epoch": 51.17983651226158, + "grad_norm": 5.236056804656982, + "learning_rate": 1.0103691261477297e-05, + "loss": 0.1554, + "step": 18783 + }, + { + "epoch": 51.182561307901906, + "grad_norm": 7.0774993896484375, + "learning_rate": 1.0102808813882627e-05, + "loss": 0.1399, + "step": 18784 + }, + { + "epoch": 51.18528610354223, + "grad_norm": 5.047219753265381, + "learning_rate": 1.0101926365487287e-05, + "loss": 0.1951, + "step": 18785 + }, + { + "epoch": 51.18801089918256, + "grad_norm": 19.370012283325195, + "learning_rate": 1.0101043916298148e-05, + "loss": 0.1911, + "step": 18786 + }, + { + "epoch": 51.19073569482289, + "grad_norm": 7.3546271324157715, + "learning_rate": 1.0100161466322082e-05, + "loss": 0.1905, + "step": 18787 + }, + { + "epoch": 51.19346049046322, + "grad_norm": 5.489282608032227, + "learning_rate": 1.0099279015565961e-05, + "loss": 0.161, + "step": 18788 + }, + { + "epoch": 51.19618528610354, + "grad_norm": 5.209650993347168, + "learning_rate": 1.0098396564036658e-05, + "loss": 0.1584, + "step": 18789 + }, + { + "epoch": 51.19891008174387, + "grad_norm": 6.183939456939697, + "learning_rate": 1.0097514111741048e-05, + "loss": 0.1404, + "step": 18790 + }, + { + "epoch": 51.201634877384194, + "grad_norm": 7.37171745300293, + "learning_rate": 1.0096631658686e-05, + "loss": 0.2906, + "step": 18791 + }, + { + "epoch": 51.20435967302452, + "grad_norm": 7.757916450500488, + "learning_rate": 1.009574920487839e-05, + "loss": 0.2218, + "step": 18792 + }, + { + "epoch": 51.20708446866485, + "grad_norm": 5.5463175773620605, + "learning_rate": 1.009486675032508e-05, + "loss": 0.1096, + "step": 18793 + }, + { + "epoch": 51.20980926430518, + "grad_norm": 6.708303928375244, + "learning_rate": 1.009398429503296e-05, + "loss": 0.1681, + "step": 18794 + }, + { + "epoch": 51.212534059945504, + "grad_norm": 9.129183769226074, + "learning_rate": 1.0093101839008888e-05, + "loss": 0.2122, + "step": 18795 + }, + { + "epoch": 51.21525885558583, + "grad_norm": 4.936119079589844, + "learning_rate": 1.0092219382259745e-05, + "loss": 0.2291, + "step": 18796 + }, + { + "epoch": 51.217983651226156, + "grad_norm": 6.745718479156494, + "learning_rate": 1.00913369247924e-05, + "loss": 0.1609, + "step": 18797 + }, + { + "epoch": 51.22070844686648, + "grad_norm": 8.815296173095703, + "learning_rate": 1.0090454466613724e-05, + "loss": 0.127, + "step": 18798 + }, + { + "epoch": 51.223433242506815, + "grad_norm": 5.680782318115234, + "learning_rate": 1.0089572007730593e-05, + "loss": 0.3213, + "step": 18799 + }, + { + "epoch": 51.22615803814714, + "grad_norm": 6.469271183013916, + "learning_rate": 1.0088689548149878e-05, + "loss": 0.1957, + "step": 18800 + }, + { + "epoch": 51.228882833787466, + "grad_norm": 6.46415901184082, + "learning_rate": 1.008780708787845e-05, + "loss": 0.1899, + "step": 18801 + }, + { + "epoch": 51.23160762942779, + "grad_norm": 6.101480484008789, + "learning_rate": 1.0086924626923185e-05, + "loss": 0.187, + "step": 18802 + }, + { + "epoch": 51.23433242506812, + "grad_norm": 4.842905044555664, + "learning_rate": 1.0086042165290952e-05, + "loss": 0.1832, + "step": 18803 + }, + { + "epoch": 51.237057220708444, + "grad_norm": 4.603719711303711, + "learning_rate": 1.0085159702988627e-05, + "loss": 0.2, + "step": 18804 + }, + { + "epoch": 51.23978201634878, + "grad_norm": 4.809569358825684, + "learning_rate": 1.0084277240023082e-05, + "loss": 0.1505, + "step": 18805 + }, + { + "epoch": 51.2425068119891, + "grad_norm": 4.232131004333496, + "learning_rate": 1.0083394776401188e-05, + "loss": 0.1742, + "step": 18806 + }, + { + "epoch": 51.24523160762943, + "grad_norm": 4.67697811126709, + "learning_rate": 1.0082512312129815e-05, + "loss": 0.2456, + "step": 18807 + }, + { + "epoch": 51.247956403269754, + "grad_norm": 4.75968599319458, + "learning_rate": 1.0081629847215843e-05, + "loss": 0.0844, + "step": 18808 + }, + { + "epoch": 51.25068119891008, + "grad_norm": 4.272505760192871, + "learning_rate": 1.0080747381666138e-05, + "loss": 0.1488, + "step": 18809 + }, + { + "epoch": 51.253405994550405, + "grad_norm": 5.496559143066406, + "learning_rate": 1.0079864915487576e-05, + "loss": 0.1714, + "step": 18810 + }, + { + "epoch": 51.25613079019074, + "grad_norm": 4.785799026489258, + "learning_rate": 1.0078982448687027e-05, + "loss": 0.1613, + "step": 18811 + }, + { + "epoch": 51.258855585831064, + "grad_norm": 6.205319881439209, + "learning_rate": 1.0078099981271367e-05, + "loss": 0.3415, + "step": 18812 + }, + { + "epoch": 51.26158038147139, + "grad_norm": 8.09691333770752, + "learning_rate": 1.0077217513247465e-05, + "loss": 0.1214, + "step": 18813 + }, + { + "epoch": 51.264305177111716, + "grad_norm": 5.109775543212891, + "learning_rate": 1.0076335044622198e-05, + "loss": 0.1111, + "step": 18814 + }, + { + "epoch": 51.26702997275204, + "grad_norm": 7.009300708770752, + "learning_rate": 1.0075452575402433e-05, + "loss": 0.1186, + "step": 18815 + }, + { + "epoch": 51.26975476839237, + "grad_norm": 6.143910884857178, + "learning_rate": 1.007457010559505e-05, + "loss": 0.1601, + "step": 18816 + }, + { + "epoch": 51.2724795640327, + "grad_norm": 10.16909408569336, + "learning_rate": 1.0073687635206915e-05, + "loss": 0.2043, + "step": 18817 + }, + { + "epoch": 51.275204359673026, + "grad_norm": 4.602548122406006, + "learning_rate": 1.0072805164244903e-05, + "loss": 0.1435, + "step": 18818 + }, + { + "epoch": 51.27792915531335, + "grad_norm": 8.02277660369873, + "learning_rate": 1.0071922692715885e-05, + "loss": 0.1631, + "step": 18819 + }, + { + "epoch": 51.28065395095368, + "grad_norm": 5.542445182800293, + "learning_rate": 1.0071040220626738e-05, + "loss": 0.1126, + "step": 18820 + }, + { + "epoch": 51.283378746594, + "grad_norm": 51.237945556640625, + "learning_rate": 1.0070157747984331e-05, + "loss": 0.2363, + "step": 18821 + }, + { + "epoch": 51.28610354223433, + "grad_norm": 4.691830158233643, + "learning_rate": 1.006927527479554e-05, + "loss": 0.2623, + "step": 18822 + }, + { + "epoch": 51.28882833787466, + "grad_norm": 5.037574291229248, + "learning_rate": 1.0068392801067232e-05, + "loss": 0.1498, + "step": 18823 + }, + { + "epoch": 51.29155313351499, + "grad_norm": 7.60037088394165, + "learning_rate": 1.0067510326806284e-05, + "loss": 0.2092, + "step": 18824 + }, + { + "epoch": 51.294277929155314, + "grad_norm": 4.125919818878174, + "learning_rate": 1.0066627852019567e-05, + "loss": 0.2363, + "step": 18825 + }, + { + "epoch": 51.29700272479564, + "grad_norm": 4.860090255737305, + "learning_rate": 1.0065745376713958e-05, + "loss": 0.1537, + "step": 18826 + }, + { + "epoch": 51.299727520435965, + "grad_norm": 6.538519859313965, + "learning_rate": 1.0064862900896323e-05, + "loss": 0.153, + "step": 18827 + }, + { + "epoch": 51.30245231607629, + "grad_norm": 6.630890369415283, + "learning_rate": 1.0063980424573538e-05, + "loss": 0.1448, + "step": 18828 + }, + { + "epoch": 51.305177111716624, + "grad_norm": 4.957268238067627, + "learning_rate": 1.0063097947752477e-05, + "loss": 0.1503, + "step": 18829 + }, + { + "epoch": 51.30790190735695, + "grad_norm": 5.636377334594727, + "learning_rate": 1.0062215470440011e-05, + "loss": 0.1475, + "step": 18830 + }, + { + "epoch": 51.310626702997276, + "grad_norm": 7.311302185058594, + "learning_rate": 1.006133299264301e-05, + "loss": 0.1904, + "step": 18831 + }, + { + "epoch": 51.3133514986376, + "grad_norm": 10.37523365020752, + "learning_rate": 1.0060450514368355e-05, + "loss": 0.11, + "step": 18832 + }, + { + "epoch": 51.31607629427793, + "grad_norm": 4.774973392486572, + "learning_rate": 1.005956803562291e-05, + "loss": 0.1609, + "step": 18833 + }, + { + "epoch": 51.31880108991825, + "grad_norm": 5.141545295715332, + "learning_rate": 1.005868555641355e-05, + "loss": 0.1307, + "step": 18834 + }, + { + "epoch": 51.321525885558586, + "grad_norm": 5.759461402893066, + "learning_rate": 1.005780307674715e-05, + "loss": 0.4502, + "step": 18835 + }, + { + "epoch": 51.32425068119891, + "grad_norm": 5.119438648223877, + "learning_rate": 1.0056920596630582e-05, + "loss": 0.1453, + "step": 18836 + }, + { + "epoch": 51.32697547683924, + "grad_norm": 6.693476676940918, + "learning_rate": 1.0056038116070716e-05, + "loss": 0.1693, + "step": 18837 + }, + { + "epoch": 51.32970027247956, + "grad_norm": 6.895663261413574, + "learning_rate": 1.005515563507443e-05, + "loss": 0.1509, + "step": 18838 + }, + { + "epoch": 51.33242506811989, + "grad_norm": 11.935626983642578, + "learning_rate": 1.0054273153648591e-05, + "loss": 0.1915, + "step": 18839 + }, + { + "epoch": 51.335149863760215, + "grad_norm": 5.337900638580322, + "learning_rate": 1.005339067180008e-05, + "loss": 0.178, + "step": 18840 + }, + { + "epoch": 51.33787465940055, + "grad_norm": 5.646678447723389, + "learning_rate": 1.0052508189535758e-05, + "loss": 0.1078, + "step": 18841 + }, + { + "epoch": 51.34059945504087, + "grad_norm": 5.215188980102539, + "learning_rate": 1.0051625706862507e-05, + "loss": 0.101, + "step": 18842 + }, + { + "epoch": 51.3433242506812, + "grad_norm": 4.767889976501465, + "learning_rate": 1.0050743223787193e-05, + "loss": 0.1725, + "step": 18843 + }, + { + "epoch": 51.346049046321525, + "grad_norm": 6.254324436187744, + "learning_rate": 1.0049860740316697e-05, + "loss": 0.1405, + "step": 18844 + }, + { + "epoch": 51.34877384196185, + "grad_norm": 5.112353801727295, + "learning_rate": 1.0048978256457885e-05, + "loss": 0.1337, + "step": 18845 + }, + { + "epoch": 51.35149863760218, + "grad_norm": 4.851981163024902, + "learning_rate": 1.004809577221763e-05, + "loss": 0.1956, + "step": 18846 + }, + { + "epoch": 51.35422343324251, + "grad_norm": 4.096112251281738, + "learning_rate": 1.0047213287602809e-05, + "loss": 0.0883, + "step": 18847 + }, + { + "epoch": 51.356948228882835, + "grad_norm": 5.8044586181640625, + "learning_rate": 1.0046330802620292e-05, + "loss": 0.093, + "step": 18848 + }, + { + "epoch": 51.35967302452316, + "grad_norm": 5.176109790802002, + "learning_rate": 1.0045448317276951e-05, + "loss": 0.1221, + "step": 18849 + }, + { + "epoch": 51.36239782016349, + "grad_norm": 5.2995781898498535, + "learning_rate": 1.0044565831579664e-05, + "loss": 0.1443, + "step": 18850 + }, + { + "epoch": 51.36512261580381, + "grad_norm": 6.7969536781311035, + "learning_rate": 1.0043683345535295e-05, + "loss": 0.0691, + "step": 18851 + }, + { + "epoch": 51.36784741144414, + "grad_norm": 4.332256317138672, + "learning_rate": 1.0042800859150726e-05, + "loss": 0.1539, + "step": 18852 + }, + { + "epoch": 51.37057220708447, + "grad_norm": 4.30204963684082, + "learning_rate": 1.0041918372432822e-05, + "loss": 0.1867, + "step": 18853 + }, + { + "epoch": 51.3732970027248, + "grad_norm": 5.851512432098389, + "learning_rate": 1.004103588538846e-05, + "loss": 0.2439, + "step": 18854 + }, + { + "epoch": 51.37602179836512, + "grad_norm": 5.3317084312438965, + "learning_rate": 1.0040153398024513e-05, + "loss": 0.1674, + "step": 18855 + }, + { + "epoch": 51.37874659400545, + "grad_norm": 4.1724534034729, + "learning_rate": 1.0039270910347849e-05, + "loss": 0.1919, + "step": 18856 + }, + { + "epoch": 51.381471389645775, + "grad_norm": 6.053035259246826, + "learning_rate": 1.0038388422365348e-05, + "loss": 0.107, + "step": 18857 + }, + { + "epoch": 51.3841961852861, + "grad_norm": 5.427990913391113, + "learning_rate": 1.0037505934083877e-05, + "loss": 0.1115, + "step": 18858 + }, + { + "epoch": 51.38692098092643, + "grad_norm": 6.375370025634766, + "learning_rate": 1.0036623445510312e-05, + "loss": 0.1364, + "step": 18859 + }, + { + "epoch": 51.38964577656676, + "grad_norm": 4.085097789764404, + "learning_rate": 1.0035740956651527e-05, + "loss": 0.2076, + "step": 18860 + }, + { + "epoch": 51.392370572207085, + "grad_norm": 7.361934661865234, + "learning_rate": 1.0034858467514388e-05, + "loss": 0.167, + "step": 18861 + }, + { + "epoch": 51.39509536784741, + "grad_norm": 5.714624881744385, + "learning_rate": 1.0033975978105774e-05, + "loss": 0.1235, + "step": 18862 + }, + { + "epoch": 51.39782016348774, + "grad_norm": 4.752364635467529, + "learning_rate": 1.003309348843256e-05, + "loss": 0.1219, + "step": 18863 + }, + { + "epoch": 51.40054495912806, + "grad_norm": 5.669373035430908, + "learning_rate": 1.0032210998501611e-05, + "loss": 0.1629, + "step": 18864 + }, + { + "epoch": 51.403269754768395, + "grad_norm": 9.528609275817871, + "learning_rate": 1.0031328508319805e-05, + "loss": 0.1717, + "step": 18865 + }, + { + "epoch": 51.40599455040872, + "grad_norm": 4.603137969970703, + "learning_rate": 1.0030446017894014e-05, + "loss": 0.078, + "step": 18866 + }, + { + "epoch": 51.40871934604905, + "grad_norm": 5.248652458190918, + "learning_rate": 1.002956352723111e-05, + "loss": 0.2607, + "step": 18867 + }, + { + "epoch": 51.41144414168937, + "grad_norm": 5.387473106384277, + "learning_rate": 1.0028681036337963e-05, + "loss": 0.1365, + "step": 18868 + }, + { + "epoch": 51.4141689373297, + "grad_norm": 4.097549915313721, + "learning_rate": 1.0027798545221453e-05, + "loss": 0.1656, + "step": 18869 + }, + { + "epoch": 51.416893732970024, + "grad_norm": 4.61376953125, + "learning_rate": 1.0026916053888449e-05, + "loss": 0.1086, + "step": 18870 + }, + { + "epoch": 51.41961852861036, + "grad_norm": 4.5222930908203125, + "learning_rate": 1.0026033562345821e-05, + "loss": 0.1723, + "step": 18871 + }, + { + "epoch": 51.42234332425068, + "grad_norm": 5.318976402282715, + "learning_rate": 1.0025151070600445e-05, + "loss": 0.1462, + "step": 18872 + }, + { + "epoch": 51.42506811989101, + "grad_norm": 4.539977073669434, + "learning_rate": 1.0024268578659195e-05, + "loss": 0.0965, + "step": 18873 + }, + { + "epoch": 51.427792915531334, + "grad_norm": 4.928645610809326, + "learning_rate": 1.0023386086528942e-05, + "loss": 0.1979, + "step": 18874 + }, + { + "epoch": 51.43051771117166, + "grad_norm": 5.497778415679932, + "learning_rate": 1.0022503594216558e-05, + "loss": 0.1126, + "step": 18875 + }, + { + "epoch": 51.433242506811986, + "grad_norm": 7.102056503295898, + "learning_rate": 1.0021621101728916e-05, + "loss": 0.2033, + "step": 18876 + }, + { + "epoch": 51.43596730245232, + "grad_norm": 5.455347537994385, + "learning_rate": 1.002073860907289e-05, + "loss": 0.1587, + "step": 18877 + }, + { + "epoch": 51.438692098092645, + "grad_norm": 5.075624465942383, + "learning_rate": 1.0019856116255353e-05, + "loss": 0.1917, + "step": 18878 + }, + { + "epoch": 51.44141689373297, + "grad_norm": 7.048523902893066, + "learning_rate": 1.0018973623283177e-05, + "loss": 0.1951, + "step": 18879 + }, + { + "epoch": 51.444141689373296, + "grad_norm": 4.175597667694092, + "learning_rate": 1.0018091130163235e-05, + "loss": 0.16, + "step": 18880 + }, + { + "epoch": 51.44686648501362, + "grad_norm": 4.40514612197876, + "learning_rate": 1.0017208636902401e-05, + "loss": 0.0847, + "step": 18881 + }, + { + "epoch": 51.44959128065395, + "grad_norm": 6.212416648864746, + "learning_rate": 1.0016326143507544e-05, + "loss": 0.288, + "step": 18882 + }, + { + "epoch": 51.45231607629428, + "grad_norm": 5.558211803436279, + "learning_rate": 1.0015443649985542e-05, + "loss": 0.131, + "step": 18883 + }, + { + "epoch": 51.45504087193461, + "grad_norm": 4.054054260253906, + "learning_rate": 1.0014561156343263e-05, + "loss": 0.1175, + "step": 18884 + }, + { + "epoch": 51.45776566757493, + "grad_norm": 5.712672710418701, + "learning_rate": 1.0013678662587584e-05, + "loss": 0.1595, + "step": 18885 + }, + { + "epoch": 51.46049046321526, + "grad_norm": 5.684453964233398, + "learning_rate": 1.0012796168725376e-05, + "loss": 0.2425, + "step": 18886 + }, + { + "epoch": 51.463215258855584, + "grad_norm": 4.908958911895752, + "learning_rate": 1.0011913674763514e-05, + "loss": 0.1607, + "step": 18887 + }, + { + "epoch": 51.46594005449591, + "grad_norm": 5.546113967895508, + "learning_rate": 1.0011031180708861e-05, + "loss": 0.1102, + "step": 18888 + }, + { + "epoch": 51.46866485013624, + "grad_norm": 4.123659133911133, + "learning_rate": 1.0010148686568304e-05, + "loss": 0.0927, + "step": 18889 + }, + { + "epoch": 51.47138964577657, + "grad_norm": 5.6722540855407715, + "learning_rate": 1.0009266192348708e-05, + "loss": 0.2096, + "step": 18890 + }, + { + "epoch": 51.474114441416894, + "grad_norm": 4.974035739898682, + "learning_rate": 1.0008383698056949e-05, + "loss": 0.1766, + "step": 18891 + }, + { + "epoch": 51.47683923705722, + "grad_norm": 5.52852201461792, + "learning_rate": 1.0007501203699894e-05, + "loss": 0.1583, + "step": 18892 + }, + { + "epoch": 51.479564032697546, + "grad_norm": 5.028327465057373, + "learning_rate": 1.0006618709284424e-05, + "loss": 0.1769, + "step": 18893 + }, + { + "epoch": 51.48228882833787, + "grad_norm": 4.124752044677734, + "learning_rate": 1.0005736214817405e-05, + "loss": 0.1034, + "step": 18894 + }, + { + "epoch": 51.485013623978205, + "grad_norm": 5.628269672393799, + "learning_rate": 1.0004853720305717e-05, + "loss": 0.1655, + "step": 18895 + }, + { + "epoch": 51.48773841961853, + "grad_norm": 5.227619171142578, + "learning_rate": 1.0003971225756222e-05, + "loss": 0.1572, + "step": 18896 + }, + { + "epoch": 51.490463215258856, + "grad_norm": 4.5399909019470215, + "learning_rate": 1.00030887311758e-05, + "loss": 0.107, + "step": 18897 + }, + { + "epoch": 51.49318801089918, + "grad_norm": 4.212165832519531, + "learning_rate": 1.0002206236571325e-05, + "loss": 0.1536, + "step": 18898 + }, + { + "epoch": 51.49591280653951, + "grad_norm": 4.753115177154541, + "learning_rate": 1.0001323741949669e-05, + "loss": 0.1167, + "step": 18899 + }, + { + "epoch": 51.49863760217983, + "grad_norm": 4.665989875793457, + "learning_rate": 1.0000441247317702e-05, + "loss": 0.1029, + "step": 18900 + }, + { + "epoch": 51.50136239782017, + "grad_norm": 4.497897624969482, + "learning_rate": 9.9995587526823e-06, + "loss": 0.0884, + "step": 18901 + }, + { + "epoch": 51.50408719346049, + "grad_norm": 5.178405284881592, + "learning_rate": 9.998676258050331e-06, + "loss": 0.0727, + "step": 18902 + }, + { + "epoch": 51.50681198910082, + "grad_norm": 5.843135833740234, + "learning_rate": 9.997793763428676e-06, + "loss": 0.2678, + "step": 18903 + }, + { + "epoch": 51.509536784741144, + "grad_norm": 4.736177444458008, + "learning_rate": 9.9969112688242e-06, + "loss": 0.1993, + "step": 18904 + }, + { + "epoch": 51.51226158038147, + "grad_norm": 5.294179916381836, + "learning_rate": 9.996028774243781e-06, + "loss": 0.1534, + "step": 18905 + }, + { + "epoch": 51.514986376021795, + "grad_norm": 4.487862586975098, + "learning_rate": 9.995146279694288e-06, + "loss": 0.2374, + "step": 18906 + }, + { + "epoch": 51.51771117166213, + "grad_norm": 4.244534015655518, + "learning_rate": 9.994263785182597e-06, + "loss": 0.127, + "step": 18907 + }, + { + "epoch": 51.520435967302454, + "grad_norm": 4.889786243438721, + "learning_rate": 9.993381290715578e-06, + "loss": 0.1465, + "step": 18908 + }, + { + "epoch": 51.52316076294278, + "grad_norm": 5.3072662353515625, + "learning_rate": 9.992498796300108e-06, + "loss": 0.1057, + "step": 18909 + }, + { + "epoch": 51.525885558583106, + "grad_norm": 6.529801368713379, + "learning_rate": 9.991616301943054e-06, + "loss": 0.221, + "step": 18910 + }, + { + "epoch": 51.52861035422343, + "grad_norm": 3.673734426498413, + "learning_rate": 9.990733807651295e-06, + "loss": 0.0801, + "step": 18911 + }, + { + "epoch": 51.53133514986376, + "grad_norm": 6.3138203620910645, + "learning_rate": 9.989851313431698e-06, + "loss": 0.2169, + "step": 18912 + }, + { + "epoch": 51.53405994550409, + "grad_norm": 3.917548179626465, + "learning_rate": 9.98896881929114e-06, + "loss": 0.1764, + "step": 18913 + }, + { + "epoch": 51.536784741144416, + "grad_norm": 5.814704418182373, + "learning_rate": 9.988086325236493e-06, + "loss": 0.1834, + "step": 18914 + }, + { + "epoch": 51.53950953678474, + "grad_norm": 4.445235252380371, + "learning_rate": 9.987203831274629e-06, + "loss": 0.2559, + "step": 18915 + }, + { + "epoch": 51.54223433242507, + "grad_norm": 4.93685245513916, + "learning_rate": 9.98632133741242e-06, + "loss": 0.2249, + "step": 18916 + }, + { + "epoch": 51.54495912806539, + "grad_norm": 4.567865371704102, + "learning_rate": 9.985438843656742e-06, + "loss": 0.0841, + "step": 18917 + }, + { + "epoch": 51.54768392370572, + "grad_norm": 4.291372776031494, + "learning_rate": 9.98455635001446e-06, + "loss": 0.2191, + "step": 18918 + }, + { + "epoch": 51.55040871934605, + "grad_norm": 5.775290012359619, + "learning_rate": 9.983673856492457e-06, + "loss": 0.2156, + "step": 18919 + }, + { + "epoch": 51.55313351498638, + "grad_norm": 4.890861511230469, + "learning_rate": 9.982791363097602e-06, + "loss": 0.2356, + "step": 18920 + }, + { + "epoch": 51.555858310626704, + "grad_norm": 4.549856662750244, + "learning_rate": 9.981908869836767e-06, + "loss": 0.1903, + "step": 18921 + }, + { + "epoch": 51.55858310626703, + "grad_norm": 4.9609246253967285, + "learning_rate": 9.981026376716823e-06, + "loss": 0.2612, + "step": 18922 + }, + { + "epoch": 51.561307901907355, + "grad_norm": 4.6248393058776855, + "learning_rate": 9.98014388374465e-06, + "loss": 0.2277, + "step": 18923 + }, + { + "epoch": 51.56403269754768, + "grad_norm": 5.297659397125244, + "learning_rate": 9.97926139092711e-06, + "loss": 0.2539, + "step": 18924 + }, + { + "epoch": 51.566757493188014, + "grad_norm": 4.408740520477295, + "learning_rate": 9.978378898271087e-06, + "loss": 0.112, + "step": 18925 + }, + { + "epoch": 51.56948228882834, + "grad_norm": 5.680944442749023, + "learning_rate": 9.977496405783444e-06, + "loss": 0.1101, + "step": 18926 + }, + { + "epoch": 51.572207084468666, + "grad_norm": 4.534115314483643, + "learning_rate": 9.976613913471063e-06, + "loss": 0.2115, + "step": 18927 + }, + { + "epoch": 51.57493188010899, + "grad_norm": 4.632035732269287, + "learning_rate": 9.975731421340807e-06, + "loss": 0.1009, + "step": 18928 + }, + { + "epoch": 51.57765667574932, + "grad_norm": 3.959153175354004, + "learning_rate": 9.974848929399557e-06, + "loss": 0.3635, + "step": 18929 + }, + { + "epoch": 51.58038147138964, + "grad_norm": 4.5949177742004395, + "learning_rate": 9.973966437654182e-06, + "loss": 0.12, + "step": 18930 + }, + { + "epoch": 51.583106267029976, + "grad_norm": 4.820900917053223, + "learning_rate": 9.973083946111556e-06, + "loss": 0.2106, + "step": 18931 + }, + { + "epoch": 51.5858310626703, + "grad_norm": 4.429122447967529, + "learning_rate": 9.97220145477855e-06, + "loss": 0.1239, + "step": 18932 + }, + { + "epoch": 51.58855585831063, + "grad_norm": 4.48766565322876, + "learning_rate": 9.971318963662042e-06, + "loss": 0.1423, + "step": 18933 + }, + { + "epoch": 51.59128065395095, + "grad_norm": 4.9005126953125, + "learning_rate": 9.970436472768895e-06, + "loss": 0.1009, + "step": 18934 + }, + { + "epoch": 51.59400544959128, + "grad_norm": 3.8744966983795166, + "learning_rate": 9.969553982105988e-06, + "loss": 0.2056, + "step": 18935 + }, + { + "epoch": 51.596730245231605, + "grad_norm": 4.15589714050293, + "learning_rate": 9.968671491680197e-06, + "loss": 0.0911, + "step": 18936 + }, + { + "epoch": 51.59945504087194, + "grad_norm": 3.719292640686035, + "learning_rate": 9.96778900149839e-06, + "loss": 0.1378, + "step": 18937 + }, + { + "epoch": 51.60217983651226, + "grad_norm": 4.779216289520264, + "learning_rate": 9.966906511567443e-06, + "loss": 0.2018, + "step": 18938 + }, + { + "epoch": 51.60490463215259, + "grad_norm": 5.980700969696045, + "learning_rate": 9.966024021894226e-06, + "loss": 0.1083, + "step": 18939 + }, + { + "epoch": 51.607629427792915, + "grad_norm": 5.108234882354736, + "learning_rate": 9.965141532485613e-06, + "loss": 0.1925, + "step": 18940 + }, + { + "epoch": 51.61035422343324, + "grad_norm": 4.135683536529541, + "learning_rate": 9.964259043348476e-06, + "loss": 0.1219, + "step": 18941 + }, + { + "epoch": 51.61307901907357, + "grad_norm": 3.197345495223999, + "learning_rate": 9.963376554489691e-06, + "loss": 0.0701, + "step": 18942 + }, + { + "epoch": 51.6158038147139, + "grad_norm": 4.442191123962402, + "learning_rate": 9.962494065916124e-06, + "loss": 0.1184, + "step": 18943 + }, + { + "epoch": 51.618528610354225, + "grad_norm": 3.397578239440918, + "learning_rate": 9.961611577634655e-06, + "loss": 0.0821, + "step": 18944 + }, + { + "epoch": 51.62125340599455, + "grad_norm": 5.611720085144043, + "learning_rate": 9.960729089652153e-06, + "loss": 0.1397, + "step": 18945 + }, + { + "epoch": 51.62397820163488, + "grad_norm": 5.228200912475586, + "learning_rate": 9.95984660197549e-06, + "loss": 0.1119, + "step": 18946 + }, + { + "epoch": 51.6267029972752, + "grad_norm": 4.0746660232543945, + "learning_rate": 9.958964114611544e-06, + "loss": 0.3339, + "step": 18947 + }, + { + "epoch": 51.62942779291553, + "grad_norm": 4.019106388092041, + "learning_rate": 9.958081627567182e-06, + "loss": 0.0726, + "step": 18948 + }, + { + "epoch": 51.63215258855586, + "grad_norm": 5.064167022705078, + "learning_rate": 9.95719914084928e-06, + "loss": 0.0893, + "step": 18949 + }, + { + "epoch": 51.63487738419619, + "grad_norm": 5.4382805824279785, + "learning_rate": 9.956316654464706e-06, + "loss": 0.0875, + "step": 18950 + }, + { + "epoch": 51.63760217983651, + "grad_norm": 5.484139442443848, + "learning_rate": 9.95543416842034e-06, + "loss": 0.2185, + "step": 18951 + }, + { + "epoch": 51.64032697547684, + "grad_norm": 6.450892925262451, + "learning_rate": 9.95455168272305e-06, + "loss": 0.3215, + "step": 18952 + }, + { + "epoch": 51.643051771117165, + "grad_norm": 4.3288421630859375, + "learning_rate": 9.953669197379708e-06, + "loss": 0.1527, + "step": 18953 + }, + { + "epoch": 51.64577656675749, + "grad_norm": 4.621757507324219, + "learning_rate": 9.952786712397191e-06, + "loss": 0.1524, + "step": 18954 + }, + { + "epoch": 51.64850136239782, + "grad_norm": 5.470773220062256, + "learning_rate": 9.95190422778237e-06, + "loss": 0.1019, + "step": 18955 + }, + { + "epoch": 51.65122615803815, + "grad_norm": 4.634878635406494, + "learning_rate": 9.951021743542119e-06, + "loss": 0.1514, + "step": 18956 + }, + { + "epoch": 51.653950953678475, + "grad_norm": 4.923651218414307, + "learning_rate": 9.950139259683305e-06, + "loss": 0.2577, + "step": 18957 + }, + { + "epoch": 51.6566757493188, + "grad_norm": 4.08267879486084, + "learning_rate": 9.949256776212808e-06, + "loss": 0.1605, + "step": 18958 + }, + { + "epoch": 51.65940054495913, + "grad_norm": 6.271906852722168, + "learning_rate": 9.948374293137496e-06, + "loss": 0.152, + "step": 18959 + }, + { + "epoch": 51.66212534059945, + "grad_norm": 4.404917240142822, + "learning_rate": 9.947491810464246e-06, + "loss": 0.2029, + "step": 18960 + }, + { + "epoch": 51.664850136239785, + "grad_norm": 4.689579963684082, + "learning_rate": 9.946609328199926e-06, + "loss": 0.092, + "step": 18961 + }, + { + "epoch": 51.66757493188011, + "grad_norm": 5.952474594116211, + "learning_rate": 9.94572684635141e-06, + "loss": 0.1792, + "step": 18962 + }, + { + "epoch": 51.67029972752044, + "grad_norm": 5.2045722007751465, + "learning_rate": 9.944844364925574e-06, + "loss": 0.295, + "step": 18963 + }, + { + "epoch": 51.67302452316076, + "grad_norm": 6.426792144775391, + "learning_rate": 9.943961883929287e-06, + "loss": 0.2517, + "step": 18964 + }, + { + "epoch": 51.67574931880109, + "grad_norm": 4.43955135345459, + "learning_rate": 9.943079403369423e-06, + "loss": 0.1677, + "step": 18965 + }, + { + "epoch": 51.678474114441414, + "grad_norm": 4.113171577453613, + "learning_rate": 9.942196923252855e-06, + "loss": 0.1186, + "step": 18966 + }, + { + "epoch": 51.68119891008175, + "grad_norm": 3.726844549179077, + "learning_rate": 9.941314443586454e-06, + "loss": 0.1156, + "step": 18967 + }, + { + "epoch": 51.68392370572207, + "grad_norm": 4.087982654571533, + "learning_rate": 9.940431964377094e-06, + "loss": 0.1668, + "step": 18968 + }, + { + "epoch": 51.6866485013624, + "grad_norm": 5.609523773193359, + "learning_rate": 9.93954948563165e-06, + "loss": 0.1342, + "step": 18969 + }, + { + "epoch": 51.689373297002724, + "grad_norm": 4.390143871307373, + "learning_rate": 9.938667007356991e-06, + "loss": 0.1868, + "step": 18970 + }, + { + "epoch": 51.69209809264305, + "grad_norm": 8.819103240966797, + "learning_rate": 9.93778452955999e-06, + "loss": 0.1333, + "step": 18971 + }, + { + "epoch": 51.694822888283376, + "grad_norm": 4.704899311065674, + "learning_rate": 9.936902052247525e-06, + "loss": 0.0866, + "step": 18972 + }, + { + "epoch": 51.69754768392371, + "grad_norm": 2.8743555545806885, + "learning_rate": 9.936019575426462e-06, + "loss": 0.0636, + "step": 18973 + }, + { + "epoch": 51.700272479564035, + "grad_norm": 6.211526393890381, + "learning_rate": 9.935137099103678e-06, + "loss": 0.2033, + "step": 18974 + }, + { + "epoch": 51.70299727520436, + "grad_norm": 4.9399871826171875, + "learning_rate": 9.934254623286043e-06, + "loss": 0.1494, + "step": 18975 + }, + { + "epoch": 51.705722070844686, + "grad_norm": 4.001533031463623, + "learning_rate": 9.933372147980434e-06, + "loss": 0.2128, + "step": 18976 + }, + { + "epoch": 51.70844686648501, + "grad_norm": 4.183261871337891, + "learning_rate": 9.932489673193718e-06, + "loss": 0.1497, + "step": 18977 + }, + { + "epoch": 51.71117166212534, + "grad_norm": 4.518909454345703, + "learning_rate": 9.931607198932771e-06, + "loss": 0.1536, + "step": 18978 + }, + { + "epoch": 51.71389645776567, + "grad_norm": 4.9194488525390625, + "learning_rate": 9.930724725204463e-06, + "loss": 0.1351, + "step": 18979 + }, + { + "epoch": 51.716621253406, + "grad_norm": 4.825377941131592, + "learning_rate": 9.929842252015672e-06, + "loss": 0.1188, + "step": 18980 + }, + { + "epoch": 51.71934604904632, + "grad_norm": 6.563079833984375, + "learning_rate": 9.928959779373265e-06, + "loss": 0.1064, + "step": 18981 + }, + { + "epoch": 51.72207084468665, + "grad_norm": 4.544953346252441, + "learning_rate": 9.928077307284118e-06, + "loss": 0.2616, + "step": 18982 + }, + { + "epoch": 51.724795640326974, + "grad_norm": 4.771892547607422, + "learning_rate": 9.9271948357551e-06, + "loss": 0.1276, + "step": 18983 + }, + { + "epoch": 51.7275204359673, + "grad_norm": 6.476113319396973, + "learning_rate": 9.92631236479309e-06, + "loss": 0.2689, + "step": 18984 + }, + { + "epoch": 51.73024523160763, + "grad_norm": 5.970198154449463, + "learning_rate": 9.925429894404955e-06, + "loss": 0.285, + "step": 18985 + }, + { + "epoch": 51.73297002724796, + "grad_norm": 4.367156505584717, + "learning_rate": 9.92454742459757e-06, + "loss": 0.1528, + "step": 18986 + }, + { + "epoch": 51.735694822888284, + "grad_norm": 5.05354118347168, + "learning_rate": 9.923664955377802e-06, + "loss": 0.1256, + "step": 18987 + }, + { + "epoch": 51.73841961852861, + "grad_norm": 4.834817886352539, + "learning_rate": 9.922782486752537e-06, + "loss": 0.1377, + "step": 18988 + }, + { + "epoch": 51.741144414168936, + "grad_norm": 3.8790314197540283, + "learning_rate": 9.921900018728634e-06, + "loss": 0.2363, + "step": 18989 + }, + { + "epoch": 51.74386920980926, + "grad_norm": 4.6017560958862305, + "learning_rate": 9.921017551312975e-06, + "loss": 0.213, + "step": 18990 + }, + { + "epoch": 51.746594005449595, + "grad_norm": 11.591754913330078, + "learning_rate": 9.920135084512425e-06, + "loss": 0.1818, + "step": 18991 + }, + { + "epoch": 51.74931880108992, + "grad_norm": 6.721871376037598, + "learning_rate": 9.919252618333864e-06, + "loss": 0.1454, + "step": 18992 + }, + { + "epoch": 51.752043596730246, + "grad_norm": 5.192331314086914, + "learning_rate": 9.918370152784158e-06, + "loss": 0.113, + "step": 18993 + }, + { + "epoch": 51.75476839237057, + "grad_norm": 4.748659610748291, + "learning_rate": 9.917487687870187e-06, + "loss": 0.1944, + "step": 18994 + }, + { + "epoch": 51.7574931880109, + "grad_norm": 5.543908596038818, + "learning_rate": 9.916605223598815e-06, + "loss": 0.1583, + "step": 18995 + }, + { + "epoch": 51.76021798365122, + "grad_norm": 4.537134170532227, + "learning_rate": 9.915722759976923e-06, + "loss": 0.1149, + "step": 18996 + }, + { + "epoch": 51.762942779291556, + "grad_norm": 5.6749677658081055, + "learning_rate": 9.914840297011376e-06, + "loss": 0.1267, + "step": 18997 + }, + { + "epoch": 51.76566757493188, + "grad_norm": 4.887343406677246, + "learning_rate": 9.913957834709051e-06, + "loss": 0.2384, + "step": 18998 + }, + { + "epoch": 51.76839237057221, + "grad_norm": 4.104245662689209, + "learning_rate": 9.913075373076819e-06, + "loss": 0.1162, + "step": 18999 + }, + { + "epoch": 51.771117166212534, + "grad_norm": 4.365303039550781, + "learning_rate": 9.912192912121554e-06, + "loss": 0.1506, + "step": 19000 + }, + { + "epoch": 51.77384196185286, + "grad_norm": 3.8478541374206543, + "learning_rate": 9.911310451850127e-06, + "loss": 0.0982, + "step": 19001 + }, + { + "epoch": 51.776566757493185, + "grad_norm": 5.014444828033447, + "learning_rate": 9.910427992269414e-06, + "loss": 0.2771, + "step": 19002 + }, + { + "epoch": 51.77929155313352, + "grad_norm": 4.454366683959961, + "learning_rate": 9.909545533386281e-06, + "loss": 0.2987, + "step": 19003 + }, + { + "epoch": 51.782016348773844, + "grad_norm": 3.6813745498657227, + "learning_rate": 9.908663075207602e-06, + "loss": 0.1858, + "step": 19004 + }, + { + "epoch": 51.78474114441417, + "grad_norm": 7.667509078979492, + "learning_rate": 9.907780617740258e-06, + "loss": 0.1968, + "step": 19005 + }, + { + "epoch": 51.787465940054496, + "grad_norm": 4.544261932373047, + "learning_rate": 9.906898160991113e-06, + "loss": 0.1412, + "step": 19006 + }, + { + "epoch": 51.79019073569482, + "grad_norm": 4.070530414581299, + "learning_rate": 9.906015704967044e-06, + "loss": 0.1038, + "step": 19007 + }, + { + "epoch": 51.79291553133515, + "grad_norm": 4.835860729217529, + "learning_rate": 9.90513324967492e-06, + "loss": 0.2113, + "step": 19008 + }, + { + "epoch": 51.79564032697548, + "grad_norm": 7.1134033203125, + "learning_rate": 9.904250795121614e-06, + "loss": 0.3214, + "step": 19009 + }, + { + "epoch": 51.798365122615806, + "grad_norm": 5.900073051452637, + "learning_rate": 9.903368341314003e-06, + "loss": 0.11, + "step": 19010 + }, + { + "epoch": 51.80108991825613, + "grad_norm": 5.206643104553223, + "learning_rate": 9.902485888258953e-06, + "loss": 0.1453, + "step": 19011 + }, + { + "epoch": 51.80381471389646, + "grad_norm": 5.340708255767822, + "learning_rate": 9.901603435963343e-06, + "loss": 0.0987, + "step": 19012 + }, + { + "epoch": 51.80653950953678, + "grad_norm": 5.448592662811279, + "learning_rate": 9.90072098443404e-06, + "loss": 0.1181, + "step": 19013 + }, + { + "epoch": 51.80926430517711, + "grad_norm": 5.2505011558532715, + "learning_rate": 9.899838533677922e-06, + "loss": 0.0873, + "step": 19014 + }, + { + "epoch": 51.81198910081744, + "grad_norm": 4.6900739669799805, + "learning_rate": 9.898956083701854e-06, + "loss": 0.1025, + "step": 19015 + }, + { + "epoch": 51.81471389645777, + "grad_norm": 7.396714687347412, + "learning_rate": 9.898073634512717e-06, + "loss": 0.0938, + "step": 19016 + }, + { + "epoch": 51.817438692098094, + "grad_norm": 4.672626972198486, + "learning_rate": 9.897191186117375e-06, + "loss": 0.2453, + "step": 19017 + }, + { + "epoch": 51.82016348773842, + "grad_norm": 4.7493720054626465, + "learning_rate": 9.896308738522708e-06, + "loss": 0.1075, + "step": 19018 + }, + { + "epoch": 51.822888283378745, + "grad_norm": 4.544273853302002, + "learning_rate": 9.895426291735582e-06, + "loss": 0.3212, + "step": 19019 + }, + { + "epoch": 51.82561307901907, + "grad_norm": 4.8066792488098145, + "learning_rate": 9.894543845762876e-06, + "loss": 0.158, + "step": 19020 + }, + { + "epoch": 51.828337874659404, + "grad_norm": 4.690978527069092, + "learning_rate": 9.893661400611456e-06, + "loss": 0.1431, + "step": 19021 + }, + { + "epoch": 51.83106267029973, + "grad_norm": 5.638887882232666, + "learning_rate": 9.892778956288198e-06, + "loss": 0.1434, + "step": 19022 + }, + { + "epoch": 51.833787465940055, + "grad_norm": 5.1739068031311035, + "learning_rate": 9.891896512799975e-06, + "loss": 0.2879, + "step": 19023 + }, + { + "epoch": 51.83651226158038, + "grad_norm": 7.537215232849121, + "learning_rate": 9.891014070153658e-06, + "loss": 0.1211, + "step": 19024 + }, + { + "epoch": 51.83923705722071, + "grad_norm": 6.0180535316467285, + "learning_rate": 9.890131628356122e-06, + "loss": 0.1376, + "step": 19025 + }, + { + "epoch": 51.84196185286103, + "grad_norm": 4.283379077911377, + "learning_rate": 9.889249187414235e-06, + "loss": 0.0915, + "step": 19026 + }, + { + "epoch": 51.844686648501366, + "grad_norm": 5.555041790008545, + "learning_rate": 9.888366747334873e-06, + "loss": 0.1199, + "step": 19027 + }, + { + "epoch": 51.84741144414169, + "grad_norm": 4.932379722595215, + "learning_rate": 9.887484308124907e-06, + "loss": 0.1198, + "step": 19028 + }, + { + "epoch": 51.85013623978202, + "grad_norm": 4.495264530181885, + "learning_rate": 9.88660186979121e-06, + "loss": 0.188, + "step": 19029 + }, + { + "epoch": 51.85286103542234, + "grad_norm": 6.212512493133545, + "learning_rate": 9.885719432340652e-06, + "loss": 0.2284, + "step": 19030 + }, + { + "epoch": 51.85558583106267, + "grad_norm": 4.427855491638184, + "learning_rate": 9.884836995780109e-06, + "loss": 0.2725, + "step": 19031 + }, + { + "epoch": 51.858310626702995, + "grad_norm": 4.954310417175293, + "learning_rate": 9.883954560116452e-06, + "loss": 0.1135, + "step": 19032 + }, + { + "epoch": 51.86103542234333, + "grad_norm": 4.122082233428955, + "learning_rate": 9.883072125356552e-06, + "loss": 0.0942, + "step": 19033 + }, + { + "epoch": 51.86376021798365, + "grad_norm": 3.8311758041381836, + "learning_rate": 9.882189691507285e-06, + "loss": 0.1667, + "step": 19034 + }, + { + "epoch": 51.86648501362398, + "grad_norm": 5.232621669769287, + "learning_rate": 9.881307258575519e-06, + "loss": 0.1082, + "step": 19035 + }, + { + "epoch": 51.869209809264305, + "grad_norm": 5.181174278259277, + "learning_rate": 9.880424826568128e-06, + "loss": 0.1105, + "step": 19036 + }, + { + "epoch": 51.87193460490463, + "grad_norm": 6.016700267791748, + "learning_rate": 9.879542395491984e-06, + "loss": 0.1191, + "step": 19037 + }, + { + "epoch": 51.87465940054496, + "grad_norm": 5.201912879943848, + "learning_rate": 9.878659965353964e-06, + "loss": 0.1178, + "step": 19038 + }, + { + "epoch": 51.87738419618529, + "grad_norm": 6.831856727600098, + "learning_rate": 9.87777753616093e-06, + "loss": 0.1596, + "step": 19039 + }, + { + "epoch": 51.880108991825615, + "grad_norm": 4.478147029876709, + "learning_rate": 9.876895107919761e-06, + "loss": 0.1235, + "step": 19040 + }, + { + "epoch": 51.88283378746594, + "grad_norm": 5.386390686035156, + "learning_rate": 9.876012680637334e-06, + "loss": 0.14, + "step": 19041 + }, + { + "epoch": 51.88555858310627, + "grad_norm": 6.98453426361084, + "learning_rate": 9.875130254320513e-06, + "loss": 0.1128, + "step": 19042 + }, + { + "epoch": 51.88828337874659, + "grad_norm": 13.316817283630371, + "learning_rate": 9.874247828976176e-06, + "loss": 0.2634, + "step": 19043 + }, + { + "epoch": 51.89100817438692, + "grad_norm": 4.4534759521484375, + "learning_rate": 9.87336540461119e-06, + "loss": 0.2525, + "step": 19044 + }, + { + "epoch": 51.89373297002725, + "grad_norm": 4.711284160614014, + "learning_rate": 9.872482981232434e-06, + "loss": 0.1092, + "step": 19045 + }, + { + "epoch": 51.89645776566758, + "grad_norm": 4.004992961883545, + "learning_rate": 9.871600558846772e-06, + "loss": 0.2462, + "step": 19046 + }, + { + "epoch": 51.8991825613079, + "grad_norm": 6.234788417816162, + "learning_rate": 9.870718137461085e-06, + "loss": 0.1602, + "step": 19047 + }, + { + "epoch": 51.90190735694823, + "grad_norm": 4.16002893447876, + "learning_rate": 9.869835717082237e-06, + "loss": 0.1424, + "step": 19048 + }, + { + "epoch": 51.904632152588555, + "grad_norm": 5.75315523147583, + "learning_rate": 9.868953297717108e-06, + "loss": 0.1034, + "step": 19049 + }, + { + "epoch": 51.90735694822888, + "grad_norm": 5.9653239250183105, + "learning_rate": 9.868070879372563e-06, + "loss": 0.1137, + "step": 19050 + }, + { + "epoch": 51.91008174386921, + "grad_norm": 4.411348819732666, + "learning_rate": 9.867188462055482e-06, + "loss": 0.1898, + "step": 19051 + }, + { + "epoch": 51.91280653950954, + "grad_norm": 5.087191104888916, + "learning_rate": 9.86630604577273e-06, + "loss": 0.1411, + "step": 19052 + }, + { + "epoch": 51.915531335149865, + "grad_norm": 7.6265788078308105, + "learning_rate": 9.865423630531182e-06, + "loss": 0.0907, + "step": 19053 + }, + { + "epoch": 51.91825613079019, + "grad_norm": 4.868733882904053, + "learning_rate": 9.86454121633771e-06, + "loss": 0.1693, + "step": 19054 + }, + { + "epoch": 51.920980926430516, + "grad_norm": 4.471322536468506, + "learning_rate": 9.863658803199187e-06, + "loss": 0.1086, + "step": 19055 + }, + { + "epoch": 51.92370572207084, + "grad_norm": 3.931206226348877, + "learning_rate": 9.862776391122482e-06, + "loss": 0.1117, + "step": 19056 + }, + { + "epoch": 51.926430517711175, + "grad_norm": 4.475884914398193, + "learning_rate": 9.861893980114475e-06, + "loss": 0.0922, + "step": 19057 + }, + { + "epoch": 51.9291553133515, + "grad_norm": 5.323555946350098, + "learning_rate": 9.86101157018203e-06, + "loss": 0.1027, + "step": 19058 + }, + { + "epoch": 51.93188010899183, + "grad_norm": 4.618867874145508, + "learning_rate": 9.860129161332026e-06, + "loss": 0.2802, + "step": 19059 + }, + { + "epoch": 51.93460490463215, + "grad_norm": 5.137905597686768, + "learning_rate": 9.859246753571328e-06, + "loss": 0.1069, + "step": 19060 + }, + { + "epoch": 51.93732970027248, + "grad_norm": 5.134658336639404, + "learning_rate": 9.858364346906814e-06, + "loss": 0.1496, + "step": 19061 + }, + { + "epoch": 51.940054495912804, + "grad_norm": 5.088315010070801, + "learning_rate": 9.857481941345354e-06, + "loss": 0.1792, + "step": 19062 + }, + { + "epoch": 51.94277929155314, + "grad_norm": 4.330304145812988, + "learning_rate": 9.856599536893821e-06, + "loss": 0.1337, + "step": 19063 + }, + { + "epoch": 51.94550408719346, + "grad_norm": 4.265829563140869, + "learning_rate": 9.855717133559082e-06, + "loss": 0.3549, + "step": 19064 + }, + { + "epoch": 51.94822888283379, + "grad_norm": 5.327817440032959, + "learning_rate": 9.854834731348017e-06, + "loss": 0.1134, + "step": 19065 + }, + { + "epoch": 51.950953678474114, + "grad_norm": 4.612740993499756, + "learning_rate": 9.853952330267494e-06, + "loss": 0.1141, + "step": 19066 + }, + { + "epoch": 51.95367847411444, + "grad_norm": 5.05368709564209, + "learning_rate": 9.853069930324386e-06, + "loss": 0.1647, + "step": 19067 + }, + { + "epoch": 51.956403269754766, + "grad_norm": 8.820033073425293, + "learning_rate": 9.852187531525563e-06, + "loss": 0.2022, + "step": 19068 + }, + { + "epoch": 51.95912806539509, + "grad_norm": 7.538532733917236, + "learning_rate": 9.8513051338779e-06, + "loss": 0.1246, + "step": 19069 + }, + { + "epoch": 51.961852861035425, + "grad_norm": 9.275288581848145, + "learning_rate": 9.850422737388266e-06, + "loss": 0.1403, + "step": 19070 + }, + { + "epoch": 51.96457765667575, + "grad_norm": 4.492852210998535, + "learning_rate": 9.849540342063538e-06, + "loss": 0.0984, + "step": 19071 + }, + { + "epoch": 51.967302452316076, + "grad_norm": 5.652397632598877, + "learning_rate": 9.848657947910582e-06, + "loss": 0.2101, + "step": 19072 + }, + { + "epoch": 51.9700272479564, + "grad_norm": 4.326151371002197, + "learning_rate": 9.84777555493627e-06, + "loss": 0.3379, + "step": 19073 + }, + { + "epoch": 51.97275204359673, + "grad_norm": 7.145446300506592, + "learning_rate": 9.84689316314748e-06, + "loss": 0.1147, + "step": 19074 + }, + { + "epoch": 51.97547683923706, + "grad_norm": 5.152425765991211, + "learning_rate": 9.846010772551083e-06, + "loss": 0.1434, + "step": 19075 + }, + { + "epoch": 51.97820163487739, + "grad_norm": 4.132455825805664, + "learning_rate": 9.845128383153948e-06, + "loss": 0.1292, + "step": 19076 + }, + { + "epoch": 51.98092643051771, + "grad_norm": 5.042201995849609, + "learning_rate": 9.84424599496295e-06, + "loss": 0.2215, + "step": 19077 + }, + { + "epoch": 51.98365122615804, + "grad_norm": 4.171875476837158, + "learning_rate": 9.843363607984957e-06, + "loss": 0.1582, + "step": 19078 + }, + { + "epoch": 51.986376021798364, + "grad_norm": 5.28590726852417, + "learning_rate": 9.842481222226845e-06, + "loss": 0.1508, + "step": 19079 + }, + { + "epoch": 51.98910081743869, + "grad_norm": 5.6133198738098145, + "learning_rate": 9.841598837695482e-06, + "loss": 0.1724, + "step": 19080 + }, + { + "epoch": 51.991825613079016, + "grad_norm": 4.963491439819336, + "learning_rate": 9.840716454397746e-06, + "loss": 0.1653, + "step": 19081 + }, + { + "epoch": 51.99455040871935, + "grad_norm": 5.135807991027832, + "learning_rate": 9.8398340723405e-06, + "loss": 0.1413, + "step": 19082 + }, + { + "epoch": 51.997275204359674, + "grad_norm": 5.180513858795166, + "learning_rate": 9.838951691530625e-06, + "loss": 0.1247, + "step": 19083 + }, + { + "epoch": 52.0, + "grad_norm": 3.206604242324829, + "learning_rate": 9.838069311974986e-06, + "loss": 0.0588, + "step": 19084 + }, + { + "epoch": 52.002724795640326, + "grad_norm": 5.357468605041504, + "learning_rate": 9.837186933680462e-06, + "loss": 0.1203, + "step": 19085 + }, + { + "epoch": 52.00544959128065, + "grad_norm": 4.185212135314941, + "learning_rate": 9.836304556653916e-06, + "loss": 0.1916, + "step": 19086 + }, + { + "epoch": 52.00817438692098, + "grad_norm": 5.570226192474365, + "learning_rate": 9.835422180902228e-06, + "loss": 0.1843, + "step": 19087 + }, + { + "epoch": 52.01089918256131, + "grad_norm": 4.808948040008545, + "learning_rate": 9.834539806432267e-06, + "loss": 0.1085, + "step": 19088 + }, + { + "epoch": 52.013623978201636, + "grad_norm": 4.601601600646973, + "learning_rate": 9.833657433250904e-06, + "loss": 0.1868, + "step": 19089 + }, + { + "epoch": 52.01634877384196, + "grad_norm": 7.2745361328125, + "learning_rate": 9.832775061365008e-06, + "loss": 0.0949, + "step": 19090 + }, + { + "epoch": 52.01907356948229, + "grad_norm": 4.245944976806641, + "learning_rate": 9.831892690781457e-06, + "loss": 0.1617, + "step": 19091 + }, + { + "epoch": 52.02179836512261, + "grad_norm": 3.1831865310668945, + "learning_rate": 9.831010321507122e-06, + "loss": 0.1959, + "step": 19092 + }, + { + "epoch": 52.02452316076294, + "grad_norm": 4.060930252075195, + "learning_rate": 9.830127953548872e-06, + "loss": 0.0862, + "step": 19093 + }, + { + "epoch": 52.02724795640327, + "grad_norm": 4.801197528839111, + "learning_rate": 9.82924558691358e-06, + "loss": 0.1185, + "step": 19094 + }, + { + "epoch": 52.0299727520436, + "grad_norm": 6.656748294830322, + "learning_rate": 9.828363221608118e-06, + "loss": 0.0909, + "step": 19095 + }, + { + "epoch": 52.032697547683924, + "grad_norm": 6.821707725524902, + "learning_rate": 9.827480857639357e-06, + "loss": 0.161, + "step": 19096 + }, + { + "epoch": 52.03542234332425, + "grad_norm": 3.8699491024017334, + "learning_rate": 9.826598495014172e-06, + "loss": 0.1075, + "step": 19097 + }, + { + "epoch": 52.038147138964575, + "grad_norm": 3.5079822540283203, + "learning_rate": 9.82571613373943e-06, + "loss": 0.1131, + "step": 19098 + }, + { + "epoch": 52.0408719346049, + "grad_norm": 3.8385355472564697, + "learning_rate": 9.824833773822006e-06, + "loss": 0.2495, + "step": 19099 + }, + { + "epoch": 52.043596730245234, + "grad_norm": 6.233022212982178, + "learning_rate": 9.82395141526877e-06, + "loss": 0.1038, + "step": 19100 + }, + { + "epoch": 52.04632152588556, + "grad_norm": 5.880666255950928, + "learning_rate": 9.823069058086597e-06, + "loss": 0.1858, + "step": 19101 + }, + { + "epoch": 52.049046321525886, + "grad_norm": 5.460610389709473, + "learning_rate": 9.822186702282354e-06, + "loss": 0.2856, + "step": 19102 + }, + { + "epoch": 52.05177111716621, + "grad_norm": 4.017082214355469, + "learning_rate": 9.821304347862917e-06, + "loss": 0.1405, + "step": 19103 + }, + { + "epoch": 52.05449591280654, + "grad_norm": 7.076798915863037, + "learning_rate": 9.820421994835154e-06, + "loss": 0.2079, + "step": 19104 + }, + { + "epoch": 52.05722070844686, + "grad_norm": 4.44091272354126, + "learning_rate": 9.81953964320594e-06, + "loss": 0.0803, + "step": 19105 + }, + { + "epoch": 52.059945504087196, + "grad_norm": 5.3109564781188965, + "learning_rate": 9.818657292982146e-06, + "loss": 0.1039, + "step": 19106 + }, + { + "epoch": 52.06267029972752, + "grad_norm": 4.658829689025879, + "learning_rate": 9.817774944170638e-06, + "loss": 0.1626, + "step": 19107 + }, + { + "epoch": 52.06539509536785, + "grad_norm": 4.813467502593994, + "learning_rate": 9.816892596778299e-06, + "loss": 0.1605, + "step": 19108 + }, + { + "epoch": 52.06811989100817, + "grad_norm": 4.176400184631348, + "learning_rate": 9.816010250811993e-06, + "loss": 0.2054, + "step": 19109 + }, + { + "epoch": 52.0708446866485, + "grad_norm": 8.531670570373535, + "learning_rate": 9.815127906278595e-06, + "loss": 0.2266, + "step": 19110 + }, + { + "epoch": 52.073569482288825, + "grad_norm": 4.211588382720947, + "learning_rate": 9.814245563184971e-06, + "loss": 0.2232, + "step": 19111 + }, + { + "epoch": 52.07629427792916, + "grad_norm": 4.5949387550354, + "learning_rate": 9.813363221538e-06, + "loss": 0.1642, + "step": 19112 + }, + { + "epoch": 52.079019073569484, + "grad_norm": 4.175572872161865, + "learning_rate": 9.812480881344548e-06, + "loss": 0.1366, + "step": 19113 + }, + { + "epoch": 52.08174386920981, + "grad_norm": 3.458845615386963, + "learning_rate": 9.811598542611492e-06, + "loss": 0.1829, + "step": 19114 + }, + { + "epoch": 52.084468664850135, + "grad_norm": 4.565491676330566, + "learning_rate": 9.810716205345695e-06, + "loss": 0.2216, + "step": 19115 + }, + { + "epoch": 52.08719346049046, + "grad_norm": 4.427910804748535, + "learning_rate": 9.80983386955404e-06, + "loss": 0.1551, + "step": 19116 + }, + { + "epoch": 52.08991825613079, + "grad_norm": 4.134413719177246, + "learning_rate": 9.808951535243389e-06, + "loss": 0.2118, + "step": 19117 + }, + { + "epoch": 52.09264305177112, + "grad_norm": 4.23202657699585, + "learning_rate": 9.808069202420617e-06, + "loss": 0.1259, + "step": 19118 + }, + { + "epoch": 52.095367847411445, + "grad_norm": 3.89436936378479, + "learning_rate": 9.8071868710926e-06, + "loss": 0.2316, + "step": 19119 + }, + { + "epoch": 52.09809264305177, + "grad_norm": 5.763807773590088, + "learning_rate": 9.8063045412662e-06, + "loss": 0.1645, + "step": 19120 + }, + { + "epoch": 52.1008174386921, + "grad_norm": 4.004239082336426, + "learning_rate": 9.805422212948297e-06, + "loss": 0.0766, + "step": 19121 + }, + { + "epoch": 52.10354223433242, + "grad_norm": 3.9072365760803223, + "learning_rate": 9.80453988614576e-06, + "loss": 0.1027, + "step": 19122 + }, + { + "epoch": 52.10626702997275, + "grad_norm": 4.546239852905273, + "learning_rate": 9.80365756086546e-06, + "loss": 0.2511, + "step": 19123 + }, + { + "epoch": 52.10899182561308, + "grad_norm": 3.611271858215332, + "learning_rate": 9.802775237114267e-06, + "loss": 0.0702, + "step": 19124 + }, + { + "epoch": 52.11171662125341, + "grad_norm": 4.813879489898682, + "learning_rate": 9.801892914899051e-06, + "loss": 0.1756, + "step": 19125 + }, + { + "epoch": 52.11444141689373, + "grad_norm": 3.95748233795166, + "learning_rate": 9.801010594226691e-06, + "loss": 0.1067, + "step": 19126 + }, + { + "epoch": 52.11716621253406, + "grad_norm": 3.612278461456299, + "learning_rate": 9.800128275104054e-06, + "loss": 0.0726, + "step": 19127 + }, + { + "epoch": 52.119891008174385, + "grad_norm": 3.7307493686676025, + "learning_rate": 9.799245957538013e-06, + "loss": 0.0693, + "step": 19128 + }, + { + "epoch": 52.12261580381471, + "grad_norm": 4.682528972625732, + "learning_rate": 9.798363641535434e-06, + "loss": 0.1538, + "step": 19129 + }, + { + "epoch": 52.12534059945504, + "grad_norm": 4.460844039916992, + "learning_rate": 9.797481327103196e-06, + "loss": 0.1456, + "step": 19130 + }, + { + "epoch": 52.12806539509537, + "grad_norm": 4.052233695983887, + "learning_rate": 9.796599014248164e-06, + "loss": 0.0777, + "step": 19131 + }, + { + "epoch": 52.130790190735695, + "grad_norm": 6.026838779449463, + "learning_rate": 9.795716702977216e-06, + "loss": 0.0797, + "step": 19132 + }, + { + "epoch": 52.13351498637602, + "grad_norm": 4.016129016876221, + "learning_rate": 9.794834393297217e-06, + "loss": 0.1709, + "step": 19133 + }, + { + "epoch": 52.13623978201635, + "grad_norm": 3.1839075088500977, + "learning_rate": 9.793952085215043e-06, + "loss": 0.0997, + "step": 19134 + }, + { + "epoch": 52.13896457765667, + "grad_norm": 5.489106178283691, + "learning_rate": 9.793069778737561e-06, + "loss": 0.2695, + "step": 19135 + }, + { + "epoch": 52.141689373297005, + "grad_norm": 4.77548885345459, + "learning_rate": 9.792187473871648e-06, + "loss": 0.3013, + "step": 19136 + }, + { + "epoch": 52.14441416893733, + "grad_norm": 4.23523473739624, + "learning_rate": 9.79130517062417e-06, + "loss": 0.1891, + "step": 19137 + }, + { + "epoch": 52.14713896457766, + "grad_norm": 4.312173366546631, + "learning_rate": 9.790422869002003e-06, + "loss": 0.1265, + "step": 19138 + }, + { + "epoch": 52.14986376021798, + "grad_norm": 5.366184711456299, + "learning_rate": 9.789540569012012e-06, + "loss": 0.0827, + "step": 19139 + }, + { + "epoch": 52.15258855585831, + "grad_norm": 6.901341915130615, + "learning_rate": 9.788658270661076e-06, + "loss": 0.1, + "step": 19140 + }, + { + "epoch": 52.155313351498634, + "grad_norm": 4.667526721954346, + "learning_rate": 9.78777597395606e-06, + "loss": 0.1889, + "step": 19141 + }, + { + "epoch": 52.15803814713897, + "grad_norm": 5.528557777404785, + "learning_rate": 9.786893678903835e-06, + "loss": 0.1324, + "step": 19142 + }, + { + "epoch": 52.16076294277929, + "grad_norm": 3.8147330284118652, + "learning_rate": 9.786011385511279e-06, + "loss": 0.0893, + "step": 19143 + }, + { + "epoch": 52.16348773841962, + "grad_norm": 3.9426429271698, + "learning_rate": 9.78512909378526e-06, + "loss": 0.0894, + "step": 19144 + }, + { + "epoch": 52.166212534059945, + "grad_norm": 4.193362236022949, + "learning_rate": 9.784246803732648e-06, + "loss": 0.1798, + "step": 19145 + }, + { + "epoch": 52.16893732970027, + "grad_norm": 3.5375497341156006, + "learning_rate": 9.783364515360315e-06, + "loss": 0.1651, + "step": 19146 + }, + { + "epoch": 52.171662125340596, + "grad_norm": 10.843406677246094, + "learning_rate": 9.782482228675132e-06, + "loss": 0.3171, + "step": 19147 + }, + { + "epoch": 52.17438692098093, + "grad_norm": 4.114462852478027, + "learning_rate": 9.781599943683972e-06, + "loss": 0.1131, + "step": 19148 + }, + { + "epoch": 52.177111716621255, + "grad_norm": 4.447324752807617, + "learning_rate": 9.780717660393702e-06, + "loss": 0.2078, + "step": 19149 + }, + { + "epoch": 52.17983651226158, + "grad_norm": 15.412213325500488, + "learning_rate": 9.7798353788112e-06, + "loss": 0.1368, + "step": 19150 + }, + { + "epoch": 52.182561307901906, + "grad_norm": 4.740209102630615, + "learning_rate": 9.778953098943329e-06, + "loss": 0.164, + "step": 19151 + }, + { + "epoch": 52.18528610354223, + "grad_norm": 4.917448997497559, + "learning_rate": 9.778070820796966e-06, + "loss": 0.1054, + "step": 19152 + }, + { + "epoch": 52.18801089918256, + "grad_norm": 4.078722953796387, + "learning_rate": 9.777188544378979e-06, + "loss": 0.2942, + "step": 19153 + }, + { + "epoch": 52.19073569482289, + "grad_norm": 7.165360927581787, + "learning_rate": 9.77630626969624e-06, + "loss": 0.1162, + "step": 19154 + }, + { + "epoch": 52.19346049046322, + "grad_norm": 6.1595258712768555, + "learning_rate": 9.775423996755622e-06, + "loss": 0.1511, + "step": 19155 + }, + { + "epoch": 52.19618528610354, + "grad_norm": 4.429165363311768, + "learning_rate": 9.774541725563996e-06, + "loss": 0.0787, + "step": 19156 + }, + { + "epoch": 52.19891008174387, + "grad_norm": 4.14840841293335, + "learning_rate": 9.773659456128229e-06, + "loss": 0.1928, + "step": 19157 + }, + { + "epoch": 52.201634877384194, + "grad_norm": 4.104926109313965, + "learning_rate": 9.772777188455196e-06, + "loss": 0.0826, + "step": 19158 + }, + { + "epoch": 52.20435967302452, + "grad_norm": 6.021915435791016, + "learning_rate": 9.771894922551763e-06, + "loss": 0.2946, + "step": 19159 + }, + { + "epoch": 52.20708446866485, + "grad_norm": 3.799884557723999, + "learning_rate": 9.771012658424808e-06, + "loss": 0.0798, + "step": 19160 + }, + { + "epoch": 52.20980926430518, + "grad_norm": 3.756002187728882, + "learning_rate": 9.7701303960812e-06, + "loss": 0.1701, + "step": 19161 + }, + { + "epoch": 52.212534059945504, + "grad_norm": 4.617569923400879, + "learning_rate": 9.76924813552781e-06, + "loss": 0.1818, + "step": 19162 + }, + { + "epoch": 52.21525885558583, + "grad_norm": 4.105844497680664, + "learning_rate": 9.768365876771505e-06, + "loss": 0.1153, + "step": 19163 + }, + { + "epoch": 52.217983651226156, + "grad_norm": 4.216437816619873, + "learning_rate": 9.767483619819164e-06, + "loss": 0.1544, + "step": 19164 + }, + { + "epoch": 52.22070844686648, + "grad_norm": 5.39052152633667, + "learning_rate": 9.766601364677648e-06, + "loss": 0.1662, + "step": 19165 + }, + { + "epoch": 52.223433242506815, + "grad_norm": 4.8423895835876465, + "learning_rate": 9.765719111353837e-06, + "loss": 0.3015, + "step": 19166 + }, + { + "epoch": 52.22615803814714, + "grad_norm": 4.74192476272583, + "learning_rate": 9.764836859854595e-06, + "loss": 0.2087, + "step": 19167 + }, + { + "epoch": 52.228882833787466, + "grad_norm": 5.739588260650635, + "learning_rate": 9.763954610186798e-06, + "loss": 0.104, + "step": 19168 + }, + { + "epoch": 52.23160762942779, + "grad_norm": 6.070648670196533, + "learning_rate": 9.763072362357315e-06, + "loss": 0.1366, + "step": 19169 + }, + { + "epoch": 52.23433242506812, + "grad_norm": 4.204780101776123, + "learning_rate": 9.762190116373017e-06, + "loss": 0.2565, + "step": 19170 + }, + { + "epoch": 52.237057220708444, + "grad_norm": 4.189395427703857, + "learning_rate": 9.761307872240773e-06, + "loss": 0.1398, + "step": 19171 + }, + { + "epoch": 52.23978201634878, + "grad_norm": 3.492771625518799, + "learning_rate": 9.760425629967457e-06, + "loss": 0.1139, + "step": 19172 + }, + { + "epoch": 52.2425068119891, + "grad_norm": 4.4667840003967285, + "learning_rate": 9.759543389559937e-06, + "loss": 0.0829, + "step": 19173 + }, + { + "epoch": 52.24523160762943, + "grad_norm": 4.1979522705078125, + "learning_rate": 9.758661151025087e-06, + "loss": 0.0752, + "step": 19174 + }, + { + "epoch": 52.247956403269754, + "grad_norm": 4.452780246734619, + "learning_rate": 9.757778914369774e-06, + "loss": 0.092, + "step": 19175 + }, + { + "epoch": 52.25068119891008, + "grad_norm": 5.760451793670654, + "learning_rate": 9.75689667960087e-06, + "loss": 0.1678, + "step": 19176 + }, + { + "epoch": 52.253405994550405, + "grad_norm": 4.483896255493164, + "learning_rate": 9.75601444672525e-06, + "loss": 0.1453, + "step": 19177 + }, + { + "epoch": 52.25613079019074, + "grad_norm": 4.075677394866943, + "learning_rate": 9.75513221574978e-06, + "loss": 0.1116, + "step": 19178 + }, + { + "epoch": 52.258855585831064, + "grad_norm": 3.575446367263794, + "learning_rate": 9.754249986681334e-06, + "loss": 0.065, + "step": 19179 + }, + { + "epoch": 52.26158038147139, + "grad_norm": 4.823285102844238, + "learning_rate": 9.75336775952678e-06, + "loss": 0.164, + "step": 19180 + }, + { + "epoch": 52.264305177111716, + "grad_norm": 4.425245761871338, + "learning_rate": 9.752485534292992e-06, + "loss": 0.0766, + "step": 19181 + }, + { + "epoch": 52.26702997275204, + "grad_norm": 5.054012298583984, + "learning_rate": 9.751603310986835e-06, + "loss": 0.1827, + "step": 19182 + }, + { + "epoch": 52.26975476839237, + "grad_norm": 3.997870922088623, + "learning_rate": 9.750721089615185e-06, + "loss": 0.0808, + "step": 19183 + }, + { + "epoch": 52.2724795640327, + "grad_norm": 3.9631030559539795, + "learning_rate": 9.749838870184914e-06, + "loss": 0.1113, + "step": 19184 + }, + { + "epoch": 52.275204359673026, + "grad_norm": 4.400388240814209, + "learning_rate": 9.748956652702885e-06, + "loss": 0.1463, + "step": 19185 + }, + { + "epoch": 52.27792915531335, + "grad_norm": 4.180642127990723, + "learning_rate": 9.748074437175979e-06, + "loss": 0.3338, + "step": 19186 + }, + { + "epoch": 52.28065395095368, + "grad_norm": 3.2455155849456787, + "learning_rate": 9.747192223611055e-06, + "loss": 0.1908, + "step": 19187 + }, + { + "epoch": 52.283378746594, + "grad_norm": 6.889337062835693, + "learning_rate": 9.746310012014996e-06, + "loss": 0.1829, + "step": 19188 + }, + { + "epoch": 52.28610354223433, + "grad_norm": 4.764960289001465, + "learning_rate": 9.745427802394662e-06, + "loss": 0.2042, + "step": 19189 + }, + { + "epoch": 52.28882833787466, + "grad_norm": 3.8126718997955322, + "learning_rate": 9.74454559475693e-06, + "loss": 0.0861, + "step": 19190 + }, + { + "epoch": 52.29155313351499, + "grad_norm": 3.9455277919769287, + "learning_rate": 9.743663389108667e-06, + "loss": 0.093, + "step": 19191 + }, + { + "epoch": 52.294277929155314, + "grad_norm": 4.232730388641357, + "learning_rate": 9.742781185456748e-06, + "loss": 0.2172, + "step": 19192 + }, + { + "epoch": 52.29700272479564, + "grad_norm": 11.808323860168457, + "learning_rate": 9.74189898380804e-06, + "loss": 0.0975, + "step": 19193 + }, + { + "epoch": 52.299727520435965, + "grad_norm": 4.863210201263428, + "learning_rate": 9.741016784169409e-06, + "loss": 0.1337, + "step": 19194 + }, + { + "epoch": 52.30245231607629, + "grad_norm": 4.657174587249756, + "learning_rate": 9.740134586547737e-06, + "loss": 0.1553, + "step": 19195 + }, + { + "epoch": 52.305177111716624, + "grad_norm": 2.96730899810791, + "learning_rate": 9.739252390949887e-06, + "loss": 0.2061, + "step": 19196 + }, + { + "epoch": 52.30790190735695, + "grad_norm": 4.627375602722168, + "learning_rate": 9.738370197382732e-06, + "loss": 0.1023, + "step": 19197 + }, + { + "epoch": 52.310626702997276, + "grad_norm": 3.875765562057495, + "learning_rate": 9.73748800585314e-06, + "loss": 0.0961, + "step": 19198 + }, + { + "epoch": 52.3133514986376, + "grad_norm": 4.1032915115356445, + "learning_rate": 9.736605816367984e-06, + "loss": 0.1447, + "step": 19199 + }, + { + "epoch": 52.31607629427793, + "grad_norm": 4.122752666473389, + "learning_rate": 9.735723628934132e-06, + "loss": 0.0795, + "step": 19200 + }, + { + "epoch": 52.31880108991825, + "grad_norm": 4.321817874908447, + "learning_rate": 9.73484144355846e-06, + "loss": 0.332, + "step": 19201 + }, + { + "epoch": 52.321525885558586, + "grad_norm": 4.540710926055908, + "learning_rate": 9.733959260247829e-06, + "loss": 0.1718, + "step": 19202 + }, + { + "epoch": 52.32425068119891, + "grad_norm": 4.2653937339782715, + "learning_rate": 9.733077079009118e-06, + "loss": 0.1837, + "step": 19203 + }, + { + "epoch": 52.32697547683924, + "grad_norm": 3.323207378387451, + "learning_rate": 9.732194899849192e-06, + "loss": 0.1834, + "step": 19204 + }, + { + "epoch": 52.32970027247956, + "grad_norm": 3.735625982284546, + "learning_rate": 9.731312722774924e-06, + "loss": 0.1162, + "step": 19205 + }, + { + "epoch": 52.33242506811989, + "grad_norm": 9.254440307617188, + "learning_rate": 9.730430547793186e-06, + "loss": 0.1432, + "step": 19206 + }, + { + "epoch": 52.335149863760215, + "grad_norm": 4.414444923400879, + "learning_rate": 9.729548374910843e-06, + "loss": 0.2507, + "step": 19207 + }, + { + "epoch": 52.33787465940055, + "grad_norm": 4.62446403503418, + "learning_rate": 9.728666204134772e-06, + "loss": 0.1977, + "step": 19208 + }, + { + "epoch": 52.34059945504087, + "grad_norm": 4.216208457946777, + "learning_rate": 9.727784035471837e-06, + "loss": 0.1967, + "step": 19209 + }, + { + "epoch": 52.3433242506812, + "grad_norm": 3.2713513374328613, + "learning_rate": 9.726901868928913e-06, + "loss": 0.1025, + "step": 19210 + }, + { + "epoch": 52.346049046321525, + "grad_norm": 3.672574281692505, + "learning_rate": 9.726019704512864e-06, + "loss": 0.0612, + "step": 19211 + }, + { + "epoch": 52.34877384196185, + "grad_norm": 4.518486976623535, + "learning_rate": 9.725137542230568e-06, + "loss": 0.2087, + "step": 19212 + }, + { + "epoch": 52.35149863760218, + "grad_norm": 4.896111011505127, + "learning_rate": 9.724255382088895e-06, + "loss": 0.2777, + "step": 19213 + }, + { + "epoch": 52.35422343324251, + "grad_norm": 4.063868999481201, + "learning_rate": 9.723373224094708e-06, + "loss": 0.1814, + "step": 19214 + }, + { + "epoch": 52.356948228882835, + "grad_norm": 4.255677223205566, + "learning_rate": 9.722491068254883e-06, + "loss": 0.1455, + "step": 19215 + }, + { + "epoch": 52.35967302452316, + "grad_norm": 4.90528678894043, + "learning_rate": 9.721608914576288e-06, + "loss": 0.102, + "step": 19216 + }, + { + "epoch": 52.36239782016349, + "grad_norm": 4.571956157684326, + "learning_rate": 9.720726763065795e-06, + "loss": 0.2026, + "step": 19217 + }, + { + "epoch": 52.36512261580381, + "grad_norm": 4.2854108810424805, + "learning_rate": 9.719844613730273e-06, + "loss": 0.16, + "step": 19218 + }, + { + "epoch": 52.36784741144414, + "grad_norm": 3.9086852073669434, + "learning_rate": 9.718962466576592e-06, + "loss": 0.1718, + "step": 19219 + }, + { + "epoch": 52.37057220708447, + "grad_norm": 5.214824199676514, + "learning_rate": 9.71808032161162e-06, + "loss": 0.1705, + "step": 19220 + }, + { + "epoch": 52.3732970027248, + "grad_norm": 3.797212839126587, + "learning_rate": 9.717198178842234e-06, + "loss": 0.2025, + "step": 19221 + }, + { + "epoch": 52.37602179836512, + "grad_norm": 4.190108776092529, + "learning_rate": 9.716316038275295e-06, + "loss": 0.082, + "step": 19222 + }, + { + "epoch": 52.37874659400545, + "grad_norm": 4.681421279907227, + "learning_rate": 9.715433899917682e-06, + "loss": 0.2673, + "step": 19223 + }, + { + "epoch": 52.381471389645775, + "grad_norm": 5.3838324546813965, + "learning_rate": 9.714551763776255e-06, + "loss": 0.1939, + "step": 19224 + }, + { + "epoch": 52.3841961852861, + "grad_norm": 4.088294506072998, + "learning_rate": 9.713669629857894e-06, + "loss": 0.1051, + "step": 19225 + }, + { + "epoch": 52.38692098092643, + "grad_norm": 3.0899713039398193, + "learning_rate": 9.712787498169462e-06, + "loss": 0.0621, + "step": 19226 + }, + { + "epoch": 52.38964577656676, + "grad_norm": 4.062369346618652, + "learning_rate": 9.711905368717834e-06, + "loss": 0.1527, + "step": 19227 + }, + { + "epoch": 52.392370572207085, + "grad_norm": 4.366440773010254, + "learning_rate": 9.711023241509873e-06, + "loss": 0.0976, + "step": 19228 + }, + { + "epoch": 52.39509536784741, + "grad_norm": 5.699102401733398, + "learning_rate": 9.710141116552458e-06, + "loss": 0.1762, + "step": 19229 + }, + { + "epoch": 52.39782016348774, + "grad_norm": 6.592490196228027, + "learning_rate": 9.709258993852453e-06, + "loss": 0.1911, + "step": 19230 + }, + { + "epoch": 52.40054495912806, + "grad_norm": 5.691075801849365, + "learning_rate": 9.708376873416732e-06, + "loss": 0.1322, + "step": 19231 + }, + { + "epoch": 52.403269754768395, + "grad_norm": 5.219867706298828, + "learning_rate": 9.70749475525216e-06, + "loss": 0.169, + "step": 19232 + }, + { + "epoch": 52.40599455040872, + "grad_norm": 4.067953586578369, + "learning_rate": 9.706612639365613e-06, + "loss": 0.164, + "step": 19233 + }, + { + "epoch": 52.40871934604905, + "grad_norm": 3.9165313243865967, + "learning_rate": 9.705730525763951e-06, + "loss": 0.1286, + "step": 19234 + }, + { + "epoch": 52.41144414168937, + "grad_norm": 3.8384532928466797, + "learning_rate": 9.704848414454057e-06, + "loss": 0.1876, + "step": 19235 + }, + { + "epoch": 52.4141689373297, + "grad_norm": 3.8974759578704834, + "learning_rate": 9.70396630544279e-06, + "loss": 0.1039, + "step": 19236 + }, + { + "epoch": 52.416893732970024, + "grad_norm": 4.8549580574035645, + "learning_rate": 9.703084198737028e-06, + "loss": 0.1575, + "step": 19237 + }, + { + "epoch": 52.41961852861036, + "grad_norm": 4.355259418487549, + "learning_rate": 9.702202094343631e-06, + "loss": 0.1488, + "step": 19238 + }, + { + "epoch": 52.42234332425068, + "grad_norm": 3.9184348583221436, + "learning_rate": 9.701319992269479e-06, + "loss": 0.0948, + "step": 19239 + }, + { + "epoch": 52.42506811989101, + "grad_norm": 4.7135725021362305, + "learning_rate": 9.700437892521434e-06, + "loss": 0.236, + "step": 19240 + }, + { + "epoch": 52.427792915531334, + "grad_norm": 3.2412667274475098, + "learning_rate": 9.699555795106373e-06, + "loss": 0.0877, + "step": 19241 + }, + { + "epoch": 52.43051771117166, + "grad_norm": 4.784268379211426, + "learning_rate": 9.698673700031159e-06, + "loss": 0.0706, + "step": 19242 + }, + { + "epoch": 52.433242506811986, + "grad_norm": 4.160239219665527, + "learning_rate": 9.697791607302665e-06, + "loss": 0.0824, + "step": 19243 + }, + { + "epoch": 52.43596730245232, + "grad_norm": 4.861740589141846, + "learning_rate": 9.69690951692776e-06, + "loss": 0.179, + "step": 19244 + }, + { + "epoch": 52.438692098092645, + "grad_norm": 5.323450565338135, + "learning_rate": 9.69602742891331e-06, + "loss": 0.1943, + "step": 19245 + }, + { + "epoch": 52.44141689373297, + "grad_norm": 5.598095417022705, + "learning_rate": 9.695145343266195e-06, + "loss": 0.146, + "step": 19246 + }, + { + "epoch": 52.444141689373296, + "grad_norm": 4.833616256713867, + "learning_rate": 9.694263259993274e-06, + "loss": 0.0836, + "step": 19247 + }, + { + "epoch": 52.44686648501362, + "grad_norm": 3.781280517578125, + "learning_rate": 9.693381179101423e-06, + "loss": 0.0723, + "step": 19248 + }, + { + "epoch": 52.44959128065395, + "grad_norm": 9.509787559509277, + "learning_rate": 9.69249910059751e-06, + "loss": 0.1396, + "step": 19249 + }, + { + "epoch": 52.45231607629428, + "grad_norm": 4.508984565734863, + "learning_rate": 9.691617024488402e-06, + "loss": 0.073, + "step": 19250 + }, + { + "epoch": 52.45504087193461, + "grad_norm": 5.343342304229736, + "learning_rate": 9.690734950780973e-06, + "loss": 0.1266, + "step": 19251 + }, + { + "epoch": 52.45776566757493, + "grad_norm": 4.149517059326172, + "learning_rate": 9.689852879482089e-06, + "loss": 0.0921, + "step": 19252 + }, + { + "epoch": 52.46049046321526, + "grad_norm": 5.513681888580322, + "learning_rate": 9.688970810598622e-06, + "loss": 0.1791, + "step": 19253 + }, + { + "epoch": 52.463215258855584, + "grad_norm": 3.3647594451904297, + "learning_rate": 9.688088744137438e-06, + "loss": 0.1007, + "step": 19254 + }, + { + "epoch": 52.46594005449591, + "grad_norm": 3.7131452560424805, + "learning_rate": 9.687206680105412e-06, + "loss": 0.0605, + "step": 19255 + }, + { + "epoch": 52.46866485013624, + "grad_norm": 4.058668613433838, + "learning_rate": 9.686324618509409e-06, + "loss": 0.0623, + "step": 19256 + }, + { + "epoch": 52.47138964577657, + "grad_norm": 5.368107795715332, + "learning_rate": 9.6854425593563e-06, + "loss": 0.0909, + "step": 19257 + }, + { + "epoch": 52.474114441416894, + "grad_norm": 4.719025611877441, + "learning_rate": 9.684560502652952e-06, + "loss": 0.1163, + "step": 19258 + }, + { + "epoch": 52.47683923705722, + "grad_norm": 3.9193098545074463, + "learning_rate": 9.68367844840624e-06, + "loss": 0.157, + "step": 19259 + }, + { + "epoch": 52.479564032697546, + "grad_norm": 4.803292751312256, + "learning_rate": 9.682796396623027e-06, + "loss": 0.1858, + "step": 19260 + }, + { + "epoch": 52.48228882833787, + "grad_norm": 3.553367853164673, + "learning_rate": 9.681914347310188e-06, + "loss": 0.0781, + "step": 19261 + }, + { + "epoch": 52.485013623978205, + "grad_norm": 6.250884532928467, + "learning_rate": 9.681032300474586e-06, + "loss": 0.1178, + "step": 19262 + }, + { + "epoch": 52.48773841961853, + "grad_norm": 4.706630229949951, + "learning_rate": 9.680150256123096e-06, + "loss": 0.1932, + "step": 19263 + }, + { + "epoch": 52.490463215258856, + "grad_norm": 5.85382080078125, + "learning_rate": 9.679268214262588e-06, + "loss": 0.1317, + "step": 19264 + }, + { + "epoch": 52.49318801089918, + "grad_norm": 5.139765739440918, + "learning_rate": 9.678386174899925e-06, + "loss": 0.1764, + "step": 19265 + }, + { + "epoch": 52.49591280653951, + "grad_norm": 4.154210567474365, + "learning_rate": 9.677504138041984e-06, + "loss": 0.0861, + "step": 19266 + }, + { + "epoch": 52.49863760217983, + "grad_norm": 4.736916542053223, + "learning_rate": 9.676622103695628e-06, + "loss": 0.1052, + "step": 19267 + }, + { + "epoch": 52.50136239782017, + "grad_norm": 3.8731517791748047, + "learning_rate": 9.675740071867729e-06, + "loss": 0.2096, + "step": 19268 + }, + { + "epoch": 52.50408719346049, + "grad_norm": 5.190960884094238, + "learning_rate": 9.674858042565157e-06, + "loss": 0.1572, + "step": 19269 + }, + { + "epoch": 52.50681198910082, + "grad_norm": 5.408673286437988, + "learning_rate": 9.673976015794778e-06, + "loss": 0.1133, + "step": 19270 + }, + { + "epoch": 52.509536784741144, + "grad_norm": 4.685727596282959, + "learning_rate": 9.673093991563466e-06, + "loss": 0.1489, + "step": 19271 + }, + { + "epoch": 52.51226158038147, + "grad_norm": 5.208731651306152, + "learning_rate": 9.672211969878085e-06, + "loss": 0.2998, + "step": 19272 + }, + { + "epoch": 52.514986376021795, + "grad_norm": 4.553671360015869, + "learning_rate": 9.671329950745509e-06, + "loss": 0.3697, + "step": 19273 + }, + { + "epoch": 52.51771117166213, + "grad_norm": 5.830882549285889, + "learning_rate": 9.670447934172602e-06, + "loss": 0.1832, + "step": 19274 + }, + { + "epoch": 52.520435967302454, + "grad_norm": 4.45698356628418, + "learning_rate": 9.669565920166238e-06, + "loss": 0.1636, + "step": 19275 + }, + { + "epoch": 52.52316076294278, + "grad_norm": 4.683032989501953, + "learning_rate": 9.668683908733283e-06, + "loss": 0.1836, + "step": 19276 + }, + { + "epoch": 52.525885558583106, + "grad_norm": 6.098485946655273, + "learning_rate": 9.667801899880609e-06, + "loss": 0.1793, + "step": 19277 + }, + { + "epoch": 52.52861035422343, + "grad_norm": 3.737724781036377, + "learning_rate": 9.66691989361508e-06, + "loss": 0.1247, + "step": 19278 + }, + { + "epoch": 52.53133514986376, + "grad_norm": 3.9942116737365723, + "learning_rate": 9.66603788994357e-06, + "loss": 0.1259, + "step": 19279 + }, + { + "epoch": 52.53405994550409, + "grad_norm": 4.8618035316467285, + "learning_rate": 9.665155888872943e-06, + "loss": 0.1133, + "step": 19280 + }, + { + "epoch": 52.536784741144416, + "grad_norm": 4.010344982147217, + "learning_rate": 9.664273890410073e-06, + "loss": 0.1095, + "step": 19281 + }, + { + "epoch": 52.53950953678474, + "grad_norm": 4.521393775939941, + "learning_rate": 9.66339189456183e-06, + "loss": 0.1318, + "step": 19282 + }, + { + "epoch": 52.54223433242507, + "grad_norm": 5.568043231964111, + "learning_rate": 9.662509901335077e-06, + "loss": 0.1339, + "step": 19283 + }, + { + "epoch": 52.54495912806539, + "grad_norm": 7.71300745010376, + "learning_rate": 9.661627910736689e-06, + "loss": 0.1413, + "step": 19284 + }, + { + "epoch": 52.54768392370572, + "grad_norm": 4.08627986907959, + "learning_rate": 9.660745922773529e-06, + "loss": 0.0931, + "step": 19285 + }, + { + "epoch": 52.55040871934605, + "grad_norm": 4.967341423034668, + "learning_rate": 9.65986393745247e-06, + "loss": 0.1998, + "step": 19286 + }, + { + "epoch": 52.55313351498638, + "grad_norm": 4.925725936889648, + "learning_rate": 9.65898195478038e-06, + "loss": 0.1094, + "step": 19287 + }, + { + "epoch": 52.555858310626704, + "grad_norm": 4.59002685546875, + "learning_rate": 9.658099974764129e-06, + "loss": 0.085, + "step": 19288 + }, + { + "epoch": 52.55858310626703, + "grad_norm": 5.515731334686279, + "learning_rate": 9.65721799741058e-06, + "loss": 0.2105, + "step": 19289 + }, + { + "epoch": 52.561307901907355, + "grad_norm": 4.188617706298828, + "learning_rate": 9.656336022726612e-06, + "loss": 0.076, + "step": 19290 + }, + { + "epoch": 52.56403269754768, + "grad_norm": 4.015984535217285, + "learning_rate": 9.655454050719081e-06, + "loss": 0.14, + "step": 19291 + }, + { + "epoch": 52.566757493188014, + "grad_norm": 3.490887403488159, + "learning_rate": 9.654572081394868e-06, + "loss": 0.068, + "step": 19292 + }, + { + "epoch": 52.56948228882834, + "grad_norm": 4.456308364868164, + "learning_rate": 9.653690114760835e-06, + "loss": 0.0687, + "step": 19293 + }, + { + "epoch": 52.572207084468666, + "grad_norm": 5.373715400695801, + "learning_rate": 9.65280815082385e-06, + "loss": 0.2611, + "step": 19294 + }, + { + "epoch": 52.57493188010899, + "grad_norm": 4.22686767578125, + "learning_rate": 9.65192618959079e-06, + "loss": 0.2667, + "step": 19295 + }, + { + "epoch": 52.57765667574932, + "grad_norm": 4.848435401916504, + "learning_rate": 9.651044231068513e-06, + "loss": 0.116, + "step": 19296 + }, + { + "epoch": 52.58038147138964, + "grad_norm": 5.875431537628174, + "learning_rate": 9.650162275263889e-06, + "loss": 0.2575, + "step": 19297 + }, + { + "epoch": 52.583106267029976, + "grad_norm": 5.266987323760986, + "learning_rate": 9.649280322183796e-06, + "loss": 0.099, + "step": 19298 + }, + { + "epoch": 52.5858310626703, + "grad_norm": 3.639037609100342, + "learning_rate": 9.648398371835094e-06, + "loss": 0.1616, + "step": 19299 + }, + { + "epoch": 52.58855585831063, + "grad_norm": 4.050128936767578, + "learning_rate": 9.647516424224655e-06, + "loss": 0.3132, + "step": 19300 + }, + { + "epoch": 52.59128065395095, + "grad_norm": 3.4647326469421387, + "learning_rate": 9.646634479359346e-06, + "loss": 0.0794, + "step": 19301 + }, + { + "epoch": 52.59400544959128, + "grad_norm": 5.349648952484131, + "learning_rate": 9.645752537246038e-06, + "loss": 0.1169, + "step": 19302 + }, + { + "epoch": 52.596730245231605, + "grad_norm": 5.098369121551514, + "learning_rate": 9.644870597891597e-06, + "loss": 0.1406, + "step": 19303 + }, + { + "epoch": 52.59945504087194, + "grad_norm": 3.8686046600341797, + "learning_rate": 9.643988661302893e-06, + "loss": 0.2649, + "step": 19304 + }, + { + "epoch": 52.60217983651226, + "grad_norm": 4.619300365447998, + "learning_rate": 9.643106727486792e-06, + "loss": 0.1186, + "step": 19305 + }, + { + "epoch": 52.60490463215259, + "grad_norm": 4.731567859649658, + "learning_rate": 9.642224796450165e-06, + "loss": 0.2956, + "step": 19306 + }, + { + "epoch": 52.607629427792915, + "grad_norm": 4.745423316955566, + "learning_rate": 9.64134286819988e-06, + "loss": 0.1265, + "step": 19307 + }, + { + "epoch": 52.61035422343324, + "grad_norm": 4.2086381912231445, + "learning_rate": 9.640460942742806e-06, + "loss": 0.0755, + "step": 19308 + }, + { + "epoch": 52.61307901907357, + "grad_norm": 5.149787425994873, + "learning_rate": 9.63957902008581e-06, + "loss": 0.1888, + "step": 19309 + }, + { + "epoch": 52.6158038147139, + "grad_norm": 3.8726794719696045, + "learning_rate": 9.638697100235763e-06, + "loss": 0.1378, + "step": 19310 + }, + { + "epoch": 52.618528610354225, + "grad_norm": 3.5131676197052, + "learning_rate": 9.637815183199527e-06, + "loss": 0.0739, + "step": 19311 + }, + { + "epoch": 52.62125340599455, + "grad_norm": 4.361724376678467, + "learning_rate": 9.636933268983979e-06, + "loss": 0.1274, + "step": 19312 + }, + { + "epoch": 52.62397820163488, + "grad_norm": 4.908632278442383, + "learning_rate": 9.636051357595979e-06, + "loss": 0.0928, + "step": 19313 + }, + { + "epoch": 52.6267029972752, + "grad_norm": 3.4299521446228027, + "learning_rate": 9.635169449042398e-06, + "loss": 0.1616, + "step": 19314 + }, + { + "epoch": 52.62942779291553, + "grad_norm": 5.611042022705078, + "learning_rate": 9.634287543330109e-06, + "loss": 0.1075, + "step": 19315 + }, + { + "epoch": 52.63215258855586, + "grad_norm": 5.181185722351074, + "learning_rate": 9.633405640465977e-06, + "loss": 0.1499, + "step": 19316 + }, + { + "epoch": 52.63487738419619, + "grad_norm": 3.2112326622009277, + "learning_rate": 9.632523740456869e-06, + "loss": 0.1762, + "step": 19317 + }, + { + "epoch": 52.63760217983651, + "grad_norm": 4.11383581161499, + "learning_rate": 9.631641843309656e-06, + "loss": 0.082, + "step": 19318 + }, + { + "epoch": 52.64032697547684, + "grad_norm": 4.444210529327393, + "learning_rate": 9.630759949031203e-06, + "loss": 0.1227, + "step": 19319 + }, + { + "epoch": 52.643051771117165, + "grad_norm": 3.353123664855957, + "learning_rate": 9.629878057628382e-06, + "loss": 0.1317, + "step": 19320 + }, + { + "epoch": 52.64577656675749, + "grad_norm": 4.4403486251831055, + "learning_rate": 9.628996169108056e-06, + "loss": 0.1149, + "step": 19321 + }, + { + "epoch": 52.64850136239782, + "grad_norm": 2.984766960144043, + "learning_rate": 9.628114283477098e-06, + "loss": 0.0698, + "step": 19322 + }, + { + "epoch": 52.65122615803815, + "grad_norm": 3.924394130706787, + "learning_rate": 9.62723240074237e-06, + "loss": 0.1254, + "step": 19323 + }, + { + "epoch": 52.653950953678475, + "grad_norm": 4.6532087326049805, + "learning_rate": 9.62635052091075e-06, + "loss": 0.0829, + "step": 19324 + }, + { + "epoch": 52.6566757493188, + "grad_norm": 3.568769693374634, + "learning_rate": 9.625468643989096e-06, + "loss": 0.1329, + "step": 19325 + }, + { + "epoch": 52.65940054495913, + "grad_norm": 4.401582717895508, + "learning_rate": 9.624586769984282e-06, + "loss": 0.1092, + "step": 19326 + }, + { + "epoch": 52.66212534059945, + "grad_norm": 4.047064781188965, + "learning_rate": 9.623704898903173e-06, + "loss": 0.0823, + "step": 19327 + }, + { + "epoch": 52.664850136239785, + "grad_norm": 6.713965892791748, + "learning_rate": 9.622823030752639e-06, + "loss": 0.1693, + "step": 19328 + }, + { + "epoch": 52.66757493188011, + "grad_norm": 4.513161659240723, + "learning_rate": 9.621941165539546e-06, + "loss": 0.1448, + "step": 19329 + }, + { + "epoch": 52.67029972752044, + "grad_norm": 4.816930294036865, + "learning_rate": 9.621059303270765e-06, + "loss": 0.113, + "step": 19330 + }, + { + "epoch": 52.67302452316076, + "grad_norm": 4.622618675231934, + "learning_rate": 9.620177443953156e-06, + "loss": 0.0817, + "step": 19331 + }, + { + "epoch": 52.67574931880109, + "grad_norm": 3.708385944366455, + "learning_rate": 9.619295587593597e-06, + "loss": 0.1095, + "step": 19332 + }, + { + "epoch": 52.678474114441414, + "grad_norm": 3.9158594608306885, + "learning_rate": 9.61841373419895e-06, + "loss": 0.0974, + "step": 19333 + }, + { + "epoch": 52.68119891008175, + "grad_norm": 5.615607261657715, + "learning_rate": 9.617531883776088e-06, + "loss": 0.2291, + "step": 19334 + }, + { + "epoch": 52.68392370572207, + "grad_norm": 5.181751251220703, + "learning_rate": 9.616650036331874e-06, + "loss": 0.2695, + "step": 19335 + }, + { + "epoch": 52.6866485013624, + "grad_norm": 4.0438151359558105, + "learning_rate": 9.615768191873179e-06, + "loss": 0.2152, + "step": 19336 + }, + { + "epoch": 52.689373297002724, + "grad_norm": 3.4214389324188232, + "learning_rate": 9.614886350406865e-06, + "loss": 0.0804, + "step": 19337 + }, + { + "epoch": 52.69209809264305, + "grad_norm": 3.4087636470794678, + "learning_rate": 9.614004511939807e-06, + "loss": 0.0582, + "step": 19338 + }, + { + "epoch": 52.694822888283376, + "grad_norm": 4.2999043464660645, + "learning_rate": 9.613122676478868e-06, + "loss": 0.1115, + "step": 19339 + }, + { + "epoch": 52.69754768392371, + "grad_norm": 4.865885257720947, + "learning_rate": 9.612240844030917e-06, + "loss": 0.135, + "step": 19340 + }, + { + "epoch": 52.700272479564035, + "grad_norm": 4.982079982757568, + "learning_rate": 9.611359014602823e-06, + "loss": 0.1326, + "step": 19341 + }, + { + "epoch": 52.70299727520436, + "grad_norm": 4.406929016113281, + "learning_rate": 9.610477188201452e-06, + "loss": 0.1047, + "step": 19342 + }, + { + "epoch": 52.705722070844686, + "grad_norm": 4.624931335449219, + "learning_rate": 9.609595364833672e-06, + "loss": 0.2232, + "step": 19343 + }, + { + "epoch": 52.70844686648501, + "grad_norm": 4.764208793640137, + "learning_rate": 9.60871354450635e-06, + "loss": 0.0927, + "step": 19344 + }, + { + "epoch": 52.71117166212534, + "grad_norm": 4.3923540115356445, + "learning_rate": 9.607831727226355e-06, + "loss": 0.1221, + "step": 19345 + }, + { + "epoch": 52.71389645776567, + "grad_norm": 3.9085776805877686, + "learning_rate": 9.606949913000554e-06, + "loss": 0.2829, + "step": 19346 + }, + { + "epoch": 52.716621253406, + "grad_norm": 4.042550563812256, + "learning_rate": 9.606068101835815e-06, + "loss": 0.1434, + "step": 19347 + }, + { + "epoch": 52.71934604904632, + "grad_norm": 3.807206392288208, + "learning_rate": 9.605186293739e-06, + "loss": 0.0913, + "step": 19348 + }, + { + "epoch": 52.72207084468665, + "grad_norm": 3.671191692352295, + "learning_rate": 9.604304488716987e-06, + "loss": 0.123, + "step": 19349 + }, + { + "epoch": 52.724795640326974, + "grad_norm": 4.420248031616211, + "learning_rate": 9.603422686776635e-06, + "loss": 0.1785, + "step": 19350 + }, + { + "epoch": 52.7275204359673, + "grad_norm": 4.048986434936523, + "learning_rate": 9.602540887924819e-06, + "loss": 0.1077, + "step": 19351 + }, + { + "epoch": 52.73024523160763, + "grad_norm": 3.655841588973999, + "learning_rate": 9.601659092168395e-06, + "loss": 0.0767, + "step": 19352 + }, + { + "epoch": 52.73297002724796, + "grad_norm": 4.169539928436279, + "learning_rate": 9.600777299514243e-06, + "loss": 0.204, + "step": 19353 + }, + { + "epoch": 52.735694822888284, + "grad_norm": 4.01200008392334, + "learning_rate": 9.59989550996922e-06, + "loss": 0.0708, + "step": 19354 + }, + { + "epoch": 52.73841961852861, + "grad_norm": 3.724123001098633, + "learning_rate": 9.599013723540204e-06, + "loss": 0.0999, + "step": 19355 + }, + { + "epoch": 52.741144414168936, + "grad_norm": 4.897405624389648, + "learning_rate": 9.598131940234051e-06, + "loss": 0.2238, + "step": 19356 + }, + { + "epoch": 52.74386920980926, + "grad_norm": 4.107428550720215, + "learning_rate": 9.597250160057635e-06, + "loss": 0.0983, + "step": 19357 + }, + { + "epoch": 52.746594005449595, + "grad_norm": 4.829750061035156, + "learning_rate": 9.596368383017822e-06, + "loss": 0.0737, + "step": 19358 + }, + { + "epoch": 52.74931880108992, + "grad_norm": 4.205144882202148, + "learning_rate": 9.595486609121477e-06, + "loss": 0.3055, + "step": 19359 + }, + { + "epoch": 52.752043596730246, + "grad_norm": 5.4464826583862305, + "learning_rate": 9.594604838375473e-06, + "loss": 0.1822, + "step": 19360 + }, + { + "epoch": 52.75476839237057, + "grad_norm": 3.527435779571533, + "learning_rate": 9.593723070786671e-06, + "loss": 0.0826, + "step": 19361 + }, + { + "epoch": 52.7574931880109, + "grad_norm": 4.032792568206787, + "learning_rate": 9.592841306361942e-06, + "loss": 0.1613, + "step": 19362 + }, + { + "epoch": 52.76021798365122, + "grad_norm": 4.165923118591309, + "learning_rate": 9.59195954510815e-06, + "loss": 0.1055, + "step": 19363 + }, + { + "epoch": 52.762942779291556, + "grad_norm": 5.197146892547607, + "learning_rate": 9.591077787032166e-06, + "loss": 0.1861, + "step": 19364 + }, + { + "epoch": 52.76566757493188, + "grad_norm": 6.287145614624023, + "learning_rate": 9.590196032140852e-06, + "loss": 0.0796, + "step": 19365 + }, + { + "epoch": 52.76839237057221, + "grad_norm": 5.605803966522217, + "learning_rate": 9.589314280441077e-06, + "loss": 0.1606, + "step": 19366 + }, + { + "epoch": 52.771117166212534, + "grad_norm": 3.812502145767212, + "learning_rate": 9.588432531939714e-06, + "loss": 0.0775, + "step": 19367 + }, + { + "epoch": 52.77384196185286, + "grad_norm": 5.06690788269043, + "learning_rate": 9.587550786643623e-06, + "loss": 0.1423, + "step": 19368 + }, + { + "epoch": 52.776566757493185, + "grad_norm": 4.095958709716797, + "learning_rate": 9.586669044559674e-06, + "loss": 0.212, + "step": 19369 + }, + { + "epoch": 52.77929155313352, + "grad_norm": 5.3416666984558105, + "learning_rate": 9.585787305694733e-06, + "loss": 0.314, + "step": 19370 + }, + { + "epoch": 52.782016348773844, + "grad_norm": 4.653022289276123, + "learning_rate": 9.584905570055668e-06, + "loss": 0.1592, + "step": 19371 + }, + { + "epoch": 52.78474114441417, + "grad_norm": 8.40907096862793, + "learning_rate": 9.584023837649343e-06, + "loss": 0.08, + "step": 19372 + }, + { + "epoch": 52.787465940054496, + "grad_norm": 6.979483604431152, + "learning_rate": 9.58314210848263e-06, + "loss": 0.1268, + "step": 19373 + }, + { + "epoch": 52.79019073569482, + "grad_norm": 4.940918922424316, + "learning_rate": 9.582260382562389e-06, + "loss": 0.0934, + "step": 19374 + }, + { + "epoch": 52.79291553133515, + "grad_norm": 4.029472827911377, + "learning_rate": 9.581378659895494e-06, + "loss": 0.0955, + "step": 19375 + }, + { + "epoch": 52.79564032697548, + "grad_norm": 3.5107131004333496, + "learning_rate": 9.580496940488806e-06, + "loss": 0.1079, + "step": 19376 + }, + { + "epoch": 52.798365122615806, + "grad_norm": 7.501389503479004, + "learning_rate": 9.579615224349195e-06, + "loss": 0.2101, + "step": 19377 + }, + { + "epoch": 52.80108991825613, + "grad_norm": 3.9385881423950195, + "learning_rate": 9.578733511483527e-06, + "loss": 0.0731, + "step": 19378 + }, + { + "epoch": 52.80381471389646, + "grad_norm": 4.246493339538574, + "learning_rate": 9.577851801898669e-06, + "loss": 0.1004, + "step": 19379 + }, + { + "epoch": 52.80653950953678, + "grad_norm": 4.60960578918457, + "learning_rate": 9.57697009560149e-06, + "loss": 0.2342, + "step": 19380 + }, + { + "epoch": 52.80926430517711, + "grad_norm": 3.791977643966675, + "learning_rate": 9.57608839259885e-06, + "loss": 0.2611, + "step": 19381 + }, + { + "epoch": 52.81198910081744, + "grad_norm": 4.869720935821533, + "learning_rate": 9.575206692897624e-06, + "loss": 0.2234, + "step": 19382 + }, + { + "epoch": 52.81471389645777, + "grad_norm": 4.54078483581543, + "learning_rate": 9.574324996504669e-06, + "loss": 0.1507, + "step": 19383 + }, + { + "epoch": 52.817438692098094, + "grad_norm": 4.842339038848877, + "learning_rate": 9.573443303426861e-06, + "loss": 0.1372, + "step": 19384 + }, + { + "epoch": 52.82016348773842, + "grad_norm": 5.749547481536865, + "learning_rate": 9.572561613671063e-06, + "loss": 0.1336, + "step": 19385 + }, + { + "epoch": 52.822888283378745, + "grad_norm": 4.521557807922363, + "learning_rate": 9.571679927244141e-06, + "loss": 0.305, + "step": 19386 + }, + { + "epoch": 52.82561307901907, + "grad_norm": 4.607681751251221, + "learning_rate": 9.570798244152962e-06, + "loss": 0.1954, + "step": 19387 + }, + { + "epoch": 52.828337874659404, + "grad_norm": 4.482492446899414, + "learning_rate": 9.569916564404392e-06, + "loss": 0.0844, + "step": 19388 + }, + { + "epoch": 52.83106267029973, + "grad_norm": 3.874396324157715, + "learning_rate": 9.5690348880053e-06, + "loss": 0.1349, + "step": 19389 + }, + { + "epoch": 52.833787465940055, + "grad_norm": 3.666623592376709, + "learning_rate": 9.568153214962548e-06, + "loss": 0.0805, + "step": 19390 + }, + { + "epoch": 52.83651226158038, + "grad_norm": 4.0994553565979, + "learning_rate": 9.567271545283008e-06, + "loss": 0.1871, + "step": 19391 + }, + { + "epoch": 52.83923705722071, + "grad_norm": 3.9918689727783203, + "learning_rate": 9.566389878973539e-06, + "loss": 0.0865, + "step": 19392 + }, + { + "epoch": 52.84196185286103, + "grad_norm": 5.492431640625, + "learning_rate": 9.565508216041015e-06, + "loss": 0.1218, + "step": 19393 + }, + { + "epoch": 52.844686648501366, + "grad_norm": 5.203312397003174, + "learning_rate": 9.564626556492297e-06, + "loss": 0.0878, + "step": 19394 + }, + { + "epoch": 52.84741144414169, + "grad_norm": 3.5612733364105225, + "learning_rate": 9.563744900334256e-06, + "loss": 0.1608, + "step": 19395 + }, + { + "epoch": 52.85013623978202, + "grad_norm": 5.559460163116455, + "learning_rate": 9.562863247573753e-06, + "loss": 0.0751, + "step": 19396 + }, + { + "epoch": 52.85286103542234, + "grad_norm": 3.9738035202026367, + "learning_rate": 9.561981598217658e-06, + "loss": 0.245, + "step": 19397 + }, + { + "epoch": 52.85558583106267, + "grad_norm": 3.7084290981292725, + "learning_rate": 9.561099952272835e-06, + "loss": 0.0937, + "step": 19398 + }, + { + "epoch": 52.858310626702995, + "grad_norm": 5.085404396057129, + "learning_rate": 9.560218309746154e-06, + "loss": 0.1895, + "step": 19399 + }, + { + "epoch": 52.86103542234333, + "grad_norm": 3.99646258354187, + "learning_rate": 9.559336670644472e-06, + "loss": 0.1783, + "step": 19400 + }, + { + "epoch": 52.86376021798365, + "grad_norm": 5.141168117523193, + "learning_rate": 9.558455034974667e-06, + "loss": 0.118, + "step": 19401 + }, + { + "epoch": 52.86648501362398, + "grad_norm": 3.759382486343384, + "learning_rate": 9.5575734027436e-06, + "loss": 0.1975, + "step": 19402 + }, + { + "epoch": 52.869209809264305, + "grad_norm": 4.657748222351074, + "learning_rate": 9.556691773958137e-06, + "loss": 0.0998, + "step": 19403 + }, + { + "epoch": 52.87193460490463, + "grad_norm": 4.618873119354248, + "learning_rate": 9.555810148625144e-06, + "loss": 0.2024, + "step": 19404 + }, + { + "epoch": 52.87465940054496, + "grad_norm": 4.090301513671875, + "learning_rate": 9.55492852675149e-06, + "loss": 0.1703, + "step": 19405 + }, + { + "epoch": 52.87738419618529, + "grad_norm": 5.711353778839111, + "learning_rate": 9.554046908344034e-06, + "loss": 0.0974, + "step": 19406 + }, + { + "epoch": 52.880108991825615, + "grad_norm": 5.343455791473389, + "learning_rate": 9.55316529340965e-06, + "loss": 0.1682, + "step": 19407 + }, + { + "epoch": 52.88283378746594, + "grad_norm": 4.769092082977295, + "learning_rate": 9.552283681955196e-06, + "loss": 0.1935, + "step": 19408 + }, + { + "epoch": 52.88555858310627, + "grad_norm": 3.6172735691070557, + "learning_rate": 9.551402073987547e-06, + "loss": 0.1412, + "step": 19409 + }, + { + "epoch": 52.88828337874659, + "grad_norm": 4.08225154876709, + "learning_rate": 9.55052046951356e-06, + "loss": 0.1674, + "step": 19410 + }, + { + "epoch": 52.89100817438692, + "grad_norm": 6.741689205169678, + "learning_rate": 9.549638868540108e-06, + "loss": 0.1482, + "step": 19411 + }, + { + "epoch": 52.89373297002725, + "grad_norm": 4.846926212310791, + "learning_rate": 9.548757271074053e-06, + "loss": 0.1357, + "step": 19412 + }, + { + "epoch": 52.89645776566758, + "grad_norm": 6.184783458709717, + "learning_rate": 9.547875677122262e-06, + "loss": 0.1598, + "step": 19413 + }, + { + "epoch": 52.8991825613079, + "grad_norm": 5.16526460647583, + "learning_rate": 9.5469940866916e-06, + "loss": 0.1519, + "step": 19414 + }, + { + "epoch": 52.90190735694823, + "grad_norm": 3.609684467315674, + "learning_rate": 9.546112499788935e-06, + "loss": 0.0773, + "step": 19415 + }, + { + "epoch": 52.904632152588555, + "grad_norm": 5.692165851593018, + "learning_rate": 9.545230916421129e-06, + "loss": 0.1726, + "step": 19416 + }, + { + "epoch": 52.90735694822888, + "grad_norm": 4.304907321929932, + "learning_rate": 9.544349336595049e-06, + "loss": 0.1301, + "step": 19417 + }, + { + "epoch": 52.91008174386921, + "grad_norm": 5.129548072814941, + "learning_rate": 9.543467760317565e-06, + "loss": 0.1788, + "step": 19418 + }, + { + "epoch": 52.91280653950954, + "grad_norm": 3.5996346473693848, + "learning_rate": 9.542586187595537e-06, + "loss": 0.127, + "step": 19419 + }, + { + "epoch": 52.915531335149865, + "grad_norm": 5.412356376647949, + "learning_rate": 9.541704618435834e-06, + "loss": 0.2205, + "step": 19420 + }, + { + "epoch": 52.91825613079019, + "grad_norm": 3.9680113792419434, + "learning_rate": 9.540823052845323e-06, + "loss": 0.1297, + "step": 19421 + }, + { + "epoch": 52.920980926430516, + "grad_norm": 3.8879904747009277, + "learning_rate": 9.539941490830863e-06, + "loss": 0.2313, + "step": 19422 + }, + { + "epoch": 52.92370572207084, + "grad_norm": 3.4496006965637207, + "learning_rate": 9.539059932399328e-06, + "loss": 0.1018, + "step": 19423 + }, + { + "epoch": 52.926430517711175, + "grad_norm": 3.728367328643799, + "learning_rate": 9.538178377557577e-06, + "loss": 0.195, + "step": 19424 + }, + { + "epoch": 52.9291553133515, + "grad_norm": 4.723453044891357, + "learning_rate": 9.53729682631248e-06, + "loss": 0.105, + "step": 19425 + }, + { + "epoch": 52.93188010899183, + "grad_norm": 4.525905609130859, + "learning_rate": 9.536415278670897e-06, + "loss": 0.0872, + "step": 19426 + }, + { + "epoch": 52.93460490463215, + "grad_norm": 4.863429546356201, + "learning_rate": 9.5355337346397e-06, + "loss": 0.2055, + "step": 19427 + }, + { + "epoch": 52.93732970027248, + "grad_norm": 4.197471618652344, + "learning_rate": 9.53465219422575e-06, + "loss": 0.2584, + "step": 19428 + }, + { + "epoch": 52.940054495912804, + "grad_norm": 4.145512580871582, + "learning_rate": 9.533770657435914e-06, + "loss": 0.0946, + "step": 19429 + }, + { + "epoch": 52.94277929155314, + "grad_norm": 4.528237342834473, + "learning_rate": 9.532889124277057e-06, + "loss": 0.2962, + "step": 19430 + }, + { + "epoch": 52.94550408719346, + "grad_norm": 4.709898948669434, + "learning_rate": 9.532007594756046e-06, + "loss": 0.1474, + "step": 19431 + }, + { + "epoch": 52.94822888283379, + "grad_norm": 5.081605911254883, + "learning_rate": 9.531126068879742e-06, + "loss": 0.1412, + "step": 19432 + }, + { + "epoch": 52.950953678474114, + "grad_norm": 8.18087387084961, + "learning_rate": 9.530244546655016e-06, + "loss": 0.2135, + "step": 19433 + }, + { + "epoch": 52.95367847411444, + "grad_norm": 3.8935437202453613, + "learning_rate": 9.529363028088725e-06, + "loss": 0.0655, + "step": 19434 + }, + { + "epoch": 52.956403269754766, + "grad_norm": 4.755772113800049, + "learning_rate": 9.528481513187744e-06, + "loss": 0.127, + "step": 19435 + }, + { + "epoch": 52.95912806539509, + "grad_norm": 4.46189546585083, + "learning_rate": 9.527600001958933e-06, + "loss": 0.1729, + "step": 19436 + }, + { + "epoch": 52.961852861035425, + "grad_norm": 8.863527297973633, + "learning_rate": 9.526718494409158e-06, + "loss": 0.158, + "step": 19437 + }, + { + "epoch": 52.96457765667575, + "grad_norm": 3.593932867050171, + "learning_rate": 9.525836990545283e-06, + "loss": 0.0814, + "step": 19438 + }, + { + "epoch": 52.967302452316076, + "grad_norm": 6.234457492828369, + "learning_rate": 9.524955490374176e-06, + "loss": 0.1996, + "step": 19439 + }, + { + "epoch": 52.9700272479564, + "grad_norm": 3.7607927322387695, + "learning_rate": 9.5240739939027e-06, + "loss": 0.1373, + "step": 19440 + }, + { + "epoch": 52.97275204359673, + "grad_norm": 3.821132183074951, + "learning_rate": 9.52319250113772e-06, + "loss": 0.1124, + "step": 19441 + }, + { + "epoch": 52.97547683923706, + "grad_norm": 4.514087200164795, + "learning_rate": 9.522311012086103e-06, + "loss": 0.121, + "step": 19442 + }, + { + "epoch": 52.97820163487739, + "grad_norm": 7.508065700531006, + "learning_rate": 9.52142952675471e-06, + "loss": 0.1596, + "step": 19443 + }, + { + "epoch": 52.98092643051771, + "grad_norm": 4.979015350341797, + "learning_rate": 9.52054804515041e-06, + "loss": 0.2283, + "step": 19444 + }, + { + "epoch": 52.98365122615804, + "grad_norm": 4.485701084136963, + "learning_rate": 9.519666567280067e-06, + "loss": 0.1493, + "step": 19445 + }, + { + "epoch": 52.986376021798364, + "grad_norm": 3.7773795127868652, + "learning_rate": 9.518785093150543e-06, + "loss": 0.0965, + "step": 19446 + }, + { + "epoch": 52.98910081743869, + "grad_norm": 3.1339917182922363, + "learning_rate": 9.517903622768707e-06, + "loss": 0.1167, + "step": 19447 + }, + { + "epoch": 52.991825613079016, + "grad_norm": 4.603447914123535, + "learning_rate": 9.51702215614142e-06, + "loss": 0.0751, + "step": 19448 + }, + { + "epoch": 52.99455040871935, + "grad_norm": 4.457182884216309, + "learning_rate": 9.516140693275554e-06, + "loss": 0.1444, + "step": 19449 + }, + { + "epoch": 52.997275204359674, + "grad_norm": 5.096701145172119, + "learning_rate": 9.515259234177964e-06, + "loss": 0.1583, + "step": 19450 + }, + { + "epoch": 53.0, + "grad_norm": 4.649552345275879, + "learning_rate": 9.514377778855521e-06, + "loss": 0.2083, + "step": 19451 + }, + { + "epoch": 53.002724795640326, + "grad_norm": 4.393429279327393, + "learning_rate": 9.513496327315085e-06, + "loss": 0.0915, + "step": 19452 + }, + { + "epoch": 53.00544959128065, + "grad_norm": 3.946039915084839, + "learning_rate": 9.512614879563525e-06, + "loss": 0.0755, + "step": 19453 + }, + { + "epoch": 53.00817438692098, + "grad_norm": 4.5312113761901855, + "learning_rate": 9.511733435607709e-06, + "loss": 0.2359, + "step": 19454 + }, + { + "epoch": 53.01089918256131, + "grad_norm": 4.726602554321289, + "learning_rate": 9.510851995454494e-06, + "loss": 0.2065, + "step": 19455 + }, + { + "epoch": 53.013623978201636, + "grad_norm": 4.218317985534668, + "learning_rate": 9.50997055911075e-06, + "loss": 0.0797, + "step": 19456 + }, + { + "epoch": 53.01634877384196, + "grad_norm": 4.34600305557251, + "learning_rate": 9.509089126583336e-06, + "loss": 0.1123, + "step": 19457 + }, + { + "epoch": 53.01907356948229, + "grad_norm": 4.702160835266113, + "learning_rate": 9.508207697879123e-06, + "loss": 0.0871, + "step": 19458 + }, + { + "epoch": 53.02179836512261, + "grad_norm": 3.6047987937927246, + "learning_rate": 9.507326273004972e-06, + "loss": 0.0744, + "step": 19459 + }, + { + "epoch": 53.02452316076294, + "grad_norm": 4.602707386016846, + "learning_rate": 9.50644485196775e-06, + "loss": 0.1927, + "step": 19460 + }, + { + "epoch": 53.02724795640327, + "grad_norm": 5.076196670532227, + "learning_rate": 9.505563434774317e-06, + "loss": 0.1479, + "step": 19461 + }, + { + "epoch": 53.0299727520436, + "grad_norm": 8.3142671585083, + "learning_rate": 9.504682021431541e-06, + "loss": 0.1404, + "step": 19462 + }, + { + "epoch": 53.032697547683924, + "grad_norm": 4.3612751960754395, + "learning_rate": 9.503800611946285e-06, + "loss": 0.0814, + "step": 19463 + }, + { + "epoch": 53.03542234332425, + "grad_norm": 3.6033620834350586, + "learning_rate": 9.502919206325415e-06, + "loss": 0.2357, + "step": 19464 + }, + { + "epoch": 53.038147138964575, + "grad_norm": 4.380779266357422, + "learning_rate": 9.502037804575793e-06, + "loss": 0.1751, + "step": 19465 + }, + { + "epoch": 53.0408719346049, + "grad_norm": 4.791330814361572, + "learning_rate": 9.501156406704284e-06, + "loss": 0.2727, + "step": 19466 + }, + { + "epoch": 53.043596730245234, + "grad_norm": 4.086306571960449, + "learning_rate": 9.500275012717754e-06, + "loss": 0.1402, + "step": 19467 + }, + { + "epoch": 53.04632152588556, + "grad_norm": 3.57738995552063, + "learning_rate": 9.499393622623064e-06, + "loss": 0.2562, + "step": 19468 + }, + { + "epoch": 53.049046321525886, + "grad_norm": 4.554544925689697, + "learning_rate": 9.49851223642708e-06, + "loss": 0.2626, + "step": 19469 + }, + { + "epoch": 53.05177111716621, + "grad_norm": 5.000865936279297, + "learning_rate": 9.49763085413667e-06, + "loss": 0.2058, + "step": 19470 + }, + { + "epoch": 53.05449591280654, + "grad_norm": 6.769252300262451, + "learning_rate": 9.496749475758692e-06, + "loss": 0.1646, + "step": 19471 + }, + { + "epoch": 53.05722070844686, + "grad_norm": 4.432536602020264, + "learning_rate": 9.495868101300015e-06, + "loss": 0.1401, + "step": 19472 + }, + { + "epoch": 53.059945504087196, + "grad_norm": 10.35960865020752, + "learning_rate": 9.4949867307675e-06, + "loss": 0.182, + "step": 19473 + }, + { + "epoch": 53.06267029972752, + "grad_norm": 3.592966318130493, + "learning_rate": 9.494105364168014e-06, + "loss": 0.2652, + "step": 19474 + }, + { + "epoch": 53.06539509536785, + "grad_norm": 4.498920440673828, + "learning_rate": 9.493224001508416e-06, + "loss": 0.1544, + "step": 19475 + }, + { + "epoch": 53.06811989100817, + "grad_norm": 4.001643657684326, + "learning_rate": 9.492342642795576e-06, + "loss": 0.061, + "step": 19476 + }, + { + "epoch": 53.0708446866485, + "grad_norm": 4.065978050231934, + "learning_rate": 9.491461288036353e-06, + "loss": 0.1452, + "step": 19477 + }, + { + "epoch": 53.073569482288825, + "grad_norm": 3.848238468170166, + "learning_rate": 9.490579937237615e-06, + "loss": 0.2558, + "step": 19478 + }, + { + "epoch": 53.07629427792916, + "grad_norm": 4.34864616394043, + "learning_rate": 9.489698590406223e-06, + "loss": 0.2458, + "step": 19479 + }, + { + "epoch": 53.079019073569484, + "grad_norm": 3.9366304874420166, + "learning_rate": 9.488817247549043e-06, + "loss": 0.0556, + "step": 19480 + }, + { + "epoch": 53.08174386920981, + "grad_norm": 3.9686615467071533, + "learning_rate": 9.487935908672936e-06, + "loss": 0.1271, + "step": 19481 + }, + { + "epoch": 53.084468664850135, + "grad_norm": 4.87516975402832, + "learning_rate": 9.487054573784769e-06, + "loss": 0.2584, + "step": 19482 + }, + { + "epoch": 53.08719346049046, + "grad_norm": 3.477492332458496, + "learning_rate": 9.486173242891404e-06, + "loss": 0.128, + "step": 19483 + }, + { + "epoch": 53.08991825613079, + "grad_norm": 3.921304225921631, + "learning_rate": 9.485291915999706e-06, + "loss": 0.0912, + "step": 19484 + }, + { + "epoch": 53.09264305177112, + "grad_norm": 4.01481294631958, + "learning_rate": 9.484410593116536e-06, + "loss": 0.1633, + "step": 19485 + }, + { + "epoch": 53.095367847411445, + "grad_norm": 5.032939910888672, + "learning_rate": 9.483529274248758e-06, + "loss": 0.167, + "step": 19486 + }, + { + "epoch": 53.09809264305177, + "grad_norm": 3.700946807861328, + "learning_rate": 9.48264795940324e-06, + "loss": 0.0914, + "step": 19487 + }, + { + "epoch": 53.1008174386921, + "grad_norm": 4.320295810699463, + "learning_rate": 9.481766648586844e-06, + "loss": 0.2146, + "step": 19488 + }, + { + "epoch": 53.10354223433242, + "grad_norm": 4.7659783363342285, + "learning_rate": 9.48088534180643e-06, + "loss": 0.1247, + "step": 19489 + }, + { + "epoch": 53.10626702997275, + "grad_norm": 3.985541343688965, + "learning_rate": 9.480004039068868e-06, + "loss": 0.1365, + "step": 19490 + }, + { + "epoch": 53.10899182561308, + "grad_norm": 3.8085134029388428, + "learning_rate": 9.479122740381015e-06, + "loss": 0.1226, + "step": 19491 + }, + { + "epoch": 53.11171662125341, + "grad_norm": 4.460117816925049, + "learning_rate": 9.478241445749739e-06, + "loss": 0.11, + "step": 19492 + }, + { + "epoch": 53.11444141689373, + "grad_norm": 4.521548748016357, + "learning_rate": 9.477360155181902e-06, + "loss": 0.2341, + "step": 19493 + }, + { + "epoch": 53.11716621253406, + "grad_norm": 4.03731632232666, + "learning_rate": 9.476478868684366e-06, + "loss": 0.1513, + "step": 19494 + }, + { + "epoch": 53.119891008174385, + "grad_norm": 4.526203155517578, + "learning_rate": 9.475597586263996e-06, + "loss": 0.155, + "step": 19495 + }, + { + "epoch": 53.12261580381471, + "grad_norm": 14.319269180297852, + "learning_rate": 9.474716307927657e-06, + "loss": 0.0924, + "step": 19496 + }, + { + "epoch": 53.12534059945504, + "grad_norm": 4.00183629989624, + "learning_rate": 9.473835033682209e-06, + "loss": 0.1389, + "step": 19497 + }, + { + "epoch": 53.12806539509537, + "grad_norm": 3.2636046409606934, + "learning_rate": 9.472953763534517e-06, + "loss": 0.067, + "step": 19498 + }, + { + "epoch": 53.130790190735695, + "grad_norm": 3.163428783416748, + "learning_rate": 9.472072497491443e-06, + "loss": 0.0709, + "step": 19499 + }, + { + "epoch": 53.13351498637602, + "grad_norm": 4.80781364440918, + "learning_rate": 9.471191235559853e-06, + "loss": 0.1009, + "step": 19500 + }, + { + "epoch": 53.13623978201635, + "grad_norm": 5.041027069091797, + "learning_rate": 9.470309977746607e-06, + "loss": 0.1678, + "step": 19501 + }, + { + "epoch": 53.13896457765667, + "grad_norm": 5.947676181793213, + "learning_rate": 9.46942872405857e-06, + "loss": 0.219, + "step": 19502 + }, + { + "epoch": 53.141689373297005, + "grad_norm": 4.79503059387207, + "learning_rate": 9.468547474502603e-06, + "loss": 0.1351, + "step": 19503 + }, + { + "epoch": 53.14441416893733, + "grad_norm": 3.2360799312591553, + "learning_rate": 9.467666229085574e-06, + "loss": 0.1247, + "step": 19504 + }, + { + "epoch": 53.14713896457766, + "grad_norm": 4.616093635559082, + "learning_rate": 9.466784987814345e-06, + "loss": 0.1742, + "step": 19505 + }, + { + "epoch": 53.14986376021798, + "grad_norm": 3.4572880268096924, + "learning_rate": 9.465903750695774e-06, + "loss": 0.0791, + "step": 19506 + }, + { + "epoch": 53.15258855585831, + "grad_norm": 5.055361270904541, + "learning_rate": 9.465022517736728e-06, + "loss": 0.1116, + "step": 19507 + }, + { + "epoch": 53.155313351498634, + "grad_norm": 4.294522762298584, + "learning_rate": 9.464141288944072e-06, + "loss": 0.1808, + "step": 19508 + }, + { + "epoch": 53.15803814713897, + "grad_norm": 3.945244550704956, + "learning_rate": 9.463260064324663e-06, + "loss": 0.12, + "step": 19509 + }, + { + "epoch": 53.16076294277929, + "grad_norm": 5.410464763641357, + "learning_rate": 9.46237884388537e-06, + "loss": 0.0788, + "step": 19510 + }, + { + "epoch": 53.16348773841962, + "grad_norm": 8.153961181640625, + "learning_rate": 9.461497627633051e-06, + "loss": 0.1865, + "step": 19511 + }, + { + "epoch": 53.166212534059945, + "grad_norm": 4.335062026977539, + "learning_rate": 9.460616415574575e-06, + "loss": 0.2073, + "step": 19512 + }, + { + "epoch": 53.16893732970027, + "grad_norm": 4.389134407043457, + "learning_rate": 9.459735207716796e-06, + "loss": 0.0822, + "step": 19513 + }, + { + "epoch": 53.171662125340596, + "grad_norm": 3.9332547187805176, + "learning_rate": 9.458854004066586e-06, + "loss": 0.0663, + "step": 19514 + }, + { + "epoch": 53.17438692098093, + "grad_norm": 4.0098676681518555, + "learning_rate": 9.457972804630801e-06, + "loss": 0.0951, + "step": 19515 + }, + { + "epoch": 53.177111716621255, + "grad_norm": 3.5633816719055176, + "learning_rate": 9.457091609416309e-06, + "loss": 0.0736, + "step": 19516 + }, + { + "epoch": 53.17983651226158, + "grad_norm": 4.113879203796387, + "learning_rate": 9.456210418429968e-06, + "loss": 0.1804, + "step": 19517 + }, + { + "epoch": 53.182561307901906, + "grad_norm": 4.0399861335754395, + "learning_rate": 9.455329231678644e-06, + "loss": 0.2328, + "step": 19518 + }, + { + "epoch": 53.18528610354223, + "grad_norm": 4.422402381896973, + "learning_rate": 9.454448049169195e-06, + "loss": 0.2042, + "step": 19519 + }, + { + "epoch": 53.18801089918256, + "grad_norm": 3.637037754058838, + "learning_rate": 9.453566870908488e-06, + "loss": 0.2312, + "step": 19520 + }, + { + "epoch": 53.19073569482289, + "grad_norm": 5.453971862792969, + "learning_rate": 9.452685696903387e-06, + "loss": 0.1949, + "step": 19521 + }, + { + "epoch": 53.19346049046322, + "grad_norm": 3.9778435230255127, + "learning_rate": 9.45180452716075e-06, + "loss": 0.1529, + "step": 19522 + }, + { + "epoch": 53.19618528610354, + "grad_norm": 6.233001708984375, + "learning_rate": 9.450923361687443e-06, + "loss": 0.1263, + "step": 19523 + }, + { + "epoch": 53.19891008174387, + "grad_norm": 4.244566917419434, + "learning_rate": 9.450042200490328e-06, + "loss": 0.2222, + "step": 19524 + }, + { + "epoch": 53.201634877384194, + "grad_norm": 4.423482894897461, + "learning_rate": 9.449161043576266e-06, + "loss": 0.2106, + "step": 19525 + }, + { + "epoch": 53.20435967302452, + "grad_norm": 4.039098262786865, + "learning_rate": 9.44827989095212e-06, + "loss": 0.2248, + "step": 19526 + }, + { + "epoch": 53.20708446866485, + "grad_norm": 2.4821112155914307, + "learning_rate": 9.447398742624754e-06, + "loss": 0.0965, + "step": 19527 + }, + { + "epoch": 53.20980926430518, + "grad_norm": 3.9655888080596924, + "learning_rate": 9.446517598601026e-06, + "loss": 0.1632, + "step": 19528 + }, + { + "epoch": 53.212534059945504, + "grad_norm": 3.9284117221832275, + "learning_rate": 9.445636458887804e-06, + "loss": 0.1691, + "step": 19529 + }, + { + "epoch": 53.21525885558583, + "grad_norm": 6.506946086883545, + "learning_rate": 9.444755323491944e-06, + "loss": 0.1877, + "step": 19530 + }, + { + "epoch": 53.217983651226156, + "grad_norm": 3.3470606803894043, + "learning_rate": 9.443874192420312e-06, + "loss": 0.1937, + "step": 19531 + }, + { + "epoch": 53.22070844686648, + "grad_norm": 4.093039035797119, + "learning_rate": 9.442993065679773e-06, + "loss": 0.0557, + "step": 19532 + }, + { + "epoch": 53.223433242506815, + "grad_norm": 3.836261034011841, + "learning_rate": 9.442111943277183e-06, + "loss": 0.1796, + "step": 19533 + }, + { + "epoch": 53.22615803814714, + "grad_norm": 4.765162944793701, + "learning_rate": 9.44123082521941e-06, + "loss": 0.122, + "step": 19534 + }, + { + "epoch": 53.228882833787466, + "grad_norm": 4.036040782928467, + "learning_rate": 9.440349711513311e-06, + "loss": 0.0643, + "step": 19535 + }, + { + "epoch": 53.23160762942779, + "grad_norm": 5.566751480102539, + "learning_rate": 9.439468602165752e-06, + "loss": 0.1608, + "step": 19536 + }, + { + "epoch": 53.23433242506812, + "grad_norm": 3.435711622238159, + "learning_rate": 9.438587497183592e-06, + "loss": 0.1056, + "step": 19537 + }, + { + "epoch": 53.237057220708444, + "grad_norm": 4.683530807495117, + "learning_rate": 9.437706396573693e-06, + "loss": 0.1333, + "step": 19538 + }, + { + "epoch": 53.23978201634878, + "grad_norm": 3.80041766166687, + "learning_rate": 9.43682530034292e-06, + "loss": 0.24, + "step": 19539 + }, + { + "epoch": 53.2425068119891, + "grad_norm": 4.056492805480957, + "learning_rate": 9.435944208498135e-06, + "loss": 0.2451, + "step": 19540 + }, + { + "epoch": 53.24523160762943, + "grad_norm": 3.077631711959839, + "learning_rate": 9.435063121046198e-06, + "loss": 0.1398, + "step": 19541 + }, + { + "epoch": 53.247956403269754, + "grad_norm": 5.0171990394592285, + "learning_rate": 9.43418203799397e-06, + "loss": 0.0593, + "step": 19542 + }, + { + "epoch": 53.25068119891008, + "grad_norm": 3.7705698013305664, + "learning_rate": 9.433300959348317e-06, + "loss": 0.1593, + "step": 19543 + }, + { + "epoch": 53.253405994550405, + "grad_norm": 17.04795265197754, + "learning_rate": 9.432419885116094e-06, + "loss": 0.1384, + "step": 19544 + }, + { + "epoch": 53.25613079019074, + "grad_norm": 3.9089910984039307, + "learning_rate": 9.43153881530417e-06, + "loss": 0.0772, + "step": 19545 + }, + { + "epoch": 53.258855585831064, + "grad_norm": 4.638715744018555, + "learning_rate": 9.4306577499194e-06, + "loss": 0.1451, + "step": 19546 + }, + { + "epoch": 53.26158038147139, + "grad_norm": 3.2247910499572754, + "learning_rate": 9.429776688968654e-06, + "loss": 0.0847, + "step": 19547 + }, + { + "epoch": 53.264305177111716, + "grad_norm": 3.8689346313476562, + "learning_rate": 9.428895632458785e-06, + "loss": 0.171, + "step": 19548 + }, + { + "epoch": 53.26702997275204, + "grad_norm": 4.553506851196289, + "learning_rate": 9.428014580396659e-06, + "loss": 0.1897, + "step": 19549 + }, + { + "epoch": 53.26975476839237, + "grad_norm": 4.09987211227417, + "learning_rate": 9.427133532789137e-06, + "loss": 0.1578, + "step": 19550 + }, + { + "epoch": 53.2724795640327, + "grad_norm": 3.6810247898101807, + "learning_rate": 9.426252489643082e-06, + "loss": 0.1001, + "step": 19551 + }, + { + "epoch": 53.275204359673026, + "grad_norm": 4.582121849060059, + "learning_rate": 9.425371450965352e-06, + "loss": 0.1994, + "step": 19552 + }, + { + "epoch": 53.27792915531335, + "grad_norm": 2.8743526935577393, + "learning_rate": 9.424490416762811e-06, + "loss": 0.0879, + "step": 19553 + }, + { + "epoch": 53.28065395095368, + "grad_norm": 4.316268444061279, + "learning_rate": 9.423609387042322e-06, + "loss": 0.1325, + "step": 19554 + }, + { + "epoch": 53.283378746594, + "grad_norm": 5.627859115600586, + "learning_rate": 9.42272836181074e-06, + "loss": 0.2588, + "step": 19555 + }, + { + "epoch": 53.28610354223433, + "grad_norm": 5.127203464508057, + "learning_rate": 9.421847341074933e-06, + "loss": 0.2171, + "step": 19556 + }, + { + "epoch": 53.28882833787466, + "grad_norm": 4.550676345825195, + "learning_rate": 9.420966324841762e-06, + "loss": 0.1611, + "step": 19557 + }, + { + "epoch": 53.29155313351499, + "grad_norm": 3.104943037033081, + "learning_rate": 9.420085313118086e-06, + "loss": 0.0543, + "step": 19558 + }, + { + "epoch": 53.294277929155314, + "grad_norm": 3.6725471019744873, + "learning_rate": 9.419204305910769e-06, + "loss": 0.2162, + "step": 19559 + }, + { + "epoch": 53.29700272479564, + "grad_norm": 3.9303996562957764, + "learning_rate": 9.418323303226667e-06, + "loss": 0.0666, + "step": 19560 + }, + { + "epoch": 53.299727520435965, + "grad_norm": 4.273158550262451, + "learning_rate": 9.417442305072647e-06, + "loss": 0.0828, + "step": 19561 + }, + { + "epoch": 53.30245231607629, + "grad_norm": 4.918844699859619, + "learning_rate": 9.416561311455565e-06, + "loss": 0.0793, + "step": 19562 + }, + { + "epoch": 53.305177111716624, + "grad_norm": 6.09805154800415, + "learning_rate": 9.415680322382289e-06, + "loss": 0.123, + "step": 19563 + }, + { + "epoch": 53.30790190735695, + "grad_norm": 4.17274284362793, + "learning_rate": 9.41479933785967e-06, + "loss": 0.0983, + "step": 19564 + }, + { + "epoch": 53.310626702997276, + "grad_norm": 4.336362838745117, + "learning_rate": 9.413918357894579e-06, + "loss": 0.0565, + "step": 19565 + }, + { + "epoch": 53.3133514986376, + "grad_norm": 5.13599967956543, + "learning_rate": 9.41303738249387e-06, + "loss": 0.3572, + "step": 19566 + }, + { + "epoch": 53.31607629427793, + "grad_norm": 3.890084743499756, + "learning_rate": 9.41215641166441e-06, + "loss": 0.167, + "step": 19567 + }, + { + "epoch": 53.31880108991825, + "grad_norm": 3.838386297225952, + "learning_rate": 9.411275445413055e-06, + "loss": 0.2074, + "step": 19568 + }, + { + "epoch": 53.321525885558586, + "grad_norm": 3.0424602031707764, + "learning_rate": 9.41039448374667e-06, + "loss": 0.0788, + "step": 19569 + }, + { + "epoch": 53.32425068119891, + "grad_norm": 3.4019460678100586, + "learning_rate": 9.409513526672111e-06, + "loss": 0.0977, + "step": 19570 + }, + { + "epoch": 53.32697547683924, + "grad_norm": 4.269498825073242, + "learning_rate": 9.408632574196245e-06, + "loss": 0.2103, + "step": 19571 + }, + { + "epoch": 53.32970027247956, + "grad_norm": 6.106554985046387, + "learning_rate": 9.407751626325922e-06, + "loss": 0.1869, + "step": 19572 + }, + { + "epoch": 53.33242506811989, + "grad_norm": 5.24274206161499, + "learning_rate": 9.406870683068017e-06, + "loss": 0.1613, + "step": 19573 + }, + { + "epoch": 53.335149863760215, + "grad_norm": 3.7461729049682617, + "learning_rate": 9.40598974442938e-06, + "loss": 0.086, + "step": 19574 + }, + { + "epoch": 53.33787465940055, + "grad_norm": 5.346202850341797, + "learning_rate": 9.405108810416881e-06, + "loss": 0.0685, + "step": 19575 + }, + { + "epoch": 53.34059945504087, + "grad_norm": 5.928539276123047, + "learning_rate": 9.404227881037372e-06, + "loss": 0.1774, + "step": 19576 + }, + { + "epoch": 53.3433242506812, + "grad_norm": 4.118345737457275, + "learning_rate": 9.40334695629772e-06, + "loss": 0.1966, + "step": 19577 + }, + { + "epoch": 53.346049046321525, + "grad_norm": 4.071616172790527, + "learning_rate": 9.402466036204779e-06, + "loss": 0.0869, + "step": 19578 + }, + { + "epoch": 53.34877384196185, + "grad_norm": 4.851202011108398, + "learning_rate": 9.401585120765416e-06, + "loss": 0.0747, + "step": 19579 + }, + { + "epoch": 53.35149863760218, + "grad_norm": 5.652044773101807, + "learning_rate": 9.400704209986488e-06, + "loss": 0.1734, + "step": 19580 + }, + { + "epoch": 53.35422343324251, + "grad_norm": 4.022444248199463, + "learning_rate": 9.399823303874856e-06, + "loss": 0.0729, + "step": 19581 + }, + { + "epoch": 53.356948228882835, + "grad_norm": 3.748548746109009, + "learning_rate": 9.398942402437382e-06, + "loss": 0.212, + "step": 19582 + }, + { + "epoch": 53.35967302452316, + "grad_norm": 3.7141458988189697, + "learning_rate": 9.398061505680925e-06, + "loss": 0.0992, + "step": 19583 + }, + { + "epoch": 53.36239782016349, + "grad_norm": 3.743070125579834, + "learning_rate": 9.397180613612343e-06, + "loss": 0.0816, + "step": 19584 + }, + { + "epoch": 53.36512261580381, + "grad_norm": 3.78251314163208, + "learning_rate": 9.396299726238501e-06, + "loss": 0.0992, + "step": 19585 + }, + { + "epoch": 53.36784741144414, + "grad_norm": 3.9803833961486816, + "learning_rate": 9.395418843566257e-06, + "loss": 0.126, + "step": 19586 + }, + { + "epoch": 53.37057220708447, + "grad_norm": 4.991311550140381, + "learning_rate": 9.394537965602473e-06, + "loss": 0.0616, + "step": 19587 + }, + { + "epoch": 53.3732970027248, + "grad_norm": 4.265721321105957, + "learning_rate": 9.393657092354005e-06, + "loss": 0.1159, + "step": 19588 + }, + { + "epoch": 53.37602179836512, + "grad_norm": 4.968245029449463, + "learning_rate": 9.392776223827715e-06, + "loss": 0.1558, + "step": 19589 + }, + { + "epoch": 53.37874659400545, + "grad_norm": 4.296175479888916, + "learning_rate": 9.391895360030467e-06, + "loss": 0.1086, + "step": 19590 + }, + { + "epoch": 53.381471389645775, + "grad_norm": 5.016697883605957, + "learning_rate": 9.391014500969118e-06, + "loss": 0.136, + "step": 19591 + }, + { + "epoch": 53.3841961852861, + "grad_norm": 4.269606113433838, + "learning_rate": 9.39013364665053e-06, + "loss": 0.2055, + "step": 19592 + }, + { + "epoch": 53.38692098092643, + "grad_norm": 5.176723003387451, + "learning_rate": 9.389252797081558e-06, + "loss": 0.0906, + "step": 19593 + }, + { + "epoch": 53.38964577656676, + "grad_norm": 3.5410618782043457, + "learning_rate": 9.388371952269068e-06, + "loss": 0.1775, + "step": 19594 + }, + { + "epoch": 53.392370572207085, + "grad_norm": 11.931692123413086, + "learning_rate": 9.387491112219917e-06, + "loss": 0.1672, + "step": 19595 + }, + { + "epoch": 53.39509536784741, + "grad_norm": 4.841396331787109, + "learning_rate": 9.386610276940966e-06, + "loss": 0.1384, + "step": 19596 + }, + { + "epoch": 53.39782016348774, + "grad_norm": 3.4168834686279297, + "learning_rate": 9.385729446439074e-06, + "loss": 0.1335, + "step": 19597 + }, + { + "epoch": 53.40054495912806, + "grad_norm": 4.518017768859863, + "learning_rate": 9.384848620721102e-06, + "loss": 0.0872, + "step": 19598 + }, + { + "epoch": 53.403269754768395, + "grad_norm": 3.9464101791381836, + "learning_rate": 9.38396779979391e-06, + "loss": 0.226, + "step": 19599 + }, + { + "epoch": 53.40599455040872, + "grad_norm": 3.6357007026672363, + "learning_rate": 9.383086983664354e-06, + "loss": 0.1953, + "step": 19600 + }, + { + "epoch": 53.40871934604905, + "grad_norm": 3.898745059967041, + "learning_rate": 9.3822061723393e-06, + "loss": 0.1117, + "step": 19601 + }, + { + "epoch": 53.41144414168937, + "grad_norm": 5.000555038452148, + "learning_rate": 9.381325365825601e-06, + "loss": 0.086, + "step": 19602 + }, + { + "epoch": 53.4141689373297, + "grad_norm": 4.185770034790039, + "learning_rate": 9.380444564130124e-06, + "loss": 0.2016, + "step": 19603 + }, + { + "epoch": 53.416893732970024, + "grad_norm": 4.505792140960693, + "learning_rate": 9.379563767259721e-06, + "loss": 0.1441, + "step": 19604 + }, + { + "epoch": 53.41961852861036, + "grad_norm": 5.0290632247924805, + "learning_rate": 9.378682975221258e-06, + "loss": 0.1137, + "step": 19605 + }, + { + "epoch": 53.42234332425068, + "grad_norm": 6.182051181793213, + "learning_rate": 9.37780218802159e-06, + "loss": 0.1923, + "step": 19606 + }, + { + "epoch": 53.42506811989101, + "grad_norm": 4.861679553985596, + "learning_rate": 9.376921405667576e-06, + "loss": 0.1379, + "step": 19607 + }, + { + "epoch": 53.427792915531334, + "grad_norm": 9.390670776367188, + "learning_rate": 9.376040628166084e-06, + "loss": 0.0715, + "step": 19608 + }, + { + "epoch": 53.43051771117166, + "grad_norm": 3.188892364501953, + "learning_rate": 9.375159855523964e-06, + "loss": 0.0807, + "step": 19609 + }, + { + "epoch": 53.433242506811986, + "grad_norm": 4.040568828582764, + "learning_rate": 9.374279087748082e-06, + "loss": 0.1842, + "step": 19610 + }, + { + "epoch": 53.43596730245232, + "grad_norm": 4.385910987854004, + "learning_rate": 9.37339832484529e-06, + "loss": 0.1429, + "step": 19611 + }, + { + "epoch": 53.438692098092645, + "grad_norm": 5.230727672576904, + "learning_rate": 9.372517566822456e-06, + "loss": 0.1741, + "step": 19612 + }, + { + "epoch": 53.44141689373297, + "grad_norm": 3.943782091140747, + "learning_rate": 9.371636813686433e-06, + "loss": 0.1633, + "step": 19613 + }, + { + "epoch": 53.444141689373296, + "grad_norm": 4.666703224182129, + "learning_rate": 9.370756065444083e-06, + "loss": 0.2011, + "step": 19614 + }, + { + "epoch": 53.44686648501362, + "grad_norm": 3.6243550777435303, + "learning_rate": 9.369875322102262e-06, + "loss": 0.1088, + "step": 19615 + }, + { + "epoch": 53.44959128065395, + "grad_norm": 5.502617359161377, + "learning_rate": 9.368994583667835e-06, + "loss": 0.1672, + "step": 19616 + }, + { + "epoch": 53.45231607629428, + "grad_norm": 4.114571571350098, + "learning_rate": 9.368113850147655e-06, + "loss": 0.0948, + "step": 19617 + }, + { + "epoch": 53.45504087193461, + "grad_norm": 4.559849262237549, + "learning_rate": 9.367233121548585e-06, + "loss": 0.1499, + "step": 19618 + }, + { + "epoch": 53.45776566757493, + "grad_norm": 5.137974262237549, + "learning_rate": 9.366352397877485e-06, + "loss": 0.1878, + "step": 19619 + }, + { + "epoch": 53.46049046321526, + "grad_norm": 4.2125139236450195, + "learning_rate": 9.36547167914121e-06, + "loss": 0.168, + "step": 19620 + }, + { + "epoch": 53.463215258855584, + "grad_norm": 4.2992377281188965, + "learning_rate": 9.364590965346622e-06, + "loss": 0.1176, + "step": 19621 + }, + { + "epoch": 53.46594005449591, + "grad_norm": 3.483376979827881, + "learning_rate": 9.363710256500578e-06, + "loss": 0.1051, + "step": 19622 + }, + { + "epoch": 53.46866485013624, + "grad_norm": 4.003507137298584, + "learning_rate": 9.36282955260994e-06, + "loss": 0.0981, + "step": 19623 + }, + { + "epoch": 53.47138964577657, + "grad_norm": 7.440272331237793, + "learning_rate": 9.361948853681562e-06, + "loss": 0.1848, + "step": 19624 + }, + { + "epoch": 53.474114441416894, + "grad_norm": 3.835020065307617, + "learning_rate": 9.361068159722306e-06, + "loss": 0.1417, + "step": 19625 + }, + { + "epoch": 53.47683923705722, + "grad_norm": 9.260590553283691, + "learning_rate": 9.360187470739033e-06, + "loss": 0.0837, + "step": 19626 + }, + { + "epoch": 53.479564032697546, + "grad_norm": 3.928607702255249, + "learning_rate": 9.359306786738598e-06, + "loss": 0.1703, + "step": 19627 + }, + { + "epoch": 53.48228882833787, + "grad_norm": 5.6095051765441895, + "learning_rate": 9.358426107727862e-06, + "loss": 0.153, + "step": 19628 + }, + { + "epoch": 53.485013623978205, + "grad_norm": 5.017398357391357, + "learning_rate": 9.357545433713683e-06, + "loss": 0.1423, + "step": 19629 + }, + { + "epoch": 53.48773841961853, + "grad_norm": 3.781545877456665, + "learning_rate": 9.35666476470292e-06, + "loss": 0.1471, + "step": 19630 + }, + { + "epoch": 53.490463215258856, + "grad_norm": 6.276341438293457, + "learning_rate": 9.35578410070243e-06, + "loss": 0.2157, + "step": 19631 + }, + { + "epoch": 53.49318801089918, + "grad_norm": 5.679474830627441, + "learning_rate": 9.354903441719073e-06, + "loss": 0.2014, + "step": 19632 + }, + { + "epoch": 53.49591280653951, + "grad_norm": 4.954401016235352, + "learning_rate": 9.354022787759707e-06, + "loss": 0.1579, + "step": 19633 + }, + { + "epoch": 53.49863760217983, + "grad_norm": 6.598718166351318, + "learning_rate": 9.353142138831192e-06, + "loss": 0.1546, + "step": 19634 + }, + { + "epoch": 53.50136239782017, + "grad_norm": 7.953682899475098, + "learning_rate": 9.352261494940382e-06, + "loss": 0.0758, + "step": 19635 + }, + { + "epoch": 53.50408719346049, + "grad_norm": 4.217384338378906, + "learning_rate": 9.351380856094142e-06, + "loss": 0.1745, + "step": 19636 + }, + { + "epoch": 53.50681198910082, + "grad_norm": 5.816168308258057, + "learning_rate": 9.350500222299326e-06, + "loss": 0.0973, + "step": 19637 + }, + { + "epoch": 53.509536784741144, + "grad_norm": 3.9512689113616943, + "learning_rate": 9.349619593562793e-06, + "loss": 0.1299, + "step": 19638 + }, + { + "epoch": 53.51226158038147, + "grad_norm": 4.017214775085449, + "learning_rate": 9.348738969891402e-06, + "loss": 0.105, + "step": 19639 + }, + { + "epoch": 53.514986376021795, + "grad_norm": 4.038506507873535, + "learning_rate": 9.34785835129201e-06, + "loss": 0.0985, + "step": 19640 + }, + { + "epoch": 53.51771117166213, + "grad_norm": 4.767246723175049, + "learning_rate": 9.346977737771471e-06, + "loss": 0.1997, + "step": 19641 + }, + { + "epoch": 53.520435967302454, + "grad_norm": 4.974850654602051, + "learning_rate": 9.346097129336658e-06, + "loss": 0.1952, + "step": 19642 + }, + { + "epoch": 53.52316076294278, + "grad_norm": 4.244633674621582, + "learning_rate": 9.345216525994415e-06, + "loss": 0.101, + "step": 19643 + }, + { + "epoch": 53.525885558583106, + "grad_norm": 4.580294132232666, + "learning_rate": 9.344335927751606e-06, + "loss": 0.2573, + "step": 19644 + }, + { + "epoch": 53.52861035422343, + "grad_norm": 4.44301176071167, + "learning_rate": 9.343455334615085e-06, + "loss": 0.2257, + "step": 19645 + }, + { + "epoch": 53.53133514986376, + "grad_norm": 4.0705671310424805, + "learning_rate": 9.342574746591718e-06, + "loss": 0.0916, + "step": 19646 + }, + { + "epoch": 53.53405994550409, + "grad_norm": 3.968733310699463, + "learning_rate": 9.341694163688352e-06, + "loss": 0.1892, + "step": 19647 + }, + { + "epoch": 53.536784741144416, + "grad_norm": 3.490436553955078, + "learning_rate": 9.340813585911854e-06, + "loss": 0.206, + "step": 19648 + }, + { + "epoch": 53.53950953678474, + "grad_norm": 4.871994972229004, + "learning_rate": 9.339933013269076e-06, + "loss": 0.1334, + "step": 19649 + }, + { + "epoch": 53.54223433242507, + "grad_norm": 3.9973957538604736, + "learning_rate": 9.339052445766883e-06, + "loss": 0.1299, + "step": 19650 + }, + { + "epoch": 53.54495912806539, + "grad_norm": 5.820115089416504, + "learning_rate": 9.338171883412123e-06, + "loss": 0.0772, + "step": 19651 + }, + { + "epoch": 53.54768392370572, + "grad_norm": 5.841065883636475, + "learning_rate": 9.337291326211663e-06, + "loss": 0.1235, + "step": 19652 + }, + { + "epoch": 53.55040871934605, + "grad_norm": 4.874732494354248, + "learning_rate": 9.336410774172356e-06, + "loss": 0.094, + "step": 19653 + }, + { + "epoch": 53.55313351498638, + "grad_norm": 4.347428321838379, + "learning_rate": 9.33553022730106e-06, + "loss": 0.0655, + "step": 19654 + }, + { + "epoch": 53.555858310626704, + "grad_norm": 3.9326961040496826, + "learning_rate": 9.334649685604632e-06, + "loss": 0.2916, + "step": 19655 + }, + { + "epoch": 53.55858310626703, + "grad_norm": 3.449640989303589, + "learning_rate": 9.333769149089934e-06, + "loss": 0.0591, + "step": 19656 + }, + { + "epoch": 53.561307901907355, + "grad_norm": 8.750727653503418, + "learning_rate": 9.332888617763816e-06, + "loss": 0.1439, + "step": 19657 + }, + { + "epoch": 53.56403269754768, + "grad_norm": 3.458325147628784, + "learning_rate": 9.33200809163314e-06, + "loss": 0.1673, + "step": 19658 + }, + { + "epoch": 53.566757493188014, + "grad_norm": 4.965142250061035, + "learning_rate": 9.331127570704765e-06, + "loss": 0.121, + "step": 19659 + }, + { + "epoch": 53.56948228882834, + "grad_norm": 3.2240495681762695, + "learning_rate": 9.330247054985548e-06, + "loss": 0.0541, + "step": 19660 + }, + { + "epoch": 53.572207084468666, + "grad_norm": 5.976936340332031, + "learning_rate": 9.329366544482346e-06, + "loss": 0.1824, + "step": 19661 + }, + { + "epoch": 53.57493188010899, + "grad_norm": 5.07879114151001, + "learning_rate": 9.328486039202015e-06, + "loss": 0.1499, + "step": 19662 + }, + { + "epoch": 53.57765667574932, + "grad_norm": 4.073906421661377, + "learning_rate": 9.327605539151412e-06, + "loss": 0.1132, + "step": 19663 + }, + { + "epoch": 53.58038147138964, + "grad_norm": 5.997085094451904, + "learning_rate": 9.326725044337398e-06, + "loss": 0.1735, + "step": 19664 + }, + { + "epoch": 53.583106267029976, + "grad_norm": 4.1504011154174805, + "learning_rate": 9.325844554766826e-06, + "loss": 0.0876, + "step": 19665 + }, + { + "epoch": 53.5858310626703, + "grad_norm": 4.301466941833496, + "learning_rate": 9.324964070446556e-06, + "loss": 0.1104, + "step": 19666 + }, + { + "epoch": 53.58855585831063, + "grad_norm": 3.404266595840454, + "learning_rate": 9.324083591383441e-06, + "loss": 0.1102, + "step": 19667 + }, + { + "epoch": 53.59128065395095, + "grad_norm": 4.574977874755859, + "learning_rate": 9.323203117584345e-06, + "loss": 0.1417, + "step": 19668 + }, + { + "epoch": 53.59400544959128, + "grad_norm": 5.017419815063477, + "learning_rate": 9.322322649056118e-06, + "loss": 0.0789, + "step": 19669 + }, + { + "epoch": 53.596730245231605, + "grad_norm": 3.7074153423309326, + "learning_rate": 9.321442185805625e-06, + "loss": 0.1018, + "step": 19670 + }, + { + "epoch": 53.59945504087194, + "grad_norm": 3.648831605911255, + "learning_rate": 9.320561727839715e-06, + "loss": 0.0912, + "step": 19671 + }, + { + "epoch": 53.60217983651226, + "grad_norm": 3.8857266902923584, + "learning_rate": 9.31968127516525e-06, + "loss": 0.1843, + "step": 19672 + }, + { + "epoch": 53.60490463215259, + "grad_norm": 4.4822678565979, + "learning_rate": 9.318800827789082e-06, + "loss": 0.138, + "step": 19673 + }, + { + "epoch": 53.607629427792915, + "grad_norm": 7.120094299316406, + "learning_rate": 9.317920385718075e-06, + "loss": 0.1012, + "step": 19674 + }, + { + "epoch": 53.61035422343324, + "grad_norm": 4.695366859436035, + "learning_rate": 9.317039948959077e-06, + "loss": 0.2115, + "step": 19675 + }, + { + "epoch": 53.61307901907357, + "grad_norm": 5.063755989074707, + "learning_rate": 9.316159517518952e-06, + "loss": 0.1157, + "step": 19676 + }, + { + "epoch": 53.6158038147139, + "grad_norm": 3.6411147117614746, + "learning_rate": 9.315279091404558e-06, + "loss": 0.118, + "step": 19677 + }, + { + "epoch": 53.618528610354225, + "grad_norm": 3.6441879272460938, + "learning_rate": 9.314398670622745e-06, + "loss": 0.1094, + "step": 19678 + }, + { + "epoch": 53.62125340599455, + "grad_norm": 3.994708299636841, + "learning_rate": 9.313518255180375e-06, + "loss": 0.118, + "step": 19679 + }, + { + "epoch": 53.62397820163488, + "grad_norm": 4.216256618499756, + "learning_rate": 9.312637845084303e-06, + "loss": 0.3642, + "step": 19680 + }, + { + "epoch": 53.6267029972752, + "grad_norm": 14.634512901306152, + "learning_rate": 9.311757440341384e-06, + "loss": 0.0635, + "step": 19681 + }, + { + "epoch": 53.62942779291553, + "grad_norm": 5.584765911102295, + "learning_rate": 9.310877040958478e-06, + "loss": 0.2964, + "step": 19682 + }, + { + "epoch": 53.63215258855586, + "grad_norm": 4.533825397491455, + "learning_rate": 9.309996646942437e-06, + "loss": 0.1632, + "step": 19683 + }, + { + "epoch": 53.63487738419619, + "grad_norm": 3.7038753032684326, + "learning_rate": 9.309116258300121e-06, + "loss": 0.1072, + "step": 19684 + }, + { + "epoch": 53.63760217983651, + "grad_norm": 4.378421783447266, + "learning_rate": 9.308235875038385e-06, + "loss": 0.0795, + "step": 19685 + }, + { + "epoch": 53.64032697547684, + "grad_norm": 4.553260326385498, + "learning_rate": 9.307355497164086e-06, + "loss": 0.1498, + "step": 19686 + }, + { + "epoch": 53.643051771117165, + "grad_norm": 4.38962984085083, + "learning_rate": 9.30647512468408e-06, + "loss": 0.0908, + "step": 19687 + }, + { + "epoch": 53.64577656675749, + "grad_norm": 4.790590763092041, + "learning_rate": 9.305594757605226e-06, + "loss": 0.1962, + "step": 19688 + }, + { + "epoch": 53.64850136239782, + "grad_norm": 3.918919801712036, + "learning_rate": 9.304714395934373e-06, + "loss": 0.1113, + "step": 19689 + }, + { + "epoch": 53.65122615803815, + "grad_norm": 4.994433879852295, + "learning_rate": 9.303834039678386e-06, + "loss": 0.1298, + "step": 19690 + }, + { + "epoch": 53.653950953678475, + "grad_norm": 13.808565139770508, + "learning_rate": 9.302953688844113e-06, + "loss": 0.139, + "step": 19691 + }, + { + "epoch": 53.6566757493188, + "grad_norm": 3.9738388061523438, + "learning_rate": 9.302073343438414e-06, + "loss": 0.0788, + "step": 19692 + }, + { + "epoch": 53.65940054495913, + "grad_norm": 3.889005184173584, + "learning_rate": 9.301193003468148e-06, + "loss": 0.2035, + "step": 19693 + }, + { + "epoch": 53.66212534059945, + "grad_norm": 4.200675010681152, + "learning_rate": 9.300312668940168e-06, + "loss": 0.1692, + "step": 19694 + }, + { + "epoch": 53.664850136239785, + "grad_norm": 7.192455768585205, + "learning_rate": 9.299432339861332e-06, + "loss": 0.0972, + "step": 19695 + }, + { + "epoch": 53.66757493188011, + "grad_norm": 3.8765366077423096, + "learning_rate": 9.298552016238492e-06, + "loss": 0.1349, + "step": 19696 + }, + { + "epoch": 53.67029972752044, + "grad_norm": 3.9085135459899902, + "learning_rate": 9.297671698078508e-06, + "loss": 0.1553, + "step": 19697 + }, + { + "epoch": 53.67302452316076, + "grad_norm": 5.163697719573975, + "learning_rate": 9.296791385388233e-06, + "loss": 0.11, + "step": 19698 + }, + { + "epoch": 53.67574931880109, + "grad_norm": 5.267614364624023, + "learning_rate": 9.295911078174526e-06, + "loss": 0.0688, + "step": 19699 + }, + { + "epoch": 53.678474114441414, + "grad_norm": 3.7285704612731934, + "learning_rate": 9.295030776444239e-06, + "loss": 0.0697, + "step": 19700 + }, + { + "epoch": 53.68119891008175, + "grad_norm": 3.6111433506011963, + "learning_rate": 9.29415048020423e-06, + "loss": 0.0731, + "step": 19701 + }, + { + "epoch": 53.68392370572207, + "grad_norm": 4.5582194328308105, + "learning_rate": 9.293270189461354e-06, + "loss": 0.1186, + "step": 19702 + }, + { + "epoch": 53.6866485013624, + "grad_norm": 3.8478405475616455, + "learning_rate": 9.292389904222468e-06, + "loss": 0.1078, + "step": 19703 + }, + { + "epoch": 53.689373297002724, + "grad_norm": 3.536839246749878, + "learning_rate": 9.291509624494426e-06, + "loss": 0.1933, + "step": 19704 + }, + { + "epoch": 53.69209809264305, + "grad_norm": 5.006591796875, + "learning_rate": 9.290629350284083e-06, + "loss": 0.2957, + "step": 19705 + }, + { + "epoch": 53.694822888283376, + "grad_norm": 5.5485358238220215, + "learning_rate": 9.289749081598298e-06, + "loss": 0.1277, + "step": 19706 + }, + { + "epoch": 53.69754768392371, + "grad_norm": 5.355322360992432, + "learning_rate": 9.288868818443923e-06, + "loss": 0.099, + "step": 19707 + }, + { + "epoch": 53.700272479564035, + "grad_norm": 3.967392683029175, + "learning_rate": 9.287988560827814e-06, + "loss": 0.0798, + "step": 19708 + }, + { + "epoch": 53.70299727520436, + "grad_norm": 4.786160469055176, + "learning_rate": 9.28710830875683e-06, + "loss": 0.0903, + "step": 19709 + }, + { + "epoch": 53.705722070844686, + "grad_norm": 4.865747451782227, + "learning_rate": 9.286228062237817e-06, + "loss": 0.2441, + "step": 19710 + }, + { + "epoch": 53.70844686648501, + "grad_norm": 7.860928535461426, + "learning_rate": 9.285347821277644e-06, + "loss": 0.2467, + "step": 19711 + }, + { + "epoch": 53.71117166212534, + "grad_norm": 3.6451687812805176, + "learning_rate": 9.284467585883156e-06, + "loss": 0.1245, + "step": 19712 + }, + { + "epoch": 53.71389645776567, + "grad_norm": 3.020920753479004, + "learning_rate": 9.283587356061214e-06, + "loss": 0.0737, + "step": 19713 + }, + { + "epoch": 53.716621253406, + "grad_norm": 4.057181358337402, + "learning_rate": 9.282707131818666e-06, + "loss": 0.1006, + "step": 19714 + }, + { + "epoch": 53.71934604904632, + "grad_norm": 5.180568218231201, + "learning_rate": 9.281826913162377e-06, + "loss": 0.11, + "step": 19715 + }, + { + "epoch": 53.72207084468665, + "grad_norm": 3.8155879974365234, + "learning_rate": 9.280946700099194e-06, + "loss": 0.1056, + "step": 19716 + }, + { + "epoch": 53.724795640326974, + "grad_norm": 3.676067352294922, + "learning_rate": 9.280066492635976e-06, + "loss": 0.0866, + "step": 19717 + }, + { + "epoch": 53.7275204359673, + "grad_norm": 6.118213653564453, + "learning_rate": 9.279186290779576e-06, + "loss": 0.095, + "step": 19718 + }, + { + "epoch": 53.73024523160763, + "grad_norm": 3.4128832817077637, + "learning_rate": 9.278306094536851e-06, + "loss": 0.0771, + "step": 19719 + }, + { + "epoch": 53.73297002724796, + "grad_norm": 4.553577423095703, + "learning_rate": 9.277425903914654e-06, + "loss": 0.0841, + "step": 19720 + }, + { + "epoch": 53.735694822888284, + "grad_norm": 6.063533782958984, + "learning_rate": 9.276545718919842e-06, + "loss": 0.1039, + "step": 19721 + }, + { + "epoch": 53.73841961852861, + "grad_norm": 4.499881267547607, + "learning_rate": 9.275665539559268e-06, + "loss": 0.1192, + "step": 19722 + }, + { + "epoch": 53.741144414168936, + "grad_norm": 5.290197372436523, + "learning_rate": 9.274785365839788e-06, + "loss": 0.0744, + "step": 19723 + }, + { + "epoch": 53.74386920980926, + "grad_norm": 4.888653755187988, + "learning_rate": 9.273905197768254e-06, + "loss": 0.165, + "step": 19724 + }, + { + "epoch": 53.746594005449595, + "grad_norm": 4.740888595581055, + "learning_rate": 9.273025035351526e-06, + "loss": 0.1876, + "step": 19725 + }, + { + "epoch": 53.74931880108992, + "grad_norm": 4.391806602478027, + "learning_rate": 9.272144878596454e-06, + "loss": 0.1214, + "step": 19726 + }, + { + "epoch": 53.752043596730246, + "grad_norm": 4.5872979164123535, + "learning_rate": 9.27126472750989e-06, + "loss": 0.1286, + "step": 19727 + }, + { + "epoch": 53.75476839237057, + "grad_norm": 4.158890724182129, + "learning_rate": 9.270384582098697e-06, + "loss": 0.0627, + "step": 19728 + }, + { + "epoch": 53.7574931880109, + "grad_norm": 3.866898775100708, + "learning_rate": 9.269504442369727e-06, + "loss": 0.1161, + "step": 19729 + }, + { + "epoch": 53.76021798365122, + "grad_norm": 4.930418491363525, + "learning_rate": 9.26862430832983e-06, + "loss": 0.1342, + "step": 19730 + }, + { + "epoch": 53.762942779291556, + "grad_norm": 8.506067276000977, + "learning_rate": 9.267744179985866e-06, + "loss": 0.1787, + "step": 19731 + }, + { + "epoch": 53.76566757493188, + "grad_norm": 5.147566318511963, + "learning_rate": 9.266864057344684e-06, + "loss": 0.0604, + "step": 19732 + }, + { + "epoch": 53.76839237057221, + "grad_norm": 9.657304763793945, + "learning_rate": 9.265983940413145e-06, + "loss": 0.1791, + "step": 19733 + }, + { + "epoch": 53.771117166212534, + "grad_norm": 4.672646999359131, + "learning_rate": 9.265103829198096e-06, + "loss": 0.1003, + "step": 19734 + }, + { + "epoch": 53.77384196185286, + "grad_norm": 4.547515392303467, + "learning_rate": 9.264223723706397e-06, + "loss": 0.0902, + "step": 19735 + }, + { + "epoch": 53.776566757493185, + "grad_norm": 2.914116382598877, + "learning_rate": 9.263343623944899e-06, + "loss": 0.0588, + "step": 19736 + }, + { + "epoch": 53.77929155313352, + "grad_norm": 4.2892961502075195, + "learning_rate": 9.262463529920458e-06, + "loss": 0.166, + "step": 19737 + }, + { + "epoch": 53.782016348773844, + "grad_norm": 3.9462146759033203, + "learning_rate": 9.261583441639926e-06, + "loss": 0.1907, + "step": 19738 + }, + { + "epoch": 53.78474114441417, + "grad_norm": 4.957346439361572, + "learning_rate": 9.26070335911016e-06, + "loss": 0.1905, + "step": 19739 + }, + { + "epoch": 53.787465940054496, + "grad_norm": 3.814995288848877, + "learning_rate": 9.259823282338008e-06, + "loss": 0.1315, + "step": 19740 + }, + { + "epoch": 53.79019073569482, + "grad_norm": 3.8015565872192383, + "learning_rate": 9.258943211330334e-06, + "loss": 0.0887, + "step": 19741 + }, + { + "epoch": 53.79291553133515, + "grad_norm": 3.8807504177093506, + "learning_rate": 9.258063146093984e-06, + "loss": 0.2631, + "step": 19742 + }, + { + "epoch": 53.79564032697548, + "grad_norm": 5.895612716674805, + "learning_rate": 9.257183086635814e-06, + "loss": 0.2002, + "step": 19743 + }, + { + "epoch": 53.798365122615806, + "grad_norm": 5.0606369972229, + "learning_rate": 9.256303032962676e-06, + "loss": 0.2234, + "step": 19744 + }, + { + "epoch": 53.80108991825613, + "grad_norm": 5.166808128356934, + "learning_rate": 9.255422985081426e-06, + "loss": 0.138, + "step": 19745 + }, + { + "epoch": 53.80381471389646, + "grad_norm": 5.078512191772461, + "learning_rate": 9.254542942998921e-06, + "loss": 0.1813, + "step": 19746 + }, + { + "epoch": 53.80653950953678, + "grad_norm": 4.038086891174316, + "learning_rate": 9.253662906722013e-06, + "loss": 0.1659, + "step": 19747 + }, + { + "epoch": 53.80926430517711, + "grad_norm": 5.574167251586914, + "learning_rate": 9.25278287625755e-06, + "loss": 0.1189, + "step": 19748 + }, + { + "epoch": 53.81198910081744, + "grad_norm": 4.144851207733154, + "learning_rate": 9.251902851612394e-06, + "loss": 0.1833, + "step": 19749 + }, + { + "epoch": 53.81471389645777, + "grad_norm": 5.024191379547119, + "learning_rate": 9.251022832793392e-06, + "loss": 0.1893, + "step": 19750 + }, + { + "epoch": 53.817438692098094, + "grad_norm": 3.9611613750457764, + "learning_rate": 9.250142819807402e-06, + "loss": 0.1355, + "step": 19751 + }, + { + "epoch": 53.82016348773842, + "grad_norm": 3.462373733520508, + "learning_rate": 9.249262812661273e-06, + "loss": 0.2155, + "step": 19752 + }, + { + "epoch": 53.822888283378745, + "grad_norm": 7.335973739624023, + "learning_rate": 9.248382811361864e-06, + "loss": 0.1384, + "step": 19753 + }, + { + "epoch": 53.82561307901907, + "grad_norm": 6.353860855102539, + "learning_rate": 9.247502815916023e-06, + "loss": 0.1822, + "step": 19754 + }, + { + "epoch": 53.828337874659404, + "grad_norm": 8.818236351013184, + "learning_rate": 9.246622826330607e-06, + "loss": 0.079, + "step": 19755 + }, + { + "epoch": 53.83106267029973, + "grad_norm": 4.357721328735352, + "learning_rate": 9.245742842612467e-06, + "loss": 0.1023, + "step": 19756 + }, + { + "epoch": 53.833787465940055, + "grad_norm": 4.350984573364258, + "learning_rate": 9.24486286476846e-06, + "loss": 0.1995, + "step": 19757 + }, + { + "epoch": 53.83651226158038, + "grad_norm": 5.060369968414307, + "learning_rate": 9.243982892805434e-06, + "loss": 0.197, + "step": 19758 + }, + { + "epoch": 53.83923705722071, + "grad_norm": 4.583494186401367, + "learning_rate": 9.243102926730247e-06, + "loss": 0.0623, + "step": 19759 + }, + { + "epoch": 53.84196185286103, + "grad_norm": 5.591639518737793, + "learning_rate": 9.242222966549748e-06, + "loss": 0.1246, + "step": 19760 + }, + { + "epoch": 53.844686648501366, + "grad_norm": 6.224551200866699, + "learning_rate": 9.24134301227079e-06, + "loss": 0.1306, + "step": 19761 + }, + { + "epoch": 53.84741144414169, + "grad_norm": 4.460511207580566, + "learning_rate": 9.240463063900233e-06, + "loss": 0.1049, + "step": 19762 + }, + { + "epoch": 53.85013623978202, + "grad_norm": 4.57638692855835, + "learning_rate": 9.239583121444923e-06, + "loss": 0.0678, + "step": 19763 + }, + { + "epoch": 53.85286103542234, + "grad_norm": 3.6189639568328857, + "learning_rate": 9.238703184911717e-06, + "loss": 0.1865, + "step": 19764 + }, + { + "epoch": 53.85558583106267, + "grad_norm": 5.947134971618652, + "learning_rate": 9.237823254307464e-06, + "loss": 0.104, + "step": 19765 + }, + { + "epoch": 53.858310626702995, + "grad_norm": 23.398439407348633, + "learning_rate": 9.236943329639022e-06, + "loss": 0.2495, + "step": 19766 + }, + { + "epoch": 53.86103542234333, + "grad_norm": 4.084773063659668, + "learning_rate": 9.236063410913237e-06, + "loss": 0.1149, + "step": 19767 + }, + { + "epoch": 53.86376021798365, + "grad_norm": 10.065081596374512, + "learning_rate": 9.235183498136965e-06, + "loss": 0.134, + "step": 19768 + }, + { + "epoch": 53.86648501362398, + "grad_norm": 3.6826155185699463, + "learning_rate": 9.234303591317064e-06, + "loss": 0.0661, + "step": 19769 + }, + { + "epoch": 53.869209809264305, + "grad_norm": 8.887621879577637, + "learning_rate": 9.233423690460377e-06, + "loss": 0.1275, + "step": 19770 + }, + { + "epoch": 53.87193460490463, + "grad_norm": 4.916548252105713, + "learning_rate": 9.232543795573766e-06, + "loss": 0.0894, + "step": 19771 + }, + { + "epoch": 53.87465940054496, + "grad_norm": 4.731387138366699, + "learning_rate": 9.231663906664077e-06, + "loss": 0.1106, + "step": 19772 + }, + { + "epoch": 53.87738419618529, + "grad_norm": 4.941989421844482, + "learning_rate": 9.230784023738165e-06, + "loss": 0.2027, + "step": 19773 + }, + { + "epoch": 53.880108991825615, + "grad_norm": 7.426902770996094, + "learning_rate": 9.229904146802882e-06, + "loss": 0.1344, + "step": 19774 + }, + { + "epoch": 53.88283378746594, + "grad_norm": 4.1482253074646, + "learning_rate": 9.229024275865083e-06, + "loss": 0.126, + "step": 19775 + }, + { + "epoch": 53.88555858310627, + "grad_norm": 6.658325672149658, + "learning_rate": 9.228144410931615e-06, + "loss": 0.2323, + "step": 19776 + }, + { + "epoch": 53.88828337874659, + "grad_norm": 4.1880269050598145, + "learning_rate": 9.227264552009336e-06, + "loss": 0.2457, + "step": 19777 + }, + { + "epoch": 53.89100817438692, + "grad_norm": 4.866042613983154, + "learning_rate": 9.226384699105094e-06, + "loss": 0.0798, + "step": 19778 + }, + { + "epoch": 53.89373297002725, + "grad_norm": 5.16387414932251, + "learning_rate": 9.22550485222574e-06, + "loss": 0.1007, + "step": 19779 + }, + { + "epoch": 53.89645776566758, + "grad_norm": 4.820022106170654, + "learning_rate": 9.224625011378134e-06, + "loss": 0.1, + "step": 19780 + }, + { + "epoch": 53.8991825613079, + "grad_norm": 4.451500415802002, + "learning_rate": 9.223745176569121e-06, + "loss": 0.0887, + "step": 19781 + }, + { + "epoch": 53.90190735694823, + "grad_norm": 5.097253799438477, + "learning_rate": 9.222865347805559e-06, + "loss": 0.1678, + "step": 19782 + }, + { + "epoch": 53.904632152588555, + "grad_norm": 5.498987197875977, + "learning_rate": 9.221985525094292e-06, + "loss": 0.0875, + "step": 19783 + }, + { + "epoch": 53.90735694822888, + "grad_norm": 4.22909688949585, + "learning_rate": 9.221105708442181e-06, + "loss": 0.1011, + "step": 19784 + }, + { + "epoch": 53.91008174386921, + "grad_norm": 3.702805280685425, + "learning_rate": 9.220225897856071e-06, + "loss": 0.0752, + "step": 19785 + }, + { + "epoch": 53.91280653950954, + "grad_norm": 5.755627632141113, + "learning_rate": 9.21934609334282e-06, + "loss": 0.1776, + "step": 19786 + }, + { + "epoch": 53.915531335149865, + "grad_norm": 6.495734214782715, + "learning_rate": 9.218466294909271e-06, + "loss": 0.1526, + "step": 19787 + }, + { + "epoch": 53.91825613079019, + "grad_norm": 4.754812717437744, + "learning_rate": 9.217586502562288e-06, + "loss": 0.1241, + "step": 19788 + }, + { + "epoch": 53.920980926430516, + "grad_norm": 5.09205436706543, + "learning_rate": 9.21670671630871e-06, + "loss": 0.1111, + "step": 19789 + }, + { + "epoch": 53.92370572207084, + "grad_norm": 3.6057493686676025, + "learning_rate": 9.215826936155396e-06, + "loss": 0.1001, + "step": 19790 + }, + { + "epoch": 53.926430517711175, + "grad_norm": 5.297196865081787, + "learning_rate": 9.2149471621092e-06, + "loss": 0.1512, + "step": 19791 + }, + { + "epoch": 53.9291553133515, + "grad_norm": 4.140446662902832, + "learning_rate": 9.214067394176967e-06, + "loss": 0.234, + "step": 19792 + }, + { + "epoch": 53.93188010899183, + "grad_norm": 3.711136817932129, + "learning_rate": 9.213187632365555e-06, + "loss": 0.1779, + "step": 19793 + }, + { + "epoch": 53.93460490463215, + "grad_norm": 3.979206085205078, + "learning_rate": 9.212307876681808e-06, + "loss": 0.1441, + "step": 19794 + }, + { + "epoch": 53.93732970027248, + "grad_norm": 4.640681743621826, + "learning_rate": 9.211428127132587e-06, + "loss": 0.0766, + "step": 19795 + }, + { + "epoch": 53.940054495912804, + "grad_norm": 5.542065620422363, + "learning_rate": 9.210548383724732e-06, + "loss": 0.0915, + "step": 19796 + }, + { + "epoch": 53.94277929155314, + "grad_norm": 3.4548604488372803, + "learning_rate": 9.209668646465103e-06, + "loss": 0.1297, + "step": 19797 + }, + { + "epoch": 53.94550408719346, + "grad_norm": 6.724388599395752, + "learning_rate": 9.208788915360552e-06, + "loss": 0.1034, + "step": 19798 + }, + { + "epoch": 53.94822888283379, + "grad_norm": 4.6330718994140625, + "learning_rate": 9.207909190417924e-06, + "loss": 0.2641, + "step": 19799 + }, + { + "epoch": 53.950953678474114, + "grad_norm": 4.715029716491699, + "learning_rate": 9.207029471644077e-06, + "loss": 0.298, + "step": 19800 + }, + { + "epoch": 53.95367847411444, + "grad_norm": 5.032526016235352, + "learning_rate": 9.206149759045859e-06, + "loss": 0.0849, + "step": 19801 + }, + { + "epoch": 53.956403269754766, + "grad_norm": 5.344160556793213, + "learning_rate": 9.20527005263012e-06, + "loss": 0.1629, + "step": 19802 + }, + { + "epoch": 53.95912806539509, + "grad_norm": 4.603373050689697, + "learning_rate": 9.204390352403711e-06, + "loss": 0.1553, + "step": 19803 + }, + { + "epoch": 53.961852861035425, + "grad_norm": 6.133690357208252, + "learning_rate": 9.203510658373487e-06, + "loss": 0.1337, + "step": 19804 + }, + { + "epoch": 53.96457765667575, + "grad_norm": 5.43211030960083, + "learning_rate": 9.202630970546293e-06, + "loss": 0.0983, + "step": 19805 + }, + { + "epoch": 53.967302452316076, + "grad_norm": 4.266453742980957, + "learning_rate": 9.201751288928988e-06, + "loss": 0.0805, + "step": 19806 + }, + { + "epoch": 53.9700272479564, + "grad_norm": 4.697748184204102, + "learning_rate": 9.200871613528414e-06, + "loss": 0.166, + "step": 19807 + }, + { + "epoch": 53.97275204359673, + "grad_norm": 4.268434047698975, + "learning_rate": 9.19999194435143e-06, + "loss": 0.0804, + "step": 19808 + }, + { + "epoch": 53.97547683923706, + "grad_norm": 3.7529213428497314, + "learning_rate": 9.199112281404878e-06, + "loss": 0.1446, + "step": 19809 + }, + { + "epoch": 53.97820163487739, + "grad_norm": 4.701591968536377, + "learning_rate": 9.198232624695618e-06, + "loss": 0.1803, + "step": 19810 + }, + { + "epoch": 53.98092643051771, + "grad_norm": 5.256634712219238, + "learning_rate": 9.197352974230494e-06, + "loss": 0.2383, + "step": 19811 + }, + { + "epoch": 53.98365122615804, + "grad_norm": 5.565563201904297, + "learning_rate": 9.196473330016361e-06, + "loss": 0.1864, + "step": 19812 + }, + { + "epoch": 53.986376021798364, + "grad_norm": 3.8778679370880127, + "learning_rate": 9.195593692060062e-06, + "loss": 0.1776, + "step": 19813 + }, + { + "epoch": 53.98910081743869, + "grad_norm": 4.592710494995117, + "learning_rate": 9.194714060368458e-06, + "loss": 0.1211, + "step": 19814 + }, + { + "epoch": 53.991825613079016, + "grad_norm": 3.748595714569092, + "learning_rate": 9.193834434948396e-06, + "loss": 0.1427, + "step": 19815 + }, + { + "epoch": 53.99455040871935, + "grad_norm": 5.07763147354126, + "learning_rate": 9.192954815806724e-06, + "loss": 0.0761, + "step": 19816 + }, + { + "epoch": 53.997275204359674, + "grad_norm": 4.350992679595947, + "learning_rate": 9.192075202950297e-06, + "loss": 0.0734, + "step": 19817 + }, + { + "epoch": 54.0, + "grad_norm": 4.1938629150390625, + "learning_rate": 9.19119559638596e-06, + "loss": 0.1311, + "step": 19818 + }, + { + "epoch": 54.002724795640326, + "grad_norm": 4.72659158706665, + "learning_rate": 9.190315996120565e-06, + "loss": 0.2525, + "step": 19819 + }, + { + "epoch": 54.00544959128065, + "grad_norm": 4.600130558013916, + "learning_rate": 9.189436402160964e-06, + "loss": 0.1599, + "step": 19820 + }, + { + "epoch": 54.00817438692098, + "grad_norm": 8.822296142578125, + "learning_rate": 9.188556814514004e-06, + "loss": 0.0787, + "step": 19821 + }, + { + "epoch": 54.01089918256131, + "grad_norm": 4.7953948974609375, + "learning_rate": 9.187677233186541e-06, + "loss": 0.0769, + "step": 19822 + }, + { + "epoch": 54.013623978201636, + "grad_norm": 8.404830932617188, + "learning_rate": 9.18679765818542e-06, + "loss": 0.1116, + "step": 19823 + }, + { + "epoch": 54.01634877384196, + "grad_norm": 4.598225116729736, + "learning_rate": 9.185918089517493e-06, + "loss": 0.1221, + "step": 19824 + }, + { + "epoch": 54.01907356948229, + "grad_norm": 5.0692925453186035, + "learning_rate": 9.18503852718961e-06, + "loss": 0.0839, + "step": 19825 + }, + { + "epoch": 54.02179836512261, + "grad_norm": 3.9961633682250977, + "learning_rate": 9.18415897120862e-06, + "loss": 0.0659, + "step": 19826 + }, + { + "epoch": 54.02452316076294, + "grad_norm": 5.0505523681640625, + "learning_rate": 9.183279421581373e-06, + "loss": 0.1316, + "step": 19827 + }, + { + "epoch": 54.02724795640327, + "grad_norm": 4.773257255554199, + "learning_rate": 9.18239987831472e-06, + "loss": 0.0747, + "step": 19828 + }, + { + "epoch": 54.0299727520436, + "grad_norm": 3.473534107208252, + "learning_rate": 9.181520341415511e-06, + "loss": 0.1516, + "step": 19829 + }, + { + "epoch": 54.032697547683924, + "grad_norm": 4.486723899841309, + "learning_rate": 9.180640810890591e-06, + "loss": 0.1769, + "step": 19830 + }, + { + "epoch": 54.03542234332425, + "grad_norm": 4.74202823638916, + "learning_rate": 9.17976128674682e-06, + "loss": 0.2705, + "step": 19831 + }, + { + "epoch": 54.038147138964575, + "grad_norm": 3.2471649646759033, + "learning_rate": 9.178881768991037e-06, + "loss": 0.0736, + "step": 19832 + }, + { + "epoch": 54.0408719346049, + "grad_norm": 4.45520544052124, + "learning_rate": 9.178002257630099e-06, + "loss": 0.1435, + "step": 19833 + }, + { + "epoch": 54.043596730245234, + "grad_norm": 4.415715217590332, + "learning_rate": 9.177122752670854e-06, + "loss": 0.0706, + "step": 19834 + }, + { + "epoch": 54.04632152588556, + "grad_norm": 2.955765724182129, + "learning_rate": 9.176243254120148e-06, + "loss": 0.1999, + "step": 19835 + }, + { + "epoch": 54.049046321525886, + "grad_norm": 3.835383653640747, + "learning_rate": 9.175363761984836e-06, + "loss": 0.0649, + "step": 19836 + }, + { + "epoch": 54.05177111716621, + "grad_norm": 3.48504638671875, + "learning_rate": 9.174484276271762e-06, + "loss": 0.0753, + "step": 19837 + }, + { + "epoch": 54.05449591280654, + "grad_norm": 3.7399494647979736, + "learning_rate": 9.17360479698778e-06, + "loss": 0.1064, + "step": 19838 + }, + { + "epoch": 54.05722070844686, + "grad_norm": 6.686160564422607, + "learning_rate": 9.172725324139735e-06, + "loss": 0.2414, + "step": 19839 + }, + { + "epoch": 54.059945504087196, + "grad_norm": 3.8733770847320557, + "learning_rate": 9.17184585773448e-06, + "loss": 0.2015, + "step": 19840 + }, + { + "epoch": 54.06267029972752, + "grad_norm": 3.7958931922912598, + "learning_rate": 9.170966397778862e-06, + "loss": 0.0806, + "step": 19841 + }, + { + "epoch": 54.06539509536785, + "grad_norm": 3.566927433013916, + "learning_rate": 9.170086944279733e-06, + "loss": 0.0867, + "step": 19842 + }, + { + "epoch": 54.06811989100817, + "grad_norm": 4.660705089569092, + "learning_rate": 9.169207497243939e-06, + "loss": 0.1188, + "step": 19843 + }, + { + "epoch": 54.0708446866485, + "grad_norm": 4.133790493011475, + "learning_rate": 9.16832805667833e-06, + "loss": 0.1706, + "step": 19844 + }, + { + "epoch": 54.073569482288825, + "grad_norm": 3.4390602111816406, + "learning_rate": 9.167448622589754e-06, + "loss": 0.0875, + "step": 19845 + }, + { + "epoch": 54.07629427792916, + "grad_norm": 5.287810325622559, + "learning_rate": 9.166569194985065e-06, + "loss": 0.0862, + "step": 19846 + }, + { + "epoch": 54.079019073569484, + "grad_norm": 4.312926769256592, + "learning_rate": 9.1656897738711e-06, + "loss": 0.1721, + "step": 19847 + }, + { + "epoch": 54.08174386920981, + "grad_norm": 9.076287269592285, + "learning_rate": 9.164810359254721e-06, + "loss": 0.1, + "step": 19848 + }, + { + "epoch": 54.084468664850135, + "grad_norm": 4.432627201080322, + "learning_rate": 9.163930951142777e-06, + "loss": 0.0796, + "step": 19849 + }, + { + "epoch": 54.08719346049046, + "grad_norm": 4.057800769805908, + "learning_rate": 9.163051549542106e-06, + "loss": 0.0967, + "step": 19850 + }, + { + "epoch": 54.08991825613079, + "grad_norm": 3.83794903755188, + "learning_rate": 9.162172154459565e-06, + "loss": 0.0676, + "step": 19851 + }, + { + "epoch": 54.09264305177112, + "grad_norm": 6.806939125061035, + "learning_rate": 9.161292765901998e-06, + "loss": 0.1545, + "step": 19852 + }, + { + "epoch": 54.095367847411445, + "grad_norm": 4.117062568664551, + "learning_rate": 9.16041338387626e-06, + "loss": 0.2045, + "step": 19853 + }, + { + "epoch": 54.09809264305177, + "grad_norm": 4.125771999359131, + "learning_rate": 9.159534008389193e-06, + "loss": 0.0902, + "step": 19854 + }, + { + "epoch": 54.1008174386921, + "grad_norm": 5.100405216217041, + "learning_rate": 9.158654639447647e-06, + "loss": 0.0767, + "step": 19855 + }, + { + "epoch": 54.10354223433242, + "grad_norm": 7.159243583679199, + "learning_rate": 9.157775277058474e-06, + "loss": 0.0882, + "step": 19856 + }, + { + "epoch": 54.10626702997275, + "grad_norm": 3.345010995864868, + "learning_rate": 9.156895921228519e-06, + "loss": 0.2141, + "step": 19857 + }, + { + "epoch": 54.10899182561308, + "grad_norm": 4.689110279083252, + "learning_rate": 9.156016571964633e-06, + "loss": 0.0822, + "step": 19858 + }, + { + "epoch": 54.11171662125341, + "grad_norm": 6.687030792236328, + "learning_rate": 9.155137229273658e-06, + "loss": 0.2441, + "step": 19859 + }, + { + "epoch": 54.11444141689373, + "grad_norm": 4.554111480712891, + "learning_rate": 9.154257893162452e-06, + "loss": 0.1471, + "step": 19860 + }, + { + "epoch": 54.11716621253406, + "grad_norm": 3.487919330596924, + "learning_rate": 9.153378563637855e-06, + "loss": 0.0966, + "step": 19861 + }, + { + "epoch": 54.119891008174385, + "grad_norm": 4.792840003967285, + "learning_rate": 9.152499240706723e-06, + "loss": 0.0964, + "step": 19862 + }, + { + "epoch": 54.12261580381471, + "grad_norm": 4.359868049621582, + "learning_rate": 9.151619924375896e-06, + "loss": 0.0888, + "step": 19863 + }, + { + "epoch": 54.12534059945504, + "grad_norm": 2.9529571533203125, + "learning_rate": 9.150740614652228e-06, + "loss": 0.0573, + "step": 19864 + }, + { + "epoch": 54.12806539509537, + "grad_norm": 4.3103179931640625, + "learning_rate": 9.149861311542559e-06, + "loss": 0.1637, + "step": 19865 + }, + { + "epoch": 54.130790190735695, + "grad_norm": 4.092645645141602, + "learning_rate": 9.148982015053746e-06, + "loss": 0.1923, + "step": 19866 + }, + { + "epoch": 54.13351498637602, + "grad_norm": 4.39013671875, + "learning_rate": 9.148102725192635e-06, + "loss": 0.1765, + "step": 19867 + }, + { + "epoch": 54.13623978201635, + "grad_norm": 4.031159400939941, + "learning_rate": 9.147223441966072e-06, + "loss": 0.0968, + "step": 19868 + }, + { + "epoch": 54.13896457765667, + "grad_norm": 3.996030569076538, + "learning_rate": 9.146344165380907e-06, + "loss": 0.0598, + "step": 19869 + }, + { + "epoch": 54.141689373297005, + "grad_norm": 5.097391128540039, + "learning_rate": 9.145464895443983e-06, + "loss": 0.0893, + "step": 19870 + }, + { + "epoch": 54.14441416893733, + "grad_norm": 4.223525047302246, + "learning_rate": 9.144585632162153e-06, + "loss": 0.0692, + "step": 19871 + }, + { + "epoch": 54.14713896457766, + "grad_norm": 5.750377655029297, + "learning_rate": 9.143706375542262e-06, + "loss": 0.2223, + "step": 19872 + }, + { + "epoch": 54.14986376021798, + "grad_norm": 5.008936882019043, + "learning_rate": 9.14282712559116e-06, + "loss": 0.1911, + "step": 19873 + }, + { + "epoch": 54.15258855585831, + "grad_norm": 5.459961414337158, + "learning_rate": 9.141947882315691e-06, + "loss": 0.1305, + "step": 19874 + }, + { + "epoch": 54.155313351498634, + "grad_norm": 3.7197933197021484, + "learning_rate": 9.141068645722705e-06, + "loss": 0.116, + "step": 19875 + }, + { + "epoch": 54.15803814713897, + "grad_norm": 4.223834991455078, + "learning_rate": 9.140189415819046e-06, + "loss": 0.1871, + "step": 19876 + }, + { + "epoch": 54.16076294277929, + "grad_norm": 4.812597751617432, + "learning_rate": 9.139310192611565e-06, + "loss": 0.1956, + "step": 19877 + }, + { + "epoch": 54.16348773841962, + "grad_norm": 4.515567302703857, + "learning_rate": 9.138430976107112e-06, + "loss": 0.0794, + "step": 19878 + }, + { + "epoch": 54.166212534059945, + "grad_norm": 5.7182512283325195, + "learning_rate": 9.137551766312528e-06, + "loss": 0.1091, + "step": 19879 + }, + { + "epoch": 54.16893732970027, + "grad_norm": 3.7585790157318115, + "learning_rate": 9.136672563234665e-06, + "loss": 0.1085, + "step": 19880 + }, + { + "epoch": 54.171662125340596, + "grad_norm": 3.8244426250457764, + "learning_rate": 9.135793366880365e-06, + "loss": 0.244, + "step": 19881 + }, + { + "epoch": 54.17438692098093, + "grad_norm": 5.750347137451172, + "learning_rate": 9.134914177256477e-06, + "loss": 0.0974, + "step": 19882 + }, + { + "epoch": 54.177111716621255, + "grad_norm": 4.220276832580566, + "learning_rate": 9.134034994369855e-06, + "loss": 0.1403, + "step": 19883 + }, + { + "epoch": 54.17983651226158, + "grad_norm": 3.6598060131073, + "learning_rate": 9.133155818227338e-06, + "loss": 0.0719, + "step": 19884 + }, + { + "epoch": 54.182561307901906, + "grad_norm": 4.386716365814209, + "learning_rate": 9.132276648835777e-06, + "loss": 0.1611, + "step": 19885 + }, + { + "epoch": 54.18528610354223, + "grad_norm": 3.7580742835998535, + "learning_rate": 9.131397486202016e-06, + "loss": 0.1606, + "step": 19886 + }, + { + "epoch": 54.18801089918256, + "grad_norm": 3.9836504459381104, + "learning_rate": 9.130518330332906e-06, + "loss": 0.1178, + "step": 19887 + }, + { + "epoch": 54.19073569482289, + "grad_norm": 3.4810760021209717, + "learning_rate": 9.129639181235287e-06, + "loss": 0.1179, + "step": 19888 + }, + { + "epoch": 54.19346049046322, + "grad_norm": 4.02688455581665, + "learning_rate": 9.128760038916014e-06, + "loss": 0.183, + "step": 19889 + }, + { + "epoch": 54.19618528610354, + "grad_norm": 5.134456157684326, + "learning_rate": 9.127880903381929e-06, + "loss": 0.1452, + "step": 19890 + }, + { + "epoch": 54.19891008174387, + "grad_norm": 6.035086154937744, + "learning_rate": 9.127001774639879e-06, + "loss": 0.1872, + "step": 19891 + }, + { + "epoch": 54.201634877384194, + "grad_norm": 4.073210716247559, + "learning_rate": 9.12612265269671e-06, + "loss": 0.121, + "step": 19892 + }, + { + "epoch": 54.20435967302452, + "grad_norm": 7.078280448913574, + "learning_rate": 9.125243537559271e-06, + "loss": 0.0725, + "step": 19893 + }, + { + "epoch": 54.20708446866485, + "grad_norm": 4.349194049835205, + "learning_rate": 9.124364429234405e-06, + "loss": 0.3014, + "step": 19894 + }, + { + "epoch": 54.20980926430518, + "grad_norm": 3.871732711791992, + "learning_rate": 9.123485327728964e-06, + "loss": 0.1668, + "step": 19895 + }, + { + "epoch": 54.212534059945504, + "grad_norm": 5.040707111358643, + "learning_rate": 9.122606233049788e-06, + "loss": 0.0866, + "step": 19896 + }, + { + "epoch": 54.21525885558583, + "grad_norm": 4.670590877532959, + "learning_rate": 9.12172714520373e-06, + "loss": 0.261, + "step": 19897 + }, + { + "epoch": 54.217983651226156, + "grad_norm": 3.076552152633667, + "learning_rate": 9.120848064197629e-06, + "loss": 0.0866, + "step": 19898 + }, + { + "epoch": 54.22070844686648, + "grad_norm": 4.455347061157227, + "learning_rate": 9.119968990038333e-06, + "loss": 0.0904, + "step": 19899 + }, + { + "epoch": 54.223433242506815, + "grad_norm": 5.187293529510498, + "learning_rate": 9.119089922732692e-06, + "loss": 0.0904, + "step": 19900 + }, + { + "epoch": 54.22615803814714, + "grad_norm": 4.790494441986084, + "learning_rate": 9.118210862287554e-06, + "loss": 0.2048, + "step": 19901 + }, + { + "epoch": 54.228882833787466, + "grad_norm": 4.984821319580078, + "learning_rate": 9.117331808709758e-06, + "loss": 0.1956, + "step": 19902 + }, + { + "epoch": 54.23160762942779, + "grad_norm": 5.494422912597656, + "learning_rate": 9.116452762006156e-06, + "loss": 0.196, + "step": 19903 + }, + { + "epoch": 54.23433242506812, + "grad_norm": 4.343879699707031, + "learning_rate": 9.11557372218359e-06, + "loss": 0.1167, + "step": 19904 + }, + { + "epoch": 54.237057220708444, + "grad_norm": 5.257289886474609, + "learning_rate": 9.114694689248908e-06, + "loss": 0.2315, + "step": 19905 + }, + { + "epoch": 54.23978201634878, + "grad_norm": 4.560327529907227, + "learning_rate": 9.113815663208954e-06, + "loss": 0.1373, + "step": 19906 + }, + { + "epoch": 54.2425068119891, + "grad_norm": 4.091838836669922, + "learning_rate": 9.112936644070577e-06, + "loss": 0.2889, + "step": 19907 + }, + { + "epoch": 54.24523160762943, + "grad_norm": 5.418046474456787, + "learning_rate": 9.11205763184062e-06, + "loss": 0.0983, + "step": 19908 + }, + { + "epoch": 54.247956403269754, + "grad_norm": 4.3591766357421875, + "learning_rate": 9.11117862652593e-06, + "loss": 0.0921, + "step": 19909 + }, + { + "epoch": 54.25068119891008, + "grad_norm": 3.6707077026367188, + "learning_rate": 9.11029962813335e-06, + "loss": 0.2086, + "step": 19910 + }, + { + "epoch": 54.253405994550405, + "grad_norm": 4.765595436096191, + "learning_rate": 9.10942063666973e-06, + "loss": 0.1228, + "step": 19911 + }, + { + "epoch": 54.25613079019074, + "grad_norm": 4.567806243896484, + "learning_rate": 9.108541652141913e-06, + "loss": 0.2093, + "step": 19912 + }, + { + "epoch": 54.258855585831064, + "grad_norm": 4.311723232269287, + "learning_rate": 9.107662674556746e-06, + "loss": 0.2204, + "step": 19913 + }, + { + "epoch": 54.26158038147139, + "grad_norm": 5.522973537445068, + "learning_rate": 9.106783703921073e-06, + "loss": 0.0944, + "step": 19914 + }, + { + "epoch": 54.264305177111716, + "grad_norm": 4.553855895996094, + "learning_rate": 9.10590474024174e-06, + "loss": 0.1351, + "step": 19915 + }, + { + "epoch": 54.26702997275204, + "grad_norm": 4.051435470581055, + "learning_rate": 9.105025783525587e-06, + "loss": 0.1354, + "step": 19916 + }, + { + "epoch": 54.26975476839237, + "grad_norm": 4.286976337432861, + "learning_rate": 9.104146833779467e-06, + "loss": 0.141, + "step": 19917 + }, + { + "epoch": 54.2724795640327, + "grad_norm": 4.656496524810791, + "learning_rate": 9.103267891010226e-06, + "loss": 0.116, + "step": 19918 + }, + { + "epoch": 54.275204359673026, + "grad_norm": 7.833804607391357, + "learning_rate": 9.102388955224703e-06, + "loss": 0.1368, + "step": 19919 + }, + { + "epoch": 54.27792915531335, + "grad_norm": 7.952826976776123, + "learning_rate": 9.101510026429747e-06, + "loss": 0.0883, + "step": 19920 + }, + { + "epoch": 54.28065395095368, + "grad_norm": 3.5332489013671875, + "learning_rate": 9.100631104632203e-06, + "loss": 0.1683, + "step": 19921 + }, + { + "epoch": 54.283378746594, + "grad_norm": 5.567306041717529, + "learning_rate": 9.099752189838912e-06, + "loss": 0.2112, + "step": 19922 + }, + { + "epoch": 54.28610354223433, + "grad_norm": 11.213207244873047, + "learning_rate": 9.098873282056726e-06, + "loss": 0.193, + "step": 19923 + }, + { + "epoch": 54.28882833787466, + "grad_norm": 3.878872871398926, + "learning_rate": 9.097994381292483e-06, + "loss": 0.1537, + "step": 19924 + }, + { + "epoch": 54.29155313351499, + "grad_norm": 5.20438814163208, + "learning_rate": 9.097115487553033e-06, + "loss": 0.1325, + "step": 19925 + }, + { + "epoch": 54.294277929155314, + "grad_norm": 4.002889156341553, + "learning_rate": 9.096236600845214e-06, + "loss": 0.0691, + "step": 19926 + }, + { + "epoch": 54.29700272479564, + "grad_norm": 5.819010257720947, + "learning_rate": 9.095357721175881e-06, + "loss": 0.1531, + "step": 19927 + }, + { + "epoch": 54.299727520435965, + "grad_norm": 4.930531978607178, + "learning_rate": 9.09447884855187e-06, + "loss": 0.125, + "step": 19928 + }, + { + "epoch": 54.30245231607629, + "grad_norm": 3.960874557495117, + "learning_rate": 9.093599982980029e-06, + "loss": 0.0625, + "step": 19929 + }, + { + "epoch": 54.305177111716624, + "grad_norm": 4.3878326416015625, + "learning_rate": 9.092721124467202e-06, + "loss": 0.1572, + "step": 19930 + }, + { + "epoch": 54.30790190735695, + "grad_norm": 6.021203517913818, + "learning_rate": 9.091842273020233e-06, + "loss": 0.0835, + "step": 19931 + }, + { + "epoch": 54.310626702997276, + "grad_norm": 7.436844825744629, + "learning_rate": 9.090963428645968e-06, + "loss": 0.2068, + "step": 19932 + }, + { + "epoch": 54.3133514986376, + "grad_norm": 3.2498369216918945, + "learning_rate": 9.090084591351247e-06, + "loss": 0.0638, + "step": 19933 + }, + { + "epoch": 54.31607629427793, + "grad_norm": 4.580674648284912, + "learning_rate": 9.089205761142923e-06, + "loss": 0.1088, + "step": 19934 + }, + { + "epoch": 54.31880108991825, + "grad_norm": 4.306822776794434, + "learning_rate": 9.088326938027832e-06, + "loss": 0.1295, + "step": 19935 + }, + { + "epoch": 54.321525885558586, + "grad_norm": 3.0955657958984375, + "learning_rate": 9.087448122012824e-06, + "loss": 0.3952, + "step": 19936 + }, + { + "epoch": 54.32425068119891, + "grad_norm": 3.77670955657959, + "learning_rate": 9.086569313104739e-06, + "loss": 0.1043, + "step": 19937 + }, + { + "epoch": 54.32697547683924, + "grad_norm": 17.023391723632812, + "learning_rate": 9.085690511310425e-06, + "loss": 0.1318, + "step": 19938 + }, + { + "epoch": 54.32970027247956, + "grad_norm": 4.265194416046143, + "learning_rate": 9.084811716636721e-06, + "loss": 0.0826, + "step": 19939 + }, + { + "epoch": 54.33242506811989, + "grad_norm": 3.366642475128174, + "learning_rate": 9.083932929090476e-06, + "loss": 0.1127, + "step": 19940 + }, + { + "epoch": 54.335149863760215, + "grad_norm": 4.4151201248168945, + "learning_rate": 9.083054148678531e-06, + "loss": 0.1242, + "step": 19941 + }, + { + "epoch": 54.33787465940055, + "grad_norm": 4.221611022949219, + "learning_rate": 9.082175375407729e-06, + "loss": 0.1635, + "step": 19942 + }, + { + "epoch": 54.34059945504087, + "grad_norm": 4.439167499542236, + "learning_rate": 9.081296609284919e-06, + "loss": 0.1386, + "step": 19943 + }, + { + "epoch": 54.3433242506812, + "grad_norm": 4.443729400634766, + "learning_rate": 9.080417850316938e-06, + "loss": 0.1717, + "step": 19944 + }, + { + "epoch": 54.346049046321525, + "grad_norm": 4.255154132843018, + "learning_rate": 9.079539098510637e-06, + "loss": 0.1705, + "step": 19945 + }, + { + "epoch": 54.34877384196185, + "grad_norm": 4.578707218170166, + "learning_rate": 9.078660353872853e-06, + "loss": 0.1526, + "step": 19946 + }, + { + "epoch": 54.35149863760218, + "grad_norm": 3.7247154712677, + "learning_rate": 9.077781616410436e-06, + "loss": 0.0903, + "step": 19947 + }, + { + "epoch": 54.35422343324251, + "grad_norm": 3.75530743598938, + "learning_rate": 9.076902886130221e-06, + "loss": 0.1433, + "step": 19948 + }, + { + "epoch": 54.356948228882835, + "grad_norm": 3.572218894958496, + "learning_rate": 9.076024163039061e-06, + "loss": 0.1547, + "step": 19949 + }, + { + "epoch": 54.35967302452316, + "grad_norm": 4.29448938369751, + "learning_rate": 9.075145447143792e-06, + "loss": 0.1369, + "step": 19950 + }, + { + "epoch": 54.36239782016349, + "grad_norm": 4.167031764984131, + "learning_rate": 9.074266738451258e-06, + "loss": 0.1004, + "step": 19951 + }, + { + "epoch": 54.36512261580381, + "grad_norm": 4.512342929840088, + "learning_rate": 9.07338803696831e-06, + "loss": 0.1222, + "step": 19952 + }, + { + "epoch": 54.36784741144414, + "grad_norm": 4.767820835113525, + "learning_rate": 9.072509342701785e-06, + "loss": 0.0902, + "step": 19953 + }, + { + "epoch": 54.37057220708447, + "grad_norm": 3.9609055519104004, + "learning_rate": 9.071630655658528e-06, + "loss": 0.0945, + "step": 19954 + }, + { + "epoch": 54.3732970027248, + "grad_norm": 3.627892255783081, + "learning_rate": 9.070751975845378e-06, + "loss": 0.0796, + "step": 19955 + }, + { + "epoch": 54.37602179836512, + "grad_norm": 3.317429780960083, + "learning_rate": 9.069873303269187e-06, + "loss": 0.2341, + "step": 19956 + }, + { + "epoch": 54.37874659400545, + "grad_norm": 3.9465110301971436, + "learning_rate": 9.068994637936789e-06, + "loss": 0.1977, + "step": 19957 + }, + { + "epoch": 54.381471389645775, + "grad_norm": 3.863725423812866, + "learning_rate": 9.068115979855033e-06, + "loss": 0.1488, + "step": 19958 + }, + { + "epoch": 54.3841961852861, + "grad_norm": 3.8893754482269287, + "learning_rate": 9.067237329030758e-06, + "loss": 0.1253, + "step": 19959 + }, + { + "epoch": 54.38692098092643, + "grad_norm": 3.4500949382781982, + "learning_rate": 9.066358685470811e-06, + "loss": 0.0806, + "step": 19960 + }, + { + "epoch": 54.38964577656676, + "grad_norm": 4.273351669311523, + "learning_rate": 9.06548004918203e-06, + "loss": 0.1133, + "step": 19961 + }, + { + "epoch": 54.392370572207085, + "grad_norm": 4.2101335525512695, + "learning_rate": 9.064601420171262e-06, + "loss": 0.2484, + "step": 19962 + }, + { + "epoch": 54.39509536784741, + "grad_norm": 4.323520660400391, + "learning_rate": 9.063722798445346e-06, + "loss": 0.0516, + "step": 19963 + }, + { + "epoch": 54.39782016348774, + "grad_norm": 4.718120098114014, + "learning_rate": 9.062844184011128e-06, + "loss": 0.1163, + "step": 19964 + }, + { + "epoch": 54.40054495912806, + "grad_norm": 3.932974100112915, + "learning_rate": 9.06196557687545e-06, + "loss": 0.1011, + "step": 19965 + }, + { + "epoch": 54.403269754768395, + "grad_norm": 3.1335978507995605, + "learning_rate": 9.061086977045151e-06, + "loss": 0.0983, + "step": 19966 + }, + { + "epoch": 54.40599455040872, + "grad_norm": 4.015022277832031, + "learning_rate": 9.06020838452708e-06, + "loss": 0.0814, + "step": 19967 + }, + { + "epoch": 54.40871934604905, + "grad_norm": 4.136988162994385, + "learning_rate": 9.059329799328071e-06, + "loss": 0.1075, + "step": 19968 + }, + { + "epoch": 54.41144414168937, + "grad_norm": 3.6818313598632812, + "learning_rate": 9.058451221454974e-06, + "loss": 0.087, + "step": 19969 + }, + { + "epoch": 54.4141689373297, + "grad_norm": 3.534766912460327, + "learning_rate": 9.057572650914631e-06, + "loss": 0.1218, + "step": 19970 + }, + { + "epoch": 54.416893732970024, + "grad_norm": 4.100685119628906, + "learning_rate": 9.05669408771388e-06, + "loss": 0.0897, + "step": 19971 + }, + { + "epoch": 54.41961852861036, + "grad_norm": 3.8797545433044434, + "learning_rate": 9.055815531859565e-06, + "loss": 0.113, + "step": 19972 + }, + { + "epoch": 54.42234332425068, + "grad_norm": 4.971447467803955, + "learning_rate": 9.054936983358528e-06, + "loss": 0.1782, + "step": 19973 + }, + { + "epoch": 54.42506811989101, + "grad_norm": 4.314890384674072, + "learning_rate": 9.054058442217613e-06, + "loss": 0.0845, + "step": 19974 + }, + { + "epoch": 54.427792915531334, + "grad_norm": 4.110722541809082, + "learning_rate": 9.053179908443658e-06, + "loss": 0.1403, + "step": 19975 + }, + { + "epoch": 54.43051771117166, + "grad_norm": 4.262246131896973, + "learning_rate": 9.05230138204351e-06, + "loss": 0.3095, + "step": 19976 + }, + { + "epoch": 54.433242506811986, + "grad_norm": 3.933448076248169, + "learning_rate": 9.051422863024006e-06, + "loss": 0.0857, + "step": 19977 + }, + { + "epoch": 54.43596730245232, + "grad_norm": 4.248157024383545, + "learning_rate": 9.050544351391992e-06, + "loss": 0.0955, + "step": 19978 + }, + { + "epoch": 54.438692098092645, + "grad_norm": 4.22047758102417, + "learning_rate": 9.049665847154307e-06, + "loss": 0.1916, + "step": 19979 + }, + { + "epoch": 54.44141689373297, + "grad_norm": 3.7908871173858643, + "learning_rate": 9.048787350317795e-06, + "loss": 0.257, + "step": 19980 + }, + { + "epoch": 54.444141689373296, + "grad_norm": 4.60216760635376, + "learning_rate": 9.047908860889295e-06, + "loss": 0.2006, + "step": 19981 + }, + { + "epoch": 54.44686648501362, + "grad_norm": 4.825819969177246, + "learning_rate": 9.047030378875652e-06, + "loss": 0.158, + "step": 19982 + }, + { + "epoch": 54.44959128065395, + "grad_norm": 3.4831581115722656, + "learning_rate": 9.046151904283703e-06, + "loss": 0.0746, + "step": 19983 + }, + { + "epoch": 54.45231607629428, + "grad_norm": 3.586744546890259, + "learning_rate": 9.045273437120294e-06, + "loss": 0.0596, + "step": 19984 + }, + { + "epoch": 54.45504087193461, + "grad_norm": 4.446600437164307, + "learning_rate": 9.04439497739226e-06, + "loss": 0.1326, + "step": 19985 + }, + { + "epoch": 54.45776566757493, + "grad_norm": 4.078514099121094, + "learning_rate": 9.043516525106452e-06, + "loss": 0.1062, + "step": 19986 + }, + { + "epoch": 54.46049046321526, + "grad_norm": 4.9097580909729, + "learning_rate": 9.042638080269705e-06, + "loss": 0.1133, + "step": 19987 + }, + { + "epoch": 54.463215258855584, + "grad_norm": 4.0611467361450195, + "learning_rate": 9.041759642888866e-06, + "loss": 0.0827, + "step": 19988 + }, + { + "epoch": 54.46594005449591, + "grad_norm": 4.112037181854248, + "learning_rate": 9.040881212970766e-06, + "loss": 0.1292, + "step": 19989 + }, + { + "epoch": 54.46866485013624, + "grad_norm": 4.098381996154785, + "learning_rate": 9.040002790522257e-06, + "loss": 0.1187, + "step": 19990 + }, + { + "epoch": 54.47138964577657, + "grad_norm": 3.539646863937378, + "learning_rate": 9.039124375550172e-06, + "loss": 0.1378, + "step": 19991 + }, + { + "epoch": 54.474114441416894, + "grad_norm": 4.825586318969727, + "learning_rate": 9.038245968061359e-06, + "loss": 0.0962, + "step": 19992 + }, + { + "epoch": 54.47683923705722, + "grad_norm": 5.104846477508545, + "learning_rate": 9.037367568062653e-06, + "loss": 0.1234, + "step": 19993 + }, + { + "epoch": 54.479564032697546, + "grad_norm": 4.715920925140381, + "learning_rate": 9.0364891755609e-06, + "loss": 0.1236, + "step": 19994 + }, + { + "epoch": 54.48228882833787, + "grad_norm": 7.497341156005859, + "learning_rate": 9.035610790562934e-06, + "loss": 0.226, + "step": 19995 + }, + { + "epoch": 54.485013623978205, + "grad_norm": 4.018693923950195, + "learning_rate": 9.034732413075603e-06, + "loss": 0.2543, + "step": 19996 + }, + { + "epoch": 54.48773841961853, + "grad_norm": 4.353559970855713, + "learning_rate": 9.033854043105743e-06, + "loss": 0.0858, + "step": 19997 + }, + { + "epoch": 54.490463215258856, + "grad_norm": 3.7409958839416504, + "learning_rate": 9.032975680660199e-06, + "loss": 0.0805, + "step": 19998 + }, + { + "epoch": 54.49318801089918, + "grad_norm": 7.8233137130737305, + "learning_rate": 9.032097325745808e-06, + "loss": 0.0697, + "step": 19999 + }, + { + "epoch": 54.49591280653951, + "grad_norm": 4.105851173400879, + "learning_rate": 9.031218978369412e-06, + "loss": 0.1566, + "step": 20000 + }, + { + "epoch": 54.49863760217983, + "grad_norm": 3.414713144302368, + "learning_rate": 9.03034063853785e-06, + "loss": 0.0754, + "step": 20001 + }, + { + "epoch": 54.50136239782017, + "grad_norm": 4.375031471252441, + "learning_rate": 9.029462306257964e-06, + "loss": 0.1029, + "step": 20002 + }, + { + "epoch": 54.50408719346049, + "grad_norm": 4.491516590118408, + "learning_rate": 9.028583981536596e-06, + "loss": 0.1226, + "step": 20003 + }, + { + "epoch": 54.50681198910082, + "grad_norm": 7.4483137130737305, + "learning_rate": 9.027705664380584e-06, + "loss": 0.1017, + "step": 20004 + }, + { + "epoch": 54.509536784741144, + "grad_norm": 4.860036373138428, + "learning_rate": 9.02682735479677e-06, + "loss": 0.1738, + "step": 20005 + }, + { + "epoch": 54.51226158038147, + "grad_norm": 3.863717555999756, + "learning_rate": 9.025949052791991e-06, + "loss": 0.0832, + "step": 20006 + }, + { + "epoch": 54.514986376021795, + "grad_norm": 3.6477813720703125, + "learning_rate": 9.02507075837309e-06, + "loss": 0.097, + "step": 20007 + }, + { + "epoch": 54.51771117166213, + "grad_norm": 3.176609992980957, + "learning_rate": 9.024192471546908e-06, + "loss": 0.0911, + "step": 20008 + }, + { + "epoch": 54.520435967302454, + "grad_norm": 3.793543577194214, + "learning_rate": 9.023314192320283e-06, + "loss": 0.25, + "step": 20009 + }, + { + "epoch": 54.52316076294278, + "grad_norm": 3.5359690189361572, + "learning_rate": 9.022435920700056e-06, + "loss": 0.0817, + "step": 20010 + }, + { + "epoch": 54.525885558583106, + "grad_norm": 3.758002519607544, + "learning_rate": 9.021557656693066e-06, + "loss": 0.1665, + "step": 20011 + }, + { + "epoch": 54.52861035422343, + "grad_norm": 3.602189540863037, + "learning_rate": 9.020679400306156e-06, + "loss": 0.2699, + "step": 20012 + }, + { + "epoch": 54.53133514986376, + "grad_norm": 3.8625736236572266, + "learning_rate": 9.019801151546158e-06, + "loss": 0.1331, + "step": 20013 + }, + { + "epoch": 54.53405994550409, + "grad_norm": 3.1072683334350586, + "learning_rate": 9.018922910419922e-06, + "loss": 0.0707, + "step": 20014 + }, + { + "epoch": 54.536784741144416, + "grad_norm": 4.463259220123291, + "learning_rate": 9.01804467693428e-06, + "loss": 0.1598, + "step": 20015 + }, + { + "epoch": 54.53950953678474, + "grad_norm": 3.9788694381713867, + "learning_rate": 9.017166451096077e-06, + "loss": 0.0881, + "step": 20016 + }, + { + "epoch": 54.54223433242507, + "grad_norm": 14.165175437927246, + "learning_rate": 9.016288232912149e-06, + "loss": 0.3357, + "step": 20017 + }, + { + "epoch": 54.54495912806539, + "grad_norm": 4.943851470947266, + "learning_rate": 9.015410022389336e-06, + "loss": 0.1081, + "step": 20018 + }, + { + "epoch": 54.54768392370572, + "grad_norm": 3.5630993843078613, + "learning_rate": 9.014531819534476e-06, + "loss": 0.0687, + "step": 20019 + }, + { + "epoch": 54.55040871934605, + "grad_norm": 3.5773746967315674, + "learning_rate": 9.013653624354412e-06, + "loss": 0.0726, + "step": 20020 + }, + { + "epoch": 54.55313351498638, + "grad_norm": 4.466707229614258, + "learning_rate": 9.012775436855983e-06, + "loss": 0.122, + "step": 20021 + }, + { + "epoch": 54.555858310626704, + "grad_norm": 5.6644816398620605, + "learning_rate": 9.011897257046025e-06, + "loss": 0.3513, + "step": 20022 + }, + { + "epoch": 54.55858310626703, + "grad_norm": 4.832213401794434, + "learning_rate": 9.011019084931383e-06, + "loss": 0.1543, + "step": 20023 + }, + { + "epoch": 54.561307901907355, + "grad_norm": 3.8002867698669434, + "learning_rate": 9.01014092051889e-06, + "loss": 0.087, + "step": 20024 + }, + { + "epoch": 54.56403269754768, + "grad_norm": 3.9812376499176025, + "learning_rate": 9.009262763815389e-06, + "loss": 0.1795, + "step": 20025 + }, + { + "epoch": 54.566757493188014, + "grad_norm": 6.038990497589111, + "learning_rate": 9.008384614827716e-06, + "loss": 0.0586, + "step": 20026 + }, + { + "epoch": 54.56948228882834, + "grad_norm": 3.3449394702911377, + "learning_rate": 9.007506473562713e-06, + "loss": 0.0652, + "step": 20027 + }, + { + "epoch": 54.572207084468666, + "grad_norm": 4.443698406219482, + "learning_rate": 9.006628340027215e-06, + "loss": 0.2079, + "step": 20028 + }, + { + "epoch": 54.57493188010899, + "grad_norm": 4.384361743927002, + "learning_rate": 9.005750214228066e-06, + "loss": 0.128, + "step": 20029 + }, + { + "epoch": 54.57765667574932, + "grad_norm": 4.37651252746582, + "learning_rate": 9.004872096172103e-06, + "loss": 0.1511, + "step": 20030 + }, + { + "epoch": 54.58038147138964, + "grad_norm": 4.8329267501831055, + "learning_rate": 9.003993985866162e-06, + "loss": 0.0954, + "step": 20031 + }, + { + "epoch": 54.583106267029976, + "grad_norm": 7.993609428405762, + "learning_rate": 9.003115883317085e-06, + "loss": 0.236, + "step": 20032 + }, + { + "epoch": 54.5858310626703, + "grad_norm": 4.4574174880981445, + "learning_rate": 9.00223778853171e-06, + "loss": 0.144, + "step": 20033 + }, + { + "epoch": 54.58855585831063, + "grad_norm": 3.9963061809539795, + "learning_rate": 9.001359701516876e-06, + "loss": 0.1694, + "step": 20034 + }, + { + "epoch": 54.59128065395095, + "grad_norm": 4.554906368255615, + "learning_rate": 9.000481622279417e-06, + "loss": 0.0969, + "step": 20035 + }, + { + "epoch": 54.59400544959128, + "grad_norm": 4.027370929718018, + "learning_rate": 8.999603550826179e-06, + "loss": 0.1302, + "step": 20036 + }, + { + "epoch": 54.596730245231605, + "grad_norm": 4.896831035614014, + "learning_rate": 8.998725487163989e-06, + "loss": 0.0989, + "step": 20037 + }, + { + "epoch": 54.59945504087194, + "grad_norm": 4.44710111618042, + "learning_rate": 8.997847431299697e-06, + "loss": 0.1535, + "step": 20038 + }, + { + "epoch": 54.60217983651226, + "grad_norm": 5.024483680725098, + "learning_rate": 8.996969383240139e-06, + "loss": 0.2239, + "step": 20039 + }, + { + "epoch": 54.60490463215259, + "grad_norm": 2.951127529144287, + "learning_rate": 8.996091342992149e-06, + "loss": 0.1386, + "step": 20040 + }, + { + "epoch": 54.607629427792915, + "grad_norm": 6.057160377502441, + "learning_rate": 8.99521331056257e-06, + "loss": 0.0736, + "step": 20041 + }, + { + "epoch": 54.61035422343324, + "grad_norm": 5.51812219619751, + "learning_rate": 8.994335285958235e-06, + "loss": 0.1019, + "step": 20042 + }, + { + "epoch": 54.61307901907357, + "grad_norm": 4.582193374633789, + "learning_rate": 8.993457269185985e-06, + "loss": 0.239, + "step": 20043 + }, + { + "epoch": 54.6158038147139, + "grad_norm": 4.180214881896973, + "learning_rate": 8.992579260252657e-06, + "loss": 0.2014, + "step": 20044 + }, + { + "epoch": 54.618528610354225, + "grad_norm": 5.111598014831543, + "learning_rate": 8.99170125916509e-06, + "loss": 0.1955, + "step": 20045 + }, + { + "epoch": 54.62125340599455, + "grad_norm": 4.240719318389893, + "learning_rate": 8.99082326593012e-06, + "loss": 0.1793, + "step": 20046 + }, + { + "epoch": 54.62397820163488, + "grad_norm": 3.8516135215759277, + "learning_rate": 8.98994528055459e-06, + "loss": 0.2461, + "step": 20047 + }, + { + "epoch": 54.6267029972752, + "grad_norm": 8.28837776184082, + "learning_rate": 8.989067303045329e-06, + "loss": 0.2363, + "step": 20048 + }, + { + "epoch": 54.62942779291553, + "grad_norm": 6.5025858879089355, + "learning_rate": 8.988189333409181e-06, + "loss": 0.097, + "step": 20049 + }, + { + "epoch": 54.63215258855586, + "grad_norm": 5.841561317443848, + "learning_rate": 8.987311371652981e-06, + "loss": 0.1508, + "step": 20050 + }, + { + "epoch": 54.63487738419619, + "grad_norm": 4.039793491363525, + "learning_rate": 8.986433417783568e-06, + "loss": 0.1022, + "step": 20051 + }, + { + "epoch": 54.63760217983651, + "grad_norm": 4.460607051849365, + "learning_rate": 8.98555547180778e-06, + "loss": 0.0702, + "step": 20052 + }, + { + "epoch": 54.64032697547684, + "grad_norm": 5.703071594238281, + "learning_rate": 8.98467753373245e-06, + "loss": 0.0853, + "step": 20053 + }, + { + "epoch": 54.643051771117165, + "grad_norm": 3.826636552810669, + "learning_rate": 8.983799603564419e-06, + "loss": 0.0832, + "step": 20054 + }, + { + "epoch": 54.64577656675749, + "grad_norm": 4.368951797485352, + "learning_rate": 8.982921681310527e-06, + "loss": 0.1486, + "step": 20055 + }, + { + "epoch": 54.64850136239782, + "grad_norm": 3.9449362754821777, + "learning_rate": 8.982043766977606e-06, + "loss": 0.2082, + "step": 20056 + }, + { + "epoch": 54.65122615803815, + "grad_norm": 4.87952995300293, + "learning_rate": 8.981165860572498e-06, + "loss": 0.1528, + "step": 20057 + }, + { + "epoch": 54.653950953678475, + "grad_norm": 5.293972969055176, + "learning_rate": 8.980287962102035e-06, + "loss": 0.2195, + "step": 20058 + }, + { + "epoch": 54.6566757493188, + "grad_norm": 3.0508005619049072, + "learning_rate": 8.979410071573059e-06, + "loss": 0.1929, + "step": 20059 + }, + { + "epoch": 54.65940054495913, + "grad_norm": 4.53085470199585, + "learning_rate": 8.978532188992403e-06, + "loss": 0.1281, + "step": 20060 + }, + { + "epoch": 54.66212534059945, + "grad_norm": 6.887814998626709, + "learning_rate": 8.977654314366906e-06, + "loss": 0.0915, + "step": 20061 + }, + { + "epoch": 54.664850136239785, + "grad_norm": 4.136505126953125, + "learning_rate": 8.976776447703402e-06, + "loss": 0.2221, + "step": 20062 + }, + { + "epoch": 54.66757493188011, + "grad_norm": 4.612685203552246, + "learning_rate": 8.975898589008734e-06, + "loss": 0.1751, + "step": 20063 + }, + { + "epoch": 54.67029972752044, + "grad_norm": 4.009918212890625, + "learning_rate": 8.975020738289732e-06, + "loss": 0.1879, + "step": 20064 + }, + { + "epoch": 54.67302452316076, + "grad_norm": 5.834253311157227, + "learning_rate": 8.974142895553237e-06, + "loss": 0.0889, + "step": 20065 + }, + { + "epoch": 54.67574931880109, + "grad_norm": 13.993331909179688, + "learning_rate": 8.973265060806083e-06, + "loss": 0.0889, + "step": 20066 + }, + { + "epoch": 54.678474114441414, + "grad_norm": 4.5561323165893555, + "learning_rate": 8.972387234055109e-06, + "loss": 0.0818, + "step": 20067 + }, + { + "epoch": 54.68119891008175, + "grad_norm": 3.4230246543884277, + "learning_rate": 8.971509415307147e-06, + "loss": 0.1092, + "step": 20068 + }, + { + "epoch": 54.68392370572207, + "grad_norm": 4.538247585296631, + "learning_rate": 8.970631604569041e-06, + "loss": 0.2038, + "step": 20069 + }, + { + "epoch": 54.6866485013624, + "grad_norm": 5.932735443115234, + "learning_rate": 8.96975380184762e-06, + "loss": 0.0815, + "step": 20070 + }, + { + "epoch": 54.689373297002724, + "grad_norm": 3.391663074493408, + "learning_rate": 8.968876007149721e-06, + "loss": 0.2214, + "step": 20071 + }, + { + "epoch": 54.69209809264305, + "grad_norm": 4.163836479187012, + "learning_rate": 8.967998220482184e-06, + "loss": 0.1795, + "step": 20072 + }, + { + "epoch": 54.694822888283376, + "grad_norm": 3.9255266189575195, + "learning_rate": 8.967120441851846e-06, + "loss": 0.1985, + "step": 20073 + }, + { + "epoch": 54.69754768392371, + "grad_norm": 6.915604591369629, + "learning_rate": 8.966242671265539e-06, + "loss": 0.1629, + "step": 20074 + }, + { + "epoch": 54.700272479564035, + "grad_norm": 4.429693698883057, + "learning_rate": 8.965364908730103e-06, + "loss": 0.1756, + "step": 20075 + }, + { + "epoch": 54.70299727520436, + "grad_norm": 8.323269844055176, + "learning_rate": 8.96448715425237e-06, + "loss": 0.1755, + "step": 20076 + }, + { + "epoch": 54.705722070844686, + "grad_norm": 3.622795581817627, + "learning_rate": 8.96360940783918e-06, + "loss": 0.1408, + "step": 20077 + }, + { + "epoch": 54.70844686648501, + "grad_norm": 6.326815605163574, + "learning_rate": 8.962731669497364e-06, + "loss": 0.1186, + "step": 20078 + }, + { + "epoch": 54.71117166212534, + "grad_norm": 4.19735860824585, + "learning_rate": 8.96185393923376e-06, + "loss": 0.065, + "step": 20079 + }, + { + "epoch": 54.71389645776567, + "grad_norm": 3.568211793899536, + "learning_rate": 8.960976217055205e-06, + "loss": 0.1169, + "step": 20080 + }, + { + "epoch": 54.716621253406, + "grad_norm": 5.315328598022461, + "learning_rate": 8.960098502968535e-06, + "loss": 0.1154, + "step": 20081 + }, + { + "epoch": 54.71934604904632, + "grad_norm": 4.539693832397461, + "learning_rate": 8.959220796980583e-06, + "loss": 0.1923, + "step": 20082 + }, + { + "epoch": 54.72207084468665, + "grad_norm": 3.790686845779419, + "learning_rate": 8.958343099098187e-06, + "loss": 0.1331, + "step": 20083 + }, + { + "epoch": 54.724795640326974, + "grad_norm": 4.368740558624268, + "learning_rate": 8.95746540932818e-06, + "loss": 0.0937, + "step": 20084 + }, + { + "epoch": 54.7275204359673, + "grad_norm": 5.634218692779541, + "learning_rate": 8.956587727677402e-06, + "loss": 0.1788, + "step": 20085 + }, + { + "epoch": 54.73024523160763, + "grad_norm": 4.544315814971924, + "learning_rate": 8.95571005415268e-06, + "loss": 0.21, + "step": 20086 + }, + { + "epoch": 54.73297002724796, + "grad_norm": 4.4608845710754395, + "learning_rate": 8.954832388760859e-06, + "loss": 0.1745, + "step": 20087 + }, + { + "epoch": 54.735694822888284, + "grad_norm": 4.1434831619262695, + "learning_rate": 8.953954731508765e-06, + "loss": 0.0603, + "step": 20088 + }, + { + "epoch": 54.73841961852861, + "grad_norm": 4.548007488250732, + "learning_rate": 8.95307708240324e-06, + "loss": 0.1487, + "step": 20089 + }, + { + "epoch": 54.741144414168936, + "grad_norm": 3.8979296684265137, + "learning_rate": 8.95219944145112e-06, + "loss": 0.1216, + "step": 20090 + }, + { + "epoch": 54.74386920980926, + "grad_norm": 4.369950771331787, + "learning_rate": 8.951321808659232e-06, + "loss": 0.2392, + "step": 20091 + }, + { + "epoch": 54.746594005449595, + "grad_norm": 3.8677966594696045, + "learning_rate": 8.950444184034422e-06, + "loss": 0.2513, + "step": 20092 + }, + { + "epoch": 54.74931880108992, + "grad_norm": 4.533779621124268, + "learning_rate": 8.949566567583514e-06, + "loss": 0.1116, + "step": 20093 + }, + { + "epoch": 54.752043596730246, + "grad_norm": 4.238668918609619, + "learning_rate": 8.948688959313348e-06, + "loss": 0.1522, + "step": 20094 + }, + { + "epoch": 54.75476839237057, + "grad_norm": 10.364192008972168, + "learning_rate": 8.947811359230762e-06, + "loss": 0.2108, + "step": 20095 + }, + { + "epoch": 54.7574931880109, + "grad_norm": 3.525343656539917, + "learning_rate": 8.946933767342584e-06, + "loss": 0.0685, + "step": 20096 + }, + { + "epoch": 54.76021798365122, + "grad_norm": 3.2858309745788574, + "learning_rate": 8.946056183655654e-06, + "loss": 0.0597, + "step": 20097 + }, + { + "epoch": 54.762942779291556, + "grad_norm": 4.3708977699279785, + "learning_rate": 8.945178608176804e-06, + "loss": 0.0842, + "step": 20098 + }, + { + "epoch": 54.76566757493188, + "grad_norm": 4.582279682159424, + "learning_rate": 8.94430104091287e-06, + "loss": 0.1406, + "step": 20099 + }, + { + "epoch": 54.76839237057221, + "grad_norm": 4.604583740234375, + "learning_rate": 8.943423481870684e-06, + "loss": 0.1027, + "step": 20100 + }, + { + "epoch": 54.771117166212534, + "grad_norm": 3.1620655059814453, + "learning_rate": 8.942545931057083e-06, + "loss": 0.1076, + "step": 20101 + }, + { + "epoch": 54.77384196185286, + "grad_norm": 3.718745470046997, + "learning_rate": 8.941668388478898e-06, + "loss": 0.1667, + "step": 20102 + }, + { + "epoch": 54.776566757493185, + "grad_norm": 3.7406957149505615, + "learning_rate": 8.940790854142967e-06, + "loss": 0.1095, + "step": 20103 + }, + { + "epoch": 54.77929155313352, + "grad_norm": 3.9838240146636963, + "learning_rate": 8.939913328056123e-06, + "loss": 0.1433, + "step": 20104 + }, + { + "epoch": 54.782016348773844, + "grad_norm": 3.6580402851104736, + "learning_rate": 8.939035810225196e-06, + "loss": 0.0863, + "step": 20105 + }, + { + "epoch": 54.78474114441417, + "grad_norm": 3.1197941303253174, + "learning_rate": 8.93815830065703e-06, + "loss": 0.1193, + "step": 20106 + }, + { + "epoch": 54.787465940054496, + "grad_norm": 3.9491944313049316, + "learning_rate": 8.937280799358449e-06, + "loss": 0.2518, + "step": 20107 + }, + { + "epoch": 54.79019073569482, + "grad_norm": 4.503064155578613, + "learning_rate": 8.936403306336294e-06, + "loss": 0.1006, + "step": 20108 + }, + { + "epoch": 54.79291553133515, + "grad_norm": 5.052579879760742, + "learning_rate": 8.935525821597393e-06, + "loss": 0.2372, + "step": 20109 + }, + { + "epoch": 54.79564032697548, + "grad_norm": 5.94606351852417, + "learning_rate": 8.934648345148586e-06, + "loss": 0.1735, + "step": 20110 + }, + { + "epoch": 54.798365122615806, + "grad_norm": 5.028207302093506, + "learning_rate": 8.933770876996701e-06, + "loss": 0.1473, + "step": 20111 + }, + { + "epoch": 54.80108991825613, + "grad_norm": 4.2381591796875, + "learning_rate": 8.932893417148574e-06, + "loss": 0.1469, + "step": 20112 + }, + { + "epoch": 54.80381471389646, + "grad_norm": 5.26708984375, + "learning_rate": 8.932015965611039e-06, + "loss": 0.1179, + "step": 20113 + }, + { + "epoch": 54.80653950953678, + "grad_norm": 3.5204062461853027, + "learning_rate": 8.931138522390932e-06, + "loss": 0.1249, + "step": 20114 + }, + { + "epoch": 54.80926430517711, + "grad_norm": 13.216294288635254, + "learning_rate": 8.93026108749508e-06, + "loss": 0.0952, + "step": 20115 + }, + { + "epoch": 54.81198910081744, + "grad_norm": 4.192880153656006, + "learning_rate": 8.92938366093032e-06, + "loss": 0.1293, + "step": 20116 + }, + { + "epoch": 54.81471389645777, + "grad_norm": 4.845882415771484, + "learning_rate": 8.928506242703487e-06, + "loss": 0.1374, + "step": 20117 + }, + { + "epoch": 54.817438692098094, + "grad_norm": 3.507521629333496, + "learning_rate": 8.927628832821414e-06, + "loss": 0.1211, + "step": 20118 + }, + { + "epoch": 54.82016348773842, + "grad_norm": 3.631596803665161, + "learning_rate": 8.926751431290932e-06, + "loss": 0.1978, + "step": 20119 + }, + { + "epoch": 54.822888283378745, + "grad_norm": 3.468186855316162, + "learning_rate": 8.925874038118874e-06, + "loss": 0.1683, + "step": 20120 + }, + { + "epoch": 54.82561307901907, + "grad_norm": 5.478501319885254, + "learning_rate": 8.924996653312078e-06, + "loss": 0.1497, + "step": 20121 + }, + { + "epoch": 54.828337874659404, + "grad_norm": 4.084097862243652, + "learning_rate": 8.92411927687737e-06, + "loss": 0.1836, + "step": 20122 + }, + { + "epoch": 54.83106267029973, + "grad_norm": 4.4851603507995605, + "learning_rate": 8.923241908821585e-06, + "loss": 0.097, + "step": 20123 + }, + { + "epoch": 54.833787465940055, + "grad_norm": 4.094699859619141, + "learning_rate": 8.92236454915156e-06, + "loss": 0.187, + "step": 20124 + }, + { + "epoch": 54.83651226158038, + "grad_norm": 4.169244289398193, + "learning_rate": 8.921487197874125e-06, + "loss": 0.1711, + "step": 20125 + }, + { + "epoch": 54.83923705722071, + "grad_norm": 4.472836494445801, + "learning_rate": 8.920609854996114e-06, + "loss": 0.1385, + "step": 20126 + }, + { + "epoch": 54.84196185286103, + "grad_norm": 4.887625694274902, + "learning_rate": 8.919732520524358e-06, + "loss": 0.0653, + "step": 20127 + }, + { + "epoch": 54.844686648501366, + "grad_norm": 3.731388568878174, + "learning_rate": 8.918855194465692e-06, + "loss": 0.1478, + "step": 20128 + }, + { + "epoch": 54.84741144414169, + "grad_norm": 3.4862475395202637, + "learning_rate": 8.917977876826944e-06, + "loss": 0.068, + "step": 20129 + }, + { + "epoch": 54.85013623978202, + "grad_norm": 3.36405086517334, + "learning_rate": 8.917100567614953e-06, + "loss": 0.1545, + "step": 20130 + }, + { + "epoch": 54.85286103542234, + "grad_norm": 4.44132661819458, + "learning_rate": 8.916223266836545e-06, + "loss": 0.0733, + "step": 20131 + }, + { + "epoch": 54.85558583106267, + "grad_norm": 3.3464503288269043, + "learning_rate": 8.915345974498555e-06, + "loss": 0.1082, + "step": 20132 + }, + { + "epoch": 54.858310626702995, + "grad_norm": 3.916621208190918, + "learning_rate": 8.914468690607817e-06, + "loss": 0.1018, + "step": 20133 + }, + { + "epoch": 54.86103542234333, + "grad_norm": 3.7433347702026367, + "learning_rate": 8.913591415171164e-06, + "loss": 0.2159, + "step": 20134 + }, + { + "epoch": 54.86376021798365, + "grad_norm": 4.746287822723389, + "learning_rate": 8.912714148195421e-06, + "loss": 0.0847, + "step": 20135 + }, + { + "epoch": 54.86648501362398, + "grad_norm": 3.4867773056030273, + "learning_rate": 8.91183688968743e-06, + "loss": 0.1162, + "step": 20136 + }, + { + "epoch": 54.869209809264305, + "grad_norm": 4.690593719482422, + "learning_rate": 8.910959639654016e-06, + "loss": 0.1168, + "step": 20137 + }, + { + "epoch": 54.87193460490463, + "grad_norm": 5.641656875610352, + "learning_rate": 8.910082398102011e-06, + "loss": 0.1863, + "step": 20138 + }, + { + "epoch": 54.87465940054496, + "grad_norm": 3.7166199684143066, + "learning_rate": 8.909205165038254e-06, + "loss": 0.0903, + "step": 20139 + }, + { + "epoch": 54.87738419618529, + "grad_norm": 3.8179373741149902, + "learning_rate": 8.908327940469566e-06, + "loss": 0.1289, + "step": 20140 + }, + { + "epoch": 54.880108991825615, + "grad_norm": 3.5929508209228516, + "learning_rate": 8.907450724402787e-06, + "loss": 0.2132, + "step": 20141 + }, + { + "epoch": 54.88283378746594, + "grad_norm": 4.170956611633301, + "learning_rate": 8.906573516844749e-06, + "loss": 0.0654, + "step": 20142 + }, + { + "epoch": 54.88555858310627, + "grad_norm": 5.51287841796875, + "learning_rate": 8.90569631780228e-06, + "loss": 0.3354, + "step": 20143 + }, + { + "epoch": 54.88828337874659, + "grad_norm": 4.574120044708252, + "learning_rate": 8.904819127282215e-06, + "loss": 0.1151, + "step": 20144 + }, + { + "epoch": 54.89100817438692, + "grad_norm": 4.020722389221191, + "learning_rate": 8.903941945291381e-06, + "loss": 0.0802, + "step": 20145 + }, + { + "epoch": 54.89373297002725, + "grad_norm": 4.197763442993164, + "learning_rate": 8.903064771836614e-06, + "loss": 0.0967, + "step": 20146 + }, + { + "epoch": 54.89645776566758, + "grad_norm": 4.7374138832092285, + "learning_rate": 8.90218760692474e-06, + "loss": 0.104, + "step": 20147 + }, + { + "epoch": 54.8991825613079, + "grad_norm": 4.119732856750488, + "learning_rate": 8.901310450562596e-06, + "loss": 0.1324, + "step": 20148 + }, + { + "epoch": 54.90190735694823, + "grad_norm": 4.031776428222656, + "learning_rate": 8.900433302757011e-06, + "loss": 0.1899, + "step": 20149 + }, + { + "epoch": 54.904632152588555, + "grad_norm": 3.7676784992218018, + "learning_rate": 8.899556163514816e-06, + "loss": 0.0882, + "step": 20150 + }, + { + "epoch": 54.90735694822888, + "grad_norm": 3.5313427448272705, + "learning_rate": 8.898679032842841e-06, + "loss": 0.0704, + "step": 20151 + }, + { + "epoch": 54.91008174386921, + "grad_norm": 7.0860748291015625, + "learning_rate": 8.89780191074792e-06, + "loss": 0.3893, + "step": 20152 + }, + { + "epoch": 54.91280653950954, + "grad_norm": 4.015528678894043, + "learning_rate": 8.89692479723688e-06, + "loss": 0.0862, + "step": 20153 + }, + { + "epoch": 54.915531335149865, + "grad_norm": 3.9792304039001465, + "learning_rate": 8.896047692316556e-06, + "loss": 0.0752, + "step": 20154 + }, + { + "epoch": 54.91825613079019, + "grad_norm": 4.7039794921875, + "learning_rate": 8.895170595993775e-06, + "loss": 0.0793, + "step": 20155 + }, + { + "epoch": 54.920980926430516, + "grad_norm": 3.5627522468566895, + "learning_rate": 8.894293508275372e-06, + "loss": 0.0566, + "step": 20156 + }, + { + "epoch": 54.92370572207084, + "grad_norm": 3.825472831726074, + "learning_rate": 8.89341642916817e-06, + "loss": 0.0845, + "step": 20157 + }, + { + "epoch": 54.926430517711175, + "grad_norm": 6.54740047454834, + "learning_rate": 8.89253935867901e-06, + "loss": 0.1128, + "step": 20158 + }, + { + "epoch": 54.9291553133515, + "grad_norm": 3.504307985305786, + "learning_rate": 8.891662296814718e-06, + "loss": 0.0474, + "step": 20159 + }, + { + "epoch": 54.93188010899183, + "grad_norm": 3.362431049346924, + "learning_rate": 8.890785243582126e-06, + "loss": 0.0863, + "step": 20160 + }, + { + "epoch": 54.93460490463215, + "grad_norm": 4.529660701751709, + "learning_rate": 8.88990819898806e-06, + "loss": 0.1229, + "step": 20161 + }, + { + "epoch": 54.93732970027248, + "grad_norm": 4.243590354919434, + "learning_rate": 8.889031163039354e-06, + "loss": 0.1806, + "step": 20162 + }, + { + "epoch": 54.940054495912804, + "grad_norm": 4.1471052169799805, + "learning_rate": 8.888154135742837e-06, + "loss": 0.1809, + "step": 20163 + }, + { + "epoch": 54.94277929155314, + "grad_norm": 4.807526111602783, + "learning_rate": 8.887277117105342e-06, + "loss": 0.1097, + "step": 20164 + }, + { + "epoch": 54.94550408719346, + "grad_norm": 4.902317523956299, + "learning_rate": 8.886400107133693e-06, + "loss": 0.0878, + "step": 20165 + }, + { + "epoch": 54.94822888283379, + "grad_norm": 3.7905032634735107, + "learning_rate": 8.885523105834728e-06, + "loss": 0.0941, + "step": 20166 + }, + { + "epoch": 54.950953678474114, + "grad_norm": 3.9634134769439697, + "learning_rate": 8.884646113215271e-06, + "loss": 0.1036, + "step": 20167 + }, + { + "epoch": 54.95367847411444, + "grad_norm": 3.690251588821411, + "learning_rate": 8.883769129282157e-06, + "loss": 0.1237, + "step": 20168 + }, + { + "epoch": 54.956403269754766, + "grad_norm": 3.8657050132751465, + "learning_rate": 8.88289215404221e-06, + "loss": 0.0878, + "step": 20169 + }, + { + "epoch": 54.95912806539509, + "grad_norm": 3.9786417484283447, + "learning_rate": 8.882015187502266e-06, + "loss": 0.1353, + "step": 20170 + }, + { + "epoch": 54.961852861035425, + "grad_norm": 3.9551243782043457, + "learning_rate": 8.881138229669148e-06, + "loss": 0.0948, + "step": 20171 + }, + { + "epoch": 54.96457765667575, + "grad_norm": 3.3971383571624756, + "learning_rate": 8.880261280549693e-06, + "loss": 0.0944, + "step": 20172 + }, + { + "epoch": 54.967302452316076, + "grad_norm": 3.829512119293213, + "learning_rate": 8.879384340150723e-06, + "loss": 0.0624, + "step": 20173 + }, + { + "epoch": 54.9700272479564, + "grad_norm": 3.6681878566741943, + "learning_rate": 8.878507408479071e-06, + "loss": 0.1425, + "step": 20174 + }, + { + "epoch": 54.97275204359673, + "grad_norm": 5.585506439208984, + "learning_rate": 8.877630485541572e-06, + "loss": 0.1311, + "step": 20175 + }, + { + "epoch": 54.97547683923706, + "grad_norm": 3.7614965438842773, + "learning_rate": 8.876753571345047e-06, + "loss": 0.1328, + "step": 20176 + }, + { + "epoch": 54.97820163487739, + "grad_norm": 3.8820040225982666, + "learning_rate": 8.875876665896332e-06, + "loss": 0.146, + "step": 20177 + }, + { + "epoch": 54.98092643051771, + "grad_norm": 4.194509983062744, + "learning_rate": 8.874999769202252e-06, + "loss": 0.0942, + "step": 20178 + }, + { + "epoch": 54.98365122615804, + "grad_norm": 3.0866785049438477, + "learning_rate": 8.874122881269638e-06, + "loss": 0.0562, + "step": 20179 + }, + { + "epoch": 54.986376021798364, + "grad_norm": 4.456143379211426, + "learning_rate": 8.873246002105318e-06, + "loss": 0.1501, + "step": 20180 + }, + { + "epoch": 54.98910081743869, + "grad_norm": 5.2778544425964355, + "learning_rate": 8.872369131716122e-06, + "loss": 0.1049, + "step": 20181 + }, + { + "epoch": 54.991825613079016, + "grad_norm": 4.072261333465576, + "learning_rate": 8.87149227010888e-06, + "loss": 0.0715, + "step": 20182 + }, + { + "epoch": 54.99455040871935, + "grad_norm": 4.435225963592529, + "learning_rate": 8.870615417290418e-06, + "loss": 0.1282, + "step": 20183 + }, + { + "epoch": 54.997275204359674, + "grad_norm": 7.494845390319824, + "learning_rate": 8.86973857326757e-06, + "loss": 0.3999, + "step": 20184 + }, + { + "epoch": 55.0, + "grad_norm": 3.7138309478759766, + "learning_rate": 8.868861738047158e-06, + "loss": 0.3206, + "step": 20185 + }, + { + "epoch": 55.002724795640326, + "grad_norm": 2.3504903316497803, + "learning_rate": 8.867984911636018e-06, + "loss": 0.042, + "step": 20186 + }, + { + "epoch": 55.00544959128065, + "grad_norm": 4.132227420806885, + "learning_rate": 8.867108094040971e-06, + "loss": 0.1461, + "step": 20187 + }, + { + "epoch": 55.00817438692098, + "grad_norm": 5.002457141876221, + "learning_rate": 8.866231285268853e-06, + "loss": 0.085, + "step": 20188 + }, + { + "epoch": 55.01089918256131, + "grad_norm": 3.5996875762939453, + "learning_rate": 8.865354485326488e-06, + "loss": 0.1164, + "step": 20189 + }, + { + "epoch": 55.013623978201636, + "grad_norm": 3.4471304416656494, + "learning_rate": 8.864477694220707e-06, + "loss": 0.2071, + "step": 20190 + }, + { + "epoch": 55.01634877384196, + "grad_norm": 3.784421920776367, + "learning_rate": 8.863600911958332e-06, + "loss": 0.1949, + "step": 20191 + }, + { + "epoch": 55.01907356948229, + "grad_norm": 3.1663200855255127, + "learning_rate": 8.862724138546199e-06, + "loss": 0.2372, + "step": 20192 + }, + { + "epoch": 55.02179836512261, + "grad_norm": 7.027255058288574, + "learning_rate": 8.861847373991137e-06, + "loss": 0.1854, + "step": 20193 + }, + { + "epoch": 55.02452316076294, + "grad_norm": 4.086968898773193, + "learning_rate": 8.860970618299969e-06, + "loss": 0.0725, + "step": 20194 + }, + { + "epoch": 55.02724795640327, + "grad_norm": 3.4274401664733887, + "learning_rate": 8.860093871479527e-06, + "loss": 0.1138, + "step": 20195 + }, + { + "epoch": 55.0299727520436, + "grad_norm": 4.892838954925537, + "learning_rate": 8.859217133536634e-06, + "loss": 0.086, + "step": 20196 + }, + { + "epoch": 55.032697547683924, + "grad_norm": 3.099942207336426, + "learning_rate": 8.858340404478125e-06, + "loss": 0.1526, + "step": 20197 + }, + { + "epoch": 55.03542234332425, + "grad_norm": 3.834798574447632, + "learning_rate": 8.857463684310822e-06, + "loss": 0.1158, + "step": 20198 + }, + { + "epoch": 55.038147138964575, + "grad_norm": 3.4103872776031494, + "learning_rate": 8.856586973041554e-06, + "loss": 0.1156, + "step": 20199 + }, + { + "epoch": 55.0408719346049, + "grad_norm": 3.874640703201294, + "learning_rate": 8.855710270677152e-06, + "loss": 0.0671, + "step": 20200 + }, + { + "epoch": 55.043596730245234, + "grad_norm": 3.6838603019714355, + "learning_rate": 8.854833577224441e-06, + "loss": 0.0981, + "step": 20201 + }, + { + "epoch": 55.04632152588556, + "grad_norm": 3.1662166118621826, + "learning_rate": 8.853956892690247e-06, + "loss": 0.0902, + "step": 20202 + }, + { + "epoch": 55.049046321525886, + "grad_norm": 4.34156608581543, + "learning_rate": 8.8530802170814e-06, + "loss": 0.0939, + "step": 20203 + }, + { + "epoch": 55.05177111716621, + "grad_norm": 3.8500425815582275, + "learning_rate": 8.852203550404733e-06, + "loss": 0.0719, + "step": 20204 + }, + { + "epoch": 55.05449591280654, + "grad_norm": 3.3220314979553223, + "learning_rate": 8.851326892667061e-06, + "loss": 0.1083, + "step": 20205 + }, + { + "epoch": 55.05722070844686, + "grad_norm": 4.671602725982666, + "learning_rate": 8.850450243875223e-06, + "loss": 0.186, + "step": 20206 + }, + { + "epoch": 55.059945504087196, + "grad_norm": 4.377599716186523, + "learning_rate": 8.849573604036037e-06, + "loss": 0.1742, + "step": 20207 + }, + { + "epoch": 55.06267029972752, + "grad_norm": 3.458615779876709, + "learning_rate": 8.84869697315634e-06, + "loss": 0.0964, + "step": 20208 + }, + { + "epoch": 55.06539509536785, + "grad_norm": 3.8470566272735596, + "learning_rate": 8.847820351242949e-06, + "loss": 0.0632, + "step": 20209 + }, + { + "epoch": 55.06811989100817, + "grad_norm": 4.82185173034668, + "learning_rate": 8.846943738302697e-06, + "loss": 0.0863, + "step": 20210 + }, + { + "epoch": 55.0708446866485, + "grad_norm": 3.5537400245666504, + "learning_rate": 8.846067134342412e-06, + "loss": 0.0965, + "step": 20211 + }, + { + "epoch": 55.073569482288825, + "grad_norm": 7.0138726234436035, + "learning_rate": 8.845190539368918e-06, + "loss": 0.1019, + "step": 20212 + }, + { + "epoch": 55.07629427792916, + "grad_norm": 3.815699338912964, + "learning_rate": 8.844313953389043e-06, + "loss": 0.0778, + "step": 20213 + }, + { + "epoch": 55.079019073569484, + "grad_norm": 4.912858963012695, + "learning_rate": 8.843437376409614e-06, + "loss": 0.1153, + "step": 20214 + }, + { + "epoch": 55.08174386920981, + "grad_norm": 3.5321946144104004, + "learning_rate": 8.842560808437459e-06, + "loss": 0.0825, + "step": 20215 + }, + { + "epoch": 55.084468664850135, + "grad_norm": 4.460391044616699, + "learning_rate": 8.841684249479399e-06, + "loss": 0.1036, + "step": 20216 + }, + { + "epoch": 55.08719346049046, + "grad_norm": 3.628164529800415, + "learning_rate": 8.840807699542269e-06, + "loss": 0.0758, + "step": 20217 + }, + { + "epoch": 55.08991825613079, + "grad_norm": 4.200746536254883, + "learning_rate": 8.839931158632889e-06, + "loss": 0.1253, + "step": 20218 + }, + { + "epoch": 55.09264305177112, + "grad_norm": 4.804069995880127, + "learning_rate": 8.83905462675809e-06, + "loss": 0.3142, + "step": 20219 + }, + { + "epoch": 55.095367847411445, + "grad_norm": 2.774752616882324, + "learning_rate": 8.838178103924694e-06, + "loss": 0.0545, + "step": 20220 + }, + { + "epoch": 55.09809264305177, + "grad_norm": 4.986216068267822, + "learning_rate": 8.83730159013953e-06, + "loss": 0.2886, + "step": 20221 + }, + { + "epoch": 55.1008174386921, + "grad_norm": 3.9713242053985596, + "learning_rate": 8.836425085409424e-06, + "loss": 0.0606, + "step": 20222 + }, + { + "epoch": 55.10354223433242, + "grad_norm": 3.014117479324341, + "learning_rate": 8.835548589741204e-06, + "loss": 0.0635, + "step": 20223 + }, + { + "epoch": 55.10626702997275, + "grad_norm": 3.384340763092041, + "learning_rate": 8.834672103141691e-06, + "loss": 0.2183, + "step": 20224 + }, + { + "epoch": 55.10899182561308, + "grad_norm": 4.542238235473633, + "learning_rate": 8.833795625617715e-06, + "loss": 0.1492, + "step": 20225 + }, + { + "epoch": 55.11171662125341, + "grad_norm": 5.573112487792969, + "learning_rate": 8.832919157176098e-06, + "loss": 0.2511, + "step": 20226 + }, + { + "epoch": 55.11444141689373, + "grad_norm": 4.03924560546875, + "learning_rate": 8.832042697823673e-06, + "loss": 0.1052, + "step": 20227 + }, + { + "epoch": 55.11716621253406, + "grad_norm": 3.9031364917755127, + "learning_rate": 8.83116624756726e-06, + "loss": 0.092, + "step": 20228 + }, + { + "epoch": 55.119891008174385, + "grad_norm": 4.472345352172852, + "learning_rate": 8.83028980641369e-06, + "loss": 0.1997, + "step": 20229 + }, + { + "epoch": 55.12261580381471, + "grad_norm": 3.6592280864715576, + "learning_rate": 8.829413374369782e-06, + "loss": 0.0813, + "step": 20230 + }, + { + "epoch": 55.12534059945504, + "grad_norm": 3.745520830154419, + "learning_rate": 8.828536951442367e-06, + "loss": 0.0754, + "step": 20231 + }, + { + "epoch": 55.12806539509537, + "grad_norm": 3.5315065383911133, + "learning_rate": 8.827660537638267e-06, + "loss": 0.1161, + "step": 20232 + }, + { + "epoch": 55.130790190735695, + "grad_norm": 4.480501174926758, + "learning_rate": 8.826784132964313e-06, + "loss": 0.0642, + "step": 20233 + }, + { + "epoch": 55.13351498637602, + "grad_norm": 4.230098724365234, + "learning_rate": 8.825907737427321e-06, + "loss": 0.1604, + "step": 20234 + }, + { + "epoch": 55.13623978201635, + "grad_norm": 5.051258087158203, + "learning_rate": 8.825031351034125e-06, + "loss": 0.1923, + "step": 20235 + }, + { + "epoch": 55.13896457765667, + "grad_norm": 4.391542911529541, + "learning_rate": 8.824154973791545e-06, + "loss": 0.0783, + "step": 20236 + }, + { + "epoch": 55.141689373297005, + "grad_norm": 4.71673583984375, + "learning_rate": 8.823278605706412e-06, + "loss": 0.1286, + "step": 20237 + }, + { + "epoch": 55.14441416893733, + "grad_norm": 5.092132091522217, + "learning_rate": 8.822402246785542e-06, + "loss": 0.1752, + "step": 20238 + }, + { + "epoch": 55.14713896457766, + "grad_norm": 3.5076375007629395, + "learning_rate": 8.82152589703577e-06, + "loss": 0.0689, + "step": 20239 + }, + { + "epoch": 55.14986376021798, + "grad_norm": 5.270573616027832, + "learning_rate": 8.820649556463913e-06, + "loss": 0.0711, + "step": 20240 + }, + { + "epoch": 55.15258855585831, + "grad_norm": 4.217471599578857, + "learning_rate": 8.819773225076803e-06, + "loss": 0.0764, + "step": 20241 + }, + { + "epoch": 55.155313351498634, + "grad_norm": 2.447371244430542, + "learning_rate": 8.818896902881257e-06, + "loss": 0.0484, + "step": 20242 + }, + { + "epoch": 55.15803814713897, + "grad_norm": 4.374931335449219, + "learning_rate": 8.818020589884103e-06, + "loss": 0.2461, + "step": 20243 + }, + { + "epoch": 55.16076294277929, + "grad_norm": 2.9120328426361084, + "learning_rate": 8.817144286092167e-06, + "loss": 0.1152, + "step": 20244 + }, + { + "epoch": 55.16348773841962, + "grad_norm": 4.129950046539307, + "learning_rate": 8.816267991512277e-06, + "loss": 0.1396, + "step": 20245 + }, + { + "epoch": 55.166212534059945, + "grad_norm": 27.105342864990234, + "learning_rate": 8.815391706151252e-06, + "loss": 0.1394, + "step": 20246 + }, + { + "epoch": 55.16893732970027, + "grad_norm": 8.449474334716797, + "learning_rate": 8.81451543001592e-06, + "loss": 0.1023, + "step": 20247 + }, + { + "epoch": 55.171662125340596, + "grad_norm": 3.819932222366333, + "learning_rate": 8.8136391631131e-06, + "loss": 0.1099, + "step": 20248 + }, + { + "epoch": 55.17438692098093, + "grad_norm": 3.9747045040130615, + "learning_rate": 8.812762905449624e-06, + "loss": 0.1669, + "step": 20249 + }, + { + "epoch": 55.177111716621255, + "grad_norm": 3.383382797241211, + "learning_rate": 8.81188665703231e-06, + "loss": 0.1389, + "step": 20250 + }, + { + "epoch": 55.17983651226158, + "grad_norm": 4.292916774749756, + "learning_rate": 8.811010417867987e-06, + "loss": 0.0666, + "step": 20251 + }, + { + "epoch": 55.182561307901906, + "grad_norm": 4.522629737854004, + "learning_rate": 8.810134187963472e-06, + "loss": 0.1429, + "step": 20252 + }, + { + "epoch": 55.18528610354223, + "grad_norm": 5.1233015060424805, + "learning_rate": 8.809257967325598e-06, + "loss": 0.1429, + "step": 20253 + }, + { + "epoch": 55.18801089918256, + "grad_norm": 7.660608291625977, + "learning_rate": 8.808381755961183e-06, + "loss": 0.107, + "step": 20254 + }, + { + "epoch": 55.19073569482289, + "grad_norm": 5.419578552246094, + "learning_rate": 8.807505553877054e-06, + "loss": 0.2346, + "step": 20255 + }, + { + "epoch": 55.19346049046322, + "grad_norm": 4.0470757484436035, + "learning_rate": 8.80662936108003e-06, + "loss": 0.1617, + "step": 20256 + }, + { + "epoch": 55.19618528610354, + "grad_norm": 4.291471481323242, + "learning_rate": 8.805753177576942e-06, + "loss": 0.055, + "step": 20257 + }, + { + "epoch": 55.19891008174387, + "grad_norm": 3.448298454284668, + "learning_rate": 8.804877003374606e-06, + "loss": 0.0694, + "step": 20258 + }, + { + "epoch": 55.201634877384194, + "grad_norm": 3.65120005607605, + "learning_rate": 8.804000838479853e-06, + "loss": 0.1836, + "step": 20259 + }, + { + "epoch": 55.20435967302452, + "grad_norm": 3.6651101112365723, + "learning_rate": 8.803124682899498e-06, + "loss": 0.1116, + "step": 20260 + }, + { + "epoch": 55.20708446866485, + "grad_norm": 4.730973243713379, + "learning_rate": 8.802248536640371e-06, + "loss": 0.154, + "step": 20261 + }, + { + "epoch": 55.20980926430518, + "grad_norm": 3.9444150924682617, + "learning_rate": 8.801372399709297e-06, + "loss": 0.205, + "step": 20262 + }, + { + "epoch": 55.212534059945504, + "grad_norm": 4.400238037109375, + "learning_rate": 8.800496272113094e-06, + "loss": 0.1721, + "step": 20263 + }, + { + "epoch": 55.21525885558583, + "grad_norm": 4.010095596313477, + "learning_rate": 8.79962015385859e-06, + "loss": 0.1627, + "step": 20264 + }, + { + "epoch": 55.217983651226156, + "grad_norm": 5.48933219909668, + "learning_rate": 8.798744044952602e-06, + "loss": 0.1086, + "step": 20265 + }, + { + "epoch": 55.22070844686648, + "grad_norm": 5.2862548828125, + "learning_rate": 8.797867945401957e-06, + "loss": 0.1496, + "step": 20266 + }, + { + "epoch": 55.223433242506815, + "grad_norm": 4.545261383056641, + "learning_rate": 8.79699185521348e-06, + "loss": 0.084, + "step": 20267 + }, + { + "epoch": 55.22615803814714, + "grad_norm": 6.042707443237305, + "learning_rate": 8.79611577439399e-06, + "loss": 0.1042, + "step": 20268 + }, + { + "epoch": 55.228882833787466, + "grad_norm": 7.061752796173096, + "learning_rate": 8.795239702950314e-06, + "loss": 0.1304, + "step": 20269 + }, + { + "epoch": 55.23160762942779, + "grad_norm": 3.2901804447174072, + "learning_rate": 8.794363640889269e-06, + "loss": 0.2088, + "step": 20270 + }, + { + "epoch": 55.23433242506812, + "grad_norm": 8.586701393127441, + "learning_rate": 8.793487588217686e-06, + "loss": 0.127, + "step": 20271 + }, + { + "epoch": 55.237057220708444, + "grad_norm": 3.2752881050109863, + "learning_rate": 8.792611544942378e-06, + "loss": 0.2658, + "step": 20272 + }, + { + "epoch": 55.23978201634878, + "grad_norm": 3.862663984298706, + "learning_rate": 8.791735511070175e-06, + "loss": 0.0598, + "step": 20273 + }, + { + "epoch": 55.2425068119891, + "grad_norm": 4.582693576812744, + "learning_rate": 8.790859486607896e-06, + "loss": 0.1095, + "step": 20274 + }, + { + "epoch": 55.24523160762943, + "grad_norm": 4.33612060546875, + "learning_rate": 8.789983471562365e-06, + "loss": 0.1885, + "step": 20275 + }, + { + "epoch": 55.247956403269754, + "grad_norm": 4.18079137802124, + "learning_rate": 8.789107465940403e-06, + "loss": 0.0801, + "step": 20276 + }, + { + "epoch": 55.25068119891008, + "grad_norm": 3.529261589050293, + "learning_rate": 8.788231469748831e-06, + "loss": 0.3526, + "step": 20277 + }, + { + "epoch": 55.253405994550405, + "grad_norm": 4.6453657150268555, + "learning_rate": 8.787355482994477e-06, + "loss": 0.0942, + "step": 20278 + }, + { + "epoch": 55.25613079019074, + "grad_norm": 4.475424289703369, + "learning_rate": 8.786479505684157e-06, + "loss": 0.1576, + "step": 20279 + }, + { + "epoch": 55.258855585831064, + "grad_norm": 5.170428276062012, + "learning_rate": 8.785603537824699e-06, + "loss": 0.1326, + "step": 20280 + }, + { + "epoch": 55.26158038147139, + "grad_norm": 5.155692100524902, + "learning_rate": 8.784727579422918e-06, + "loss": 0.0831, + "step": 20281 + }, + { + "epoch": 55.264305177111716, + "grad_norm": 4.734813213348389, + "learning_rate": 8.783851630485642e-06, + "loss": 0.0534, + "step": 20282 + }, + { + "epoch": 55.26702997275204, + "grad_norm": 3.995192289352417, + "learning_rate": 8.782975691019689e-06, + "loss": 0.1358, + "step": 20283 + }, + { + "epoch": 55.26975476839237, + "grad_norm": 6.3889288902282715, + "learning_rate": 8.782099761031882e-06, + "loss": 0.1075, + "step": 20284 + }, + { + "epoch": 55.2724795640327, + "grad_norm": 4.618751525878906, + "learning_rate": 8.781223840529043e-06, + "loss": 0.2006, + "step": 20285 + }, + { + "epoch": 55.275204359673026, + "grad_norm": 4.445119380950928, + "learning_rate": 8.780347929517995e-06, + "loss": 0.132, + "step": 20286 + }, + { + "epoch": 55.27792915531335, + "grad_norm": 4.009746551513672, + "learning_rate": 8.779472028005555e-06, + "loss": 0.0733, + "step": 20287 + }, + { + "epoch": 55.28065395095368, + "grad_norm": 5.356363296508789, + "learning_rate": 8.778596135998551e-06, + "loss": 0.084, + "step": 20288 + }, + { + "epoch": 55.283378746594, + "grad_norm": 3.0403525829315186, + "learning_rate": 8.777720253503799e-06, + "loss": 0.1113, + "step": 20289 + }, + { + "epoch": 55.28610354223433, + "grad_norm": 4.624750137329102, + "learning_rate": 8.776844380528123e-06, + "loss": 0.157, + "step": 20290 + }, + { + "epoch": 55.28882833787466, + "grad_norm": 4.86638879776001, + "learning_rate": 8.775968517078343e-06, + "loss": 0.3833, + "step": 20291 + }, + { + "epoch": 55.29155313351499, + "grad_norm": 3.088222026824951, + "learning_rate": 8.77509266316128e-06, + "loss": 0.0966, + "step": 20292 + }, + { + "epoch": 55.294277929155314, + "grad_norm": 4.835270404815674, + "learning_rate": 8.774216818783758e-06, + "loss": 0.113, + "step": 20293 + }, + { + "epoch": 55.29700272479564, + "grad_norm": 6.672879695892334, + "learning_rate": 8.773340983952595e-06, + "loss": 0.0722, + "step": 20294 + }, + { + "epoch": 55.299727520435965, + "grad_norm": 7.032373428344727, + "learning_rate": 8.77246515867461e-06, + "loss": 0.1777, + "step": 20295 + }, + { + "epoch": 55.30245231607629, + "grad_norm": 5.144742965698242, + "learning_rate": 8.77158934295663e-06, + "loss": 0.1588, + "step": 20296 + }, + { + "epoch": 55.305177111716624, + "grad_norm": 5.2068915367126465, + "learning_rate": 8.770713536805471e-06, + "loss": 0.1146, + "step": 20297 + }, + { + "epoch": 55.30790190735695, + "grad_norm": 2.8044724464416504, + "learning_rate": 8.769837740227959e-06, + "loss": 0.0561, + "step": 20298 + }, + { + "epoch": 55.310626702997276, + "grad_norm": 5.347578525543213, + "learning_rate": 8.768961953230908e-06, + "loss": 0.0992, + "step": 20299 + }, + { + "epoch": 55.3133514986376, + "grad_norm": 4.6252970695495605, + "learning_rate": 8.768086175821145e-06, + "loss": 0.0579, + "step": 20300 + }, + { + "epoch": 55.31607629427793, + "grad_norm": 3.5642454624176025, + "learning_rate": 8.767210408005483e-06, + "loss": 0.1003, + "step": 20301 + }, + { + "epoch": 55.31880108991825, + "grad_norm": 3.8838951587677, + "learning_rate": 8.76633464979075e-06, + "loss": 0.1208, + "step": 20302 + }, + { + "epoch": 55.321525885558586, + "grad_norm": 6.521909713745117, + "learning_rate": 8.76545890118376e-06, + "loss": 0.1335, + "step": 20303 + }, + { + "epoch": 55.32425068119891, + "grad_norm": 3.353015899658203, + "learning_rate": 8.764583162191338e-06, + "loss": 0.1621, + "step": 20304 + }, + { + "epoch": 55.32697547683924, + "grad_norm": 3.9906301498413086, + "learning_rate": 8.763707432820303e-06, + "loss": 0.0857, + "step": 20305 + }, + { + "epoch": 55.32970027247956, + "grad_norm": 4.320180892944336, + "learning_rate": 8.762831713077475e-06, + "loss": 0.1162, + "step": 20306 + }, + { + "epoch": 55.33242506811989, + "grad_norm": 4.274276256561279, + "learning_rate": 8.761956002969672e-06, + "loss": 0.0848, + "step": 20307 + }, + { + "epoch": 55.335149863760215, + "grad_norm": 3.954271078109741, + "learning_rate": 8.761080302503718e-06, + "loss": 0.1116, + "step": 20308 + }, + { + "epoch": 55.33787465940055, + "grad_norm": 8.057647705078125, + "learning_rate": 8.760204611686429e-06, + "loss": 0.1377, + "step": 20309 + }, + { + "epoch": 55.34059945504087, + "grad_norm": 3.788517475128174, + "learning_rate": 8.759328930524628e-06, + "loss": 0.0685, + "step": 20310 + }, + { + "epoch": 55.3433242506812, + "grad_norm": 4.2331438064575195, + "learning_rate": 8.75845325902513e-06, + "loss": 0.0902, + "step": 20311 + }, + { + "epoch": 55.346049046321525, + "grad_norm": 5.339404582977295, + "learning_rate": 8.757577597194758e-06, + "loss": 0.1751, + "step": 20312 + }, + { + "epoch": 55.34877384196185, + "grad_norm": 5.503269672393799, + "learning_rate": 8.756701945040334e-06, + "loss": 0.1377, + "step": 20313 + }, + { + "epoch": 55.35149863760218, + "grad_norm": 4.48171329498291, + "learning_rate": 8.755826302568676e-06, + "loss": 0.1856, + "step": 20314 + }, + { + "epoch": 55.35422343324251, + "grad_norm": 3.3599138259887695, + "learning_rate": 8.754950669786602e-06, + "loss": 0.0976, + "step": 20315 + }, + { + "epoch": 55.356948228882835, + "grad_norm": 4.272397041320801, + "learning_rate": 8.754075046700934e-06, + "loss": 0.0889, + "step": 20316 + }, + { + "epoch": 55.35967302452316, + "grad_norm": 3.6690478324890137, + "learning_rate": 8.753199433318486e-06, + "loss": 0.0819, + "step": 20317 + }, + { + "epoch": 55.36239782016349, + "grad_norm": 5.556273460388184, + "learning_rate": 8.752323829646084e-06, + "loss": 0.1198, + "step": 20318 + }, + { + "epoch": 55.36512261580381, + "grad_norm": 6.00161075592041, + "learning_rate": 8.751448235690541e-06, + "loss": 0.2671, + "step": 20319 + }, + { + "epoch": 55.36784741144414, + "grad_norm": 4.806107044219971, + "learning_rate": 8.750572651458682e-06, + "loss": 0.1753, + "step": 20320 + }, + { + "epoch": 55.37057220708447, + "grad_norm": 4.758706569671631, + "learning_rate": 8.74969707695732e-06, + "loss": 0.0665, + "step": 20321 + }, + { + "epoch": 55.3732970027248, + "grad_norm": 4.076588153839111, + "learning_rate": 8.74882151219328e-06, + "loss": 0.0696, + "step": 20322 + }, + { + "epoch": 55.37602179836512, + "grad_norm": 4.132752418518066, + "learning_rate": 8.747945957173374e-06, + "loss": 0.1716, + "step": 20323 + }, + { + "epoch": 55.37874659400545, + "grad_norm": 4.330327987670898, + "learning_rate": 8.747070411904429e-06, + "loss": 0.088, + "step": 20324 + }, + { + "epoch": 55.381471389645775, + "grad_norm": 7.776508808135986, + "learning_rate": 8.746194876393255e-06, + "loss": 0.091, + "step": 20325 + }, + { + "epoch": 55.3841961852861, + "grad_norm": 3.777819871902466, + "learning_rate": 8.745319350646678e-06, + "loss": 0.1072, + "step": 20326 + }, + { + "epoch": 55.38692098092643, + "grad_norm": 4.417204856872559, + "learning_rate": 8.744443834671509e-06, + "loss": 0.1621, + "step": 20327 + }, + { + "epoch": 55.38964577656676, + "grad_norm": 4.460134983062744, + "learning_rate": 8.743568328474577e-06, + "loss": 0.0995, + "step": 20328 + }, + { + "epoch": 55.392370572207085, + "grad_norm": 2.475911855697632, + "learning_rate": 8.742692832062688e-06, + "loss": 0.0443, + "step": 20329 + }, + { + "epoch": 55.39509536784741, + "grad_norm": 4.059835433959961, + "learning_rate": 8.74181734544267e-06, + "loss": 0.0958, + "step": 20330 + }, + { + "epoch": 55.39782016348774, + "grad_norm": 6.29917049407959, + "learning_rate": 8.740941868621337e-06, + "loss": 0.1114, + "step": 20331 + }, + { + "epoch": 55.40054495912806, + "grad_norm": 4.21348237991333, + "learning_rate": 8.740066401605512e-06, + "loss": 0.1171, + "step": 20332 + }, + { + "epoch": 55.403269754768395, + "grad_norm": 4.922358512878418, + "learning_rate": 8.739190944402006e-06, + "loss": 0.2403, + "step": 20333 + }, + { + "epoch": 55.40599455040872, + "grad_norm": 4.729889869689941, + "learning_rate": 8.738315497017642e-06, + "loss": 0.128, + "step": 20334 + }, + { + "epoch": 55.40871934604905, + "grad_norm": 4.229569435119629, + "learning_rate": 8.737440059459234e-06, + "loss": 0.115, + "step": 20335 + }, + { + "epoch": 55.41144414168937, + "grad_norm": 4.083345890045166, + "learning_rate": 8.736564631733606e-06, + "loss": 0.1628, + "step": 20336 + }, + { + "epoch": 55.4141689373297, + "grad_norm": 4.032779216766357, + "learning_rate": 8.735689213847569e-06, + "loss": 0.1891, + "step": 20337 + }, + { + "epoch": 55.416893732970024, + "grad_norm": 3.4884467124938965, + "learning_rate": 8.734813805807944e-06, + "loss": 0.2137, + "step": 20338 + }, + { + "epoch": 55.41961852861036, + "grad_norm": 3.715762138366699, + "learning_rate": 8.73393840762155e-06, + "loss": 0.1797, + "step": 20339 + }, + { + "epoch": 55.42234332425068, + "grad_norm": 4.092436790466309, + "learning_rate": 8.733063019295202e-06, + "loss": 0.1081, + "step": 20340 + }, + { + "epoch": 55.42506811989101, + "grad_norm": 4.212950229644775, + "learning_rate": 8.732187640835718e-06, + "loss": 0.0681, + "step": 20341 + }, + { + "epoch": 55.427792915531334, + "grad_norm": 3.463665723800659, + "learning_rate": 8.731312272249916e-06, + "loss": 0.0773, + "step": 20342 + }, + { + "epoch": 55.43051771117166, + "grad_norm": 3.5409793853759766, + "learning_rate": 8.730436913544612e-06, + "loss": 0.1978, + "step": 20343 + }, + { + "epoch": 55.433242506811986, + "grad_norm": 4.001033782958984, + "learning_rate": 8.729561564726627e-06, + "loss": 0.1921, + "step": 20344 + }, + { + "epoch": 55.43596730245232, + "grad_norm": 4.495682239532471, + "learning_rate": 8.728686225802773e-06, + "loss": 0.1104, + "step": 20345 + }, + { + "epoch": 55.438692098092645, + "grad_norm": 5.5811967849731445, + "learning_rate": 8.727810896779869e-06, + "loss": 0.0699, + "step": 20346 + }, + { + "epoch": 55.44141689373297, + "grad_norm": 4.244899749755859, + "learning_rate": 8.726935577664737e-06, + "loss": 0.1407, + "step": 20347 + }, + { + "epoch": 55.444141689373296, + "grad_norm": 6.328291893005371, + "learning_rate": 8.726060268464186e-06, + "loss": 0.1195, + "step": 20348 + }, + { + "epoch": 55.44686648501362, + "grad_norm": 3.9155054092407227, + "learning_rate": 8.72518496918504e-06, + "loss": 0.1208, + "step": 20349 + }, + { + "epoch": 55.44959128065395, + "grad_norm": 4.084961414337158, + "learning_rate": 8.724309679834109e-06, + "loss": 0.0744, + "step": 20350 + }, + { + "epoch": 55.45231607629428, + "grad_norm": 6.089450836181641, + "learning_rate": 8.723434400418215e-06, + "loss": 0.1051, + "step": 20351 + }, + { + "epoch": 55.45504087193461, + "grad_norm": 3.64111328125, + "learning_rate": 8.722559130944173e-06, + "loss": 0.1728, + "step": 20352 + }, + { + "epoch": 55.45776566757493, + "grad_norm": 4.314663410186768, + "learning_rate": 8.721683871418797e-06, + "loss": 0.1598, + "step": 20353 + }, + { + "epoch": 55.46049046321526, + "grad_norm": 2.8920440673828125, + "learning_rate": 8.720808621848911e-06, + "loss": 0.1399, + "step": 20354 + }, + { + "epoch": 55.463215258855584, + "grad_norm": 4.880285739898682, + "learning_rate": 8.719933382241322e-06, + "loss": 0.094, + "step": 20355 + }, + { + "epoch": 55.46594005449591, + "grad_norm": 3.634341239929199, + "learning_rate": 8.719058152602853e-06, + "loss": 0.1027, + "step": 20356 + }, + { + "epoch": 55.46866485013624, + "grad_norm": 4.2444024085998535, + "learning_rate": 8.718182932940316e-06, + "loss": 0.1918, + "step": 20357 + }, + { + "epoch": 55.47138964577657, + "grad_norm": 6.068127155303955, + "learning_rate": 8.71730772326053e-06, + "loss": 0.2071, + "step": 20358 + }, + { + "epoch": 55.474114441416894, + "grad_norm": 2.986868143081665, + "learning_rate": 8.71643252357031e-06, + "loss": 0.2392, + "step": 20359 + }, + { + "epoch": 55.47683923705722, + "grad_norm": 4.797121524810791, + "learning_rate": 8.715557333876472e-06, + "loss": 0.135, + "step": 20360 + }, + { + "epoch": 55.479564032697546, + "grad_norm": 4.307587623596191, + "learning_rate": 8.714682154185831e-06, + "loss": 0.0817, + "step": 20361 + }, + { + "epoch": 55.48228882833787, + "grad_norm": 3.9596898555755615, + "learning_rate": 8.713806984505208e-06, + "loss": 0.1155, + "step": 20362 + }, + { + "epoch": 55.485013623978205, + "grad_norm": 4.114192008972168, + "learning_rate": 8.712931824841411e-06, + "loss": 0.0847, + "step": 20363 + }, + { + "epoch": 55.48773841961853, + "grad_norm": 3.0506885051727295, + "learning_rate": 8.712056675201257e-06, + "loss": 0.1047, + "step": 20364 + }, + { + "epoch": 55.490463215258856, + "grad_norm": 3.6099131107330322, + "learning_rate": 8.711181535591569e-06, + "loss": 0.0744, + "step": 20365 + }, + { + "epoch": 55.49318801089918, + "grad_norm": 4.8901591300964355, + "learning_rate": 8.710306406019155e-06, + "loss": 0.1609, + "step": 20366 + }, + { + "epoch": 55.49591280653951, + "grad_norm": 6.4215874671936035, + "learning_rate": 8.709431286490837e-06, + "loss": 0.1302, + "step": 20367 + }, + { + "epoch": 55.49863760217983, + "grad_norm": 4.286976337432861, + "learning_rate": 8.708556177013423e-06, + "loss": 0.1142, + "step": 20368 + }, + { + "epoch": 55.50136239782017, + "grad_norm": 4.187290191650391, + "learning_rate": 8.707681077593735e-06, + "loss": 0.3471, + "step": 20369 + }, + { + "epoch": 55.50408719346049, + "grad_norm": 4.669692516326904, + "learning_rate": 8.70680598823858e-06, + "loss": 0.1053, + "step": 20370 + }, + { + "epoch": 55.50681198910082, + "grad_norm": 5.98300838470459, + "learning_rate": 8.705930908954786e-06, + "loss": 0.2092, + "step": 20371 + }, + { + "epoch": 55.509536784741144, + "grad_norm": 5.066943168640137, + "learning_rate": 8.705055839749154e-06, + "loss": 0.0883, + "step": 20372 + }, + { + "epoch": 55.51226158038147, + "grad_norm": 4.160504341125488, + "learning_rate": 8.704180780628508e-06, + "loss": 0.1035, + "step": 20373 + }, + { + "epoch": 55.514986376021795, + "grad_norm": 4.330354690551758, + "learning_rate": 8.70330573159966e-06, + "loss": 0.107, + "step": 20374 + }, + { + "epoch": 55.51771117166213, + "grad_norm": 3.0367326736450195, + "learning_rate": 8.702430692669426e-06, + "loss": 0.0578, + "step": 20375 + }, + { + "epoch": 55.520435967302454, + "grad_norm": 4.381452560424805, + "learning_rate": 8.701555663844619e-06, + "loss": 0.3114, + "step": 20376 + }, + { + "epoch": 55.52316076294278, + "grad_norm": 5.92275857925415, + "learning_rate": 8.700680645132053e-06, + "loss": 0.3236, + "step": 20377 + }, + { + "epoch": 55.525885558583106, + "grad_norm": 3.6232314109802246, + "learning_rate": 8.699805636538548e-06, + "loss": 0.0894, + "step": 20378 + }, + { + "epoch": 55.52861035422343, + "grad_norm": 4.690647602081299, + "learning_rate": 8.698930638070913e-06, + "loss": 0.0753, + "step": 20379 + }, + { + "epoch": 55.53133514986376, + "grad_norm": 4.333375453948975, + "learning_rate": 8.698055649735964e-06, + "loss": 0.138, + "step": 20380 + }, + { + "epoch": 55.53405994550409, + "grad_norm": 4.587692737579346, + "learning_rate": 8.697180671540513e-06, + "loss": 0.0817, + "step": 20381 + }, + { + "epoch": 55.536784741144416, + "grad_norm": 4.031619071960449, + "learning_rate": 8.69630570349138e-06, + "loss": 0.1549, + "step": 20382 + }, + { + "epoch": 55.53950953678474, + "grad_norm": 4.475871562957764, + "learning_rate": 8.695430745595377e-06, + "loss": 0.2075, + "step": 20383 + }, + { + "epoch": 55.54223433242507, + "grad_norm": 3.520782470703125, + "learning_rate": 8.694555797859317e-06, + "loss": 0.0868, + "step": 20384 + }, + { + "epoch": 55.54495912806539, + "grad_norm": 5.136046409606934, + "learning_rate": 8.693680860290016e-06, + "loss": 0.1181, + "step": 20385 + }, + { + "epoch": 55.54768392370572, + "grad_norm": 4.102364540100098, + "learning_rate": 8.692805932894281e-06, + "loss": 0.2792, + "step": 20386 + }, + { + "epoch": 55.55040871934605, + "grad_norm": 4.081116199493408, + "learning_rate": 8.691931015678938e-06, + "loss": 0.132, + "step": 20387 + }, + { + "epoch": 55.55313351498638, + "grad_norm": 4.678136825561523, + "learning_rate": 8.69105610865079e-06, + "loss": 0.1073, + "step": 20388 + }, + { + "epoch": 55.555858310626704, + "grad_norm": 3.575960874557495, + "learning_rate": 8.690181211816657e-06, + "loss": 0.0895, + "step": 20389 + }, + { + "epoch": 55.55858310626703, + "grad_norm": 3.154576063156128, + "learning_rate": 8.689306325183348e-06, + "loss": 0.113, + "step": 20390 + }, + { + "epoch": 55.561307901907355, + "grad_norm": 3.1575584411621094, + "learning_rate": 8.688431448757682e-06, + "loss": 0.314, + "step": 20391 + }, + { + "epoch": 55.56403269754768, + "grad_norm": 3.662139892578125, + "learning_rate": 8.687556582546467e-06, + "loss": 0.1995, + "step": 20392 + }, + { + "epoch": 55.566757493188014, + "grad_norm": 4.017824172973633, + "learning_rate": 8.686681726556521e-06, + "loss": 0.2252, + "step": 20393 + }, + { + "epoch": 55.56948228882834, + "grad_norm": 5.218798637390137, + "learning_rate": 8.685806880794654e-06, + "loss": 0.1921, + "step": 20394 + }, + { + "epoch": 55.572207084468666, + "grad_norm": 4.111189365386963, + "learning_rate": 8.684932045267683e-06, + "loss": 0.1295, + "step": 20395 + }, + { + "epoch": 55.57493188010899, + "grad_norm": 3.641528367996216, + "learning_rate": 8.684057219982416e-06, + "loss": 0.0877, + "step": 20396 + }, + { + "epoch": 55.57765667574932, + "grad_norm": 5.454028129577637, + "learning_rate": 8.683182404945672e-06, + "loss": 0.1628, + "step": 20397 + }, + { + "epoch": 55.58038147138964, + "grad_norm": 3.9976165294647217, + "learning_rate": 8.682307600164255e-06, + "loss": 0.0892, + "step": 20398 + }, + { + "epoch": 55.583106267029976, + "grad_norm": 4.10651969909668, + "learning_rate": 8.68143280564499e-06, + "loss": 0.1394, + "step": 20399 + }, + { + "epoch": 55.5858310626703, + "grad_norm": 4.620141983032227, + "learning_rate": 8.68055802139468e-06, + "loss": 0.0581, + "step": 20400 + }, + { + "epoch": 55.58855585831063, + "grad_norm": 3.702589750289917, + "learning_rate": 8.679683247420146e-06, + "loss": 0.0711, + "step": 20401 + }, + { + "epoch": 55.59128065395095, + "grad_norm": 3.2625372409820557, + "learning_rate": 8.678808483728194e-06, + "loss": 0.0644, + "step": 20402 + }, + { + "epoch": 55.59400544959128, + "grad_norm": 4.552007675170898, + "learning_rate": 8.67793373032564e-06, + "loss": 0.2491, + "step": 20403 + }, + { + "epoch": 55.596730245231605, + "grad_norm": 3.1166679859161377, + "learning_rate": 8.677058987219294e-06, + "loss": 0.0956, + "step": 20404 + }, + { + "epoch": 55.59945504087194, + "grad_norm": 3.954953193664551, + "learning_rate": 8.676184254415973e-06, + "loss": 0.067, + "step": 20405 + }, + { + "epoch": 55.60217983651226, + "grad_norm": 3.1082582473754883, + "learning_rate": 8.675309531922484e-06, + "loss": 0.1931, + "step": 20406 + }, + { + "epoch": 55.60490463215259, + "grad_norm": 4.5571513175964355, + "learning_rate": 8.674434819745643e-06, + "loss": 0.1322, + "step": 20407 + }, + { + "epoch": 55.607629427792915, + "grad_norm": 5.0540571212768555, + "learning_rate": 8.67356011789226e-06, + "loss": 0.2517, + "step": 20408 + }, + { + "epoch": 55.61035422343324, + "grad_norm": 6.6033782958984375, + "learning_rate": 8.672685426369148e-06, + "loss": 0.0835, + "step": 20409 + }, + { + "epoch": 55.61307901907357, + "grad_norm": 3.401458501815796, + "learning_rate": 8.671810745183118e-06, + "loss": 0.0837, + "step": 20410 + }, + { + "epoch": 55.6158038147139, + "grad_norm": 4.99204158782959, + "learning_rate": 8.670936074340987e-06, + "loss": 0.1478, + "step": 20411 + }, + { + "epoch": 55.618528610354225, + "grad_norm": 6.409547328948975, + "learning_rate": 8.67006141384956e-06, + "loss": 0.179, + "step": 20412 + }, + { + "epoch": 55.62125340599455, + "grad_norm": 9.704611778259277, + "learning_rate": 8.669186763715654e-06, + "loss": 0.1256, + "step": 20413 + }, + { + "epoch": 55.62397820163488, + "grad_norm": 4.166541576385498, + "learning_rate": 8.668312123946076e-06, + "loss": 0.1664, + "step": 20414 + }, + { + "epoch": 55.6267029972752, + "grad_norm": 4.253971576690674, + "learning_rate": 8.667437494547637e-06, + "loss": 0.0987, + "step": 20415 + }, + { + "epoch": 55.62942779291553, + "grad_norm": 3.637429714202881, + "learning_rate": 8.666562875527158e-06, + "loss": 0.1224, + "step": 20416 + }, + { + "epoch": 55.63215258855586, + "grad_norm": 3.9984216690063477, + "learning_rate": 8.665688266891442e-06, + "loss": 0.1385, + "step": 20417 + }, + { + "epoch": 55.63487738419619, + "grad_norm": 7.363391876220703, + "learning_rate": 8.664813668647303e-06, + "loss": 0.089, + "step": 20418 + }, + { + "epoch": 55.63760217983651, + "grad_norm": 3.269890785217285, + "learning_rate": 8.663939080801555e-06, + "loss": 0.0553, + "step": 20419 + }, + { + "epoch": 55.64032697547684, + "grad_norm": 3.394165515899658, + "learning_rate": 8.663064503361003e-06, + "loss": 0.143, + "step": 20420 + }, + { + "epoch": 55.643051771117165, + "grad_norm": 4.915383338928223, + "learning_rate": 8.662189936332463e-06, + "loss": 0.1576, + "step": 20421 + }, + { + "epoch": 55.64577656675749, + "grad_norm": 4.551702499389648, + "learning_rate": 8.661315379722745e-06, + "loss": 0.1276, + "step": 20422 + }, + { + "epoch": 55.64850136239782, + "grad_norm": 6.632296085357666, + "learning_rate": 8.66044083353866e-06, + "loss": 0.1448, + "step": 20423 + }, + { + "epoch": 55.65122615803815, + "grad_norm": 3.6714444160461426, + "learning_rate": 8.659566297787016e-06, + "loss": 0.0493, + "step": 20424 + }, + { + "epoch": 55.653950953678475, + "grad_norm": 4.507234573364258, + "learning_rate": 8.658691772474632e-06, + "loss": 0.1582, + "step": 20425 + }, + { + "epoch": 55.6566757493188, + "grad_norm": 6.121192932128906, + "learning_rate": 8.657817257608308e-06, + "loss": 0.1015, + "step": 20426 + }, + { + "epoch": 55.65940054495913, + "grad_norm": 5.42222785949707, + "learning_rate": 8.656942753194863e-06, + "loss": 0.1766, + "step": 20427 + }, + { + "epoch": 55.66212534059945, + "grad_norm": 3.701658010482788, + "learning_rate": 8.656068259241102e-06, + "loss": 0.0617, + "step": 20428 + }, + { + "epoch": 55.664850136239785, + "grad_norm": 3.8383970260620117, + "learning_rate": 8.655193775753841e-06, + "loss": 0.1377, + "step": 20429 + }, + { + "epoch": 55.66757493188011, + "grad_norm": 4.109371662139893, + "learning_rate": 8.654319302739887e-06, + "loss": 0.1278, + "step": 20430 + }, + { + "epoch": 55.67029972752044, + "grad_norm": 3.5328078269958496, + "learning_rate": 8.65344484020605e-06, + "loss": 0.0901, + "step": 20431 + }, + { + "epoch": 55.67302452316076, + "grad_norm": 4.257531642913818, + "learning_rate": 8.652570388159139e-06, + "loss": 0.1675, + "step": 20432 + }, + { + "epoch": 55.67574931880109, + "grad_norm": 3.289428472518921, + "learning_rate": 8.651695946605967e-06, + "loss": 0.1157, + "step": 20433 + }, + { + "epoch": 55.678474114441414, + "grad_norm": 4.315040111541748, + "learning_rate": 8.650821515553347e-06, + "loss": 0.1814, + "step": 20434 + }, + { + "epoch": 55.68119891008175, + "grad_norm": 5.300807476043701, + "learning_rate": 8.649947095008083e-06, + "loss": 0.1745, + "step": 20435 + }, + { + "epoch": 55.68392370572207, + "grad_norm": 3.0710952281951904, + "learning_rate": 8.64907268497699e-06, + "loss": 0.1117, + "step": 20436 + }, + { + "epoch": 55.6866485013624, + "grad_norm": 3.7290239334106445, + "learning_rate": 8.648198285466874e-06, + "loss": 0.076, + "step": 20437 + }, + { + "epoch": 55.689373297002724, + "grad_norm": 4.601301193237305, + "learning_rate": 8.647323896484547e-06, + "loss": 0.2185, + "step": 20438 + }, + { + "epoch": 55.69209809264305, + "grad_norm": 4.6118550300598145, + "learning_rate": 8.646449518036817e-06, + "loss": 0.067, + "step": 20439 + }, + { + "epoch": 55.694822888283376, + "grad_norm": 4.642988204956055, + "learning_rate": 8.645575150130494e-06, + "loss": 0.1258, + "step": 20440 + }, + { + "epoch": 55.69754768392371, + "grad_norm": 4.468482494354248, + "learning_rate": 8.64470079277239e-06, + "loss": 0.2527, + "step": 20441 + }, + { + "epoch": 55.700272479564035, + "grad_norm": 4.860848903656006, + "learning_rate": 8.64382644596931e-06, + "loss": 0.0957, + "step": 20442 + }, + { + "epoch": 55.70299727520436, + "grad_norm": 4.185880184173584, + "learning_rate": 8.642952109728069e-06, + "loss": 0.0742, + "step": 20443 + }, + { + "epoch": 55.705722070844686, + "grad_norm": 4.801362037658691, + "learning_rate": 8.642077784055472e-06, + "loss": 0.1382, + "step": 20444 + }, + { + "epoch": 55.70844686648501, + "grad_norm": 4.546573162078857, + "learning_rate": 8.64120346895833e-06, + "loss": 0.2831, + "step": 20445 + }, + { + "epoch": 55.71117166212534, + "grad_norm": 4.603366851806641, + "learning_rate": 8.64032916444345e-06, + "loss": 0.1412, + "step": 20446 + }, + { + "epoch": 55.71389645776567, + "grad_norm": 4.130717754364014, + "learning_rate": 8.639454870517646e-06, + "loss": 0.1299, + "step": 20447 + }, + { + "epoch": 55.716621253406, + "grad_norm": 4.901968479156494, + "learning_rate": 8.63858058718772e-06, + "loss": 0.1439, + "step": 20448 + }, + { + "epoch": 55.71934604904632, + "grad_norm": 3.360917806625366, + "learning_rate": 8.637706314460487e-06, + "loss": 0.163, + "step": 20449 + }, + { + "epoch": 55.72207084468665, + "grad_norm": 4.054257392883301, + "learning_rate": 8.63683205234275e-06, + "loss": 0.1393, + "step": 20450 + }, + { + "epoch": 55.724795640326974, + "grad_norm": 3.5764174461364746, + "learning_rate": 8.63595780084132e-06, + "loss": 0.318, + "step": 20451 + }, + { + "epoch": 55.7275204359673, + "grad_norm": 3.5609607696533203, + "learning_rate": 8.635083559963014e-06, + "loss": 0.0677, + "step": 20452 + }, + { + "epoch": 55.73024523160763, + "grad_norm": 3.7269129753112793, + "learning_rate": 8.634209329714628e-06, + "loss": 0.0785, + "step": 20453 + }, + { + "epoch": 55.73297002724796, + "grad_norm": 4.766541004180908, + "learning_rate": 8.633335110102979e-06, + "loss": 0.1893, + "step": 20454 + }, + { + "epoch": 55.735694822888284, + "grad_norm": 4.41552209854126, + "learning_rate": 8.632460901134869e-06, + "loss": 0.1576, + "step": 20455 + }, + { + "epoch": 55.73841961852861, + "grad_norm": 5.0423479080200195, + "learning_rate": 8.631586702817111e-06, + "loss": 0.0763, + "step": 20456 + }, + { + "epoch": 55.741144414168936, + "grad_norm": 4.5149736404418945, + "learning_rate": 8.630712515156512e-06, + "loss": 0.1774, + "step": 20457 + }, + { + "epoch": 55.74386920980926, + "grad_norm": 3.756617784500122, + "learning_rate": 8.62983833815988e-06, + "loss": 0.2158, + "step": 20458 + }, + { + "epoch": 55.746594005449595, + "grad_norm": 3.6888821125030518, + "learning_rate": 8.628964171834023e-06, + "loss": 0.1418, + "step": 20459 + }, + { + "epoch": 55.74931880108992, + "grad_norm": 5.236166000366211, + "learning_rate": 8.628090016185748e-06, + "loss": 0.1648, + "step": 20460 + }, + { + "epoch": 55.752043596730246, + "grad_norm": 3.830169439315796, + "learning_rate": 8.627215871221864e-06, + "loss": 0.1081, + "step": 20461 + }, + { + "epoch": 55.75476839237057, + "grad_norm": 4.974534034729004, + "learning_rate": 8.62634173694918e-06, + "loss": 0.1028, + "step": 20462 + }, + { + "epoch": 55.7574931880109, + "grad_norm": 7.999661922454834, + "learning_rate": 8.625467613374501e-06, + "loss": 0.1679, + "step": 20463 + }, + { + "epoch": 55.76021798365122, + "grad_norm": 3.9220337867736816, + "learning_rate": 8.624593500504634e-06, + "loss": 0.1749, + "step": 20464 + }, + { + "epoch": 55.762942779291556, + "grad_norm": 4.370566368103027, + "learning_rate": 8.623719398346394e-06, + "loss": 0.2471, + "step": 20465 + }, + { + "epoch": 55.76566757493188, + "grad_norm": 4.0340728759765625, + "learning_rate": 8.622845306906577e-06, + "loss": 0.0947, + "step": 20466 + }, + { + "epoch": 55.76839237057221, + "grad_norm": 3.9111313819885254, + "learning_rate": 8.621971226191995e-06, + "loss": 0.167, + "step": 20467 + }, + { + "epoch": 55.771117166212534, + "grad_norm": 2.8047828674316406, + "learning_rate": 8.621097156209463e-06, + "loss": 0.0542, + "step": 20468 + }, + { + "epoch": 55.77384196185286, + "grad_norm": 3.8338875770568848, + "learning_rate": 8.62022309696578e-06, + "loss": 0.1348, + "step": 20469 + }, + { + "epoch": 55.776566757493185, + "grad_norm": 3.6789472103118896, + "learning_rate": 8.619349048467755e-06, + "loss": 0.1679, + "step": 20470 + }, + { + "epoch": 55.77929155313352, + "grad_norm": 3.9221291542053223, + "learning_rate": 8.618475010722194e-06, + "loss": 0.09, + "step": 20471 + }, + { + "epoch": 55.782016348773844, + "grad_norm": 4.1862592697143555, + "learning_rate": 8.617600983735908e-06, + "loss": 0.0659, + "step": 20472 + }, + { + "epoch": 55.78474114441417, + "grad_norm": 4.799045085906982, + "learning_rate": 8.6167269675157e-06, + "loss": 0.068, + "step": 20473 + }, + { + "epoch": 55.787465940054496, + "grad_norm": 3.4132657051086426, + "learning_rate": 8.615852962068377e-06, + "loss": 0.0683, + "step": 20474 + }, + { + "epoch": 55.79019073569482, + "grad_norm": 3.262223482131958, + "learning_rate": 8.614978967400747e-06, + "loss": 0.1489, + "step": 20475 + }, + { + "epoch": 55.79291553133515, + "grad_norm": 3.795609712600708, + "learning_rate": 8.614104983519617e-06, + "loss": 0.227, + "step": 20476 + }, + { + "epoch": 55.79564032697548, + "grad_norm": 3.7105584144592285, + "learning_rate": 8.61323101043179e-06, + "loss": 0.0702, + "step": 20477 + }, + { + "epoch": 55.798365122615806, + "grad_norm": 3.7257235050201416, + "learning_rate": 8.612357048144079e-06, + "loss": 0.1147, + "step": 20478 + }, + { + "epoch": 55.80108991825613, + "grad_norm": 3.381202220916748, + "learning_rate": 8.611483096663284e-06, + "loss": 0.1281, + "step": 20479 + }, + { + "epoch": 55.80381471389646, + "grad_norm": 3.040492534637451, + "learning_rate": 8.610609155996216e-06, + "loss": 0.0807, + "step": 20480 + }, + { + "epoch": 55.80653950953678, + "grad_norm": 4.473389148712158, + "learning_rate": 8.609735226149676e-06, + "loss": 0.1294, + "step": 20481 + }, + { + "epoch": 55.80926430517711, + "grad_norm": 5.4073896408081055, + "learning_rate": 8.608861307130477e-06, + "loss": 0.1582, + "step": 20482 + }, + { + "epoch": 55.81198910081744, + "grad_norm": 3.274014949798584, + "learning_rate": 8.607987398945419e-06, + "loss": 0.1768, + "step": 20483 + }, + { + "epoch": 55.81471389645777, + "grad_norm": 2.8430848121643066, + "learning_rate": 8.607113501601307e-06, + "loss": 0.1409, + "step": 20484 + }, + { + "epoch": 55.817438692098094, + "grad_norm": 4.293489456176758, + "learning_rate": 8.606239615104953e-06, + "loss": 0.0842, + "step": 20485 + }, + { + "epoch": 55.82016348773842, + "grad_norm": 4.750711917877197, + "learning_rate": 8.605365739463163e-06, + "loss": 0.1093, + "step": 20486 + }, + { + "epoch": 55.822888283378745, + "grad_norm": 4.375786304473877, + "learning_rate": 8.604491874682736e-06, + "loss": 0.1656, + "step": 20487 + }, + { + "epoch": 55.82561307901907, + "grad_norm": 4.1107611656188965, + "learning_rate": 8.603618020770486e-06, + "loss": 0.2394, + "step": 20488 + }, + { + "epoch": 55.828337874659404, + "grad_norm": 3.8165786266326904, + "learning_rate": 8.602744177733208e-06, + "loss": 0.0979, + "step": 20489 + }, + { + "epoch": 55.83106267029973, + "grad_norm": 5.442535400390625, + "learning_rate": 8.601870345577719e-06, + "loss": 0.0686, + "step": 20490 + }, + { + "epoch": 55.833787465940055, + "grad_norm": 3.9983370304107666, + "learning_rate": 8.600996524310814e-06, + "loss": 0.1364, + "step": 20491 + }, + { + "epoch": 55.83651226158038, + "grad_norm": 5.155202865600586, + "learning_rate": 8.600122713939307e-06, + "loss": 0.0956, + "step": 20492 + }, + { + "epoch": 55.83923705722071, + "grad_norm": 5.143024444580078, + "learning_rate": 8.599248914469997e-06, + "loss": 0.0867, + "step": 20493 + }, + { + "epoch": 55.84196185286103, + "grad_norm": 5.1866559982299805, + "learning_rate": 8.598375125909693e-06, + "loss": 0.1143, + "step": 20494 + }, + { + "epoch": 55.844686648501366, + "grad_norm": 3.8809587955474854, + "learning_rate": 8.597501348265197e-06, + "loss": 0.1009, + "step": 20495 + }, + { + "epoch": 55.84741144414169, + "grad_norm": 4.155538082122803, + "learning_rate": 8.596627581543317e-06, + "loss": 0.1741, + "step": 20496 + }, + { + "epoch": 55.85013623978202, + "grad_norm": 3.671724796295166, + "learning_rate": 8.595753825750853e-06, + "loss": 0.1216, + "step": 20497 + }, + { + "epoch": 55.85286103542234, + "grad_norm": 4.219904899597168, + "learning_rate": 8.594880080894616e-06, + "loss": 0.1168, + "step": 20498 + }, + { + "epoch": 55.85558583106267, + "grad_norm": 5.11779260635376, + "learning_rate": 8.594006346981406e-06, + "loss": 0.1481, + "step": 20499 + }, + { + "epoch": 55.858310626702995, + "grad_norm": 4.027957439422607, + "learning_rate": 8.59313262401803e-06, + "loss": 0.1699, + "step": 20500 + }, + { + "epoch": 55.86103542234333, + "grad_norm": 3.728930950164795, + "learning_rate": 8.59225891201129e-06, + "loss": 0.0855, + "step": 20501 + }, + { + "epoch": 55.86376021798365, + "grad_norm": 4.834834098815918, + "learning_rate": 8.591385210967993e-06, + "loss": 0.2245, + "step": 20502 + }, + { + "epoch": 55.86648501362398, + "grad_norm": 4.288930416107178, + "learning_rate": 8.590511520894946e-06, + "loss": 0.1592, + "step": 20503 + }, + { + "epoch": 55.869209809264305, + "grad_norm": 4.237362861633301, + "learning_rate": 8.589637841798945e-06, + "loss": 0.1316, + "step": 20504 + }, + { + "epoch": 55.87193460490463, + "grad_norm": 3.412639617919922, + "learning_rate": 8.5887641736868e-06, + "loss": 0.0765, + "step": 20505 + }, + { + "epoch": 55.87465940054496, + "grad_norm": 5.373528480529785, + "learning_rate": 8.587890516565319e-06, + "loss": 0.1209, + "step": 20506 + }, + { + "epoch": 55.87738419618529, + "grad_norm": 4.227440357208252, + "learning_rate": 8.587016870441297e-06, + "loss": 0.0988, + "step": 20507 + }, + { + "epoch": 55.880108991825615, + "grad_norm": 4.1393280029296875, + "learning_rate": 8.586143235321545e-06, + "loss": 0.0866, + "step": 20508 + }, + { + "epoch": 55.88283378746594, + "grad_norm": 3.8176050186157227, + "learning_rate": 8.585269611212862e-06, + "loss": 0.11, + "step": 20509 + }, + { + "epoch": 55.88555858310627, + "grad_norm": 4.862467288970947, + "learning_rate": 8.584395998122054e-06, + "loss": 0.1565, + "step": 20510 + }, + { + "epoch": 55.88828337874659, + "grad_norm": 3.5602667331695557, + "learning_rate": 8.583522396055923e-06, + "loss": 0.146, + "step": 20511 + }, + { + "epoch": 55.89100817438692, + "grad_norm": 4.005143165588379, + "learning_rate": 8.582648805021276e-06, + "loss": 0.1389, + "step": 20512 + }, + { + "epoch": 55.89373297002725, + "grad_norm": 3.108684778213501, + "learning_rate": 8.581775225024914e-06, + "loss": 0.1552, + "step": 20513 + }, + { + "epoch": 55.89645776566758, + "grad_norm": 3.6260788440704346, + "learning_rate": 8.58090165607364e-06, + "loss": 0.0751, + "step": 20514 + }, + { + "epoch": 55.8991825613079, + "grad_norm": 4.506085395812988, + "learning_rate": 8.58002809817426e-06, + "loss": 0.188, + "step": 20515 + }, + { + "epoch": 55.90190735694823, + "grad_norm": 3.595628499984741, + "learning_rate": 8.579154551333574e-06, + "loss": 0.1135, + "step": 20516 + }, + { + "epoch": 55.904632152588555, + "grad_norm": 4.162252426147461, + "learning_rate": 8.578281015558388e-06, + "loss": 0.1032, + "step": 20517 + }, + { + "epoch": 55.90735694822888, + "grad_norm": 3.3928403854370117, + "learning_rate": 8.577407490855499e-06, + "loss": 0.1577, + "step": 20518 + }, + { + "epoch": 55.91008174386921, + "grad_norm": 4.454849720001221, + "learning_rate": 8.57653397723172e-06, + "loss": 0.1331, + "step": 20519 + }, + { + "epoch": 55.91280653950954, + "grad_norm": 3.7224721908569336, + "learning_rate": 8.575660474693846e-06, + "loss": 0.0846, + "step": 20520 + }, + { + "epoch": 55.915531335149865, + "grad_norm": 3.00057315826416, + "learning_rate": 8.574786983248684e-06, + "loss": 0.1174, + "step": 20521 + }, + { + "epoch": 55.91825613079019, + "grad_norm": 3.5504508018493652, + "learning_rate": 8.573913502903034e-06, + "loss": 0.202, + "step": 20522 + }, + { + "epoch": 55.920980926430516, + "grad_norm": 4.388420104980469, + "learning_rate": 8.573040033663702e-06, + "loss": 0.0857, + "step": 20523 + }, + { + "epoch": 55.92370572207084, + "grad_norm": 3.6599771976470947, + "learning_rate": 8.572166575537484e-06, + "loss": 0.0688, + "step": 20524 + }, + { + "epoch": 55.926430517711175, + "grad_norm": 5.742560386657715, + "learning_rate": 8.571293128531191e-06, + "loss": 0.1443, + "step": 20525 + }, + { + "epoch": 55.9291553133515, + "grad_norm": 5.439338684082031, + "learning_rate": 8.57041969265162e-06, + "loss": 0.1298, + "step": 20526 + }, + { + "epoch": 55.93188010899183, + "grad_norm": 4.148625373840332, + "learning_rate": 8.569546267905571e-06, + "loss": 0.1327, + "step": 20527 + }, + { + "epoch": 55.93460490463215, + "grad_norm": 4.74026346206665, + "learning_rate": 8.568672854299856e-06, + "loss": 0.2154, + "step": 20528 + }, + { + "epoch": 55.93732970027248, + "grad_norm": 3.3893229961395264, + "learning_rate": 8.567799451841266e-06, + "loss": 0.0736, + "step": 20529 + }, + { + "epoch": 55.940054495912804, + "grad_norm": 2.7869043350219727, + "learning_rate": 8.566926060536608e-06, + "loss": 0.0547, + "step": 20530 + }, + { + "epoch": 55.94277929155314, + "grad_norm": 4.547995567321777, + "learning_rate": 8.566052680392684e-06, + "loss": 0.2509, + "step": 20531 + }, + { + "epoch": 55.94550408719346, + "grad_norm": 3.5843234062194824, + "learning_rate": 8.565179311416298e-06, + "loss": 0.1101, + "step": 20532 + }, + { + "epoch": 55.94822888283379, + "grad_norm": 4.6569414138793945, + "learning_rate": 8.564305953614246e-06, + "loss": 0.0799, + "step": 20533 + }, + { + "epoch": 55.950953678474114, + "grad_norm": 4.099673271179199, + "learning_rate": 8.563432606993337e-06, + "loss": 0.2314, + "step": 20534 + }, + { + "epoch": 55.95367847411444, + "grad_norm": 3.8664135932922363, + "learning_rate": 8.562559271560365e-06, + "loss": 0.1103, + "step": 20535 + }, + { + "epoch": 55.956403269754766, + "grad_norm": 4.16465425491333, + "learning_rate": 8.561685947322133e-06, + "loss": 0.1514, + "step": 20536 + }, + { + "epoch": 55.95912806539509, + "grad_norm": 5.871386528015137, + "learning_rate": 8.560812634285451e-06, + "loss": 0.0679, + "step": 20537 + }, + { + "epoch": 55.961852861035425, + "grad_norm": 3.923872470855713, + "learning_rate": 8.559939332457109e-06, + "loss": 0.0887, + "step": 20538 + }, + { + "epoch": 55.96457765667575, + "grad_norm": 4.287431240081787, + "learning_rate": 8.559066041843917e-06, + "loss": 0.1737, + "step": 20539 + }, + { + "epoch": 55.967302452316076, + "grad_norm": 3.428402900695801, + "learning_rate": 8.558192762452669e-06, + "loss": 0.0724, + "step": 20540 + }, + { + "epoch": 55.9700272479564, + "grad_norm": 4.2366533279418945, + "learning_rate": 8.557319494290171e-06, + "loss": 0.1356, + "step": 20541 + }, + { + "epoch": 55.97275204359673, + "grad_norm": 3.562201738357544, + "learning_rate": 8.55644623736322e-06, + "loss": 0.1089, + "step": 20542 + }, + { + "epoch": 55.97547683923706, + "grad_norm": 4.23938512802124, + "learning_rate": 8.555572991678624e-06, + "loss": 0.1206, + "step": 20543 + }, + { + "epoch": 55.97820163487739, + "grad_norm": 5.907759666442871, + "learning_rate": 8.554699757243174e-06, + "loss": 0.1504, + "step": 20544 + }, + { + "epoch": 55.98092643051771, + "grad_norm": 4.7009148597717285, + "learning_rate": 8.553826534063681e-06, + "loss": 0.147, + "step": 20545 + }, + { + "epoch": 55.98365122615804, + "grad_norm": 4.274569511413574, + "learning_rate": 8.552953322146936e-06, + "loss": 0.1461, + "step": 20546 + }, + { + "epoch": 55.986376021798364, + "grad_norm": 3.7574856281280518, + "learning_rate": 8.552080121499747e-06, + "loss": 0.0946, + "step": 20547 + }, + { + "epoch": 55.98910081743869, + "grad_norm": 3.955724000930786, + "learning_rate": 8.551206932128908e-06, + "loss": 0.1318, + "step": 20548 + }, + { + "epoch": 55.991825613079016, + "grad_norm": 3.2213187217712402, + "learning_rate": 8.550333754041227e-06, + "loss": 0.1254, + "step": 20549 + }, + { + "epoch": 55.99455040871935, + "grad_norm": 3.9226980209350586, + "learning_rate": 8.549460587243496e-06, + "loss": 0.0988, + "step": 20550 + }, + { + "epoch": 55.997275204359674, + "grad_norm": 4.1123576164245605, + "learning_rate": 8.54858743174252e-06, + "loss": 0.1186, + "step": 20551 + }, + { + "epoch": 56.0, + "grad_norm": 3.55380916595459, + "learning_rate": 8.5477142875451e-06, + "loss": 0.0511, + "step": 20552 + }, + { + "epoch": 56.002724795640326, + "grad_norm": 4.605118751525879, + "learning_rate": 8.546841154658031e-06, + "loss": 0.1745, + "step": 20553 + }, + { + "epoch": 56.00544959128065, + "grad_norm": 2.965914249420166, + "learning_rate": 8.545968033088117e-06, + "loss": 0.0537, + "step": 20554 + }, + { + "epoch": 56.00817438692098, + "grad_norm": 4.400588035583496, + "learning_rate": 8.545094922842161e-06, + "loss": 0.1819, + "step": 20555 + }, + { + "epoch": 56.01089918256131, + "grad_norm": 4.025671482086182, + "learning_rate": 8.544221823926957e-06, + "loss": 0.0813, + "step": 20556 + }, + { + "epoch": 56.013623978201636, + "grad_norm": 6.826101779937744, + "learning_rate": 8.543348736349307e-06, + "loss": 0.0879, + "step": 20557 + }, + { + "epoch": 56.01634877384196, + "grad_norm": 4.12449836730957, + "learning_rate": 8.54247566011601e-06, + "loss": 0.1038, + "step": 20558 + }, + { + "epoch": 56.01907356948229, + "grad_norm": 3.6200411319732666, + "learning_rate": 8.541602595233866e-06, + "loss": 0.0882, + "step": 20559 + }, + { + "epoch": 56.02179836512261, + "grad_norm": 3.680046319961548, + "learning_rate": 8.540729541709673e-06, + "loss": 0.0771, + "step": 20560 + }, + { + "epoch": 56.02452316076294, + "grad_norm": 5.322786808013916, + "learning_rate": 8.539856499550233e-06, + "loss": 0.088, + "step": 20561 + }, + { + "epoch": 56.02724795640327, + "grad_norm": 3.4235246181488037, + "learning_rate": 8.53898346876234e-06, + "loss": 0.1759, + "step": 20562 + }, + { + "epoch": 56.0299727520436, + "grad_norm": 3.9941909313201904, + "learning_rate": 8.5381104493528e-06, + "loss": 0.182, + "step": 20563 + }, + { + "epoch": 56.032697547683924, + "grad_norm": 3.8364150524139404, + "learning_rate": 8.537237441328409e-06, + "loss": 0.0684, + "step": 20564 + }, + { + "epoch": 56.03542234332425, + "grad_norm": 3.503875255584717, + "learning_rate": 8.536364444695967e-06, + "loss": 0.099, + "step": 20565 + }, + { + "epoch": 56.038147138964575, + "grad_norm": 9.737573623657227, + "learning_rate": 8.535491459462267e-06, + "loss": 0.1859, + "step": 20566 + }, + { + "epoch": 56.0408719346049, + "grad_norm": 3.5125746726989746, + "learning_rate": 8.534618485634115e-06, + "loss": 0.1195, + "step": 20567 + }, + { + "epoch": 56.043596730245234, + "grad_norm": 3.228148937225342, + "learning_rate": 8.533745523218307e-06, + "loss": 0.0768, + "step": 20568 + }, + { + "epoch": 56.04632152588556, + "grad_norm": 4.585299015045166, + "learning_rate": 8.532872572221642e-06, + "loss": 0.1622, + "step": 20569 + }, + { + "epoch": 56.049046321525886, + "grad_norm": 3.633225202560425, + "learning_rate": 8.531999632650912e-06, + "loss": 0.3036, + "step": 20570 + }, + { + "epoch": 56.05177111716621, + "grad_norm": 3.193605899810791, + "learning_rate": 8.531126704512928e-06, + "loss": 0.1625, + "step": 20571 + }, + { + "epoch": 56.05449591280654, + "grad_norm": 4.373520851135254, + "learning_rate": 8.53025378781448e-06, + "loss": 0.2033, + "step": 20572 + }, + { + "epoch": 56.05722070844686, + "grad_norm": 3.933464765548706, + "learning_rate": 8.529380882562371e-06, + "loss": 0.1679, + "step": 20573 + }, + { + "epoch": 56.059945504087196, + "grad_norm": 3.5256805419921875, + "learning_rate": 8.528507988763393e-06, + "loss": 0.0786, + "step": 20574 + }, + { + "epoch": 56.06267029972752, + "grad_norm": 4.1520891189575195, + "learning_rate": 8.527635106424352e-06, + "loss": 0.1364, + "step": 20575 + }, + { + "epoch": 56.06539509536785, + "grad_norm": 4.632296562194824, + "learning_rate": 8.526762235552038e-06, + "loss": 0.1718, + "step": 20576 + }, + { + "epoch": 56.06811989100817, + "grad_norm": 4.335762977600098, + "learning_rate": 8.525889376153253e-06, + "loss": 0.1075, + "step": 20577 + }, + { + "epoch": 56.0708446866485, + "grad_norm": 3.0486397743225098, + "learning_rate": 8.525016528234794e-06, + "loss": 0.078, + "step": 20578 + }, + { + "epoch": 56.073569482288825, + "grad_norm": 4.040469646453857, + "learning_rate": 8.52414369180346e-06, + "loss": 0.0702, + "step": 20579 + }, + { + "epoch": 56.07629427792916, + "grad_norm": 3.926084041595459, + "learning_rate": 8.523270866866044e-06, + "loss": 0.0851, + "step": 20580 + }, + { + "epoch": 56.079019073569484, + "grad_norm": 4.060538291931152, + "learning_rate": 8.52239805342935e-06, + "loss": 0.2353, + "step": 20581 + }, + { + "epoch": 56.08174386920981, + "grad_norm": 5.469473361968994, + "learning_rate": 8.521525251500172e-06, + "loss": 0.0915, + "step": 20582 + }, + { + "epoch": 56.084468664850135, + "grad_norm": 3.8926613330841064, + "learning_rate": 8.520652461085309e-06, + "loss": 0.1103, + "step": 20583 + }, + { + "epoch": 56.08719346049046, + "grad_norm": 3.446298360824585, + "learning_rate": 8.519779682191554e-06, + "loss": 0.0861, + "step": 20584 + }, + { + "epoch": 56.08991825613079, + "grad_norm": 3.4064533710479736, + "learning_rate": 8.518906914825709e-06, + "loss": 0.0959, + "step": 20585 + }, + { + "epoch": 56.09264305177112, + "grad_norm": 3.9588980674743652, + "learning_rate": 8.518034158994567e-06, + "loss": 0.0604, + "step": 20586 + }, + { + "epoch": 56.095367847411445, + "grad_norm": 3.596825122833252, + "learning_rate": 8.517161414704926e-06, + "loss": 0.0688, + "step": 20587 + }, + { + "epoch": 56.09809264305177, + "grad_norm": 3.5281028747558594, + "learning_rate": 8.516288681963589e-06, + "loss": 0.2004, + "step": 20588 + }, + { + "epoch": 56.1008174386921, + "grad_norm": 4.134294509887695, + "learning_rate": 8.515415960777345e-06, + "loss": 0.0913, + "step": 20589 + }, + { + "epoch": 56.10354223433242, + "grad_norm": 4.095026969909668, + "learning_rate": 8.514543251152996e-06, + "loss": 0.253, + "step": 20590 + }, + { + "epoch": 56.10626702997275, + "grad_norm": 3.5762150287628174, + "learning_rate": 8.513670553097335e-06, + "loss": 0.1701, + "step": 20591 + }, + { + "epoch": 56.10899182561308, + "grad_norm": 3.8802061080932617, + "learning_rate": 8.512797866617158e-06, + "loss": 0.1399, + "step": 20592 + }, + { + "epoch": 56.11171662125341, + "grad_norm": 4.417481899261475, + "learning_rate": 8.511925191719268e-06, + "loss": 0.187, + "step": 20593 + }, + { + "epoch": 56.11444141689373, + "grad_norm": 4.006098747253418, + "learning_rate": 8.511052528410453e-06, + "loss": 0.1473, + "step": 20594 + }, + { + "epoch": 56.11716621253406, + "grad_norm": 4.55978536605835, + "learning_rate": 8.510179876697514e-06, + "loss": 0.2118, + "step": 20595 + }, + { + "epoch": 56.119891008174385, + "grad_norm": 3.7112536430358887, + "learning_rate": 8.509307236587247e-06, + "loss": 0.1585, + "step": 20596 + }, + { + "epoch": 56.12261580381471, + "grad_norm": 2.8644304275512695, + "learning_rate": 8.508434608086448e-06, + "loss": 0.1177, + "step": 20597 + }, + { + "epoch": 56.12534059945504, + "grad_norm": 4.249670028686523, + "learning_rate": 8.507561991201908e-06, + "loss": 0.0741, + "step": 20598 + }, + { + "epoch": 56.12806539509537, + "grad_norm": 3.9912595748901367, + "learning_rate": 8.506689385940433e-06, + "loss": 0.0659, + "step": 20599 + }, + { + "epoch": 56.130790190735695, + "grad_norm": 3.794909954071045, + "learning_rate": 8.50581679230881e-06, + "loss": 0.0722, + "step": 20600 + }, + { + "epoch": 56.13351498637602, + "grad_norm": 3.5600454807281494, + "learning_rate": 8.504944210313838e-06, + "loss": 0.1109, + "step": 20601 + }, + { + "epoch": 56.13623978201635, + "grad_norm": 5.2991414070129395, + "learning_rate": 8.50407163996231e-06, + "loss": 0.0802, + "step": 20602 + }, + { + "epoch": 56.13896457765667, + "grad_norm": 7.255417346954346, + "learning_rate": 8.503199081261028e-06, + "loss": 0.1211, + "step": 20603 + }, + { + "epoch": 56.141689373297005, + "grad_norm": 3.479802370071411, + "learning_rate": 8.50232653421678e-06, + "loss": 0.0732, + "step": 20604 + }, + { + "epoch": 56.14441416893733, + "grad_norm": 3.8354055881500244, + "learning_rate": 8.501453998836364e-06, + "loss": 0.0726, + "step": 20605 + }, + { + "epoch": 56.14713896457766, + "grad_norm": 3.690303087234497, + "learning_rate": 8.50058147512658e-06, + "loss": 0.1032, + "step": 20606 + }, + { + "epoch": 56.14986376021798, + "grad_norm": 4.3305182456970215, + "learning_rate": 8.499708963094216e-06, + "loss": 0.3212, + "step": 20607 + }, + { + "epoch": 56.15258855585831, + "grad_norm": 4.2532196044921875, + "learning_rate": 8.498836462746074e-06, + "loss": 0.073, + "step": 20608 + }, + { + "epoch": 56.155313351498634, + "grad_norm": 4.8961873054504395, + "learning_rate": 8.497963974088942e-06, + "loss": 0.2046, + "step": 20609 + }, + { + "epoch": 56.15803814713897, + "grad_norm": 3.996030330657959, + "learning_rate": 8.497091497129621e-06, + "loss": 0.1031, + "step": 20610 + }, + { + "epoch": 56.16076294277929, + "grad_norm": 3.6293375492095947, + "learning_rate": 8.496219031874899e-06, + "loss": 0.1507, + "step": 20611 + }, + { + "epoch": 56.16348773841962, + "grad_norm": 4.9578633308410645, + "learning_rate": 8.49534657833158e-06, + "loss": 0.1609, + "step": 20612 + }, + { + "epoch": 56.166212534059945, + "grad_norm": 4.215757369995117, + "learning_rate": 8.49447413650645e-06, + "loss": 0.1286, + "step": 20613 + }, + { + "epoch": 56.16893732970027, + "grad_norm": 4.967205047607422, + "learning_rate": 8.493601706406305e-06, + "loss": 0.2106, + "step": 20614 + }, + { + "epoch": 56.171662125340596, + "grad_norm": 3.4942333698272705, + "learning_rate": 8.492729288037945e-06, + "loss": 0.0626, + "step": 20615 + }, + { + "epoch": 56.17438692098093, + "grad_norm": 3.1676595211029053, + "learning_rate": 8.491856881408159e-06, + "loss": 0.0788, + "step": 20616 + }, + { + "epoch": 56.177111716621255, + "grad_norm": 4.532700061798096, + "learning_rate": 8.490984486523746e-06, + "loss": 0.101, + "step": 20617 + }, + { + "epoch": 56.17983651226158, + "grad_norm": 3.0709919929504395, + "learning_rate": 8.490112103391494e-06, + "loss": 0.0716, + "step": 20618 + }, + { + "epoch": 56.182561307901906, + "grad_norm": 4.7369384765625, + "learning_rate": 8.489239732018202e-06, + "loss": 0.1132, + "step": 20619 + }, + { + "epoch": 56.18528610354223, + "grad_norm": 4.261050224304199, + "learning_rate": 8.48836737241066e-06, + "loss": 0.1538, + "step": 20620 + }, + { + "epoch": 56.18801089918256, + "grad_norm": 8.628913879394531, + "learning_rate": 8.487495024575668e-06, + "loss": 0.077, + "step": 20621 + }, + { + "epoch": 56.19073569482289, + "grad_norm": 3.7310938835144043, + "learning_rate": 8.48662268852001e-06, + "loss": 0.1542, + "step": 20622 + }, + { + "epoch": 56.19346049046322, + "grad_norm": 4.899902820587158, + "learning_rate": 8.48575036425049e-06, + "loss": 0.209, + "step": 20623 + }, + { + "epoch": 56.19618528610354, + "grad_norm": 3.526634693145752, + "learning_rate": 8.4848780517739e-06, + "loss": 0.098, + "step": 20624 + }, + { + "epoch": 56.19891008174387, + "grad_norm": 4.161648750305176, + "learning_rate": 8.484005751097026e-06, + "loss": 0.1522, + "step": 20625 + }, + { + "epoch": 56.201634877384194, + "grad_norm": 3.330474853515625, + "learning_rate": 8.483133462226671e-06, + "loss": 0.1376, + "step": 20626 + }, + { + "epoch": 56.20435967302452, + "grad_norm": 4.167783260345459, + "learning_rate": 8.48226118516962e-06, + "loss": 0.1346, + "step": 20627 + }, + { + "epoch": 56.20708446866485, + "grad_norm": 4.754262924194336, + "learning_rate": 8.481388919932672e-06, + "loss": 0.0906, + "step": 20628 + }, + { + "epoch": 56.20980926430518, + "grad_norm": 3.272594928741455, + "learning_rate": 8.480516666522616e-06, + "loss": 0.1415, + "step": 20629 + }, + { + "epoch": 56.212534059945504, + "grad_norm": 3.318922758102417, + "learning_rate": 8.479644424946251e-06, + "loss": 0.0499, + "step": 20630 + }, + { + "epoch": 56.21525885558583, + "grad_norm": 4.075006484985352, + "learning_rate": 8.478772195210365e-06, + "loss": 0.1142, + "step": 20631 + }, + { + "epoch": 56.217983651226156, + "grad_norm": 4.122602462768555, + "learning_rate": 8.477899977321752e-06, + "loss": 0.1281, + "step": 20632 + }, + { + "epoch": 56.22070844686648, + "grad_norm": 3.0714304447174072, + "learning_rate": 8.477027771287203e-06, + "loss": 0.1627, + "step": 20633 + }, + { + "epoch": 56.223433242506815, + "grad_norm": 5.425609588623047, + "learning_rate": 8.476155577113515e-06, + "loss": 0.1478, + "step": 20634 + }, + { + "epoch": 56.22615803814714, + "grad_norm": 4.0460920333862305, + "learning_rate": 8.475283394807478e-06, + "loss": 0.1296, + "step": 20635 + }, + { + "epoch": 56.228882833787466, + "grad_norm": 3.1727192401885986, + "learning_rate": 8.474411224375885e-06, + "loss": 0.206, + "step": 20636 + }, + { + "epoch": 56.23160762942779, + "grad_norm": 3.6730051040649414, + "learning_rate": 8.473539065825527e-06, + "loss": 0.1467, + "step": 20637 + }, + { + "epoch": 56.23433242506812, + "grad_norm": 3.1039352416992188, + "learning_rate": 8.472666919163198e-06, + "loss": 0.0871, + "step": 20638 + }, + { + "epoch": 56.237057220708444, + "grad_norm": 2.95245099067688, + "learning_rate": 8.471794784395687e-06, + "loss": 0.0625, + "step": 20639 + }, + { + "epoch": 56.23978201634878, + "grad_norm": 5.449034690856934, + "learning_rate": 8.470922661529792e-06, + "loss": 0.0532, + "step": 20640 + }, + { + "epoch": 56.2425068119891, + "grad_norm": 4.009894371032715, + "learning_rate": 8.470050550572302e-06, + "loss": 0.1112, + "step": 20641 + }, + { + "epoch": 56.24523160762943, + "grad_norm": 3.69368052482605, + "learning_rate": 8.46917845153001e-06, + "loss": 0.1003, + "step": 20642 + }, + { + "epoch": 56.247956403269754, + "grad_norm": 4.515437126159668, + "learning_rate": 8.468306364409704e-06, + "loss": 0.0798, + "step": 20643 + }, + { + "epoch": 56.25068119891008, + "grad_norm": 4.0363450050354, + "learning_rate": 8.467434289218184e-06, + "loss": 0.075, + "step": 20644 + }, + { + "epoch": 56.253405994550405, + "grad_norm": 4.053673267364502, + "learning_rate": 8.466562225962233e-06, + "loss": 0.1453, + "step": 20645 + }, + { + "epoch": 56.25613079019074, + "grad_norm": 3.6368520259857178, + "learning_rate": 8.465690174648648e-06, + "loss": 0.1522, + "step": 20646 + }, + { + "epoch": 56.258855585831064, + "grad_norm": 4.203634738922119, + "learning_rate": 8.464818135284214e-06, + "loss": 0.1559, + "step": 20647 + }, + { + "epoch": 56.26158038147139, + "grad_norm": 3.756179094314575, + "learning_rate": 8.463946107875732e-06, + "loss": 0.2895, + "step": 20648 + }, + { + "epoch": 56.264305177111716, + "grad_norm": 3.291050910949707, + "learning_rate": 8.463074092429986e-06, + "loss": 0.0635, + "step": 20649 + }, + { + "epoch": 56.26702997275204, + "grad_norm": 3.4768476486206055, + "learning_rate": 8.462202088953771e-06, + "loss": 0.091, + "step": 20650 + }, + { + "epoch": 56.26975476839237, + "grad_norm": 4.023835182189941, + "learning_rate": 8.461330097453875e-06, + "loss": 0.1656, + "step": 20651 + }, + { + "epoch": 56.2724795640327, + "grad_norm": 3.9702351093292236, + "learning_rate": 8.460458117937091e-06, + "loss": 0.1035, + "step": 20652 + }, + { + "epoch": 56.275204359673026, + "grad_norm": 3.135334014892578, + "learning_rate": 8.45958615041021e-06, + "loss": 0.0998, + "step": 20653 + }, + { + "epoch": 56.27792915531335, + "grad_norm": 4.371511459350586, + "learning_rate": 8.458714194880022e-06, + "loss": 0.0726, + "step": 20654 + }, + { + "epoch": 56.28065395095368, + "grad_norm": 3.310818910598755, + "learning_rate": 8.45784225135332e-06, + "loss": 0.0718, + "step": 20655 + }, + { + "epoch": 56.283378746594, + "grad_norm": 3.2568392753601074, + "learning_rate": 8.456970319836886e-06, + "loss": 0.0666, + "step": 20656 + }, + { + "epoch": 56.28610354223433, + "grad_norm": 4.366418361663818, + "learning_rate": 8.456098400337522e-06, + "loss": 0.2138, + "step": 20657 + }, + { + "epoch": 56.28882833787466, + "grad_norm": 4.223952770233154, + "learning_rate": 8.455226492862017e-06, + "loss": 0.0636, + "step": 20658 + }, + { + "epoch": 56.29155313351499, + "grad_norm": 3.9034769535064697, + "learning_rate": 8.454354597417155e-06, + "loss": 0.1913, + "step": 20659 + }, + { + "epoch": 56.294277929155314, + "grad_norm": 7.27374267578125, + "learning_rate": 8.453482714009732e-06, + "loss": 0.1548, + "step": 20660 + }, + { + "epoch": 56.29700272479564, + "grad_norm": 4.076107025146484, + "learning_rate": 8.452610842646533e-06, + "loss": 0.1189, + "step": 20661 + }, + { + "epoch": 56.299727520435965, + "grad_norm": 3.573756694793701, + "learning_rate": 8.451738983334355e-06, + "loss": 0.064, + "step": 20662 + }, + { + "epoch": 56.30245231607629, + "grad_norm": 3.9268429279327393, + "learning_rate": 8.45086713607998e-06, + "loss": 0.1564, + "step": 20663 + }, + { + "epoch": 56.305177111716624, + "grad_norm": 4.568852424621582, + "learning_rate": 8.449995300890204e-06, + "loss": 0.0923, + "step": 20664 + }, + { + "epoch": 56.30790190735695, + "grad_norm": 4.122679710388184, + "learning_rate": 8.449123477771815e-06, + "loss": 0.1715, + "step": 20665 + }, + { + "epoch": 56.310626702997276, + "grad_norm": 3.1892356872558594, + "learning_rate": 8.448251666731601e-06, + "loss": 0.0709, + "step": 20666 + }, + { + "epoch": 56.3133514986376, + "grad_norm": 3.214322328567505, + "learning_rate": 8.447379867776353e-06, + "loss": 0.0796, + "step": 20667 + }, + { + "epoch": 56.31607629427793, + "grad_norm": 4.30591344833374, + "learning_rate": 8.446508080912863e-06, + "loss": 0.1585, + "step": 20668 + }, + { + "epoch": 56.31880108991825, + "grad_norm": 3.253145217895508, + "learning_rate": 8.445636306147915e-06, + "loss": 0.0599, + "step": 20669 + }, + { + "epoch": 56.321525885558586, + "grad_norm": 3.429258108139038, + "learning_rate": 8.444764543488303e-06, + "loss": 0.0623, + "step": 20670 + }, + { + "epoch": 56.32425068119891, + "grad_norm": 3.463414192199707, + "learning_rate": 8.443892792940815e-06, + "loss": 0.0788, + "step": 20671 + }, + { + "epoch": 56.32697547683924, + "grad_norm": 4.158020496368408, + "learning_rate": 8.44302105451224e-06, + "loss": 0.1442, + "step": 20672 + }, + { + "epoch": 56.32970027247956, + "grad_norm": 4.838292598724365, + "learning_rate": 8.442149328209364e-06, + "loss": 0.1763, + "step": 20673 + }, + { + "epoch": 56.33242506811989, + "grad_norm": 3.9878294467926025, + "learning_rate": 8.44127761403898e-06, + "loss": 0.078, + "step": 20674 + }, + { + "epoch": 56.335149863760215, + "grad_norm": 2.6165270805358887, + "learning_rate": 8.440405912007879e-06, + "loss": 0.0497, + "step": 20675 + }, + { + "epoch": 56.33787465940055, + "grad_norm": 4.76611852645874, + "learning_rate": 8.439534222122843e-06, + "loss": 0.3121, + "step": 20676 + }, + { + "epoch": 56.34059945504087, + "grad_norm": 3.606412172317505, + "learning_rate": 8.438662544390666e-06, + "loss": 0.0633, + "step": 20677 + }, + { + "epoch": 56.3433242506812, + "grad_norm": 4.322358131408691, + "learning_rate": 8.437790878818135e-06, + "loss": 0.1374, + "step": 20678 + }, + { + "epoch": 56.346049046321525, + "grad_norm": 3.323930263519287, + "learning_rate": 8.436919225412038e-06, + "loss": 0.1242, + "step": 20679 + }, + { + "epoch": 56.34877384196185, + "grad_norm": 4.404124736785889, + "learning_rate": 8.436047584179163e-06, + "loss": 0.099, + "step": 20680 + }, + { + "epoch": 56.35149863760218, + "grad_norm": 5.267062664031982, + "learning_rate": 8.4351759551263e-06, + "loss": 0.1487, + "step": 20681 + }, + { + "epoch": 56.35422343324251, + "grad_norm": 3.791018486022949, + "learning_rate": 8.434304338260237e-06, + "loss": 0.1992, + "step": 20682 + }, + { + "epoch": 56.356948228882835, + "grad_norm": 3.1285722255706787, + "learning_rate": 8.433432733587758e-06, + "loss": 0.0647, + "step": 20683 + }, + { + "epoch": 56.35967302452316, + "grad_norm": 4.164439678192139, + "learning_rate": 8.43256114111566e-06, + "loss": 0.1759, + "step": 20684 + }, + { + "epoch": 56.36239782016349, + "grad_norm": 6.165648937225342, + "learning_rate": 8.43168956085072e-06, + "loss": 0.1041, + "step": 20685 + }, + { + "epoch": 56.36512261580381, + "grad_norm": 3.150517225265503, + "learning_rate": 8.430817992799735e-06, + "loss": 0.0934, + "step": 20686 + }, + { + "epoch": 56.36784741144414, + "grad_norm": 3.8604135513305664, + "learning_rate": 8.429946436969488e-06, + "loss": 0.1202, + "step": 20687 + }, + { + "epoch": 56.37057220708447, + "grad_norm": 2.8514785766601562, + "learning_rate": 8.429074893366768e-06, + "loss": 0.0547, + "step": 20688 + }, + { + "epoch": 56.3732970027248, + "grad_norm": 3.9102790355682373, + "learning_rate": 8.42820336199836e-06, + "loss": 0.0665, + "step": 20689 + }, + { + "epoch": 56.37602179836512, + "grad_norm": 3.69484281539917, + "learning_rate": 8.427331842871052e-06, + "loss": 0.0907, + "step": 20690 + }, + { + "epoch": 56.37874659400545, + "grad_norm": 6.28098201751709, + "learning_rate": 8.426460335991638e-06, + "loss": 0.0531, + "step": 20691 + }, + { + "epoch": 56.381471389645775, + "grad_norm": 3.8371851444244385, + "learning_rate": 8.425588841366896e-06, + "loss": 0.0674, + "step": 20692 + }, + { + "epoch": 56.3841961852861, + "grad_norm": 5.768299102783203, + "learning_rate": 8.424717359003621e-06, + "loss": 0.1763, + "step": 20693 + }, + { + "epoch": 56.38692098092643, + "grad_norm": 3.979182004928589, + "learning_rate": 8.423845888908595e-06, + "loss": 0.1097, + "step": 20694 + }, + { + "epoch": 56.38964577656676, + "grad_norm": 6.081275463104248, + "learning_rate": 8.422974431088607e-06, + "loss": 0.2229, + "step": 20695 + }, + { + "epoch": 56.392370572207085, + "grad_norm": 2.5754799842834473, + "learning_rate": 8.422102985550441e-06, + "loss": 0.1401, + "step": 20696 + }, + { + "epoch": 56.39509536784741, + "grad_norm": 3.954085350036621, + "learning_rate": 8.42123155230089e-06, + "loss": 0.0638, + "step": 20697 + }, + { + "epoch": 56.39782016348774, + "grad_norm": 6.7409563064575195, + "learning_rate": 8.420360131346735e-06, + "loss": 0.2512, + "step": 20698 + }, + { + "epoch": 56.40054495912806, + "grad_norm": 5.291450023651123, + "learning_rate": 8.419488722694765e-06, + "loss": 0.0859, + "step": 20699 + }, + { + "epoch": 56.403269754768395, + "grad_norm": 3.6343750953674316, + "learning_rate": 8.418617326351765e-06, + "loss": 0.1427, + "step": 20700 + }, + { + "epoch": 56.40599455040872, + "grad_norm": 4.284163951873779, + "learning_rate": 8.417745942324522e-06, + "loss": 0.1995, + "step": 20701 + }, + { + "epoch": 56.40871934604905, + "grad_norm": 4.142784595489502, + "learning_rate": 8.416874570619825e-06, + "loss": 0.1035, + "step": 20702 + }, + { + "epoch": 56.41144414168937, + "grad_norm": 3.6764538288116455, + "learning_rate": 8.416003211244454e-06, + "loss": 0.0861, + "step": 20703 + }, + { + "epoch": 56.4141689373297, + "grad_norm": 5.162350177764893, + "learning_rate": 8.415131864205204e-06, + "loss": 0.0556, + "step": 20704 + }, + { + "epoch": 56.416893732970024, + "grad_norm": 3.668029546737671, + "learning_rate": 8.414260529508851e-06, + "loss": 0.2694, + "step": 20705 + }, + { + "epoch": 56.41961852861036, + "grad_norm": 3.40997576713562, + "learning_rate": 8.41338920716219e-06, + "loss": 0.1552, + "step": 20706 + }, + { + "epoch": 56.42234332425068, + "grad_norm": 3.400639057159424, + "learning_rate": 8.412517897172001e-06, + "loss": 0.0723, + "step": 20707 + }, + { + "epoch": 56.42506811989101, + "grad_norm": 2.9111382961273193, + "learning_rate": 8.411646599545068e-06, + "loss": 0.0683, + "step": 20708 + }, + { + "epoch": 56.427792915531334, + "grad_norm": 3.2668423652648926, + "learning_rate": 8.410775314288186e-06, + "loss": 0.1265, + "step": 20709 + }, + { + "epoch": 56.43051771117166, + "grad_norm": 3.4724650382995605, + "learning_rate": 8.40990404140813e-06, + "loss": 0.1359, + "step": 20710 + }, + { + "epoch": 56.433242506811986, + "grad_norm": 3.0020253658294678, + "learning_rate": 8.409032780911695e-06, + "loss": 0.0692, + "step": 20711 + }, + { + "epoch": 56.43596730245232, + "grad_norm": 3.6473333835601807, + "learning_rate": 8.408161532805659e-06, + "loss": 0.0758, + "step": 20712 + }, + { + "epoch": 56.438692098092645, + "grad_norm": 2.9921231269836426, + "learning_rate": 8.40729029709681e-06, + "loss": 0.0782, + "step": 20713 + }, + { + "epoch": 56.44141689373297, + "grad_norm": 3.7293179035186768, + "learning_rate": 8.406419073791933e-06, + "loss": 0.094, + "step": 20714 + }, + { + "epoch": 56.444141689373296, + "grad_norm": 4.795324802398682, + "learning_rate": 8.405547862897813e-06, + "loss": 0.0817, + "step": 20715 + }, + { + "epoch": 56.44686648501362, + "grad_norm": 3.7878880500793457, + "learning_rate": 8.404676664421235e-06, + "loss": 0.0871, + "step": 20716 + }, + { + "epoch": 56.44959128065395, + "grad_norm": 4.343838691711426, + "learning_rate": 8.403805478368983e-06, + "loss": 0.2216, + "step": 20717 + }, + { + "epoch": 56.45231607629428, + "grad_norm": 3.9245493412017822, + "learning_rate": 8.402934304747843e-06, + "loss": 0.0767, + "step": 20718 + }, + { + "epoch": 56.45504087193461, + "grad_norm": 3.8246958255767822, + "learning_rate": 8.402063143564601e-06, + "loss": 0.1074, + "step": 20719 + }, + { + "epoch": 56.45776566757493, + "grad_norm": 3.887381076812744, + "learning_rate": 8.401191994826036e-06, + "loss": 0.1733, + "step": 20720 + }, + { + "epoch": 56.46049046321526, + "grad_norm": 4.081824779510498, + "learning_rate": 8.40032085853894e-06, + "loss": 0.1419, + "step": 20721 + }, + { + "epoch": 56.463215258855584, + "grad_norm": 3.5036237239837646, + "learning_rate": 8.399449734710092e-06, + "loss": 0.0743, + "step": 20722 + }, + { + "epoch": 56.46594005449591, + "grad_norm": 5.252984046936035, + "learning_rate": 8.398578623346277e-06, + "loss": 0.1331, + "step": 20723 + }, + { + "epoch": 56.46866485013624, + "grad_norm": 4.580055236816406, + "learning_rate": 8.397707524454283e-06, + "loss": 0.2314, + "step": 20724 + }, + { + "epoch": 56.47138964577657, + "grad_norm": 3.5325496196746826, + "learning_rate": 8.396836438040885e-06, + "loss": 0.0936, + "step": 20725 + }, + { + "epoch": 56.474114441416894, + "grad_norm": 3.3489267826080322, + "learning_rate": 8.395965364112877e-06, + "loss": 0.2236, + "step": 20726 + }, + { + "epoch": 56.47683923705722, + "grad_norm": 4.340264797210693, + "learning_rate": 8.395094302677041e-06, + "loss": 0.0966, + "step": 20727 + }, + { + "epoch": 56.479564032697546, + "grad_norm": 2.4337453842163086, + "learning_rate": 8.394223253740157e-06, + "loss": 0.0514, + "step": 20728 + }, + { + "epoch": 56.48228882833787, + "grad_norm": 4.0651679039001465, + "learning_rate": 8.393352217309012e-06, + "loss": 0.2055, + "step": 20729 + }, + { + "epoch": 56.485013623978205, + "grad_norm": 4.50044584274292, + "learning_rate": 8.392481193390388e-06, + "loss": 0.2629, + "step": 20730 + }, + { + "epoch": 56.48773841961853, + "grad_norm": 5.812916278839111, + "learning_rate": 8.391610181991068e-06, + "loss": 0.1296, + "step": 20731 + }, + { + "epoch": 56.490463215258856, + "grad_norm": 3.895035743713379, + "learning_rate": 8.390739183117836e-06, + "loss": 0.0793, + "step": 20732 + }, + { + "epoch": 56.49318801089918, + "grad_norm": 3.867765426635742, + "learning_rate": 8.389868196777478e-06, + "loss": 0.1574, + "step": 20733 + }, + { + "epoch": 56.49591280653951, + "grad_norm": 3.1692419052124023, + "learning_rate": 8.388997222976772e-06, + "loss": 0.0734, + "step": 20734 + }, + { + "epoch": 56.49863760217983, + "grad_norm": 4.660286903381348, + "learning_rate": 8.388126261722504e-06, + "loss": 0.2578, + "step": 20735 + }, + { + "epoch": 56.50136239782017, + "grad_norm": 3.813767910003662, + "learning_rate": 8.387255313021456e-06, + "loss": 0.0827, + "step": 20736 + }, + { + "epoch": 56.50408719346049, + "grad_norm": 3.25433087348938, + "learning_rate": 8.386384376880414e-06, + "loss": 0.1, + "step": 20737 + }, + { + "epoch": 56.50681198910082, + "grad_norm": 3.4825737476348877, + "learning_rate": 8.385513453306157e-06, + "loss": 0.0449, + "step": 20738 + }, + { + "epoch": 56.509536784741144, + "grad_norm": 4.238973617553711, + "learning_rate": 8.38464254230547e-06, + "loss": 0.1629, + "step": 20739 + }, + { + "epoch": 56.51226158038147, + "grad_norm": 3.243096113204956, + "learning_rate": 8.383771643885134e-06, + "loss": 0.0877, + "step": 20740 + }, + { + "epoch": 56.514986376021795, + "grad_norm": 3.553771495819092, + "learning_rate": 8.382900758051934e-06, + "loss": 0.2725, + "step": 20741 + }, + { + "epoch": 56.51771117166213, + "grad_norm": 5.023160457611084, + "learning_rate": 8.382029884812644e-06, + "loss": 0.2727, + "step": 20742 + }, + { + "epoch": 56.520435967302454, + "grad_norm": 4.514641284942627, + "learning_rate": 8.381159024174061e-06, + "loss": 0.1745, + "step": 20743 + }, + { + "epoch": 56.52316076294278, + "grad_norm": 3.5146920680999756, + "learning_rate": 8.380288176142957e-06, + "loss": 0.0662, + "step": 20744 + }, + { + "epoch": 56.525885558583106, + "grad_norm": 3.1947133541107178, + "learning_rate": 8.379417340726118e-06, + "loss": 0.1594, + "step": 20745 + }, + { + "epoch": 56.52861035422343, + "grad_norm": 4.743031024932861, + "learning_rate": 8.378546517930322e-06, + "loss": 0.1361, + "step": 20746 + }, + { + "epoch": 56.53133514986376, + "grad_norm": 5.257390975952148, + "learning_rate": 8.377675707762356e-06, + "loss": 0.1024, + "step": 20747 + }, + { + "epoch": 56.53405994550409, + "grad_norm": 4.6400604248046875, + "learning_rate": 8.376804910228996e-06, + "loss": 0.1175, + "step": 20748 + }, + { + "epoch": 56.536784741144416, + "grad_norm": 10.755497932434082, + "learning_rate": 8.375934125337032e-06, + "loss": 0.0668, + "step": 20749 + }, + { + "epoch": 56.53950953678474, + "grad_norm": 5.789342403411865, + "learning_rate": 8.375063353093237e-06, + "loss": 0.1429, + "step": 20750 + }, + { + "epoch": 56.54223433242507, + "grad_norm": 5.7196760177612305, + "learning_rate": 8.3741925935044e-06, + "loss": 0.1703, + "step": 20751 + }, + { + "epoch": 56.54495912806539, + "grad_norm": 5.382983684539795, + "learning_rate": 8.373321846577295e-06, + "loss": 0.1995, + "step": 20752 + }, + { + "epoch": 56.54768392370572, + "grad_norm": 3.461686134338379, + "learning_rate": 8.37245111231871e-06, + "loss": 0.0761, + "step": 20753 + }, + { + "epoch": 56.55040871934605, + "grad_norm": 4.363855838775635, + "learning_rate": 8.371580390735421e-06, + "loss": 0.13, + "step": 20754 + }, + { + "epoch": 56.55313351498638, + "grad_norm": 3.5286946296691895, + "learning_rate": 8.370709681834213e-06, + "loss": 0.0899, + "step": 20755 + }, + { + "epoch": 56.555858310626704, + "grad_norm": 4.524600505828857, + "learning_rate": 8.369838985621864e-06, + "loss": 0.0949, + "step": 20756 + }, + { + "epoch": 56.55858310626703, + "grad_norm": 6.84073543548584, + "learning_rate": 8.368968302105158e-06, + "loss": 0.0614, + "step": 20757 + }, + { + "epoch": 56.561307901907355, + "grad_norm": 3.4950039386749268, + "learning_rate": 8.368097631290873e-06, + "loss": 0.1144, + "step": 20758 + }, + { + "epoch": 56.56403269754768, + "grad_norm": 4.201791286468506, + "learning_rate": 8.367226973185789e-06, + "loss": 0.0992, + "step": 20759 + }, + { + "epoch": 56.566757493188014, + "grad_norm": 4.8018798828125, + "learning_rate": 8.366356327796693e-06, + "loss": 0.2256, + "step": 20760 + }, + { + "epoch": 56.56948228882834, + "grad_norm": 3.444166898727417, + "learning_rate": 8.36548569513036e-06, + "loss": 0.0888, + "step": 20761 + }, + { + "epoch": 56.572207084468666, + "grad_norm": 3.421161651611328, + "learning_rate": 8.364615075193572e-06, + "loss": 0.0611, + "step": 20762 + }, + { + "epoch": 56.57493188010899, + "grad_norm": 3.7761220932006836, + "learning_rate": 8.363744467993108e-06, + "loss": 0.1276, + "step": 20763 + }, + { + "epoch": 56.57765667574932, + "grad_norm": 6.344570159912109, + "learning_rate": 8.362873873535751e-06, + "loss": 0.1218, + "step": 20764 + }, + { + "epoch": 56.58038147138964, + "grad_norm": 4.360270977020264, + "learning_rate": 8.362003291828279e-06, + "loss": 0.141, + "step": 20765 + }, + { + "epoch": 56.583106267029976, + "grad_norm": 6.195434093475342, + "learning_rate": 8.361132722877471e-06, + "loss": 0.2367, + "step": 20766 + }, + { + "epoch": 56.5858310626703, + "grad_norm": 4.121311664581299, + "learning_rate": 8.360262166690112e-06, + "loss": 0.123, + "step": 20767 + }, + { + "epoch": 56.58855585831063, + "grad_norm": 4.218409538269043, + "learning_rate": 8.359391623272976e-06, + "loss": 0.0734, + "step": 20768 + }, + { + "epoch": 56.59128065395095, + "grad_norm": 4.011482238769531, + "learning_rate": 8.358521092632848e-06, + "loss": 0.1374, + "step": 20769 + }, + { + "epoch": 56.59400544959128, + "grad_norm": 7.294281005859375, + "learning_rate": 8.357650574776501e-06, + "loss": 0.1011, + "step": 20770 + }, + { + "epoch": 56.596730245231605, + "grad_norm": 3.218067169189453, + "learning_rate": 8.356780069710721e-06, + "loss": 0.1312, + "step": 20771 + }, + { + "epoch": 56.59945504087194, + "grad_norm": 6.19024658203125, + "learning_rate": 8.355909577442284e-06, + "loss": 0.2366, + "step": 20772 + }, + { + "epoch": 56.60217983651226, + "grad_norm": 4.183459281921387, + "learning_rate": 8.355039097977972e-06, + "loss": 0.2199, + "step": 20773 + }, + { + "epoch": 56.60490463215259, + "grad_norm": 5.475216388702393, + "learning_rate": 8.35416863132456e-06, + "loss": 0.2377, + "step": 20774 + }, + { + "epoch": 56.607629427792915, + "grad_norm": 3.531409978866577, + "learning_rate": 8.353298177488832e-06, + "loss": 0.0806, + "step": 20775 + }, + { + "epoch": 56.61035422343324, + "grad_norm": 5.869809627532959, + "learning_rate": 8.35242773647756e-06, + "loss": 0.0627, + "step": 20776 + }, + { + "epoch": 56.61307901907357, + "grad_norm": 6.493967056274414, + "learning_rate": 8.35155730829753e-06, + "loss": 0.1159, + "step": 20777 + }, + { + "epoch": 56.6158038147139, + "grad_norm": 2.9832074642181396, + "learning_rate": 8.350686892955522e-06, + "loss": 0.1214, + "step": 20778 + }, + { + "epoch": 56.618528610354225, + "grad_norm": 3.689751386642456, + "learning_rate": 8.349816490458307e-06, + "loss": 0.2088, + "step": 20779 + }, + { + "epoch": 56.62125340599455, + "grad_norm": 5.616393089294434, + "learning_rate": 8.348946100812672e-06, + "loss": 0.1126, + "step": 20780 + }, + { + "epoch": 56.62397820163488, + "grad_norm": 6.355755805969238, + "learning_rate": 8.34807572402539e-06, + "loss": 0.1506, + "step": 20781 + }, + { + "epoch": 56.6267029972752, + "grad_norm": 4.0162672996521, + "learning_rate": 8.347205360103243e-06, + "loss": 0.0995, + "step": 20782 + }, + { + "epoch": 56.62942779291553, + "grad_norm": 4.354006767272949, + "learning_rate": 8.346335009053004e-06, + "loss": 0.1814, + "step": 20783 + }, + { + "epoch": 56.63215258855586, + "grad_norm": 4.109909534454346, + "learning_rate": 8.345464670881458e-06, + "loss": 0.1874, + "step": 20784 + }, + { + "epoch": 56.63487738419619, + "grad_norm": 3.7556591033935547, + "learning_rate": 8.344594345595377e-06, + "loss": 0.2412, + "step": 20785 + }, + { + "epoch": 56.63760217983651, + "grad_norm": 7.884458065032959, + "learning_rate": 8.343724033201544e-06, + "loss": 0.1487, + "step": 20786 + }, + { + "epoch": 56.64032697547684, + "grad_norm": 3.905724287033081, + "learning_rate": 8.342853733706733e-06, + "loss": 0.1255, + "step": 20787 + }, + { + "epoch": 56.643051771117165, + "grad_norm": 4.148049831390381, + "learning_rate": 8.341983447117725e-06, + "loss": 0.108, + "step": 20788 + }, + { + "epoch": 56.64577656675749, + "grad_norm": 4.072840690612793, + "learning_rate": 8.341113173441298e-06, + "loss": 0.096, + "step": 20789 + }, + { + "epoch": 56.64850136239782, + "grad_norm": 3.712479829788208, + "learning_rate": 8.340242912684225e-06, + "loss": 0.0745, + "step": 20790 + }, + { + "epoch": 56.65122615803815, + "grad_norm": 4.330201625823975, + "learning_rate": 8.33937266485329e-06, + "loss": 0.1308, + "step": 20791 + }, + { + "epoch": 56.653950953678475, + "grad_norm": 4.016898155212402, + "learning_rate": 8.338502429955264e-06, + "loss": 0.0759, + "step": 20792 + }, + { + "epoch": 56.6566757493188, + "grad_norm": 3.2190215587615967, + "learning_rate": 8.337632207996932e-06, + "loss": 0.1056, + "step": 20793 + }, + { + "epoch": 56.65940054495913, + "grad_norm": 4.42525053024292, + "learning_rate": 8.336761998985059e-06, + "loss": 0.0807, + "step": 20794 + }, + { + "epoch": 56.66212534059945, + "grad_norm": 3.3427927494049072, + "learning_rate": 8.335891802926435e-06, + "loss": 0.0768, + "step": 20795 + }, + { + "epoch": 56.664850136239785, + "grad_norm": 2.8755178451538086, + "learning_rate": 8.335021619827833e-06, + "loss": 0.1892, + "step": 20796 + }, + { + "epoch": 56.66757493188011, + "grad_norm": 4.551873683929443, + "learning_rate": 8.334151449696027e-06, + "loss": 0.1809, + "step": 20797 + }, + { + "epoch": 56.67029972752044, + "grad_norm": 3.6021249294281006, + "learning_rate": 8.333281292537799e-06, + "loss": 0.1102, + "step": 20798 + }, + { + "epoch": 56.67302452316076, + "grad_norm": 3.869985342025757, + "learning_rate": 8.33241114835992e-06, + "loss": 0.155, + "step": 20799 + }, + { + "epoch": 56.67574931880109, + "grad_norm": 4.747959613800049, + "learning_rate": 8.331541017169172e-06, + "loss": 0.0875, + "step": 20800 + }, + { + "epoch": 56.678474114441414, + "grad_norm": 3.290243148803711, + "learning_rate": 8.330670898972326e-06, + "loss": 0.0621, + "step": 20801 + }, + { + "epoch": 56.68119891008175, + "grad_norm": 4.514286041259766, + "learning_rate": 8.329800793776163e-06, + "loss": 0.0868, + "step": 20802 + }, + { + "epoch": 56.68392370572207, + "grad_norm": 3.982741117477417, + "learning_rate": 8.328930701587456e-06, + "loss": 0.0877, + "step": 20803 + }, + { + "epoch": 56.6866485013624, + "grad_norm": 5.891603946685791, + "learning_rate": 8.328060622412986e-06, + "loss": 0.0628, + "step": 20804 + }, + { + "epoch": 56.689373297002724, + "grad_norm": 4.320755481719971, + "learning_rate": 8.327190556259523e-06, + "loss": 0.0843, + "step": 20805 + }, + { + "epoch": 56.69209809264305, + "grad_norm": 3.407414674758911, + "learning_rate": 8.326320503133847e-06, + "loss": 0.0976, + "step": 20806 + }, + { + "epoch": 56.694822888283376, + "grad_norm": 3.5583882331848145, + "learning_rate": 8.325450463042733e-06, + "loss": 0.1037, + "step": 20807 + }, + { + "epoch": 56.69754768392371, + "grad_norm": 4.379970073699951, + "learning_rate": 8.324580435992959e-06, + "loss": 0.0786, + "step": 20808 + }, + { + "epoch": 56.700272479564035, + "grad_norm": 5.11167049407959, + "learning_rate": 8.323710421991295e-06, + "loss": 0.4112, + "step": 20809 + }, + { + "epoch": 56.70299727520436, + "grad_norm": 4.02913236618042, + "learning_rate": 8.32284042104452e-06, + "loss": 0.2831, + "step": 20810 + }, + { + "epoch": 56.705722070844686, + "grad_norm": 4.0310845375061035, + "learning_rate": 8.321970433159409e-06, + "loss": 0.0971, + "step": 20811 + }, + { + "epoch": 56.70844686648501, + "grad_norm": 3.525644063949585, + "learning_rate": 8.321100458342742e-06, + "loss": 0.0836, + "step": 20812 + }, + { + "epoch": 56.71117166212534, + "grad_norm": 4.3504958152771, + "learning_rate": 8.32023049660129e-06, + "loss": 0.1602, + "step": 20813 + }, + { + "epoch": 56.71389645776567, + "grad_norm": 3.7884342670440674, + "learning_rate": 8.319360547941828e-06, + "loss": 0.071, + "step": 20814 + }, + { + "epoch": 56.716621253406, + "grad_norm": 14.091556549072266, + "learning_rate": 8.318490612371132e-06, + "loss": 0.0971, + "step": 20815 + }, + { + "epoch": 56.71934604904632, + "grad_norm": 2.9496817588806152, + "learning_rate": 8.317620689895979e-06, + "loss": 0.0968, + "step": 20816 + }, + { + "epoch": 56.72207084468665, + "grad_norm": 3.5632452964782715, + "learning_rate": 8.316750780523139e-06, + "loss": 0.0613, + "step": 20817 + }, + { + "epoch": 56.724795640326974, + "grad_norm": 3.4774179458618164, + "learning_rate": 8.315880884259393e-06, + "loss": 0.1866, + "step": 20818 + }, + { + "epoch": 56.7275204359673, + "grad_norm": 6.17877197265625, + "learning_rate": 8.31501100111151e-06, + "loss": 0.1622, + "step": 20819 + }, + { + "epoch": 56.73024523160763, + "grad_norm": 4.434709548950195, + "learning_rate": 8.314141131086268e-06, + "loss": 0.2256, + "step": 20820 + }, + { + "epoch": 56.73297002724796, + "grad_norm": 5.374114036560059, + "learning_rate": 8.31327127419044e-06, + "loss": 0.2084, + "step": 20821 + }, + { + "epoch": 56.735694822888284, + "grad_norm": 4.9178595542907715, + "learning_rate": 8.312401430430802e-06, + "loss": 0.2069, + "step": 20822 + }, + { + "epoch": 56.73841961852861, + "grad_norm": 3.505828380584717, + "learning_rate": 8.311531599814125e-06, + "loss": 0.0871, + "step": 20823 + }, + { + "epoch": 56.741144414168936, + "grad_norm": 4.222629547119141, + "learning_rate": 8.310661782347189e-06, + "loss": 0.1207, + "step": 20824 + }, + { + "epoch": 56.74386920980926, + "grad_norm": 3.801757574081421, + "learning_rate": 8.309791978036762e-06, + "loss": 0.067, + "step": 20825 + }, + { + "epoch": 56.746594005449595, + "grad_norm": 3.894122838973999, + "learning_rate": 8.308922186889623e-06, + "loss": 0.2891, + "step": 20826 + }, + { + "epoch": 56.74931880108992, + "grad_norm": 3.1469714641571045, + "learning_rate": 8.308052408912541e-06, + "loss": 0.0763, + "step": 20827 + }, + { + "epoch": 56.752043596730246, + "grad_norm": 5.020132541656494, + "learning_rate": 8.307182644112291e-06, + "loss": 0.0999, + "step": 20828 + }, + { + "epoch": 56.75476839237057, + "grad_norm": 3.6829075813293457, + "learning_rate": 8.306312892495648e-06, + "loss": 0.0729, + "step": 20829 + }, + { + "epoch": 56.7574931880109, + "grad_norm": 5.328718185424805, + "learning_rate": 8.30544315406939e-06, + "loss": 0.0652, + "step": 20830 + }, + { + "epoch": 56.76021798365122, + "grad_norm": 3.8909647464752197, + "learning_rate": 8.304573428840284e-06, + "loss": 0.0955, + "step": 20831 + }, + { + "epoch": 56.762942779291556, + "grad_norm": 4.502145290374756, + "learning_rate": 8.303703716815108e-06, + "loss": 0.096, + "step": 20832 + }, + { + "epoch": 56.76566757493188, + "grad_norm": 5.859290599822998, + "learning_rate": 8.302834018000628e-06, + "loss": 0.2217, + "step": 20833 + }, + { + "epoch": 56.76839237057221, + "grad_norm": 7.264393329620361, + "learning_rate": 8.301964332403627e-06, + "loss": 0.2151, + "step": 20834 + }, + { + "epoch": 56.771117166212534, + "grad_norm": 3.542628288269043, + "learning_rate": 8.301094660030869e-06, + "loss": 0.0687, + "step": 20835 + }, + { + "epoch": 56.77384196185286, + "grad_norm": 3.1421024799346924, + "learning_rate": 8.300225000889135e-06, + "loss": 0.0777, + "step": 20836 + }, + { + "epoch": 56.776566757493185, + "grad_norm": 4.3368377685546875, + "learning_rate": 8.299355354985192e-06, + "loss": 0.0837, + "step": 20837 + }, + { + "epoch": 56.77929155313352, + "grad_norm": 4.881613731384277, + "learning_rate": 8.298485722325815e-06, + "loss": 0.1662, + "step": 20838 + }, + { + "epoch": 56.782016348773844, + "grad_norm": 7.901316165924072, + "learning_rate": 8.297616102917776e-06, + "loss": 0.1904, + "step": 20839 + }, + { + "epoch": 56.78474114441417, + "grad_norm": 4.116857528686523, + "learning_rate": 8.29674649676785e-06, + "loss": 0.1002, + "step": 20840 + }, + { + "epoch": 56.787465940054496, + "grad_norm": 3.000873327255249, + "learning_rate": 8.295876903882804e-06, + "loss": 0.0516, + "step": 20841 + }, + { + "epoch": 56.79019073569482, + "grad_norm": 3.8488805294036865, + "learning_rate": 8.295007324269417e-06, + "loss": 0.0744, + "step": 20842 + }, + { + "epoch": 56.79291553133515, + "grad_norm": 4.251661777496338, + "learning_rate": 8.294137757934456e-06, + "loss": 0.1279, + "step": 20843 + }, + { + "epoch": 56.79564032697548, + "grad_norm": 3.890658378601074, + "learning_rate": 8.293268204884696e-06, + "loss": 0.0802, + "step": 20844 + }, + { + "epoch": 56.798365122615806, + "grad_norm": 4.6637163162231445, + "learning_rate": 8.292398665126906e-06, + "loss": 0.1038, + "step": 20845 + }, + { + "epoch": 56.80108991825613, + "grad_norm": 4.350137233734131, + "learning_rate": 8.291529138667862e-06, + "loss": 0.1758, + "step": 20846 + }, + { + "epoch": 56.80381471389646, + "grad_norm": 3.3026187419891357, + "learning_rate": 8.290659625514336e-06, + "loss": 0.1161, + "step": 20847 + }, + { + "epoch": 56.80653950953678, + "grad_norm": 3.4914233684539795, + "learning_rate": 8.289790125673095e-06, + "loss": 0.1193, + "step": 20848 + }, + { + "epoch": 56.80926430517711, + "grad_norm": 4.479560375213623, + "learning_rate": 8.288920639150915e-06, + "loss": 0.0678, + "step": 20849 + }, + { + "epoch": 56.81198910081744, + "grad_norm": 3.654784679412842, + "learning_rate": 8.288051165954566e-06, + "loss": 0.1295, + "step": 20850 + }, + { + "epoch": 56.81471389645777, + "grad_norm": 3.607421875, + "learning_rate": 8.28718170609082e-06, + "loss": 0.1604, + "step": 20851 + }, + { + "epoch": 56.817438692098094, + "grad_norm": 4.677554130554199, + "learning_rate": 8.286312259566445e-06, + "loss": 0.0532, + "step": 20852 + }, + { + "epoch": 56.82016348773842, + "grad_norm": 4.797582149505615, + "learning_rate": 8.285442826388217e-06, + "loss": 0.1041, + "step": 20853 + }, + { + "epoch": 56.822888283378745, + "grad_norm": 4.3747663497924805, + "learning_rate": 8.284573406562906e-06, + "loss": 0.2096, + "step": 20854 + }, + { + "epoch": 56.82561307901907, + "grad_norm": 5.039104461669922, + "learning_rate": 8.283704000097281e-06, + "loss": 0.0731, + "step": 20855 + }, + { + "epoch": 56.828337874659404, + "grad_norm": 6.823355674743652, + "learning_rate": 8.282834606998114e-06, + "loss": 0.1905, + "step": 20856 + }, + { + "epoch": 56.83106267029973, + "grad_norm": 3.110656261444092, + "learning_rate": 8.281965227272176e-06, + "loss": 0.0642, + "step": 20857 + }, + { + "epoch": 56.833787465940055, + "grad_norm": 5.17993688583374, + "learning_rate": 8.281095860926238e-06, + "loss": 0.1422, + "step": 20858 + }, + { + "epoch": 56.83651226158038, + "grad_norm": 3.290844678878784, + "learning_rate": 8.280226507967068e-06, + "loss": 0.0627, + "step": 20859 + }, + { + "epoch": 56.83923705722071, + "grad_norm": 4.022027492523193, + "learning_rate": 8.279357168401442e-06, + "loss": 0.0629, + "step": 20860 + }, + { + "epoch": 56.84196185286103, + "grad_norm": 3.564958095550537, + "learning_rate": 8.278487842236125e-06, + "loss": 0.1541, + "step": 20861 + }, + { + "epoch": 56.844686648501366, + "grad_norm": 5.737844944000244, + "learning_rate": 8.277618529477886e-06, + "loss": 0.1378, + "step": 20862 + }, + { + "epoch": 56.84741144414169, + "grad_norm": 3.8045578002929688, + "learning_rate": 8.276749230133503e-06, + "loss": 0.0741, + "step": 20863 + }, + { + "epoch": 56.85013623978202, + "grad_norm": 3.8062503337860107, + "learning_rate": 8.27587994420974e-06, + "loss": 0.2534, + "step": 20864 + }, + { + "epoch": 56.85286103542234, + "grad_norm": 4.266364574432373, + "learning_rate": 8.27501067171337e-06, + "loss": 0.0873, + "step": 20865 + }, + { + "epoch": 56.85558583106267, + "grad_norm": 3.5831804275512695, + "learning_rate": 8.27414141265116e-06, + "loss": 0.1219, + "step": 20866 + }, + { + "epoch": 56.858310626702995, + "grad_norm": 4.1305131912231445, + "learning_rate": 8.273272167029882e-06, + "loss": 0.1514, + "step": 20867 + }, + { + "epoch": 56.86103542234333, + "grad_norm": 4.11383581161499, + "learning_rate": 8.272402934856302e-06, + "loss": 0.1572, + "step": 20868 + }, + { + "epoch": 56.86376021798365, + "grad_norm": 6.590770721435547, + "learning_rate": 8.271533716137196e-06, + "loss": 0.1691, + "step": 20869 + }, + { + "epoch": 56.86648501362398, + "grad_norm": 3.7014214992523193, + "learning_rate": 8.270664510879328e-06, + "loss": 0.0933, + "step": 20870 + }, + { + "epoch": 56.869209809264305, + "grad_norm": 5.859397888183594, + "learning_rate": 8.269795319089471e-06, + "loss": 0.0823, + "step": 20871 + }, + { + "epoch": 56.87193460490463, + "grad_norm": 5.130993366241455, + "learning_rate": 8.26892614077439e-06, + "loss": 0.2859, + "step": 20872 + }, + { + "epoch": 56.87465940054496, + "grad_norm": 3.934887170791626, + "learning_rate": 8.26805697594086e-06, + "loss": 0.0851, + "step": 20873 + }, + { + "epoch": 56.87738419618529, + "grad_norm": 4.152246475219727, + "learning_rate": 8.267187824595641e-06, + "loss": 0.1747, + "step": 20874 + }, + { + "epoch": 56.880108991825615, + "grad_norm": 3.5175857543945312, + "learning_rate": 8.26631868674551e-06, + "loss": 0.0463, + "step": 20875 + }, + { + "epoch": 56.88283378746594, + "grad_norm": 3.765432357788086, + "learning_rate": 8.265449562397235e-06, + "loss": 0.0878, + "step": 20876 + }, + { + "epoch": 56.88555858310627, + "grad_norm": 4.602232933044434, + "learning_rate": 8.26458045155758e-06, + "loss": 0.0716, + "step": 20877 + }, + { + "epoch": 56.88828337874659, + "grad_norm": 4.033105373382568, + "learning_rate": 8.26371135423332e-06, + "loss": 0.1735, + "step": 20878 + }, + { + "epoch": 56.89100817438692, + "grad_norm": 3.979550838470459, + "learning_rate": 8.262842270431218e-06, + "loss": 0.0935, + "step": 20879 + }, + { + "epoch": 56.89373297002725, + "grad_norm": 4.2078938484191895, + "learning_rate": 8.26197320015804e-06, + "loss": 0.0885, + "step": 20880 + }, + { + "epoch": 56.89645776566758, + "grad_norm": 4.143012046813965, + "learning_rate": 8.261104143420566e-06, + "loss": 0.1719, + "step": 20881 + }, + { + "epoch": 56.8991825613079, + "grad_norm": 3.549680471420288, + "learning_rate": 8.260235100225553e-06, + "loss": 0.1014, + "step": 20882 + }, + { + "epoch": 56.90190735694823, + "grad_norm": 4.424400806427002, + "learning_rate": 8.259366070579775e-06, + "loss": 0.2626, + "step": 20883 + }, + { + "epoch": 56.904632152588555, + "grad_norm": 3.190826892852783, + "learning_rate": 8.258497054489998e-06, + "loss": 0.0614, + "step": 20884 + }, + { + "epoch": 56.90735694822888, + "grad_norm": 4.439691066741943, + "learning_rate": 8.25762805196299e-06, + "loss": 0.0798, + "step": 20885 + }, + { + "epoch": 56.91008174386921, + "grad_norm": 4.760251522064209, + "learning_rate": 8.256759063005517e-06, + "loss": 0.1198, + "step": 20886 + }, + { + "epoch": 56.91280653950954, + "grad_norm": 3.8580844402313232, + "learning_rate": 8.255890087624352e-06, + "loss": 0.0949, + "step": 20887 + }, + { + "epoch": 56.915531335149865, + "grad_norm": 3.825615882873535, + "learning_rate": 8.255021125826255e-06, + "loss": 0.0951, + "step": 20888 + }, + { + "epoch": 56.91825613079019, + "grad_norm": 4.554897308349609, + "learning_rate": 8.254152177618e-06, + "loss": 0.0915, + "step": 20889 + }, + { + "epoch": 56.920980926430516, + "grad_norm": 3.0845141410827637, + "learning_rate": 8.253283243006349e-06, + "loss": 0.1355, + "step": 20890 + }, + { + "epoch": 56.92370572207084, + "grad_norm": 4.7472662925720215, + "learning_rate": 8.252414321998075e-06, + "loss": 0.0902, + "step": 20891 + }, + { + "epoch": 56.926430517711175, + "grad_norm": 3.4225594997406006, + "learning_rate": 8.25154541459994e-06, + "loss": 0.0618, + "step": 20892 + }, + { + "epoch": 56.9291553133515, + "grad_norm": 4.021973609924316, + "learning_rate": 8.250676520818712e-06, + "loss": 0.1459, + "step": 20893 + }, + { + "epoch": 56.93188010899183, + "grad_norm": 4.833191394805908, + "learning_rate": 8.24980764066116e-06, + "loss": 0.2345, + "step": 20894 + }, + { + "epoch": 56.93460490463215, + "grad_norm": 4.990149974822998, + "learning_rate": 8.248938774134052e-06, + "loss": 0.123, + "step": 20895 + }, + { + "epoch": 56.93732970027248, + "grad_norm": 4.602786540985107, + "learning_rate": 8.248069921244148e-06, + "loss": 0.136, + "step": 20896 + }, + { + "epoch": 56.940054495912804, + "grad_norm": 3.887037515640259, + "learning_rate": 8.247201081998218e-06, + "loss": 0.1327, + "step": 20897 + }, + { + "epoch": 56.94277929155314, + "grad_norm": 3.8991174697875977, + "learning_rate": 8.246332256403033e-06, + "loss": 0.148, + "step": 20898 + }, + { + "epoch": 56.94550408719346, + "grad_norm": 5.6237993240356445, + "learning_rate": 8.245463444465357e-06, + "loss": 0.176, + "step": 20899 + }, + { + "epoch": 56.94822888283379, + "grad_norm": 3.590494394302368, + "learning_rate": 8.244594646191953e-06, + "loss": 0.1345, + "step": 20900 + }, + { + "epoch": 56.950953678474114, + "grad_norm": 3.9823145866394043, + "learning_rate": 8.243725861589592e-06, + "loss": 0.1468, + "step": 20901 + }, + { + "epoch": 56.95367847411444, + "grad_norm": 4.785423755645752, + "learning_rate": 8.242857090665036e-06, + "loss": 0.0687, + "step": 20902 + }, + { + "epoch": 56.956403269754766, + "grad_norm": 4.729231834411621, + "learning_rate": 8.241988333425052e-06, + "loss": 0.1528, + "step": 20903 + }, + { + "epoch": 56.95912806539509, + "grad_norm": 3.7704522609710693, + "learning_rate": 8.241119589876406e-06, + "loss": 0.1939, + "step": 20904 + }, + { + "epoch": 56.961852861035425, + "grad_norm": 4.724066734313965, + "learning_rate": 8.240250860025866e-06, + "loss": 0.0784, + "step": 20905 + }, + { + "epoch": 56.96457765667575, + "grad_norm": 3.4864683151245117, + "learning_rate": 8.239382143880195e-06, + "loss": 0.0798, + "step": 20906 + }, + { + "epoch": 56.967302452316076, + "grad_norm": 4.217945575714111, + "learning_rate": 8.238513441446158e-06, + "loss": 0.2088, + "step": 20907 + }, + { + "epoch": 56.9700272479564, + "grad_norm": 3.3189778327941895, + "learning_rate": 8.237644752730522e-06, + "loss": 0.0701, + "step": 20908 + }, + { + "epoch": 56.97275204359673, + "grad_norm": 3.262610912322998, + "learning_rate": 8.236776077740054e-06, + "loss": 0.0706, + "step": 20909 + }, + { + "epoch": 56.97547683923706, + "grad_norm": 5.687419414520264, + "learning_rate": 8.235907416481514e-06, + "loss": 0.1054, + "step": 20910 + }, + { + "epoch": 56.97820163487739, + "grad_norm": 3.3241074085235596, + "learning_rate": 8.235038768961672e-06, + "loss": 0.2147, + "step": 20911 + }, + { + "epoch": 56.98092643051771, + "grad_norm": 4.45330810546875, + "learning_rate": 8.23417013518729e-06, + "loss": 0.0628, + "step": 20912 + }, + { + "epoch": 56.98365122615804, + "grad_norm": 4.936892509460449, + "learning_rate": 8.233301515165138e-06, + "loss": 0.1097, + "step": 20913 + }, + { + "epoch": 56.986376021798364, + "grad_norm": 3.4377126693725586, + "learning_rate": 8.23243290890197e-06, + "loss": 0.0554, + "step": 20914 + }, + { + "epoch": 56.98910081743869, + "grad_norm": 4.021442413330078, + "learning_rate": 8.23156431640456e-06, + "loss": 0.1718, + "step": 20915 + }, + { + "epoch": 56.991825613079016, + "grad_norm": 5.111627101898193, + "learning_rate": 8.230695737679671e-06, + "loss": 0.0534, + "step": 20916 + }, + { + "epoch": 56.99455040871935, + "grad_norm": 4.411771297454834, + "learning_rate": 8.229827172734068e-06, + "loss": 0.303, + "step": 20917 + }, + { + "epoch": 56.997275204359674, + "grad_norm": 4.301294803619385, + "learning_rate": 8.228958621574514e-06, + "loss": 0.2108, + "step": 20918 + }, + { + "epoch": 57.0, + "grad_norm": 3.4039785861968994, + "learning_rate": 8.228090084207773e-06, + "loss": 0.0957, + "step": 20919 + }, + { + "epoch": 57.002724795640326, + "grad_norm": 4.393790245056152, + "learning_rate": 8.227221560640609e-06, + "loss": 0.1562, + "step": 20920 + }, + { + "epoch": 57.00544959128065, + "grad_norm": 3.451871395111084, + "learning_rate": 8.226353050879788e-06, + "loss": 0.0594, + "step": 20921 + }, + { + "epoch": 57.00817438692098, + "grad_norm": 3.661106586456299, + "learning_rate": 8.225484554932069e-06, + "loss": 0.0763, + "step": 20922 + }, + { + "epoch": 57.01089918256131, + "grad_norm": 5.8789167404174805, + "learning_rate": 8.224616072804223e-06, + "loss": 0.1362, + "step": 20923 + }, + { + "epoch": 57.013623978201636, + "grad_norm": 3.4945576190948486, + "learning_rate": 8.223747604503005e-06, + "loss": 0.0889, + "step": 20924 + }, + { + "epoch": 57.01634877384196, + "grad_norm": 4.172882080078125, + "learning_rate": 8.22287915003519e-06, + "loss": 0.1805, + "step": 20925 + }, + { + "epoch": 57.01907356948229, + "grad_norm": 3.1446330547332764, + "learning_rate": 8.22201070940753e-06, + "loss": 0.194, + "step": 20926 + }, + { + "epoch": 57.02179836512261, + "grad_norm": 4.150295257568359, + "learning_rate": 8.221142282626795e-06, + "loss": 0.1064, + "step": 20927 + }, + { + "epoch": 57.02452316076294, + "grad_norm": 5.671179294586182, + "learning_rate": 8.220273869699746e-06, + "loss": 0.0806, + "step": 20928 + }, + { + "epoch": 57.02724795640327, + "grad_norm": 4.209830284118652, + "learning_rate": 8.219405470633149e-06, + "loss": 0.1902, + "step": 20929 + }, + { + "epoch": 57.0299727520436, + "grad_norm": 5.202353477478027, + "learning_rate": 8.218537085433761e-06, + "loss": 0.1203, + "step": 20930 + }, + { + "epoch": 57.032697547683924, + "grad_norm": 2.7137610912323, + "learning_rate": 8.217668714108348e-06, + "loss": 0.0501, + "step": 20931 + }, + { + "epoch": 57.03542234332425, + "grad_norm": 3.73943829536438, + "learning_rate": 8.216800356663679e-06, + "loss": 0.1214, + "step": 20932 + }, + { + "epoch": 57.038147138964575, + "grad_norm": 4.07224702835083, + "learning_rate": 8.215932013106508e-06, + "loss": 0.1636, + "step": 20933 + }, + { + "epoch": 57.0408719346049, + "grad_norm": 3.760071277618408, + "learning_rate": 8.215063683443603e-06, + "loss": 0.1316, + "step": 20934 + }, + { + "epoch": 57.043596730245234, + "grad_norm": 3.020530939102173, + "learning_rate": 8.214195367681723e-06, + "loss": 0.0668, + "step": 20935 + }, + { + "epoch": 57.04632152588556, + "grad_norm": 6.602606773376465, + "learning_rate": 8.213327065827635e-06, + "loss": 0.092, + "step": 20936 + }, + { + "epoch": 57.049046321525886, + "grad_norm": 3.1322200298309326, + "learning_rate": 8.212458777888094e-06, + "loss": 0.0659, + "step": 20937 + }, + { + "epoch": 57.05177111716621, + "grad_norm": 3.437601327896118, + "learning_rate": 8.21159050386987e-06, + "loss": 0.0693, + "step": 20938 + }, + { + "epoch": 57.05449591280654, + "grad_norm": 3.798060178756714, + "learning_rate": 8.210722243779719e-06, + "loss": 0.1284, + "step": 20939 + }, + { + "epoch": 57.05722070844686, + "grad_norm": 4.102583885192871, + "learning_rate": 8.209853997624406e-06, + "loss": 0.0916, + "step": 20940 + }, + { + "epoch": 57.059945504087196, + "grad_norm": 5.362946510314941, + "learning_rate": 8.208985765410694e-06, + "loss": 0.1258, + "step": 20941 + }, + { + "epoch": 57.06267029972752, + "grad_norm": 3.262148380279541, + "learning_rate": 8.20811754714534e-06, + "loss": 0.067, + "step": 20942 + }, + { + "epoch": 57.06539509536785, + "grad_norm": 4.280355930328369, + "learning_rate": 8.207249342835114e-06, + "loss": 0.0927, + "step": 20943 + }, + { + "epoch": 57.06811989100817, + "grad_norm": 4.460330963134766, + "learning_rate": 8.206381152486769e-06, + "loss": 0.0997, + "step": 20944 + }, + { + "epoch": 57.0708446866485, + "grad_norm": 3.6226274967193604, + "learning_rate": 8.205512976107071e-06, + "loss": 0.0791, + "step": 20945 + }, + { + "epoch": 57.073569482288825, + "grad_norm": 2.9987363815307617, + "learning_rate": 8.204644813702778e-06, + "loss": 0.062, + "step": 20946 + }, + { + "epoch": 57.07629427792916, + "grad_norm": 3.7295479774475098, + "learning_rate": 8.203776665280656e-06, + "loss": 0.1054, + "step": 20947 + }, + { + "epoch": 57.079019073569484, + "grad_norm": 4.244683265686035, + "learning_rate": 8.202908530847463e-06, + "loss": 0.115, + "step": 20948 + }, + { + "epoch": 57.08174386920981, + "grad_norm": 4.423742771148682, + "learning_rate": 8.202040410409957e-06, + "loss": 0.244, + "step": 20949 + }, + { + "epoch": 57.084468664850135, + "grad_norm": 4.738261699676514, + "learning_rate": 8.201172303974907e-06, + "loss": 0.1805, + "step": 20950 + }, + { + "epoch": 57.08719346049046, + "grad_norm": 4.013214588165283, + "learning_rate": 8.200304211549066e-06, + "loss": 0.1277, + "step": 20951 + }, + { + "epoch": 57.08991825613079, + "grad_norm": 4.8289899826049805, + "learning_rate": 8.199436133139202e-06, + "loss": 0.1858, + "step": 20952 + }, + { + "epoch": 57.09264305177112, + "grad_norm": 3.8840034008026123, + "learning_rate": 8.198568068752069e-06, + "loss": 0.2074, + "step": 20953 + }, + { + "epoch": 57.095367847411445, + "grad_norm": 3.429579257965088, + "learning_rate": 8.19770001839443e-06, + "loss": 0.1578, + "step": 20954 + }, + { + "epoch": 57.09809264305177, + "grad_norm": 5.330948829650879, + "learning_rate": 8.196831982073044e-06, + "loss": 0.1479, + "step": 20955 + }, + { + "epoch": 57.1008174386921, + "grad_norm": 3.138073444366455, + "learning_rate": 8.195963959794675e-06, + "loss": 0.0659, + "step": 20956 + }, + { + "epoch": 57.10354223433242, + "grad_norm": 4.590211868286133, + "learning_rate": 8.19509595156608e-06, + "loss": 0.0611, + "step": 20957 + }, + { + "epoch": 57.10626702997275, + "grad_norm": 4.668395519256592, + "learning_rate": 8.19422795739402e-06, + "loss": 0.1441, + "step": 20958 + }, + { + "epoch": 57.10899182561308, + "grad_norm": 3.013331890106201, + "learning_rate": 8.193359977285252e-06, + "loss": 0.0626, + "step": 20959 + }, + { + "epoch": 57.11171662125341, + "grad_norm": 3.3874785900115967, + "learning_rate": 8.19249201124654e-06, + "loss": 0.1339, + "step": 20960 + }, + { + "epoch": 57.11444141689373, + "grad_norm": 4.477400779724121, + "learning_rate": 8.191624059284643e-06, + "loss": 0.2508, + "step": 20961 + }, + { + "epoch": 57.11716621253406, + "grad_norm": 3.449695348739624, + "learning_rate": 8.190756121406317e-06, + "loss": 0.0629, + "step": 20962 + }, + { + "epoch": 57.119891008174385, + "grad_norm": 3.6937551498413086, + "learning_rate": 8.189888197618326e-06, + "loss": 0.1012, + "step": 20963 + }, + { + "epoch": 57.12261580381471, + "grad_norm": 4.387967586517334, + "learning_rate": 8.189020287927428e-06, + "loss": 0.0852, + "step": 20964 + }, + { + "epoch": 57.12534059945504, + "grad_norm": 3.6131112575531006, + "learning_rate": 8.18815239234038e-06, + "loss": 0.0723, + "step": 20965 + }, + { + "epoch": 57.12806539509537, + "grad_norm": 3.1580309867858887, + "learning_rate": 8.187284510863943e-06, + "loss": 0.132, + "step": 20966 + }, + { + "epoch": 57.130790190735695, + "grad_norm": 3.4441542625427246, + "learning_rate": 8.186416643504874e-06, + "loss": 0.1683, + "step": 20967 + }, + { + "epoch": 57.13351498637602, + "grad_norm": 3.049184799194336, + "learning_rate": 8.185548790269937e-06, + "loss": 0.0765, + "step": 20968 + }, + { + "epoch": 57.13623978201635, + "grad_norm": 3.3789780139923096, + "learning_rate": 8.184680951165887e-06, + "loss": 0.0705, + "step": 20969 + }, + { + "epoch": 57.13896457765667, + "grad_norm": 3.8413381576538086, + "learning_rate": 8.183813126199485e-06, + "loss": 0.0927, + "step": 20970 + }, + { + "epoch": 57.141689373297005, + "grad_norm": 3.9096827507019043, + "learning_rate": 8.182945315377484e-06, + "loss": 0.1362, + "step": 20971 + }, + { + "epoch": 57.14441416893733, + "grad_norm": 4.063755989074707, + "learning_rate": 8.18207751870665e-06, + "loss": 0.1608, + "step": 20972 + }, + { + "epoch": 57.14713896457766, + "grad_norm": 3.655320405960083, + "learning_rate": 8.181209736193736e-06, + "loss": 0.0954, + "step": 20973 + }, + { + "epoch": 57.14986376021798, + "grad_norm": 3.309751272201538, + "learning_rate": 8.180341967845505e-06, + "loss": 0.1083, + "step": 20974 + }, + { + "epoch": 57.15258855585831, + "grad_norm": 5.1634979248046875, + "learning_rate": 8.179474213668709e-06, + "loss": 0.1171, + "step": 20975 + }, + { + "epoch": 57.155313351498634, + "grad_norm": 3.713399887084961, + "learning_rate": 8.17860647367011e-06, + "loss": 0.1329, + "step": 20976 + }, + { + "epoch": 57.15803814713897, + "grad_norm": 3.0816543102264404, + "learning_rate": 8.177738747856464e-06, + "loss": 0.069, + "step": 20977 + }, + { + "epoch": 57.16076294277929, + "grad_norm": 3.5811123847961426, + "learning_rate": 8.176871036234533e-06, + "loss": 0.0922, + "step": 20978 + }, + { + "epoch": 57.16348773841962, + "grad_norm": 3.7834033966064453, + "learning_rate": 8.176003338811069e-06, + "loss": 0.1462, + "step": 20979 + }, + { + "epoch": 57.166212534059945, + "grad_norm": 3.9214141368865967, + "learning_rate": 8.175135655592833e-06, + "loss": 0.1544, + "step": 20980 + }, + { + "epoch": 57.16893732970027, + "grad_norm": 3.1623823642730713, + "learning_rate": 8.17426798658658e-06, + "loss": 0.0527, + "step": 20981 + }, + { + "epoch": 57.171662125340596, + "grad_norm": 14.0775146484375, + "learning_rate": 8.173400331799072e-06, + "loss": 0.1046, + "step": 20982 + }, + { + "epoch": 57.17438692098093, + "grad_norm": 4.159304618835449, + "learning_rate": 8.172532691237058e-06, + "loss": 0.1219, + "step": 20983 + }, + { + "epoch": 57.177111716621255, + "grad_norm": 4.568202018737793, + "learning_rate": 8.171665064907306e-06, + "loss": 0.1168, + "step": 20984 + }, + { + "epoch": 57.17983651226158, + "grad_norm": 2.868018865585327, + "learning_rate": 8.170797452816566e-06, + "loss": 0.0655, + "step": 20985 + }, + { + "epoch": 57.182561307901906, + "grad_norm": 3.5403952598571777, + "learning_rate": 8.169929854971598e-06, + "loss": 0.1954, + "step": 20986 + }, + { + "epoch": 57.18528610354223, + "grad_norm": 7.548911094665527, + "learning_rate": 8.169062271379155e-06, + "loss": 0.201, + "step": 20987 + }, + { + "epoch": 57.18801089918256, + "grad_norm": 3.3708622455596924, + "learning_rate": 8.168194702046e-06, + "loss": 0.0669, + "step": 20988 + }, + { + "epoch": 57.19073569482289, + "grad_norm": 3.5939998626708984, + "learning_rate": 8.167327146978883e-06, + "loss": 0.0934, + "step": 20989 + }, + { + "epoch": 57.19346049046322, + "grad_norm": 3.2615737915039062, + "learning_rate": 8.166459606184565e-06, + "loss": 0.0636, + "step": 20990 + }, + { + "epoch": 57.19618528610354, + "grad_norm": 4.119452476501465, + "learning_rate": 8.165592079669798e-06, + "loss": 0.1014, + "step": 20991 + }, + { + "epoch": 57.19891008174387, + "grad_norm": 2.944352388381958, + "learning_rate": 8.164724567441343e-06, + "loss": 0.1998, + "step": 20992 + }, + { + "epoch": 57.201634877384194, + "grad_norm": 3.481367826461792, + "learning_rate": 8.163857069505952e-06, + "loss": 0.1698, + "step": 20993 + }, + { + "epoch": 57.20435967302452, + "grad_norm": 3.1614503860473633, + "learning_rate": 8.162989585870385e-06, + "loss": 0.1418, + "step": 20994 + }, + { + "epoch": 57.20708446866485, + "grad_norm": 4.005900859832764, + "learning_rate": 8.162122116541394e-06, + "loss": 0.1592, + "step": 20995 + }, + { + "epoch": 57.20980926430518, + "grad_norm": 3.480644702911377, + "learning_rate": 8.161254661525739e-06, + "loss": 0.095, + "step": 20996 + }, + { + "epoch": 57.212534059945504, + "grad_norm": 3.2617340087890625, + "learning_rate": 8.160387220830172e-06, + "loss": 0.1094, + "step": 20997 + }, + { + "epoch": 57.21525885558583, + "grad_norm": 4.810868740081787, + "learning_rate": 8.159519794461452e-06, + "loss": 0.109, + "step": 20998 + }, + { + "epoch": 57.217983651226156, + "grad_norm": 2.804990291595459, + "learning_rate": 8.158652382426328e-06, + "loss": 0.1342, + "step": 20999 + }, + { + "epoch": 57.22070844686648, + "grad_norm": 17.00299644470215, + "learning_rate": 8.157784984731561e-06, + "loss": 0.1707, + "step": 21000 + }, + { + "epoch": 57.223433242506815, + "grad_norm": 4.369019031524658, + "learning_rate": 8.156917601383909e-06, + "loss": 0.1973, + "step": 21001 + }, + { + "epoch": 57.22615803814714, + "grad_norm": 3.4167332649230957, + "learning_rate": 8.156050232390121e-06, + "loss": 0.1066, + "step": 21002 + }, + { + "epoch": 57.228882833787466, + "grad_norm": 6.498249053955078, + "learning_rate": 8.155182877756953e-06, + "loss": 0.2003, + "step": 21003 + }, + { + "epoch": 57.23160762942779, + "grad_norm": 25.307979583740234, + "learning_rate": 8.154315537491166e-06, + "loss": 0.136, + "step": 21004 + }, + { + "epoch": 57.23433242506812, + "grad_norm": 3.269639492034912, + "learning_rate": 8.153448211599506e-06, + "loss": 0.1138, + "step": 21005 + }, + { + "epoch": 57.237057220708444, + "grad_norm": 3.17785906791687, + "learning_rate": 8.152580900088735e-06, + "loss": 0.0825, + "step": 21006 + }, + { + "epoch": 57.23978201634878, + "grad_norm": 3.8047120571136475, + "learning_rate": 8.151713602965602e-06, + "loss": 0.1321, + "step": 21007 + }, + { + "epoch": 57.2425068119891, + "grad_norm": 2.9458749294281006, + "learning_rate": 8.150846320236866e-06, + "loss": 0.1597, + "step": 21008 + }, + { + "epoch": 57.24523160762943, + "grad_norm": 4.262577533721924, + "learning_rate": 8.149979051909278e-06, + "loss": 0.0785, + "step": 21009 + }, + { + "epoch": 57.247956403269754, + "grad_norm": 4.848487854003906, + "learning_rate": 8.149111797989595e-06, + "loss": 0.1172, + "step": 21010 + }, + { + "epoch": 57.25068119891008, + "grad_norm": 6.822971820831299, + "learning_rate": 8.148244558484568e-06, + "loss": 0.1364, + "step": 21011 + }, + { + "epoch": 57.253405994550405, + "grad_norm": 4.221641540527344, + "learning_rate": 8.147377333400955e-06, + "loss": 0.0943, + "step": 21012 + }, + { + "epoch": 57.25613079019074, + "grad_norm": 3.7261950969696045, + "learning_rate": 8.146510122745504e-06, + "loss": 0.1605, + "step": 21013 + }, + { + "epoch": 57.258855585831064, + "grad_norm": 4.5704345703125, + "learning_rate": 8.145642926524977e-06, + "loss": 0.0632, + "step": 21014 + }, + { + "epoch": 57.26158038147139, + "grad_norm": 4.229184150695801, + "learning_rate": 8.14477574474612e-06, + "loss": 0.0648, + "step": 21015 + }, + { + "epoch": 57.264305177111716, + "grad_norm": 3.4966213703155518, + "learning_rate": 8.143908577415691e-06, + "loss": 0.0934, + "step": 21016 + }, + { + "epoch": 57.26702997275204, + "grad_norm": 4.787452220916748, + "learning_rate": 8.14304142454044e-06, + "loss": 0.1329, + "step": 21017 + }, + { + "epoch": 57.26975476839237, + "grad_norm": 5.035547733306885, + "learning_rate": 8.142174286127123e-06, + "loss": 0.0921, + "step": 21018 + }, + { + "epoch": 57.2724795640327, + "grad_norm": 3.683725118637085, + "learning_rate": 8.141307162182496e-06, + "loss": 0.0705, + "step": 21019 + }, + { + "epoch": 57.275204359673026, + "grad_norm": 4.442389488220215, + "learning_rate": 8.140440052713307e-06, + "loss": 0.241, + "step": 21020 + }, + { + "epoch": 57.27792915531335, + "grad_norm": 3.7261180877685547, + "learning_rate": 8.139572957726312e-06, + "loss": 0.0714, + "step": 21021 + }, + { + "epoch": 57.28065395095368, + "grad_norm": 3.876488447189331, + "learning_rate": 8.138705877228262e-06, + "loss": 0.2101, + "step": 21022 + }, + { + "epoch": 57.283378746594, + "grad_norm": 5.133909702301025, + "learning_rate": 8.137838811225913e-06, + "loss": 0.116, + "step": 21023 + }, + { + "epoch": 57.28610354223433, + "grad_norm": 4.60747766494751, + "learning_rate": 8.136971759726011e-06, + "loss": 0.1487, + "step": 21024 + }, + { + "epoch": 57.28882833787466, + "grad_norm": 4.002742767333984, + "learning_rate": 8.136104722735317e-06, + "loss": 0.0709, + "step": 21025 + }, + { + "epoch": 57.29155313351499, + "grad_norm": 3.7660610675811768, + "learning_rate": 8.135237700260578e-06, + "loss": 0.0797, + "step": 21026 + }, + { + "epoch": 57.294277929155314, + "grad_norm": 4.8447465896606445, + "learning_rate": 8.134370692308547e-06, + "loss": 0.1175, + "step": 21027 + }, + { + "epoch": 57.29700272479564, + "grad_norm": 4.493288993835449, + "learning_rate": 8.133503698885978e-06, + "loss": 0.2296, + "step": 21028 + }, + { + "epoch": 57.299727520435965, + "grad_norm": 30.658430099487305, + "learning_rate": 8.132636719999622e-06, + "loss": 0.0807, + "step": 21029 + }, + { + "epoch": 57.30245231607629, + "grad_norm": 3.621741771697998, + "learning_rate": 8.131769755656231e-06, + "loss": 0.0795, + "step": 21030 + }, + { + "epoch": 57.305177111716624, + "grad_norm": 3.7663137912750244, + "learning_rate": 8.130902805862556e-06, + "loss": 0.1682, + "step": 21031 + }, + { + "epoch": 57.30790190735695, + "grad_norm": 6.516160488128662, + "learning_rate": 8.130035870625352e-06, + "loss": 0.0639, + "step": 21032 + }, + { + "epoch": 57.310626702997276, + "grad_norm": 3.108703136444092, + "learning_rate": 8.129168949951368e-06, + "loss": 0.1736, + "step": 21033 + }, + { + "epoch": 57.3133514986376, + "grad_norm": 2.8198657035827637, + "learning_rate": 8.128302043847355e-06, + "loss": 0.0448, + "step": 21034 + }, + { + "epoch": 57.31607629427793, + "grad_norm": 2.566166639328003, + "learning_rate": 8.127435152320061e-06, + "loss": 0.0431, + "step": 21035 + }, + { + "epoch": 57.31880108991825, + "grad_norm": 6.921756267547607, + "learning_rate": 8.126568275376247e-06, + "loss": 0.1104, + "step": 21036 + }, + { + "epoch": 57.321525885558586, + "grad_norm": 4.090224266052246, + "learning_rate": 8.125701413022659e-06, + "loss": 0.2506, + "step": 21037 + }, + { + "epoch": 57.32425068119891, + "grad_norm": 3.300335645675659, + "learning_rate": 8.124834565266048e-06, + "loss": 0.0638, + "step": 21038 + }, + { + "epoch": 57.32697547683924, + "grad_norm": 4.812459945678711, + "learning_rate": 8.123967732113165e-06, + "loss": 0.1904, + "step": 21039 + }, + { + "epoch": 57.32970027247956, + "grad_norm": 3.0873422622680664, + "learning_rate": 8.12310091357076e-06, + "loss": 0.0469, + "step": 21040 + }, + { + "epoch": 57.33242506811989, + "grad_norm": 3.7849323749542236, + "learning_rate": 8.122234109645586e-06, + "loss": 0.1019, + "step": 21041 + }, + { + "epoch": 57.335149863760215, + "grad_norm": 3.6425018310546875, + "learning_rate": 8.12136732034439e-06, + "loss": 0.1474, + "step": 21042 + }, + { + "epoch": 57.33787465940055, + "grad_norm": 4.636575698852539, + "learning_rate": 8.120500545673928e-06, + "loss": 0.0658, + "step": 21043 + }, + { + "epoch": 57.34059945504087, + "grad_norm": 3.2334156036376953, + "learning_rate": 8.119633785640944e-06, + "loss": 0.1799, + "step": 21044 + }, + { + "epoch": 57.3433242506812, + "grad_norm": 4.16218376159668, + "learning_rate": 8.118767040252196e-06, + "loss": 0.0955, + "step": 21045 + }, + { + "epoch": 57.346049046321525, + "grad_norm": 3.0309019088745117, + "learning_rate": 8.117900309514425e-06, + "loss": 0.0419, + "step": 21046 + }, + { + "epoch": 57.34877384196185, + "grad_norm": 3.9720096588134766, + "learning_rate": 8.117033593434389e-06, + "loss": 0.1225, + "step": 21047 + }, + { + "epoch": 57.35149863760218, + "grad_norm": 3.7392325401306152, + "learning_rate": 8.116166892018834e-06, + "loss": 0.0861, + "step": 21048 + }, + { + "epoch": 57.35422343324251, + "grad_norm": 4.26577615737915, + "learning_rate": 8.115300205274508e-06, + "loss": 0.1512, + "step": 21049 + }, + { + "epoch": 57.356948228882835, + "grad_norm": 3.7570958137512207, + "learning_rate": 8.114433533208165e-06, + "loss": 0.13, + "step": 21050 + }, + { + "epoch": 57.35967302452316, + "grad_norm": 4.121349811553955, + "learning_rate": 8.113566875826553e-06, + "loss": 0.2045, + "step": 21051 + }, + { + "epoch": 57.36239782016349, + "grad_norm": 5.072442531585693, + "learning_rate": 8.11270023313642e-06, + "loss": 0.0885, + "step": 21052 + }, + { + "epoch": 57.36512261580381, + "grad_norm": 3.1366050243377686, + "learning_rate": 8.11183360514452e-06, + "loss": 0.0985, + "step": 21053 + }, + { + "epoch": 57.36784741144414, + "grad_norm": 4.402289390563965, + "learning_rate": 8.110966991857596e-06, + "loss": 0.1637, + "step": 21054 + }, + { + "epoch": 57.37057220708447, + "grad_norm": 3.750377893447876, + "learning_rate": 8.110100393282402e-06, + "loss": 0.0972, + "step": 21055 + }, + { + "epoch": 57.3732970027248, + "grad_norm": 6.2638773918151855, + "learning_rate": 8.109233809425686e-06, + "loss": 0.127, + "step": 21056 + }, + { + "epoch": 57.37602179836512, + "grad_norm": 4.752940654754639, + "learning_rate": 8.108367240294197e-06, + "loss": 0.2132, + "step": 21057 + }, + { + "epoch": 57.37874659400545, + "grad_norm": 3.561741590499878, + "learning_rate": 8.10750068589468e-06, + "loss": 0.0837, + "step": 21058 + }, + { + "epoch": 57.381471389645775, + "grad_norm": 5.152788162231445, + "learning_rate": 8.10663414623389e-06, + "loss": 0.1005, + "step": 21059 + }, + { + "epoch": 57.3841961852861, + "grad_norm": 4.3131489753723145, + "learning_rate": 8.10576762131857e-06, + "loss": 0.2148, + "step": 21060 + }, + { + "epoch": 57.38692098092643, + "grad_norm": 3.1346771717071533, + "learning_rate": 8.104901111155472e-06, + "loss": 0.081, + "step": 21061 + }, + { + "epoch": 57.38964577656676, + "grad_norm": 3.919673442840576, + "learning_rate": 8.104034615751343e-06, + "loss": 0.1024, + "step": 21062 + }, + { + "epoch": 57.392370572207085, + "grad_norm": 3.703479051589966, + "learning_rate": 8.103168135112932e-06, + "loss": 0.1538, + "step": 21063 + }, + { + "epoch": 57.39509536784741, + "grad_norm": 4.304934024810791, + "learning_rate": 8.102301669246984e-06, + "loss": 0.2611, + "step": 21064 + }, + { + "epoch": 57.39782016348774, + "grad_norm": 5.615895748138428, + "learning_rate": 8.101435218160253e-06, + "loss": 0.0922, + "step": 21065 + }, + { + "epoch": 57.40054495912806, + "grad_norm": 5.641123294830322, + "learning_rate": 8.10056878185948e-06, + "loss": 0.1476, + "step": 21066 + }, + { + "epoch": 57.403269754768395, + "grad_norm": 4.991501808166504, + "learning_rate": 8.09970236035142e-06, + "loss": 0.0636, + "step": 21067 + }, + { + "epoch": 57.40599455040872, + "grad_norm": 7.819751262664795, + "learning_rate": 8.098835953642813e-06, + "loss": 0.18, + "step": 21068 + }, + { + "epoch": 57.40871934604905, + "grad_norm": 3.9003374576568604, + "learning_rate": 8.097969561740409e-06, + "loss": 0.0832, + "step": 21069 + }, + { + "epoch": 57.41144414168937, + "grad_norm": 3.9136853218078613, + "learning_rate": 8.097103184650959e-06, + "loss": 0.0986, + "step": 21070 + }, + { + "epoch": 57.4141689373297, + "grad_norm": 4.419578552246094, + "learning_rate": 8.09623682238121e-06, + "loss": 0.0991, + "step": 21071 + }, + { + "epoch": 57.416893732970024, + "grad_norm": 4.347434997558594, + "learning_rate": 8.095370474937904e-06, + "loss": 0.0892, + "step": 21072 + }, + { + "epoch": 57.41961852861036, + "grad_norm": 7.327247619628906, + "learning_rate": 8.094504142327796e-06, + "loss": 0.1526, + "step": 21073 + }, + { + "epoch": 57.42234332425068, + "grad_norm": 4.945771217346191, + "learning_rate": 8.093637824557625e-06, + "loss": 0.1173, + "step": 21074 + }, + { + "epoch": 57.42506811989101, + "grad_norm": 4.112789154052734, + "learning_rate": 8.092771521634143e-06, + "loss": 0.093, + "step": 21075 + }, + { + "epoch": 57.427792915531334, + "grad_norm": 2.9911928176879883, + "learning_rate": 8.091905233564095e-06, + "loss": 0.0547, + "step": 21076 + }, + { + "epoch": 57.43051771117166, + "grad_norm": 11.361251831054688, + "learning_rate": 8.091038960354227e-06, + "loss": 0.0711, + "step": 21077 + }, + { + "epoch": 57.433242506811986, + "grad_norm": 2.9650349617004395, + "learning_rate": 8.090172702011287e-06, + "loss": 0.1761, + "step": 21078 + }, + { + "epoch": 57.43596730245232, + "grad_norm": 5.548549175262451, + "learning_rate": 8.08930645854202e-06, + "loss": 0.1474, + "step": 21079 + }, + { + "epoch": 57.438692098092645, + "grad_norm": 6.829399585723877, + "learning_rate": 8.088440229953172e-06, + "loss": 0.1011, + "step": 21080 + }, + { + "epoch": 57.44141689373297, + "grad_norm": 3.559237480163574, + "learning_rate": 8.087574016251492e-06, + "loss": 0.0824, + "step": 21081 + }, + { + "epoch": 57.444141689373296, + "grad_norm": 5.038529872894287, + "learning_rate": 8.086707817443722e-06, + "loss": 0.0856, + "step": 21082 + }, + { + "epoch": 57.44686648501362, + "grad_norm": 6.732036113739014, + "learning_rate": 8.085841633536611e-06, + "loss": 0.0751, + "step": 21083 + }, + { + "epoch": 57.44959128065395, + "grad_norm": 4.63095760345459, + "learning_rate": 8.084975464536902e-06, + "loss": 0.1056, + "step": 21084 + }, + { + "epoch": 57.45231607629428, + "grad_norm": 3.8541738986968994, + "learning_rate": 8.084109310451345e-06, + "loss": 0.1154, + "step": 21085 + }, + { + "epoch": 57.45504087193461, + "grad_norm": 4.783348560333252, + "learning_rate": 8.083243171286679e-06, + "loss": 0.387, + "step": 21086 + }, + { + "epoch": 57.45776566757493, + "grad_norm": 4.016456127166748, + "learning_rate": 8.082377047049654e-06, + "loss": 0.1227, + "step": 21087 + }, + { + "epoch": 57.46049046321526, + "grad_norm": 3.026258707046509, + "learning_rate": 8.08151093774702e-06, + "loss": 0.0905, + "step": 21088 + }, + { + "epoch": 57.463215258855584, + "grad_norm": 4.230606555938721, + "learning_rate": 8.080644843385512e-06, + "loss": 0.1961, + "step": 21089 + }, + { + "epoch": 57.46594005449591, + "grad_norm": 3.694626569747925, + "learning_rate": 8.079778763971882e-06, + "loss": 0.1383, + "step": 21090 + }, + { + "epoch": 57.46866485013624, + "grad_norm": 3.6818764209747314, + "learning_rate": 8.078912699512874e-06, + "loss": 0.1239, + "step": 21091 + }, + { + "epoch": 57.47138964577657, + "grad_norm": 3.8059468269348145, + "learning_rate": 8.07804665001523e-06, + "loss": 0.1128, + "step": 21092 + }, + { + "epoch": 57.474114441416894, + "grad_norm": 4.613978385925293, + "learning_rate": 8.0771806154857e-06, + "loss": 0.2063, + "step": 21093 + }, + { + "epoch": 57.47683923705722, + "grad_norm": 2.964661121368408, + "learning_rate": 8.076314595931024e-06, + "loss": 0.0482, + "step": 21094 + }, + { + "epoch": 57.479564032697546, + "grad_norm": 4.8119049072265625, + "learning_rate": 8.075448591357948e-06, + "loss": 0.0736, + "step": 21095 + }, + { + "epoch": 57.48228882833787, + "grad_norm": 4.246369361877441, + "learning_rate": 8.074582601773215e-06, + "loss": 0.0999, + "step": 21096 + }, + { + "epoch": 57.485013623978205, + "grad_norm": 3.5195250511169434, + "learning_rate": 8.073716627183575e-06, + "loss": 0.0621, + "step": 21097 + }, + { + "epoch": 57.48773841961853, + "grad_norm": 5.680939674377441, + "learning_rate": 8.072850667595763e-06, + "loss": 0.095, + "step": 21098 + }, + { + "epoch": 57.490463215258856, + "grad_norm": 3.6644961833953857, + "learning_rate": 8.071984723016532e-06, + "loss": 0.063, + "step": 21099 + }, + { + "epoch": 57.49318801089918, + "grad_norm": 3.7200732231140137, + "learning_rate": 8.071118793452618e-06, + "loss": 0.1048, + "step": 21100 + }, + { + "epoch": 57.49591280653951, + "grad_norm": 3.758270025253296, + "learning_rate": 8.070252878910771e-06, + "loss": 0.0762, + "step": 21101 + }, + { + "epoch": 57.49863760217983, + "grad_norm": 2.9253904819488525, + "learning_rate": 8.069386979397732e-06, + "loss": 0.1048, + "step": 21102 + }, + { + "epoch": 57.50136239782017, + "grad_norm": 4.1088714599609375, + "learning_rate": 8.068521094920242e-06, + "loss": 0.0957, + "step": 21103 + }, + { + "epoch": 57.50408719346049, + "grad_norm": 5.188478469848633, + "learning_rate": 8.067655225485052e-06, + "loss": 0.1402, + "step": 21104 + }, + { + "epoch": 57.50681198910082, + "grad_norm": 8.501290321350098, + "learning_rate": 8.066789371098899e-06, + "loss": 0.1355, + "step": 21105 + }, + { + "epoch": 57.509536784741144, + "grad_norm": 3.4538586139678955, + "learning_rate": 8.065923531768529e-06, + "loss": 0.0738, + "step": 21106 + }, + { + "epoch": 57.51226158038147, + "grad_norm": 3.281200647354126, + "learning_rate": 8.065057707500684e-06, + "loss": 0.1021, + "step": 21107 + }, + { + "epoch": 57.514986376021795, + "grad_norm": 4.295124530792236, + "learning_rate": 8.064191898302109e-06, + "loss": 0.2357, + "step": 21108 + }, + { + "epoch": 57.51771117166213, + "grad_norm": 4.262333869934082, + "learning_rate": 8.063326104179542e-06, + "loss": 0.0805, + "step": 21109 + }, + { + "epoch": 57.520435967302454, + "grad_norm": 4.151923179626465, + "learning_rate": 8.062460325139731e-06, + "loss": 0.0682, + "step": 21110 + }, + { + "epoch": 57.52316076294278, + "grad_norm": 3.6162490844726562, + "learning_rate": 8.061594561189417e-06, + "loss": 0.118, + "step": 21111 + }, + { + "epoch": 57.525885558583106, + "grad_norm": 4.753512859344482, + "learning_rate": 8.06072881233534e-06, + "loss": 0.1768, + "step": 21112 + }, + { + "epoch": 57.52861035422343, + "grad_norm": 7.29217529296875, + "learning_rate": 8.059863078584245e-06, + "loss": 0.1235, + "step": 21113 + }, + { + "epoch": 57.53133514986376, + "grad_norm": 3.687530040740967, + "learning_rate": 8.058997359942875e-06, + "loss": 0.1103, + "step": 21114 + }, + { + "epoch": 57.53405994550409, + "grad_norm": 3.6048548221588135, + "learning_rate": 8.058131656417972e-06, + "loss": 0.0726, + "step": 21115 + }, + { + "epoch": 57.536784741144416, + "grad_norm": 3.727325916290283, + "learning_rate": 8.057265968016275e-06, + "loss": 0.0839, + "step": 21116 + }, + { + "epoch": 57.53950953678474, + "grad_norm": 4.673880100250244, + "learning_rate": 8.056400294744531e-06, + "loss": 0.0867, + "step": 21117 + }, + { + "epoch": 57.54223433242507, + "grad_norm": 2.8797502517700195, + "learning_rate": 8.055534636609476e-06, + "loss": 0.0489, + "step": 21118 + }, + { + "epoch": 57.54495912806539, + "grad_norm": 4.70318603515625, + "learning_rate": 8.054668993617857e-06, + "loss": 0.1014, + "step": 21119 + }, + { + "epoch": 57.54768392370572, + "grad_norm": 4.084402084350586, + "learning_rate": 8.053803365776412e-06, + "loss": 0.1301, + "step": 21120 + }, + { + "epoch": 57.55040871934605, + "grad_norm": 3.4945762157440186, + "learning_rate": 8.052937753091879e-06, + "loss": 0.2309, + "step": 21121 + }, + { + "epoch": 57.55313351498638, + "grad_norm": 3.5946857929229736, + "learning_rate": 8.05207215557101e-06, + "loss": 0.1019, + "step": 21122 + }, + { + "epoch": 57.555858310626704, + "grad_norm": 4.264369010925293, + "learning_rate": 8.05120657322054e-06, + "loss": 0.2453, + "step": 21123 + }, + { + "epoch": 57.55858310626703, + "grad_norm": 5.001492500305176, + "learning_rate": 8.050341006047209e-06, + "loss": 0.2087, + "step": 21124 + }, + { + "epoch": 57.561307901907355, + "grad_norm": 4.087818622589111, + "learning_rate": 8.04947545405776e-06, + "loss": 0.097, + "step": 21125 + }, + { + "epoch": 57.56403269754768, + "grad_norm": 6.340839385986328, + "learning_rate": 8.048609917258935e-06, + "loss": 0.1306, + "step": 21126 + }, + { + "epoch": 57.566757493188014, + "grad_norm": 4.888052463531494, + "learning_rate": 8.047744395657471e-06, + "loss": 0.0972, + "step": 21127 + }, + { + "epoch": 57.56948228882834, + "grad_norm": 3.893559217453003, + "learning_rate": 8.046878889260112e-06, + "loss": 0.0995, + "step": 21128 + }, + { + "epoch": 57.572207084468666, + "grad_norm": 4.35330867767334, + "learning_rate": 8.046013398073597e-06, + "loss": 0.2851, + "step": 21129 + }, + { + "epoch": 57.57493188010899, + "grad_norm": 3.9809250831604004, + "learning_rate": 8.045147922104668e-06, + "loss": 0.0911, + "step": 21130 + }, + { + "epoch": 57.57765667574932, + "grad_norm": 3.5093841552734375, + "learning_rate": 8.044282461360062e-06, + "loss": 0.5028, + "step": 21131 + }, + { + "epoch": 57.58038147138964, + "grad_norm": 5.057225704193115, + "learning_rate": 8.043417015846523e-06, + "loss": 0.1298, + "step": 21132 + }, + { + "epoch": 57.583106267029976, + "grad_norm": 3.862987995147705, + "learning_rate": 8.042551585570787e-06, + "loss": 0.0906, + "step": 21133 + }, + { + "epoch": 57.5858310626703, + "grad_norm": 7.200356960296631, + "learning_rate": 8.041686170539599e-06, + "loss": 0.0996, + "step": 21134 + }, + { + "epoch": 57.58855585831063, + "grad_norm": 6.5382890701293945, + "learning_rate": 8.040820770759694e-06, + "loss": 0.1129, + "step": 21135 + }, + { + "epoch": 57.59128065395095, + "grad_norm": 6.598848342895508, + "learning_rate": 8.039955386237813e-06, + "loss": 0.0697, + "step": 21136 + }, + { + "epoch": 57.59400544959128, + "grad_norm": 5.061677932739258, + "learning_rate": 8.0390900169807e-06, + "loss": 0.1203, + "step": 21137 + }, + { + "epoch": 57.596730245231605, + "grad_norm": 6.442782878875732, + "learning_rate": 8.038224662995084e-06, + "loss": 0.1633, + "step": 21138 + }, + { + "epoch": 57.59945504087194, + "grad_norm": 5.684314250946045, + "learning_rate": 8.037359324287716e-06, + "loss": 0.1409, + "step": 21139 + }, + { + "epoch": 57.60217983651226, + "grad_norm": 4.345500946044922, + "learning_rate": 8.036494000865331e-06, + "loss": 0.1985, + "step": 21140 + }, + { + "epoch": 57.60490463215259, + "grad_norm": 3.5980756282806396, + "learning_rate": 8.035628692734666e-06, + "loss": 0.0802, + "step": 21141 + }, + { + "epoch": 57.607629427792915, + "grad_norm": 3.9551618099212646, + "learning_rate": 8.034763399902462e-06, + "loss": 0.2361, + "step": 21142 + }, + { + "epoch": 57.61035422343324, + "grad_norm": 4.956972122192383, + "learning_rate": 8.033898122375458e-06, + "loss": 0.0805, + "step": 21143 + }, + { + "epoch": 57.61307901907357, + "grad_norm": 2.717604160308838, + "learning_rate": 8.033032860160394e-06, + "loss": 0.0599, + "step": 21144 + }, + { + "epoch": 57.6158038147139, + "grad_norm": 3.742825984954834, + "learning_rate": 8.032167613264002e-06, + "loss": 0.0542, + "step": 21145 + }, + { + "epoch": 57.618528610354225, + "grad_norm": 5.366011142730713, + "learning_rate": 8.03130238169303e-06, + "loss": 0.1661, + "step": 21146 + }, + { + "epoch": 57.62125340599455, + "grad_norm": 4.602841854095459, + "learning_rate": 8.030437165454208e-06, + "loss": 0.1687, + "step": 21147 + }, + { + "epoch": 57.62397820163488, + "grad_norm": 4.1078362464904785, + "learning_rate": 8.029571964554282e-06, + "loss": 0.1252, + "step": 21148 + }, + { + "epoch": 57.6267029972752, + "grad_norm": 3.8847732543945312, + "learning_rate": 8.028706778999982e-06, + "loss": 0.0739, + "step": 21149 + }, + { + "epoch": 57.62942779291553, + "grad_norm": 4.712838649749756, + "learning_rate": 8.027841608798053e-06, + "loss": 0.1337, + "step": 21150 + }, + { + "epoch": 57.63215258855586, + "grad_norm": 4.490561008453369, + "learning_rate": 8.026976453955228e-06, + "loss": 0.07, + "step": 21151 + }, + { + "epoch": 57.63487738419619, + "grad_norm": 3.750500440597534, + "learning_rate": 8.026111314478249e-06, + "loss": 0.0686, + "step": 21152 + }, + { + "epoch": 57.63760217983651, + "grad_norm": 3.8146345615386963, + "learning_rate": 8.02524619037385e-06, + "loss": 0.0689, + "step": 21153 + }, + { + "epoch": 57.64032697547684, + "grad_norm": 6.2692718505859375, + "learning_rate": 8.02438108164877e-06, + "loss": 0.0755, + "step": 21154 + }, + { + "epoch": 57.643051771117165, + "grad_norm": 3.5104455947875977, + "learning_rate": 8.023515988309742e-06, + "loss": 0.0951, + "step": 21155 + }, + { + "epoch": 57.64577656675749, + "grad_norm": 5.580707550048828, + "learning_rate": 8.022650910363516e-06, + "loss": 0.1287, + "step": 21156 + }, + { + "epoch": 57.64850136239782, + "grad_norm": 3.445660352706909, + "learning_rate": 8.021785847816816e-06, + "loss": 0.1773, + "step": 21157 + }, + { + "epoch": 57.65122615803815, + "grad_norm": 4.380588054656982, + "learning_rate": 8.020920800676387e-06, + "loss": 0.1294, + "step": 21158 + }, + { + "epoch": 57.653950953678475, + "grad_norm": 7.622682094573975, + "learning_rate": 8.020055768948963e-06, + "loss": 0.257, + "step": 21159 + }, + { + "epoch": 57.6566757493188, + "grad_norm": 4.133795261383057, + "learning_rate": 8.01919075264128e-06, + "loss": 0.1186, + "step": 21160 + }, + { + "epoch": 57.65940054495913, + "grad_norm": 10.034468650817871, + "learning_rate": 8.018325751760075e-06, + "loss": 0.2248, + "step": 21161 + }, + { + "epoch": 57.66212534059945, + "grad_norm": 4.84804630279541, + "learning_rate": 8.017460766312088e-06, + "loss": 0.2466, + "step": 21162 + }, + { + "epoch": 57.664850136239785, + "grad_norm": 3.387465000152588, + "learning_rate": 8.01659579630405e-06, + "loss": 0.0704, + "step": 21163 + }, + { + "epoch": 57.66757493188011, + "grad_norm": 4.253676891326904, + "learning_rate": 8.015730841742702e-06, + "loss": 0.1156, + "step": 21164 + }, + { + "epoch": 57.67029972752044, + "grad_norm": 5.0305657386779785, + "learning_rate": 8.014865902634774e-06, + "loss": 0.1137, + "step": 21165 + }, + { + "epoch": 57.67302452316076, + "grad_norm": 3.5951809883117676, + "learning_rate": 8.014000978987013e-06, + "loss": 0.2383, + "step": 21166 + }, + { + "epoch": 57.67574931880109, + "grad_norm": 4.939373016357422, + "learning_rate": 8.013136070806143e-06, + "loss": 0.1463, + "step": 21167 + }, + { + "epoch": 57.678474114441414, + "grad_norm": 3.7658889293670654, + "learning_rate": 8.01227117809891e-06, + "loss": 0.0886, + "step": 21168 + }, + { + "epoch": 57.68119891008175, + "grad_norm": 6.335522174835205, + "learning_rate": 8.011406300872041e-06, + "loss": 0.2037, + "step": 21169 + }, + { + "epoch": 57.68392370572207, + "grad_norm": 4.378781318664551, + "learning_rate": 8.01054143913228e-06, + "loss": 0.1036, + "step": 21170 + }, + { + "epoch": 57.6866485013624, + "grad_norm": 3.1508800983428955, + "learning_rate": 8.009676592886353e-06, + "loss": 0.133, + "step": 21171 + }, + { + "epoch": 57.689373297002724, + "grad_norm": 3.9530043601989746, + "learning_rate": 8.008811762141e-06, + "loss": 0.0892, + "step": 21172 + }, + { + "epoch": 57.69209809264305, + "grad_norm": 5.408289432525635, + "learning_rate": 8.00794694690296e-06, + "loss": 0.1036, + "step": 21173 + }, + { + "epoch": 57.694822888283376, + "grad_norm": 4.0240278244018555, + "learning_rate": 8.007082147178967e-06, + "loss": 0.0761, + "step": 21174 + }, + { + "epoch": 57.69754768392371, + "grad_norm": 4.17277717590332, + "learning_rate": 8.006217362975752e-06, + "loss": 0.0883, + "step": 21175 + }, + { + "epoch": 57.700272479564035, + "grad_norm": 3.8516342639923096, + "learning_rate": 8.005352594300052e-06, + "loss": 0.1287, + "step": 21176 + }, + { + "epoch": 57.70299727520436, + "grad_norm": 3.2691752910614014, + "learning_rate": 8.004487841158601e-06, + "loss": 0.279, + "step": 21177 + }, + { + "epoch": 57.705722070844686, + "grad_norm": 4.902161121368408, + "learning_rate": 8.003623103558137e-06, + "loss": 0.1033, + "step": 21178 + }, + { + "epoch": 57.70844686648501, + "grad_norm": 4.927868843078613, + "learning_rate": 8.002758381505389e-06, + "loss": 0.1865, + "step": 21179 + }, + { + "epoch": 57.71117166212534, + "grad_norm": 3.784280300140381, + "learning_rate": 8.001893675007098e-06, + "loss": 0.0666, + "step": 21180 + }, + { + "epoch": 57.71389645776567, + "grad_norm": 5.653964996337891, + "learning_rate": 8.001028984069991e-06, + "loss": 0.0703, + "step": 21181 + }, + { + "epoch": 57.716621253406, + "grad_norm": 3.5887389183044434, + "learning_rate": 8.00016430870081e-06, + "loss": 0.0579, + "step": 21182 + }, + { + "epoch": 57.71934604904632, + "grad_norm": 3.9548680782318115, + "learning_rate": 7.999299648906281e-06, + "loss": 0.1167, + "step": 21183 + }, + { + "epoch": 57.72207084468665, + "grad_norm": 5.61143684387207, + "learning_rate": 7.998435004693144e-06, + "loss": 0.0734, + "step": 21184 + }, + { + "epoch": 57.724795640326974, + "grad_norm": 7.683944225311279, + "learning_rate": 7.99757037606813e-06, + "loss": 0.2285, + "step": 21185 + }, + { + "epoch": 57.7275204359673, + "grad_norm": 3.710585355758667, + "learning_rate": 7.996705763037975e-06, + "loss": 0.0516, + "step": 21186 + }, + { + "epoch": 57.73024523160763, + "grad_norm": 3.7653274536132812, + "learning_rate": 7.99584116560941e-06, + "loss": 0.0953, + "step": 21187 + }, + { + "epoch": 57.73297002724796, + "grad_norm": 3.338184118270874, + "learning_rate": 7.99497658378917e-06, + "loss": 0.1255, + "step": 21188 + }, + { + "epoch": 57.735694822888284, + "grad_norm": 3.2238829135894775, + "learning_rate": 7.994112017583984e-06, + "loss": 0.057, + "step": 21189 + }, + { + "epoch": 57.73841961852861, + "grad_norm": 3.815045118331909, + "learning_rate": 7.99324746700059e-06, + "loss": 0.216, + "step": 21190 + }, + { + "epoch": 57.741144414168936, + "grad_norm": 5.742342472076416, + "learning_rate": 7.992382932045726e-06, + "loss": 0.1826, + "step": 21191 + }, + { + "epoch": 57.74386920980926, + "grad_norm": 3.9520397186279297, + "learning_rate": 7.991518412726113e-06, + "loss": 0.0978, + "step": 21192 + }, + { + "epoch": 57.746594005449595, + "grad_norm": 3.801438808441162, + "learning_rate": 7.990653909048494e-06, + "loss": 0.0702, + "step": 21193 + }, + { + "epoch": 57.74931880108992, + "grad_norm": 5.18593168258667, + "learning_rate": 7.989789421019596e-06, + "loss": 0.1799, + "step": 21194 + }, + { + "epoch": 57.752043596730246, + "grad_norm": 13.383259773254395, + "learning_rate": 7.988924948646153e-06, + "loss": 0.1071, + "step": 21195 + }, + { + "epoch": 57.75476839237057, + "grad_norm": 3.170557737350464, + "learning_rate": 7.988060491934899e-06, + "loss": 0.1505, + "step": 21196 + }, + { + "epoch": 57.7574931880109, + "grad_norm": 4.092858791351318, + "learning_rate": 7.987196050892565e-06, + "loss": 0.0949, + "step": 21197 + }, + { + "epoch": 57.76021798365122, + "grad_norm": 3.719846487045288, + "learning_rate": 7.986331625525883e-06, + "loss": 0.0713, + "step": 21198 + }, + { + "epoch": 57.762942779291556, + "grad_norm": 3.993051528930664, + "learning_rate": 7.985467215841584e-06, + "loss": 0.1295, + "step": 21199 + }, + { + "epoch": 57.76566757493188, + "grad_norm": 3.3964996337890625, + "learning_rate": 7.984602821846404e-06, + "loss": 0.1053, + "step": 21200 + }, + { + "epoch": 57.76839237057221, + "grad_norm": 3.152707576751709, + "learning_rate": 7.983738443547068e-06, + "loss": 0.0612, + "step": 21201 + }, + { + "epoch": 57.771117166212534, + "grad_norm": 4.443272590637207, + "learning_rate": 7.982874080950319e-06, + "loss": 0.0838, + "step": 21202 + }, + { + "epoch": 57.77384196185286, + "grad_norm": 4.386751174926758, + "learning_rate": 7.982009734062876e-06, + "loss": 0.2328, + "step": 21203 + }, + { + "epoch": 57.776566757493185, + "grad_norm": 3.799968719482422, + "learning_rate": 7.98114540289148e-06, + "loss": 0.0868, + "step": 21204 + }, + { + "epoch": 57.77929155313352, + "grad_norm": 3.518902540206909, + "learning_rate": 7.980281087442855e-06, + "loss": 0.1107, + "step": 21205 + }, + { + "epoch": 57.782016348773844, + "grad_norm": 3.5291759967803955, + "learning_rate": 7.97941678772374e-06, + "loss": 0.0716, + "step": 21206 + }, + { + "epoch": 57.78474114441417, + "grad_norm": 3.9906630516052246, + "learning_rate": 7.978552503740855e-06, + "loss": 0.168, + "step": 21207 + }, + { + "epoch": 57.787465940054496, + "grad_norm": 3.3229517936706543, + "learning_rate": 7.977688235500942e-06, + "loss": 0.1101, + "step": 21208 + }, + { + "epoch": 57.79019073569482, + "grad_norm": 4.04408597946167, + "learning_rate": 7.97682398301073e-06, + "loss": 0.1445, + "step": 21209 + }, + { + "epoch": 57.79291553133515, + "grad_norm": 4.9350690841674805, + "learning_rate": 7.975959746276946e-06, + "loss": 0.2702, + "step": 21210 + }, + { + "epoch": 57.79564032697548, + "grad_norm": 4.619058609008789, + "learning_rate": 7.975095525306324e-06, + "loss": 0.0929, + "step": 21211 + }, + { + "epoch": 57.798365122615806, + "grad_norm": 4.2038679122924805, + "learning_rate": 7.97423132010559e-06, + "loss": 0.0711, + "step": 21212 + }, + { + "epoch": 57.80108991825613, + "grad_norm": 3.2375524044036865, + "learning_rate": 7.97336713068148e-06, + "loss": 0.0973, + "step": 21213 + }, + { + "epoch": 57.80381471389646, + "grad_norm": 3.6754302978515625, + "learning_rate": 7.97250295704072e-06, + "loss": 0.3182, + "step": 21214 + }, + { + "epoch": 57.80653950953678, + "grad_norm": 3.4124221801757812, + "learning_rate": 7.971638799190044e-06, + "loss": 0.1551, + "step": 21215 + }, + { + "epoch": 57.80926430517711, + "grad_norm": 3.6353249549865723, + "learning_rate": 7.970774657136177e-06, + "loss": 0.203, + "step": 21216 + }, + { + "epoch": 57.81198910081744, + "grad_norm": 5.511824607849121, + "learning_rate": 7.969910530885854e-06, + "loss": 0.1322, + "step": 21217 + }, + { + "epoch": 57.81471389645777, + "grad_norm": 6.8044633865356445, + "learning_rate": 7.9690464204458e-06, + "loss": 0.1543, + "step": 21218 + }, + { + "epoch": 57.817438692098094, + "grad_norm": 4.027974605560303, + "learning_rate": 7.968182325822748e-06, + "loss": 0.1423, + "step": 21219 + }, + { + "epoch": 57.82016348773842, + "grad_norm": 3.3240561485290527, + "learning_rate": 7.967318247023427e-06, + "loss": 0.0687, + "step": 21220 + }, + { + "epoch": 57.822888283378745, + "grad_norm": 3.256725311279297, + "learning_rate": 7.966454184054566e-06, + "loss": 0.049, + "step": 21221 + }, + { + "epoch": 57.82561307901907, + "grad_norm": 6.475952625274658, + "learning_rate": 7.965590136922894e-06, + "loss": 0.0575, + "step": 21222 + }, + { + "epoch": 57.828337874659404, + "grad_norm": 6.960272312164307, + "learning_rate": 7.96472610563514e-06, + "loss": 0.0667, + "step": 21223 + }, + { + "epoch": 57.83106267029973, + "grad_norm": 4.397171974182129, + "learning_rate": 7.96386209019803e-06, + "loss": 0.1421, + "step": 21224 + }, + { + "epoch": 57.833787465940055, + "grad_norm": 4.35145378112793, + "learning_rate": 7.962998090618303e-06, + "loss": 0.1062, + "step": 21225 + }, + { + "epoch": 57.83651226158038, + "grad_norm": 6.342430114746094, + "learning_rate": 7.962134106902679e-06, + "loss": 0.1545, + "step": 21226 + }, + { + "epoch": 57.83923705722071, + "grad_norm": 4.252971172332764, + "learning_rate": 7.961270139057891e-06, + "loss": 0.0715, + "step": 21227 + }, + { + "epoch": 57.84196185286103, + "grad_norm": 3.5006935596466064, + "learning_rate": 7.960406187090661e-06, + "loss": 0.1496, + "step": 21228 + }, + { + "epoch": 57.844686648501366, + "grad_norm": 3.8766372203826904, + "learning_rate": 7.959542251007726e-06, + "loss": 0.0847, + "step": 21229 + }, + { + "epoch": 57.84741144414169, + "grad_norm": 5.189877986907959, + "learning_rate": 7.95867833081581e-06, + "loss": 0.156, + "step": 21230 + }, + { + "epoch": 57.85013623978202, + "grad_norm": 4.126110076904297, + "learning_rate": 7.95781442652164e-06, + "loss": 0.0603, + "step": 21231 + }, + { + "epoch": 57.85286103542234, + "grad_norm": 2.957515001296997, + "learning_rate": 7.956950538131946e-06, + "loss": 0.0549, + "step": 21232 + }, + { + "epoch": 57.85558583106267, + "grad_norm": 5.171656608581543, + "learning_rate": 7.956086665653456e-06, + "loss": 0.1057, + "step": 21233 + }, + { + "epoch": 57.858310626702995, + "grad_norm": 5.595894813537598, + "learning_rate": 7.955222809092895e-06, + "loss": 0.1428, + "step": 21234 + }, + { + "epoch": 57.86103542234333, + "grad_norm": 5.651068210601807, + "learning_rate": 7.954358968456997e-06, + "loss": 0.1894, + "step": 21235 + }, + { + "epoch": 57.86376021798365, + "grad_norm": 5.017315864562988, + "learning_rate": 7.953495143752481e-06, + "loss": 0.1441, + "step": 21236 + }, + { + "epoch": 57.86648501362398, + "grad_norm": 3.8824210166931152, + "learning_rate": 7.952631334986083e-06, + "loss": 0.0687, + "step": 21237 + }, + { + "epoch": 57.869209809264305, + "grad_norm": 4.548652648925781, + "learning_rate": 7.951767542164524e-06, + "loss": 0.1594, + "step": 21238 + }, + { + "epoch": 57.87193460490463, + "grad_norm": 3.957911491394043, + "learning_rate": 7.950903765294534e-06, + "loss": 0.1356, + "step": 21239 + }, + { + "epoch": 57.87465940054496, + "grad_norm": 4.3087263107299805, + "learning_rate": 7.950040004382838e-06, + "loss": 0.0463, + "step": 21240 + }, + { + "epoch": 57.87738419618529, + "grad_norm": 3.348483085632324, + "learning_rate": 7.949176259436164e-06, + "loss": 0.1183, + "step": 21241 + }, + { + "epoch": 57.880108991825615, + "grad_norm": 3.969270706176758, + "learning_rate": 7.94831253046124e-06, + "loss": 0.1048, + "step": 21242 + }, + { + "epoch": 57.88283378746594, + "grad_norm": 4.792532444000244, + "learning_rate": 7.947448817464793e-06, + "loss": 0.2866, + "step": 21243 + }, + { + "epoch": 57.88555858310627, + "grad_norm": 3.986077070236206, + "learning_rate": 7.946585120453549e-06, + "loss": 0.0796, + "step": 21244 + }, + { + "epoch": 57.88828337874659, + "grad_norm": 10.107830047607422, + "learning_rate": 7.945721439434234e-06, + "loss": 0.0846, + "step": 21245 + }, + { + "epoch": 57.89100817438692, + "grad_norm": 4.53139591217041, + "learning_rate": 7.944857774413573e-06, + "loss": 0.1073, + "step": 21246 + }, + { + "epoch": 57.89373297002725, + "grad_norm": 4.03631067276001, + "learning_rate": 7.943994125398295e-06, + "loss": 0.0719, + "step": 21247 + }, + { + "epoch": 57.89645776566758, + "grad_norm": 3.6810109615325928, + "learning_rate": 7.943130492395123e-06, + "loss": 0.1046, + "step": 21248 + }, + { + "epoch": 57.8991825613079, + "grad_norm": 5.402345180511475, + "learning_rate": 7.942266875410788e-06, + "loss": 0.1807, + "step": 21249 + }, + { + "epoch": 57.90190735694823, + "grad_norm": 5.32850456237793, + "learning_rate": 7.941403274452009e-06, + "loss": 0.0887, + "step": 21250 + }, + { + "epoch": 57.904632152588555, + "grad_norm": 5.606999397277832, + "learning_rate": 7.940539689525517e-06, + "loss": 0.0795, + "step": 21251 + }, + { + "epoch": 57.90735694822888, + "grad_norm": 3.406586170196533, + "learning_rate": 7.939676120638033e-06, + "loss": 0.0599, + "step": 21252 + }, + { + "epoch": 57.91008174386921, + "grad_norm": 3.391803741455078, + "learning_rate": 7.938812567796289e-06, + "loss": 0.17, + "step": 21253 + }, + { + "epoch": 57.91280653950954, + "grad_norm": 4.0680928230285645, + "learning_rate": 7.937949031007001e-06, + "loss": 0.1939, + "step": 21254 + }, + { + "epoch": 57.915531335149865, + "grad_norm": 3.9837732315063477, + "learning_rate": 7.937085510276904e-06, + "loss": 0.132, + "step": 21255 + }, + { + "epoch": 57.91825613079019, + "grad_norm": 3.055096387863159, + "learning_rate": 7.936222005612717e-06, + "loss": 0.0558, + "step": 21256 + }, + { + "epoch": 57.920980926430516, + "grad_norm": 4.074774265289307, + "learning_rate": 7.935358517021168e-06, + "loss": 0.1265, + "step": 21257 + }, + { + "epoch": 57.92370572207084, + "grad_norm": 3.5439140796661377, + "learning_rate": 7.934495044508976e-06, + "loss": 0.1168, + "step": 21258 + }, + { + "epoch": 57.926430517711175, + "grad_norm": 4.016378879547119, + "learning_rate": 7.933631588082872e-06, + "loss": 0.115, + "step": 21259 + }, + { + "epoch": 57.9291553133515, + "grad_norm": 3.780677318572998, + "learning_rate": 7.932768147749582e-06, + "loss": 0.0652, + "step": 21260 + }, + { + "epoch": 57.93188010899183, + "grad_norm": 4.864652156829834, + "learning_rate": 7.931904723515825e-06, + "loss": 0.2459, + "step": 21261 + }, + { + "epoch": 57.93460490463215, + "grad_norm": 6.173576831817627, + "learning_rate": 7.931041315388328e-06, + "loss": 0.1484, + "step": 21262 + }, + { + "epoch": 57.93732970027248, + "grad_norm": 3.8185551166534424, + "learning_rate": 7.930177923373814e-06, + "loss": 0.0882, + "step": 21263 + }, + { + "epoch": 57.940054495912804, + "grad_norm": 4.387790203094482, + "learning_rate": 7.929314547479007e-06, + "loss": 0.1572, + "step": 21264 + }, + { + "epoch": 57.94277929155314, + "grad_norm": 3.009045124053955, + "learning_rate": 7.928451187710632e-06, + "loss": 0.0655, + "step": 21265 + }, + { + "epoch": 57.94550408719346, + "grad_norm": 3.612657070159912, + "learning_rate": 7.927587844075413e-06, + "loss": 0.1895, + "step": 21266 + }, + { + "epoch": 57.94822888283379, + "grad_norm": 4.834962844848633, + "learning_rate": 7.926724516580076e-06, + "loss": 0.1516, + "step": 21267 + }, + { + "epoch": 57.950953678474114, + "grad_norm": 4.229416847229004, + "learning_rate": 7.925861205231336e-06, + "loss": 0.124, + "step": 21268 + }, + { + "epoch": 57.95367847411444, + "grad_norm": 4.106301307678223, + "learning_rate": 7.924997910035928e-06, + "loss": 0.0933, + "step": 21269 + }, + { + "epoch": 57.956403269754766, + "grad_norm": 4.202123165130615, + "learning_rate": 7.924134631000566e-06, + "loss": 0.1113, + "step": 21270 + }, + { + "epoch": 57.95912806539509, + "grad_norm": 4.454462051391602, + "learning_rate": 7.923271368131977e-06, + "loss": 0.1347, + "step": 21271 + }, + { + "epoch": 57.961852861035425, + "grad_norm": 4.040456295013428, + "learning_rate": 7.922408121436883e-06, + "loss": 0.0798, + "step": 21272 + }, + { + "epoch": 57.96457765667575, + "grad_norm": 3.8941664695739746, + "learning_rate": 7.921544890922011e-06, + "loss": 0.0735, + "step": 21273 + }, + { + "epoch": 57.967302452316076, + "grad_norm": 4.834648609161377, + "learning_rate": 7.920681676594077e-06, + "loss": 0.1558, + "step": 21274 + }, + { + "epoch": 57.9700272479564, + "grad_norm": 4.663985252380371, + "learning_rate": 7.919818478459805e-06, + "loss": 0.216, + "step": 21275 + }, + { + "epoch": 57.97275204359673, + "grad_norm": 5.6572465896606445, + "learning_rate": 7.918955296525925e-06, + "loss": 0.072, + "step": 21276 + }, + { + "epoch": 57.97547683923706, + "grad_norm": 2.902808427810669, + "learning_rate": 7.91809213079915e-06, + "loss": 0.0762, + "step": 21277 + }, + { + "epoch": 57.97820163487739, + "grad_norm": 3.3866100311279297, + "learning_rate": 7.917228981286212e-06, + "loss": 0.0842, + "step": 21278 + }, + { + "epoch": 57.98092643051771, + "grad_norm": 4.018303871154785, + "learning_rate": 7.916365847993823e-06, + "loss": 0.1088, + "step": 21279 + }, + { + "epoch": 57.98365122615804, + "grad_norm": 4.212928295135498, + "learning_rate": 7.915502730928713e-06, + "loss": 0.1219, + "step": 21280 + }, + { + "epoch": 57.986376021798364, + "grad_norm": 3.5765438079833984, + "learning_rate": 7.914639630097598e-06, + "loss": 0.0922, + "step": 21281 + }, + { + "epoch": 57.98910081743869, + "grad_norm": 5.174197196960449, + "learning_rate": 7.913776545507204e-06, + "loss": 0.2322, + "step": 21282 + }, + { + "epoch": 57.991825613079016, + "grad_norm": 12.848947525024414, + "learning_rate": 7.91291347716425e-06, + "loss": 0.1827, + "step": 21283 + }, + { + "epoch": 57.99455040871935, + "grad_norm": 3.7650251388549805, + "learning_rate": 7.91205042507546e-06, + "loss": 0.0621, + "step": 21284 + }, + { + "epoch": 57.997275204359674, + "grad_norm": 3.8231921195983887, + "learning_rate": 7.911187389247553e-06, + "loss": 0.0696, + "step": 21285 + }, + { + "epoch": 58.0, + "grad_norm": 3.755431652069092, + "learning_rate": 7.91032436968725e-06, + "loss": 0.167, + "step": 21286 + }, + { + "epoch": 58.002724795640326, + "grad_norm": 4.290729999542236, + "learning_rate": 7.909461366401277e-06, + "loss": 0.0838, + "step": 21287 + }, + { + "epoch": 58.00544959128065, + "grad_norm": 3.493969202041626, + "learning_rate": 7.908598379396349e-06, + "loss": 0.0639, + "step": 21288 + }, + { + "epoch": 58.00817438692098, + "grad_norm": 4.644974231719971, + "learning_rate": 7.90773540867919e-06, + "loss": 0.0932, + "step": 21289 + }, + { + "epoch": 58.01089918256131, + "grad_norm": 3.7207095623016357, + "learning_rate": 7.90687245425652e-06, + "loss": 0.0752, + "step": 21290 + }, + { + "epoch": 58.013623978201636, + "grad_norm": 5.176153659820557, + "learning_rate": 7.90600951613506e-06, + "loss": 0.1327, + "step": 21291 + }, + { + "epoch": 58.01634877384196, + "grad_norm": 4.342294216156006, + "learning_rate": 7.905146594321532e-06, + "loss": 0.0694, + "step": 21292 + }, + { + "epoch": 58.01907356948229, + "grad_norm": 7.584478855133057, + "learning_rate": 7.904283688822651e-06, + "loss": 0.0665, + "step": 21293 + }, + { + "epoch": 58.02179836512261, + "grad_norm": 4.0451459884643555, + "learning_rate": 7.903420799645145e-06, + "loss": 0.0988, + "step": 21294 + }, + { + "epoch": 58.02452316076294, + "grad_norm": 4.211483955383301, + "learning_rate": 7.90255792679573e-06, + "loss": 0.1224, + "step": 21295 + }, + { + "epoch": 58.02724795640327, + "grad_norm": 5.9595947265625, + "learning_rate": 7.901695070281126e-06, + "loss": 0.1019, + "step": 21296 + }, + { + "epoch": 58.0299727520436, + "grad_norm": 5.6954569816589355, + "learning_rate": 7.90083223010805e-06, + "loss": 0.0998, + "step": 21297 + }, + { + "epoch": 58.032697547683924, + "grad_norm": 3.059959888458252, + "learning_rate": 7.899969406283232e-06, + "loss": 0.2582, + "step": 21298 + }, + { + "epoch": 58.03542234332425, + "grad_norm": 3.3717527389526367, + "learning_rate": 7.89910659881338e-06, + "loss": 0.197, + "step": 21299 + }, + { + "epoch": 58.038147138964575, + "grad_norm": 5.451910495758057, + "learning_rate": 7.898243807705219e-06, + "loss": 0.1239, + "step": 21300 + }, + { + "epoch": 58.0408719346049, + "grad_norm": 3.5340797901153564, + "learning_rate": 7.897381032965467e-06, + "loss": 0.0729, + "step": 21301 + }, + { + "epoch": 58.043596730245234, + "grad_norm": 4.630802631378174, + "learning_rate": 7.896518274600845e-06, + "loss": 0.1574, + "step": 21302 + }, + { + "epoch": 58.04632152588556, + "grad_norm": 4.857437610626221, + "learning_rate": 7.89565553261807e-06, + "loss": 0.1973, + "step": 21303 + }, + { + "epoch": 58.049046321525886, + "grad_norm": 4.43881893157959, + "learning_rate": 7.894792807023864e-06, + "loss": 0.0897, + "step": 21304 + }, + { + "epoch": 58.05177111716621, + "grad_norm": 3.798677682876587, + "learning_rate": 7.89393009782494e-06, + "loss": 0.0626, + "step": 21305 + }, + { + "epoch": 58.05449591280654, + "grad_norm": 3.7635207176208496, + "learning_rate": 7.893067405028025e-06, + "loss": 0.1203, + "step": 21306 + }, + { + "epoch": 58.05722070844686, + "grad_norm": 3.1937971115112305, + "learning_rate": 7.89220472863983e-06, + "loss": 0.0529, + "step": 21307 + }, + { + "epoch": 58.059945504087196, + "grad_norm": 3.741414785385132, + "learning_rate": 7.891342068667079e-06, + "loss": 0.083, + "step": 21308 + }, + { + "epoch": 58.06267029972752, + "grad_norm": 3.0845866203308105, + "learning_rate": 7.890479425116484e-06, + "loss": 0.1788, + "step": 21309 + }, + { + "epoch": 58.06539509536785, + "grad_norm": 3.9257125854492188, + "learning_rate": 7.889616797994768e-06, + "loss": 0.0752, + "step": 21310 + }, + { + "epoch": 58.06811989100817, + "grad_norm": 5.93182373046875, + "learning_rate": 7.88875418730865e-06, + "loss": 0.2888, + "step": 21311 + }, + { + "epoch": 58.0708446866485, + "grad_norm": 2.8869850635528564, + "learning_rate": 7.887891593064848e-06, + "loss": 0.0445, + "step": 21312 + }, + { + "epoch": 58.073569482288825, + "grad_norm": 3.5473380088806152, + "learning_rate": 7.887029015270076e-06, + "loss": 0.0753, + "step": 21313 + }, + { + "epoch": 58.07629427792916, + "grad_norm": 5.232302665710449, + "learning_rate": 7.886166453931056e-06, + "loss": 0.1679, + "step": 21314 + }, + { + "epoch": 58.079019073569484, + "grad_norm": 3.481288433074951, + "learning_rate": 7.885303909054504e-06, + "loss": 0.0694, + "step": 21315 + }, + { + "epoch": 58.08174386920981, + "grad_norm": 4.258885860443115, + "learning_rate": 7.884441380647136e-06, + "loss": 0.0734, + "step": 21316 + }, + { + "epoch": 58.084468664850135, + "grad_norm": 3.5817365646362305, + "learning_rate": 7.88357886871567e-06, + "loss": 0.158, + "step": 21317 + }, + { + "epoch": 58.08719346049046, + "grad_norm": 4.158348560333252, + "learning_rate": 7.882716373266825e-06, + "loss": 0.1088, + "step": 21318 + }, + { + "epoch": 58.08991825613079, + "grad_norm": 4.0440802574157715, + "learning_rate": 7.881853894307316e-06, + "loss": 0.2369, + "step": 21319 + }, + { + "epoch": 58.09264305177112, + "grad_norm": 4.712680339813232, + "learning_rate": 7.880991431843861e-06, + "loss": 0.0653, + "step": 21320 + }, + { + "epoch": 58.095367847411445, + "grad_norm": 3.7499608993530273, + "learning_rate": 7.880128985883175e-06, + "loss": 0.0768, + "step": 21321 + }, + { + "epoch": 58.09809264305177, + "grad_norm": 4.3392157554626465, + "learning_rate": 7.879266556431979e-06, + "loss": 0.0587, + "step": 21322 + }, + { + "epoch": 58.1008174386921, + "grad_norm": 5.922008514404297, + "learning_rate": 7.878404143496985e-06, + "loss": 0.1057, + "step": 21323 + }, + { + "epoch": 58.10354223433242, + "grad_norm": 3.9000155925750732, + "learning_rate": 7.877541747084912e-06, + "loss": 0.0811, + "step": 21324 + }, + { + "epoch": 58.10626702997275, + "grad_norm": 3.4240224361419678, + "learning_rate": 7.876679367202474e-06, + "loss": 0.1955, + "step": 21325 + }, + { + "epoch": 58.10899182561308, + "grad_norm": 3.6861934661865234, + "learning_rate": 7.875817003856392e-06, + "loss": 0.0501, + "step": 21326 + }, + { + "epoch": 58.11171662125341, + "grad_norm": 4.137561798095703, + "learning_rate": 7.874954657053373e-06, + "loss": 0.2101, + "step": 21327 + }, + { + "epoch": 58.11444141689373, + "grad_norm": 3.0040736198425293, + "learning_rate": 7.874092326800142e-06, + "loss": 0.1097, + "step": 21328 + }, + { + "epoch": 58.11716621253406, + "grad_norm": 4.561694622039795, + "learning_rate": 7.87323001310341e-06, + "loss": 0.2594, + "step": 21329 + }, + { + "epoch": 58.119891008174385, + "grad_norm": 3.0798263549804688, + "learning_rate": 7.872367715969897e-06, + "loss": 0.0712, + "step": 21330 + }, + { + "epoch": 58.12261580381471, + "grad_norm": 3.4744293689727783, + "learning_rate": 7.871505435406315e-06, + "loss": 0.1981, + "step": 21331 + }, + { + "epoch": 58.12534059945504, + "grad_norm": 3.486356735229492, + "learning_rate": 7.870643171419382e-06, + "loss": 0.054, + "step": 21332 + }, + { + "epoch": 58.12806539509537, + "grad_norm": 3.9207701683044434, + "learning_rate": 7.869780924015807e-06, + "loss": 0.0655, + "step": 21333 + }, + { + "epoch": 58.130790190735695, + "grad_norm": 3.4613382816314697, + "learning_rate": 7.868918693202314e-06, + "loss": 0.1243, + "step": 21334 + }, + { + "epoch": 58.13351498637602, + "grad_norm": 3.66589617729187, + "learning_rate": 7.86805647898561e-06, + "loss": 0.1703, + "step": 21335 + }, + { + "epoch": 58.13623978201635, + "grad_norm": 3.6065454483032227, + "learning_rate": 7.867194281372417e-06, + "loss": 0.1415, + "step": 21336 + }, + { + "epoch": 58.13896457765667, + "grad_norm": 4.07046365737915, + "learning_rate": 7.866332100369444e-06, + "loss": 0.1409, + "step": 21337 + }, + { + "epoch": 58.141689373297005, + "grad_norm": 3.97886061668396, + "learning_rate": 7.865469935983409e-06, + "loss": 0.1356, + "step": 21338 + }, + { + "epoch": 58.14441416893733, + "grad_norm": 4.356708526611328, + "learning_rate": 7.864607788221024e-06, + "loss": 0.1442, + "step": 21339 + }, + { + "epoch": 58.14713896457766, + "grad_norm": 4.287309646606445, + "learning_rate": 7.863745657089008e-06, + "loss": 0.1436, + "step": 21340 + }, + { + "epoch": 58.14986376021798, + "grad_norm": 2.969545364379883, + "learning_rate": 7.862883542594067e-06, + "loss": 0.0489, + "step": 21341 + }, + { + "epoch": 58.15258855585831, + "grad_norm": 3.9011642932891846, + "learning_rate": 7.862021444742924e-06, + "loss": 0.103, + "step": 21342 + }, + { + "epoch": 58.155313351498634, + "grad_norm": 3.09757924079895, + "learning_rate": 7.861159363542289e-06, + "loss": 0.1337, + "step": 21343 + }, + { + "epoch": 58.15803814713897, + "grad_norm": 3.0279064178466797, + "learning_rate": 7.860297298998871e-06, + "loss": 0.0505, + "step": 21344 + }, + { + "epoch": 58.16076294277929, + "grad_norm": 3.4479753971099854, + "learning_rate": 7.859435251119394e-06, + "loss": 0.154, + "step": 21345 + }, + { + "epoch": 58.16348773841962, + "grad_norm": 3.727128744125366, + "learning_rate": 7.858573219910565e-06, + "loss": 0.1915, + "step": 21346 + }, + { + "epoch": 58.166212534059945, + "grad_norm": 5.588064670562744, + "learning_rate": 7.857711205379099e-06, + "loss": 0.1808, + "step": 21347 + }, + { + "epoch": 58.16893732970027, + "grad_norm": 5.7774128913879395, + "learning_rate": 7.85684920753171e-06, + "loss": 0.1534, + "step": 21348 + }, + { + "epoch": 58.171662125340596, + "grad_norm": 3.6232221126556396, + "learning_rate": 7.85598722637511e-06, + "loss": 0.1654, + "step": 21349 + }, + { + "epoch": 58.17438692098093, + "grad_norm": 4.164429187774658, + "learning_rate": 7.855125261916012e-06, + "loss": 0.098, + "step": 21350 + }, + { + "epoch": 58.177111716621255, + "grad_norm": 3.551900625228882, + "learning_rate": 7.854263314161128e-06, + "loss": 0.0566, + "step": 21351 + }, + { + "epoch": 58.17983651226158, + "grad_norm": 4.061517238616943, + "learning_rate": 7.853401383117176e-06, + "loss": 0.1674, + "step": 21352 + }, + { + "epoch": 58.182561307901906, + "grad_norm": 4.399727821350098, + "learning_rate": 7.85253946879086e-06, + "loss": 0.1202, + "step": 21353 + }, + { + "epoch": 58.18528610354223, + "grad_norm": 3.430011749267578, + "learning_rate": 7.851677571188903e-06, + "loss": 0.2057, + "step": 21354 + }, + { + "epoch": 58.18801089918256, + "grad_norm": 3.1353375911712646, + "learning_rate": 7.850815690318007e-06, + "loss": 0.0631, + "step": 21355 + }, + { + "epoch": 58.19073569482289, + "grad_norm": 4.898374080657959, + "learning_rate": 7.849953826184892e-06, + "loss": 0.2719, + "step": 21356 + }, + { + "epoch": 58.19346049046322, + "grad_norm": 4.685498237609863, + "learning_rate": 7.849091978796267e-06, + "loss": 0.0952, + "step": 21357 + }, + { + "epoch": 58.19618528610354, + "grad_norm": 6.148848056793213, + "learning_rate": 7.848230148158847e-06, + "loss": 0.1801, + "step": 21358 + }, + { + "epoch": 58.19891008174387, + "grad_norm": 4.193655967712402, + "learning_rate": 7.847368334279336e-06, + "loss": 0.1095, + "step": 21359 + }, + { + "epoch": 58.201634877384194, + "grad_norm": 3.1795859336853027, + "learning_rate": 7.846506537164456e-06, + "loss": 0.0984, + "step": 21360 + }, + { + "epoch": 58.20435967302452, + "grad_norm": 4.306779861450195, + "learning_rate": 7.845644756820908e-06, + "loss": 0.1707, + "step": 21361 + }, + { + "epoch": 58.20708446866485, + "grad_norm": 3.9911789894104004, + "learning_rate": 7.844782993255412e-06, + "loss": 0.0743, + "step": 21362 + }, + { + "epoch": 58.20980926430518, + "grad_norm": 4.329372406005859, + "learning_rate": 7.843921246474679e-06, + "loss": 0.1007, + "step": 21363 + }, + { + "epoch": 58.212534059945504, + "grad_norm": 2.8500869274139404, + "learning_rate": 7.843059516485415e-06, + "loss": 0.0463, + "step": 21364 + }, + { + "epoch": 58.21525885558583, + "grad_norm": 4.476006984710693, + "learning_rate": 7.842197803294337e-06, + "loss": 0.1228, + "step": 21365 + }, + { + "epoch": 58.217983651226156, + "grad_norm": 3.1800928115844727, + "learning_rate": 7.84133610690815e-06, + "loss": 0.0705, + "step": 21366 + }, + { + "epoch": 58.22070844686648, + "grad_norm": 3.367802619934082, + "learning_rate": 7.840474427333573e-06, + "loss": 0.0722, + "step": 21367 + }, + { + "epoch": 58.223433242506815, + "grad_norm": 3.4590463638305664, + "learning_rate": 7.839612764577305e-06, + "loss": 0.0742, + "step": 21368 + }, + { + "epoch": 58.22615803814714, + "grad_norm": 3.1542577743530273, + "learning_rate": 7.838751118646068e-06, + "loss": 0.0678, + "step": 21369 + }, + { + "epoch": 58.228882833787466, + "grad_norm": 3.5310192108154297, + "learning_rate": 7.837889489546566e-06, + "loss": 0.0516, + "step": 21370 + }, + { + "epoch": 58.23160762942779, + "grad_norm": 3.7076683044433594, + "learning_rate": 7.837027877285512e-06, + "loss": 0.1798, + "step": 21371 + }, + { + "epoch": 58.23433242506812, + "grad_norm": 3.785773992538452, + "learning_rate": 7.836166281869614e-06, + "loss": 0.1145, + "step": 21372 + }, + { + "epoch": 58.237057220708444, + "grad_norm": 3.829242706298828, + "learning_rate": 7.835304703305583e-06, + "loss": 0.2267, + "step": 21373 + }, + { + "epoch": 58.23978201634878, + "grad_norm": 3.6718368530273438, + "learning_rate": 7.834443141600131e-06, + "loss": 0.0481, + "step": 21374 + }, + { + "epoch": 58.2425068119891, + "grad_norm": 3.986198902130127, + "learning_rate": 7.833581596759965e-06, + "loss": 0.1318, + "step": 21375 + }, + { + "epoch": 58.24523160762943, + "grad_norm": 5.590548992156982, + "learning_rate": 7.832720068791798e-06, + "loss": 0.073, + "step": 21376 + }, + { + "epoch": 58.247956403269754, + "grad_norm": 4.912227630615234, + "learning_rate": 7.831858557702332e-06, + "loss": 0.0819, + "step": 21377 + }, + { + "epoch": 58.25068119891008, + "grad_norm": 4.700142860412598, + "learning_rate": 7.830997063498288e-06, + "loss": 0.0877, + "step": 21378 + }, + { + "epoch": 58.253405994550405, + "grad_norm": 3.449402093887329, + "learning_rate": 7.830135586186363e-06, + "loss": 0.0639, + "step": 21379 + }, + { + "epoch": 58.25613079019074, + "grad_norm": 4.228108882904053, + "learning_rate": 7.829274125773275e-06, + "loss": 0.1262, + "step": 21380 + }, + { + "epoch": 58.258855585831064, + "grad_norm": 3.4274513721466064, + "learning_rate": 7.82841268226573e-06, + "loss": 0.1647, + "step": 21381 + }, + { + "epoch": 58.26158038147139, + "grad_norm": 4.357746601104736, + "learning_rate": 7.827551255670438e-06, + "loss": 0.1457, + "step": 21382 + }, + { + "epoch": 58.264305177111716, + "grad_norm": 5.125286102294922, + "learning_rate": 7.82668984599411e-06, + "loss": 0.1067, + "step": 21383 + }, + { + "epoch": 58.26702997275204, + "grad_norm": 3.2794137001037598, + "learning_rate": 7.825828453243446e-06, + "loss": 0.0759, + "step": 21384 + }, + { + "epoch": 58.26975476839237, + "grad_norm": 6.392207145690918, + "learning_rate": 7.824967077425163e-06, + "loss": 0.074, + "step": 21385 + }, + { + "epoch": 58.2724795640327, + "grad_norm": 3.7522635459899902, + "learning_rate": 7.824105718545964e-06, + "loss": 0.0575, + "step": 21386 + }, + { + "epoch": 58.275204359673026, + "grad_norm": 3.603132486343384, + "learning_rate": 7.823244376612565e-06, + "loss": 0.0482, + "step": 21387 + }, + { + "epoch": 58.27792915531335, + "grad_norm": 4.035679340362549, + "learning_rate": 7.822383051631664e-06, + "loss": 0.058, + "step": 21388 + }, + { + "epoch": 58.28065395095368, + "grad_norm": 4.110881805419922, + "learning_rate": 7.821521743609974e-06, + "loss": 0.1739, + "step": 21389 + }, + { + "epoch": 58.283378746594, + "grad_norm": 4.31303596496582, + "learning_rate": 7.820660452554203e-06, + "loss": 0.1267, + "step": 21390 + }, + { + "epoch": 58.28610354223433, + "grad_norm": 4.4154534339904785, + "learning_rate": 7.81979917847106e-06, + "loss": 0.1102, + "step": 21391 + }, + { + "epoch": 58.28882833787466, + "grad_norm": 3.369174003601074, + "learning_rate": 7.81893792136725e-06, + "loss": 0.1161, + "step": 21392 + }, + { + "epoch": 58.29155313351499, + "grad_norm": 3.901320695877075, + "learning_rate": 7.81807668124948e-06, + "loss": 0.0618, + "step": 21393 + }, + { + "epoch": 58.294277929155314, + "grad_norm": 5.338075160980225, + "learning_rate": 7.817215458124459e-06, + "loss": 0.0779, + "step": 21394 + }, + { + "epoch": 58.29700272479564, + "grad_norm": 3.79465913772583, + "learning_rate": 7.816354251998896e-06, + "loss": 0.1361, + "step": 21395 + }, + { + "epoch": 58.299727520435965, + "grad_norm": 4.482502460479736, + "learning_rate": 7.815493062879488e-06, + "loss": 0.1486, + "step": 21396 + }, + { + "epoch": 58.30245231607629, + "grad_norm": 3.5135910511016846, + "learning_rate": 7.814631890772957e-06, + "loss": 0.1713, + "step": 21397 + }, + { + "epoch": 58.305177111716624, + "grad_norm": 4.737347602844238, + "learning_rate": 7.813770735686e-06, + "loss": 0.2697, + "step": 21398 + }, + { + "epoch": 58.30790190735695, + "grad_norm": 3.4451520442962646, + "learning_rate": 7.812909597625328e-06, + "loss": 0.1412, + "step": 21399 + }, + { + "epoch": 58.310626702997276, + "grad_norm": 4.710101127624512, + "learning_rate": 7.812048476597645e-06, + "loss": 0.0543, + "step": 21400 + }, + { + "epoch": 58.3133514986376, + "grad_norm": 4.055838108062744, + "learning_rate": 7.811187372609658e-06, + "loss": 0.0741, + "step": 21401 + }, + { + "epoch": 58.31607629427793, + "grad_norm": 4.483063220977783, + "learning_rate": 7.810326285668073e-06, + "loss": 0.1152, + "step": 21402 + }, + { + "epoch": 58.31880108991825, + "grad_norm": 3.3968918323516846, + "learning_rate": 7.809465215779596e-06, + "loss": 0.0614, + "step": 21403 + }, + { + "epoch": 58.321525885558586, + "grad_norm": 3.713894844055176, + "learning_rate": 7.808604162950934e-06, + "loss": 0.0972, + "step": 21404 + }, + { + "epoch": 58.32425068119891, + "grad_norm": 3.5638866424560547, + "learning_rate": 7.807743127188794e-06, + "loss": 0.0657, + "step": 21405 + }, + { + "epoch": 58.32697547683924, + "grad_norm": 4.74470329284668, + "learning_rate": 7.806882108499878e-06, + "loss": 0.1854, + "step": 21406 + }, + { + "epoch": 58.32970027247956, + "grad_norm": 4.56574010848999, + "learning_rate": 7.806021106890894e-06, + "loss": 0.0825, + "step": 21407 + }, + { + "epoch": 58.33242506811989, + "grad_norm": 3.5397439002990723, + "learning_rate": 7.805160122368548e-06, + "loss": 0.1053, + "step": 21408 + }, + { + "epoch": 58.335149863760215, + "grad_norm": 3.121457815170288, + "learning_rate": 7.804299154939543e-06, + "loss": 0.1497, + "step": 21409 + }, + { + "epoch": 58.33787465940055, + "grad_norm": 3.075286626815796, + "learning_rate": 7.803438204610584e-06, + "loss": 0.0687, + "step": 21410 + }, + { + "epoch": 58.34059945504087, + "grad_norm": 3.287900686264038, + "learning_rate": 7.802577271388381e-06, + "loss": 0.1355, + "step": 21411 + }, + { + "epoch": 58.3433242506812, + "grad_norm": 4.360344409942627, + "learning_rate": 7.801716355279632e-06, + "loss": 0.1377, + "step": 21412 + }, + { + "epoch": 58.346049046321525, + "grad_norm": 4.808806896209717, + "learning_rate": 7.800855456291045e-06, + "loss": 0.2072, + "step": 21413 + }, + { + "epoch": 58.34877384196185, + "grad_norm": 4.6278300285339355, + "learning_rate": 7.799994574429329e-06, + "loss": 0.1165, + "step": 21414 + }, + { + "epoch": 58.35149863760218, + "grad_norm": 2.3931100368499756, + "learning_rate": 7.79913370970118e-06, + "loss": 0.0474, + "step": 21415 + }, + { + "epoch": 58.35422343324251, + "grad_norm": 4.6696295738220215, + "learning_rate": 7.798272862113308e-06, + "loss": 0.0821, + "step": 21416 + }, + { + "epoch": 58.356948228882835, + "grad_norm": 3.7376925945281982, + "learning_rate": 7.797412031672419e-06, + "loss": 0.057, + "step": 21417 + }, + { + "epoch": 58.35967302452316, + "grad_norm": 3.901583671569824, + "learning_rate": 7.796551218385211e-06, + "loss": 0.073, + "step": 21418 + }, + { + "epoch": 58.36239782016349, + "grad_norm": 4.015518665313721, + "learning_rate": 7.795690422258394e-06, + "loss": 0.0653, + "step": 21419 + }, + { + "epoch": 58.36512261580381, + "grad_norm": 3.206453800201416, + "learning_rate": 7.794829643298667e-06, + "loss": 0.0632, + "step": 21420 + }, + { + "epoch": 58.36784741144414, + "grad_norm": 7.467257976531982, + "learning_rate": 7.793968881512737e-06, + "loss": 0.1243, + "step": 21421 + }, + { + "epoch": 58.37057220708447, + "grad_norm": 4.359302043914795, + "learning_rate": 7.793108136907306e-06, + "loss": 0.0704, + "step": 21422 + }, + { + "epoch": 58.3732970027248, + "grad_norm": 4.667004108428955, + "learning_rate": 7.79224740948908e-06, + "loss": 0.0965, + "step": 21423 + }, + { + "epoch": 58.37602179836512, + "grad_norm": 3.114868402481079, + "learning_rate": 7.791386699264756e-06, + "loss": 0.1781, + "step": 21424 + }, + { + "epoch": 58.37874659400545, + "grad_norm": 5.092816352844238, + "learning_rate": 7.790526006241044e-06, + "loss": 0.1404, + "step": 21425 + }, + { + "epoch": 58.381471389645775, + "grad_norm": 2.988006353378296, + "learning_rate": 7.789665330424643e-06, + "loss": 0.1273, + "step": 21426 + }, + { + "epoch": 58.3841961852861, + "grad_norm": 3.5393736362457275, + "learning_rate": 7.78880467182226e-06, + "loss": 0.0856, + "step": 21427 + }, + { + "epoch": 58.38692098092643, + "grad_norm": 3.369912624359131, + "learning_rate": 7.78794403044059e-06, + "loss": 0.2267, + "step": 21428 + }, + { + "epoch": 58.38964577656676, + "grad_norm": 4.061559200286865, + "learning_rate": 7.787083406286345e-06, + "loss": 0.1604, + "step": 21429 + }, + { + "epoch": 58.392370572207085, + "grad_norm": 3.5608556270599365, + "learning_rate": 7.78622279936622e-06, + "loss": 0.2598, + "step": 21430 + }, + { + "epoch": 58.39509536784741, + "grad_norm": 5.442565441131592, + "learning_rate": 7.78536220968692e-06, + "loss": 0.1797, + "step": 21431 + }, + { + "epoch": 58.39782016348774, + "grad_norm": 3.6805570125579834, + "learning_rate": 7.78450163725515e-06, + "loss": 0.0749, + "step": 21432 + }, + { + "epoch": 58.40054495912806, + "grad_norm": 3.387275218963623, + "learning_rate": 7.78364108207761e-06, + "loss": 0.0808, + "step": 21433 + }, + { + "epoch": 58.403269754768395, + "grad_norm": 4.009548664093018, + "learning_rate": 7.782780544161002e-06, + "loss": 0.1643, + "step": 21434 + }, + { + "epoch": 58.40599455040872, + "grad_norm": 6.480135917663574, + "learning_rate": 7.781920023512027e-06, + "loss": 0.2497, + "step": 21435 + }, + { + "epoch": 58.40871934604905, + "grad_norm": 4.250776290893555, + "learning_rate": 7.78105952013739e-06, + "loss": 0.1018, + "step": 21436 + }, + { + "epoch": 58.41144414168937, + "grad_norm": 3.59672212600708, + "learning_rate": 7.780199034043787e-06, + "loss": 0.1838, + "step": 21437 + }, + { + "epoch": 58.4141689373297, + "grad_norm": 4.79533576965332, + "learning_rate": 7.779338565237922e-06, + "loss": 0.251, + "step": 21438 + }, + { + "epoch": 58.416893732970024, + "grad_norm": 3.9480504989624023, + "learning_rate": 7.778478113726501e-06, + "loss": 0.1554, + "step": 21439 + }, + { + "epoch": 58.41961852861036, + "grad_norm": 4.790663719177246, + "learning_rate": 7.777617679516217e-06, + "loss": 0.2321, + "step": 21440 + }, + { + "epoch": 58.42234332425068, + "grad_norm": 4.551621437072754, + "learning_rate": 7.776757262613777e-06, + "loss": 0.0843, + "step": 21441 + }, + { + "epoch": 58.42506811989101, + "grad_norm": 4.327082633972168, + "learning_rate": 7.77589686302588e-06, + "loss": 0.0786, + "step": 21442 + }, + { + "epoch": 58.427792915531334, + "grad_norm": 3.325671434402466, + "learning_rate": 7.775036480759226e-06, + "loss": 0.0904, + "step": 21443 + }, + { + "epoch": 58.43051771117166, + "grad_norm": 4.046737194061279, + "learning_rate": 7.774176115820516e-06, + "loss": 0.0647, + "step": 21444 + }, + { + "epoch": 58.433242506811986, + "grad_norm": 2.9866275787353516, + "learning_rate": 7.773315768216452e-06, + "loss": 0.05, + "step": 21445 + }, + { + "epoch": 58.43596730245232, + "grad_norm": 4.174355506896973, + "learning_rate": 7.772455437953731e-06, + "loss": 0.0584, + "step": 21446 + }, + { + "epoch": 58.438692098092645, + "grad_norm": 3.5630075931549072, + "learning_rate": 7.771595125039053e-06, + "loss": 0.3054, + "step": 21447 + }, + { + "epoch": 58.44141689373297, + "grad_norm": 3.7853434085845947, + "learning_rate": 7.770734829479126e-06, + "loss": 0.0693, + "step": 21448 + }, + { + "epoch": 58.444141689373296, + "grad_norm": 4.610340118408203, + "learning_rate": 7.76987455128064e-06, + "loss": 0.2594, + "step": 21449 + }, + { + "epoch": 58.44686648501362, + "grad_norm": 4.337750434875488, + "learning_rate": 7.769014290450303e-06, + "loss": 0.1092, + "step": 21450 + }, + { + "epoch": 58.44959128065395, + "grad_norm": 4.147157192230225, + "learning_rate": 7.76815404699481e-06, + "loss": 0.1268, + "step": 21451 + }, + { + "epoch": 58.45231607629428, + "grad_norm": 4.715500354766846, + "learning_rate": 7.76729382092086e-06, + "loss": 0.0855, + "step": 21452 + }, + { + "epoch": 58.45504087193461, + "grad_norm": 5.13818359375, + "learning_rate": 7.766433612235154e-06, + "loss": 0.09, + "step": 21453 + }, + { + "epoch": 58.45776566757493, + "grad_norm": 3.5562307834625244, + "learning_rate": 7.765573420944394e-06, + "loss": 0.0597, + "step": 21454 + }, + { + "epoch": 58.46049046321526, + "grad_norm": 8.059571266174316, + "learning_rate": 7.764713247055273e-06, + "loss": 0.1189, + "step": 21455 + }, + { + "epoch": 58.463215258855584, + "grad_norm": 4.303390979766846, + "learning_rate": 7.763853090574495e-06, + "loss": 0.0741, + "step": 21456 + }, + { + "epoch": 58.46594005449591, + "grad_norm": 3.4709019660949707, + "learning_rate": 7.762992951508757e-06, + "loss": 0.0471, + "step": 21457 + }, + { + "epoch": 58.46866485013624, + "grad_norm": 4.330159664154053, + "learning_rate": 7.762132829864757e-06, + "loss": 0.0934, + "step": 21458 + }, + { + "epoch": 58.47138964577657, + "grad_norm": 5.4488911628723145, + "learning_rate": 7.761272725649195e-06, + "loss": 0.0801, + "step": 21459 + }, + { + "epoch": 58.474114441416894, + "grad_norm": 4.719922065734863, + "learning_rate": 7.760412638868768e-06, + "loss": 0.0891, + "step": 21460 + }, + { + "epoch": 58.47683923705722, + "grad_norm": 4.579160690307617, + "learning_rate": 7.759552569530178e-06, + "loss": 0.0819, + "step": 21461 + }, + { + "epoch": 58.479564032697546, + "grad_norm": 3.2546329498291016, + "learning_rate": 7.758692517640117e-06, + "loss": 0.1069, + "step": 21462 + }, + { + "epoch": 58.48228882833787, + "grad_norm": 2.822486162185669, + "learning_rate": 7.75783248320529e-06, + "loss": 0.0632, + "step": 21463 + }, + { + "epoch": 58.485013623978205, + "grad_norm": 4.434988498687744, + "learning_rate": 7.756972466232388e-06, + "loss": 0.0693, + "step": 21464 + }, + { + "epoch": 58.48773841961853, + "grad_norm": 3.8925631046295166, + "learning_rate": 7.756112466728111e-06, + "loss": 0.1362, + "step": 21465 + }, + { + "epoch": 58.490463215258856, + "grad_norm": 3.5528383255004883, + "learning_rate": 7.755252484699163e-06, + "loss": 0.1053, + "step": 21466 + }, + { + "epoch": 58.49318801089918, + "grad_norm": 3.9033761024475098, + "learning_rate": 7.754392520152233e-06, + "loss": 0.1055, + "step": 21467 + }, + { + "epoch": 58.49591280653951, + "grad_norm": 3.428138017654419, + "learning_rate": 7.753532573094024e-06, + "loss": 0.0671, + "step": 21468 + }, + { + "epoch": 58.49863760217983, + "grad_norm": 5.6496262550354, + "learning_rate": 7.75267264353123e-06, + "loss": 0.1115, + "step": 21469 + }, + { + "epoch": 58.50136239782017, + "grad_norm": 4.147008419036865, + "learning_rate": 7.751812731470549e-06, + "loss": 0.1251, + "step": 21470 + }, + { + "epoch": 58.50408719346049, + "grad_norm": 3.3708302974700928, + "learning_rate": 7.750952836918679e-06, + "loss": 0.0984, + "step": 21471 + }, + { + "epoch": 58.50681198910082, + "grad_norm": 4.073522567749023, + "learning_rate": 7.750092959882315e-06, + "loss": 0.1517, + "step": 21472 + }, + { + "epoch": 58.509536784741144, + "grad_norm": 13.929010391235352, + "learning_rate": 7.749233100368155e-06, + "loss": 0.0846, + "step": 21473 + }, + { + "epoch": 58.51226158038147, + "grad_norm": 3.3463056087493896, + "learning_rate": 7.748373258382896e-06, + "loss": 0.2056, + "step": 21474 + }, + { + "epoch": 58.514986376021795, + "grad_norm": 3.756589889526367, + "learning_rate": 7.747513433933231e-06, + "loss": 0.1352, + "step": 21475 + }, + { + "epoch": 58.51771117166213, + "grad_norm": 3.955935001373291, + "learning_rate": 7.746653627025861e-06, + "loss": 0.1816, + "step": 21476 + }, + { + "epoch": 58.520435967302454, + "grad_norm": 3.919924259185791, + "learning_rate": 7.745793837667479e-06, + "loss": 0.0746, + "step": 21477 + }, + { + "epoch": 58.52316076294278, + "grad_norm": 5.583837032318115, + "learning_rate": 7.744934065864785e-06, + "loss": 0.1019, + "step": 21478 + }, + { + "epoch": 58.525885558583106, + "grad_norm": 4.4430155754089355, + "learning_rate": 7.744074311624468e-06, + "loss": 0.0647, + "step": 21479 + }, + { + "epoch": 58.52861035422343, + "grad_norm": 3.9184672832489014, + "learning_rate": 7.743214574953231e-06, + "loss": 0.0539, + "step": 21480 + }, + { + "epoch": 58.53133514986376, + "grad_norm": 3.769113063812256, + "learning_rate": 7.742354855857761e-06, + "loss": 0.0516, + "step": 21481 + }, + { + "epoch": 58.53405994550409, + "grad_norm": 4.248811721801758, + "learning_rate": 7.74149515434476e-06, + "loss": 0.1288, + "step": 21482 + }, + { + "epoch": 58.536784741144416, + "grad_norm": 3.2389869689941406, + "learning_rate": 7.740635470420922e-06, + "loss": 0.1682, + "step": 21483 + }, + { + "epoch": 58.53950953678474, + "grad_norm": 3.2946629524230957, + "learning_rate": 7.739775804092947e-06, + "loss": 0.0769, + "step": 21484 + }, + { + "epoch": 58.54223433242507, + "grad_norm": 4.172604560852051, + "learning_rate": 7.738916155367522e-06, + "loss": 0.103, + "step": 21485 + }, + { + "epoch": 58.54495912806539, + "grad_norm": 3.7815375328063965, + "learning_rate": 7.738056524251347e-06, + "loss": 0.2709, + "step": 21486 + }, + { + "epoch": 58.54768392370572, + "grad_norm": 3.3296620845794678, + "learning_rate": 7.737196910751113e-06, + "loss": 0.0737, + "step": 21487 + }, + { + "epoch": 58.55040871934605, + "grad_norm": 3.880136489868164, + "learning_rate": 7.73633731487352e-06, + "loss": 0.1735, + "step": 21488 + }, + { + "epoch": 58.55313351498638, + "grad_norm": 3.3581833839416504, + "learning_rate": 7.735477736625255e-06, + "loss": 0.1288, + "step": 21489 + }, + { + "epoch": 58.555858310626704, + "grad_norm": 7.105356216430664, + "learning_rate": 7.73461817601302e-06, + "loss": 0.1674, + "step": 21490 + }, + { + "epoch": 58.55858310626703, + "grad_norm": 5.7333083152771, + "learning_rate": 7.733758633043502e-06, + "loss": 0.1656, + "step": 21491 + }, + { + "epoch": 58.561307901907355, + "grad_norm": 4.50360631942749, + "learning_rate": 7.732899107723401e-06, + "loss": 0.1094, + "step": 21492 + }, + { + "epoch": 58.56403269754768, + "grad_norm": 3.3514621257781982, + "learning_rate": 7.732039600059407e-06, + "loss": 0.1267, + "step": 21493 + }, + { + "epoch": 58.566757493188014, + "grad_norm": 5.052760601043701, + "learning_rate": 7.73118011005822e-06, + "loss": 0.049, + "step": 21494 + }, + { + "epoch": 58.56948228882834, + "grad_norm": 5.315223217010498, + "learning_rate": 7.730320637726524e-06, + "loss": 0.1214, + "step": 21495 + }, + { + "epoch": 58.572207084468666, + "grad_norm": 3.963050603866577, + "learning_rate": 7.729461183071023e-06, + "loss": 0.1245, + "step": 21496 + }, + { + "epoch": 58.57493188010899, + "grad_norm": 6.392207622528076, + "learning_rate": 7.728601746098401e-06, + "loss": 0.1709, + "step": 21497 + }, + { + "epoch": 58.57765667574932, + "grad_norm": 3.605137586593628, + "learning_rate": 7.727742326815357e-06, + "loss": 0.0681, + "step": 21498 + }, + { + "epoch": 58.58038147138964, + "grad_norm": 3.6206047534942627, + "learning_rate": 7.72688292522858e-06, + "loss": 0.073, + "step": 21499 + }, + { + "epoch": 58.583106267029976, + "grad_norm": 5.480008602142334, + "learning_rate": 7.726023541344767e-06, + "loss": 0.1793, + "step": 21500 + }, + { + "epoch": 58.5858310626703, + "grad_norm": 4.394006252288818, + "learning_rate": 7.725164175170611e-06, + "loss": 0.2018, + "step": 21501 + }, + { + "epoch": 58.58855585831063, + "grad_norm": 5.898493766784668, + "learning_rate": 7.724304826712802e-06, + "loss": 0.1331, + "step": 21502 + }, + { + "epoch": 58.59128065395095, + "grad_norm": 3.7584009170532227, + "learning_rate": 7.723445495978034e-06, + "loss": 0.0893, + "step": 21503 + }, + { + "epoch": 58.59400544959128, + "grad_norm": 3.396317481994629, + "learning_rate": 7.722586182973002e-06, + "loss": 0.0871, + "step": 21504 + }, + { + "epoch": 58.596730245231605, + "grad_norm": 4.105969429016113, + "learning_rate": 7.721726887704392e-06, + "loss": 0.0996, + "step": 21505 + }, + { + "epoch": 58.59945504087194, + "grad_norm": 3.7845029830932617, + "learning_rate": 7.720867610178902e-06, + "loss": 0.1126, + "step": 21506 + }, + { + "epoch": 58.60217983651226, + "grad_norm": 6.148295879364014, + "learning_rate": 7.72000835040322e-06, + "loss": 0.2394, + "step": 21507 + }, + { + "epoch": 58.60490463215259, + "grad_norm": 4.514403820037842, + "learning_rate": 7.719149108384042e-06, + "loss": 0.1659, + "step": 21508 + }, + { + "epoch": 58.607629427792915, + "grad_norm": 3.663196086883545, + "learning_rate": 7.718289884128054e-06, + "loss": 0.0688, + "step": 21509 + }, + { + "epoch": 58.61035422343324, + "grad_norm": 3.3898158073425293, + "learning_rate": 7.717430677641954e-06, + "loss": 0.0567, + "step": 21510 + }, + { + "epoch": 58.61307901907357, + "grad_norm": 4.63852596282959, + "learning_rate": 7.716571488932427e-06, + "loss": 0.0974, + "step": 21511 + }, + { + "epoch": 58.6158038147139, + "grad_norm": 3.5420165061950684, + "learning_rate": 7.715712318006173e-06, + "loss": 0.1034, + "step": 21512 + }, + { + "epoch": 58.618528610354225, + "grad_norm": 3.5376248359680176, + "learning_rate": 7.714853164869872e-06, + "loss": 0.0632, + "step": 21513 + }, + { + "epoch": 58.62125340599455, + "grad_norm": 3.5798234939575195, + "learning_rate": 7.713994029530224e-06, + "loss": 0.1411, + "step": 21514 + }, + { + "epoch": 58.62397820163488, + "grad_norm": 3.4283549785614014, + "learning_rate": 7.713134911993917e-06, + "loss": 0.1473, + "step": 21515 + }, + { + "epoch": 58.6267029972752, + "grad_norm": 4.478358268737793, + "learning_rate": 7.712275812267638e-06, + "loss": 0.1915, + "step": 21516 + }, + { + "epoch": 58.62942779291553, + "grad_norm": 4.1488237380981445, + "learning_rate": 7.711416730358085e-06, + "loss": 0.0788, + "step": 21517 + }, + { + "epoch": 58.63215258855586, + "grad_norm": 4.851395130157471, + "learning_rate": 7.710557666271943e-06, + "loss": 0.1862, + "step": 21518 + }, + { + "epoch": 58.63487738419619, + "grad_norm": 4.15927791595459, + "learning_rate": 7.709698620015908e-06, + "loss": 0.1268, + "step": 21519 + }, + { + "epoch": 58.63760217983651, + "grad_norm": 3.2418174743652344, + "learning_rate": 7.708839591596663e-06, + "loss": 0.121, + "step": 21520 + }, + { + "epoch": 58.64032697547684, + "grad_norm": 4.322272300720215, + "learning_rate": 7.707980581020903e-06, + "loss": 0.1349, + "step": 21521 + }, + { + "epoch": 58.643051771117165, + "grad_norm": 4.424936771392822, + "learning_rate": 7.707121588295316e-06, + "loss": 0.06, + "step": 21522 + }, + { + "epoch": 58.64577656675749, + "grad_norm": 4.182270050048828, + "learning_rate": 7.706262613426594e-06, + "loss": 0.0556, + "step": 21523 + }, + { + "epoch": 58.64850136239782, + "grad_norm": 3.3170406818389893, + "learning_rate": 7.705403656421422e-06, + "loss": 0.1684, + "step": 21524 + }, + { + "epoch": 58.65122615803815, + "grad_norm": 4.232260704040527, + "learning_rate": 7.704544717286493e-06, + "loss": 0.0699, + "step": 21525 + }, + { + "epoch": 58.653950953678475, + "grad_norm": 4.209249019622803, + "learning_rate": 7.703685796028499e-06, + "loss": 0.0765, + "step": 21526 + }, + { + "epoch": 58.6566757493188, + "grad_norm": 3.5731842517852783, + "learning_rate": 7.702826892654121e-06, + "loss": 0.0448, + "step": 21527 + }, + { + "epoch": 58.65940054495913, + "grad_norm": 3.5391786098480225, + "learning_rate": 7.701968007170057e-06, + "loss": 0.0694, + "step": 21528 + }, + { + "epoch": 58.66212534059945, + "grad_norm": 3.4241995811462402, + "learning_rate": 7.701109139582993e-06, + "loss": 0.2635, + "step": 21529 + }, + { + "epoch": 58.664850136239785, + "grad_norm": 6.018126964569092, + "learning_rate": 7.700250289899614e-06, + "loss": 0.1424, + "step": 21530 + }, + { + "epoch": 58.66757493188011, + "grad_norm": 3.708371162414551, + "learning_rate": 7.699391458126612e-06, + "loss": 0.1822, + "step": 21531 + }, + { + "epoch": 58.67029972752044, + "grad_norm": 4.279620170593262, + "learning_rate": 7.698532644270678e-06, + "loss": 0.265, + "step": 21532 + }, + { + "epoch": 58.67302452316076, + "grad_norm": 5.6820969581604, + "learning_rate": 7.697673848338495e-06, + "loss": 0.0961, + "step": 21533 + }, + { + "epoch": 58.67574931880109, + "grad_norm": 3.770305871963501, + "learning_rate": 7.696815070336752e-06, + "loss": 0.0676, + "step": 21534 + }, + { + "epoch": 58.678474114441414, + "grad_norm": 4.238286018371582, + "learning_rate": 7.695956310272143e-06, + "loss": 0.1453, + "step": 21535 + }, + { + "epoch": 58.68119891008175, + "grad_norm": 3.1553149223327637, + "learning_rate": 7.695097568151351e-06, + "loss": 0.1258, + "step": 21536 + }, + { + "epoch": 58.68392370572207, + "grad_norm": 3.0492682456970215, + "learning_rate": 7.694238843981066e-06, + "loss": 0.0873, + "step": 21537 + }, + { + "epoch": 58.6866485013624, + "grad_norm": 3.081958055496216, + "learning_rate": 7.693380137767971e-06, + "loss": 0.0869, + "step": 21538 + }, + { + "epoch": 58.689373297002724, + "grad_norm": 3.7943410873413086, + "learning_rate": 7.692521449518763e-06, + "loss": 0.0703, + "step": 21539 + }, + { + "epoch": 58.69209809264305, + "grad_norm": 4.566564083099365, + "learning_rate": 7.691662779240119e-06, + "loss": 0.1587, + "step": 21540 + }, + { + "epoch": 58.694822888283376, + "grad_norm": 4.0657572746276855, + "learning_rate": 7.690804126938733e-06, + "loss": 0.0757, + "step": 21541 + }, + { + "epoch": 58.69754768392371, + "grad_norm": 3.274008274078369, + "learning_rate": 7.68994549262129e-06, + "loss": 0.0666, + "step": 21542 + }, + { + "epoch": 58.700272479564035, + "grad_norm": 3.5570719242095947, + "learning_rate": 7.689086876294479e-06, + "loss": 0.3087, + "step": 21543 + }, + { + "epoch": 58.70299727520436, + "grad_norm": 2.881232500076294, + "learning_rate": 7.68822827796498e-06, + "loss": 0.0512, + "step": 21544 + }, + { + "epoch": 58.705722070844686, + "grad_norm": 3.1296496391296387, + "learning_rate": 7.68736969763949e-06, + "loss": 0.0736, + "step": 21545 + }, + { + "epoch": 58.70844686648501, + "grad_norm": 3.461085557937622, + "learning_rate": 7.686511135324687e-06, + "loss": 0.0604, + "step": 21546 + }, + { + "epoch": 58.71117166212534, + "grad_norm": 3.1067328453063965, + "learning_rate": 7.685652591027261e-06, + "loss": 0.1282, + "step": 21547 + }, + { + "epoch": 58.71389645776567, + "grad_norm": 2.9073550701141357, + "learning_rate": 7.6847940647539e-06, + "loss": 0.1454, + "step": 21548 + }, + { + "epoch": 58.716621253406, + "grad_norm": 3.7609846591949463, + "learning_rate": 7.683935556511287e-06, + "loss": 0.1043, + "step": 21549 + }, + { + "epoch": 58.71934604904632, + "grad_norm": 4.674740791320801, + "learning_rate": 7.68307706630611e-06, + "loss": 0.2425, + "step": 21550 + }, + { + "epoch": 58.72207084468665, + "grad_norm": 4.871628761291504, + "learning_rate": 7.682218594145052e-06, + "loss": 0.2236, + "step": 21551 + }, + { + "epoch": 58.724795640326974, + "grad_norm": 4.0654191970825195, + "learning_rate": 7.681360140034802e-06, + "loss": 0.1669, + "step": 21552 + }, + { + "epoch": 58.7275204359673, + "grad_norm": 3.182121992111206, + "learning_rate": 7.680501703982047e-06, + "loss": 0.1692, + "step": 21553 + }, + { + "epoch": 58.73024523160763, + "grad_norm": 4.811152458190918, + "learning_rate": 7.679643285993466e-06, + "loss": 0.1249, + "step": 21554 + }, + { + "epoch": 58.73297002724796, + "grad_norm": 3.7067596912384033, + "learning_rate": 7.678784886075753e-06, + "loss": 0.1163, + "step": 21555 + }, + { + "epoch": 58.735694822888284, + "grad_norm": 3.1542389392852783, + "learning_rate": 7.677926504235585e-06, + "loss": 0.0612, + "step": 21556 + }, + { + "epoch": 58.73841961852861, + "grad_norm": 3.0129261016845703, + "learning_rate": 7.677068140479654e-06, + "loss": 0.2432, + "step": 21557 + }, + { + "epoch": 58.741144414168936, + "grad_norm": 2.8790557384490967, + "learning_rate": 7.676209794814639e-06, + "loss": 0.0482, + "step": 21558 + }, + { + "epoch": 58.74386920980926, + "grad_norm": 3.94728946685791, + "learning_rate": 7.67535146724723e-06, + "loss": 0.0951, + "step": 21559 + }, + { + "epoch": 58.746594005449595, + "grad_norm": 3.058041572570801, + "learning_rate": 7.674493157784106e-06, + "loss": 0.1165, + "step": 21560 + }, + { + "epoch": 58.74931880108992, + "grad_norm": 3.3404855728149414, + "learning_rate": 7.673634866431955e-06, + "loss": 0.0721, + "step": 21561 + }, + { + "epoch": 58.752043596730246, + "grad_norm": 5.324344635009766, + "learning_rate": 7.672776593197463e-06, + "loss": 0.1768, + "step": 21562 + }, + { + "epoch": 58.75476839237057, + "grad_norm": 3.7187886238098145, + "learning_rate": 7.67191833808731e-06, + "loss": 0.0909, + "step": 21563 + }, + { + "epoch": 58.7574931880109, + "grad_norm": 5.002996444702148, + "learning_rate": 7.671060101108182e-06, + "loss": 0.0889, + "step": 21564 + }, + { + "epoch": 58.76021798365122, + "grad_norm": 3.5215115547180176, + "learning_rate": 7.670201882266764e-06, + "loss": 0.0895, + "step": 21565 + }, + { + "epoch": 58.762942779291556, + "grad_norm": 4.215787887573242, + "learning_rate": 7.669343681569737e-06, + "loss": 0.1413, + "step": 21566 + }, + { + "epoch": 58.76566757493188, + "grad_norm": 3.1859095096588135, + "learning_rate": 7.66848549902379e-06, + "loss": 0.1498, + "step": 21567 + }, + { + "epoch": 58.76839237057221, + "grad_norm": 3.565659284591675, + "learning_rate": 7.667627334635595e-06, + "loss": 0.0579, + "step": 21568 + }, + { + "epoch": 58.771117166212534, + "grad_norm": 3.4855968952178955, + "learning_rate": 7.666769188411848e-06, + "loss": 0.0735, + "step": 21569 + }, + { + "epoch": 58.77384196185286, + "grad_norm": 4.283398628234863, + "learning_rate": 7.665911060359228e-06, + "loss": 0.2532, + "step": 21570 + }, + { + "epoch": 58.776566757493185, + "grad_norm": 3.126268148422241, + "learning_rate": 7.66505295048442e-06, + "loss": 0.1428, + "step": 21571 + }, + { + "epoch": 58.77929155313352, + "grad_norm": 4.907703399658203, + "learning_rate": 7.6641948587941e-06, + "loss": 0.1766, + "step": 21572 + }, + { + "epoch": 58.782016348773844, + "grad_norm": 4.114948749542236, + "learning_rate": 7.663336785294959e-06, + "loss": 0.1095, + "step": 21573 + }, + { + "epoch": 58.78474114441417, + "grad_norm": 3.390493154525757, + "learning_rate": 7.662478729993673e-06, + "loss": 0.1895, + "step": 21574 + }, + { + "epoch": 58.787465940054496, + "grad_norm": 3.6392195224761963, + "learning_rate": 7.661620692896931e-06, + "loss": 0.114, + "step": 21575 + }, + { + "epoch": 58.79019073569482, + "grad_norm": 4.038777828216553, + "learning_rate": 7.660762674011408e-06, + "loss": 0.1706, + "step": 21576 + }, + { + "epoch": 58.79291553133515, + "grad_norm": 3.585653066635132, + "learning_rate": 7.659904673343793e-06, + "loss": 0.0877, + "step": 21577 + }, + { + "epoch": 58.79564032697548, + "grad_norm": 5.2134575843811035, + "learning_rate": 7.659046690900762e-06, + "loss": 0.1707, + "step": 21578 + }, + { + "epoch": 58.798365122615806, + "grad_norm": 3.6076905727386475, + "learning_rate": 7.658188726689003e-06, + "loss": 0.1078, + "step": 21579 + }, + { + "epoch": 58.80108991825613, + "grad_norm": 4.470366477966309, + "learning_rate": 7.657330780715193e-06, + "loss": 0.181, + "step": 21580 + }, + { + "epoch": 58.80381471389646, + "grad_norm": 3.638078451156616, + "learning_rate": 7.656472852986017e-06, + "loss": 0.1224, + "step": 21581 + }, + { + "epoch": 58.80653950953678, + "grad_norm": 3.5840208530426025, + "learning_rate": 7.655614943508153e-06, + "loss": 0.108, + "step": 21582 + }, + { + "epoch": 58.80926430517711, + "grad_norm": 6.398871421813965, + "learning_rate": 7.654757052288286e-06, + "loss": 0.0816, + "step": 21583 + }, + { + "epoch": 58.81198910081744, + "grad_norm": 3.523592472076416, + "learning_rate": 7.653899179333094e-06, + "loss": 0.1269, + "step": 21584 + }, + { + "epoch": 58.81471389645777, + "grad_norm": 4.927404403686523, + "learning_rate": 7.653041324649258e-06, + "loss": 0.066, + "step": 21585 + }, + { + "epoch": 58.817438692098094, + "grad_norm": 3.422100067138672, + "learning_rate": 7.652183488243465e-06, + "loss": 0.0608, + "step": 21586 + }, + { + "epoch": 58.82016348773842, + "grad_norm": 3.7407214641571045, + "learning_rate": 7.651325670122389e-06, + "loss": 0.0925, + "step": 21587 + }, + { + "epoch": 58.822888283378745, + "grad_norm": 3.263108968734741, + "learning_rate": 7.650467870292711e-06, + "loss": 0.0745, + "step": 21588 + }, + { + "epoch": 58.82561307901907, + "grad_norm": 4.6756815910339355, + "learning_rate": 7.649610088761117e-06, + "loss": 0.3144, + "step": 21589 + }, + { + "epoch": 58.828337874659404, + "grad_norm": 5.076279640197754, + "learning_rate": 7.648752325534283e-06, + "loss": 0.0882, + "step": 21590 + }, + { + "epoch": 58.83106267029973, + "grad_norm": 3.9108126163482666, + "learning_rate": 7.647894580618892e-06, + "loss": 0.0979, + "step": 21591 + }, + { + "epoch": 58.833787465940055, + "grad_norm": 3.7094666957855225, + "learning_rate": 7.64703685402162e-06, + "loss": 0.1617, + "step": 21592 + }, + { + "epoch": 58.83651226158038, + "grad_norm": 3.3642637729644775, + "learning_rate": 7.646179145749151e-06, + "loss": 0.0763, + "step": 21593 + }, + { + "epoch": 58.83923705722071, + "grad_norm": 4.531522750854492, + "learning_rate": 7.645321455808162e-06, + "loss": 0.1066, + "step": 21594 + }, + { + "epoch": 58.84196185286103, + "grad_norm": 3.2476766109466553, + "learning_rate": 7.644463784205335e-06, + "loss": 0.0698, + "step": 21595 + }, + { + "epoch": 58.844686648501366, + "grad_norm": 3.3269529342651367, + "learning_rate": 7.643606130947345e-06, + "loss": 0.0512, + "step": 21596 + }, + { + "epoch": 58.84741144414169, + "grad_norm": 3.5970005989074707, + "learning_rate": 7.64274849604088e-06, + "loss": 0.2536, + "step": 21597 + }, + { + "epoch": 58.85013623978202, + "grad_norm": 3.4453017711639404, + "learning_rate": 7.641890879492608e-06, + "loss": 0.0743, + "step": 21598 + }, + { + "epoch": 58.85286103542234, + "grad_norm": 4.354587554931641, + "learning_rate": 7.641033281309219e-06, + "loss": 0.1206, + "step": 21599 + }, + { + "epoch": 58.85558583106267, + "grad_norm": 3.3186676502227783, + "learning_rate": 7.640175701497383e-06, + "loss": 0.065, + "step": 21600 + }, + { + "epoch": 58.858310626702995, + "grad_norm": 4.4106950759887695, + "learning_rate": 7.639318140063785e-06, + "loss": 0.0593, + "step": 21601 + }, + { + "epoch": 58.86103542234333, + "grad_norm": 3.0654456615448, + "learning_rate": 7.638460597015097e-06, + "loss": 0.0836, + "step": 21602 + }, + { + "epoch": 58.86376021798365, + "grad_norm": 3.552016258239746, + "learning_rate": 7.637603072358004e-06, + "loss": 0.122, + "step": 21603 + }, + { + "epoch": 58.86648501362398, + "grad_norm": 6.45775032043457, + "learning_rate": 7.636745566099185e-06, + "loss": 0.1001, + "step": 21604 + }, + { + "epoch": 58.869209809264305, + "grad_norm": 3.066519260406494, + "learning_rate": 7.635888078245312e-06, + "loss": 0.1041, + "step": 21605 + }, + { + "epoch": 58.87193460490463, + "grad_norm": 3.6877498626708984, + "learning_rate": 7.635030608803072e-06, + "loss": 0.0741, + "step": 21606 + }, + { + "epoch": 58.87465940054496, + "grad_norm": 4.111044883728027, + "learning_rate": 7.634173157779133e-06, + "loss": 0.3042, + "step": 21607 + }, + { + "epoch": 58.87738419618529, + "grad_norm": 3.6182291507720947, + "learning_rate": 7.633315725180178e-06, + "loss": 0.0835, + "step": 21608 + }, + { + "epoch": 58.880108991825615, + "grad_norm": 2.8847904205322266, + "learning_rate": 7.632458311012884e-06, + "loss": 0.1888, + "step": 21609 + }, + { + "epoch": 58.88283378746594, + "grad_norm": 3.524197816848755, + "learning_rate": 7.63160091528393e-06, + "loss": 0.091, + "step": 21610 + }, + { + "epoch": 58.88555858310627, + "grad_norm": 3.9682729244232178, + "learning_rate": 7.630743537999989e-06, + "loss": 0.0787, + "step": 21611 + }, + { + "epoch": 58.88828337874659, + "grad_norm": 3.8259661197662354, + "learning_rate": 7.629886179167743e-06, + "loss": 0.1559, + "step": 21612 + }, + { + "epoch": 58.89100817438692, + "grad_norm": 3.9684224128723145, + "learning_rate": 7.629028838793867e-06, + "loss": 0.1177, + "step": 21613 + }, + { + "epoch": 58.89373297002725, + "grad_norm": 4.789135456085205, + "learning_rate": 7.6281715168850364e-06, + "loss": 0.0941, + "step": 21614 + }, + { + "epoch": 58.89645776566758, + "grad_norm": 6.84328556060791, + "learning_rate": 7.6273142134479335e-06, + "loss": 0.1571, + "step": 21615 + }, + { + "epoch": 58.8991825613079, + "grad_norm": 3.524958848953247, + "learning_rate": 7.626456928489228e-06, + "loss": 0.0701, + "step": 21616 + }, + { + "epoch": 58.90190735694823, + "grad_norm": 3.621579885482788, + "learning_rate": 7.625599662015602e-06, + "loss": 0.1075, + "step": 21617 + }, + { + "epoch": 58.904632152588555, + "grad_norm": 3.4036946296691895, + "learning_rate": 7.624742414033725e-06, + "loss": 0.1193, + "step": 21618 + }, + { + "epoch": 58.90735694822888, + "grad_norm": 5.28678560256958, + "learning_rate": 7.623885184550283e-06, + "loss": 0.1419, + "step": 21619 + }, + { + "epoch": 58.91008174386921, + "grad_norm": 4.394040107727051, + "learning_rate": 7.6230279735719415e-06, + "loss": 0.1415, + "step": 21620 + }, + { + "epoch": 58.91280653950954, + "grad_norm": 4.134680271148682, + "learning_rate": 7.622170781105382e-06, + "loss": 0.1504, + "step": 21621 + }, + { + "epoch": 58.915531335149865, + "grad_norm": 3.1160125732421875, + "learning_rate": 7.621313607157285e-06, + "loss": 0.1596, + "step": 21622 + }, + { + "epoch": 58.91825613079019, + "grad_norm": 3.513460636138916, + "learning_rate": 7.620456451734317e-06, + "loss": 0.1005, + "step": 21623 + }, + { + "epoch": 58.920980926430516, + "grad_norm": 3.427602767944336, + "learning_rate": 7.61959931484316e-06, + "loss": 0.0597, + "step": 21624 + }, + { + "epoch": 58.92370572207084, + "grad_norm": 4.323990345001221, + "learning_rate": 7.618742196490485e-06, + "loss": 0.1795, + "step": 21625 + }, + { + "epoch": 58.926430517711175, + "grad_norm": 2.7273409366607666, + "learning_rate": 7.617885096682971e-06, + "loss": 0.2101, + "step": 21626 + }, + { + "epoch": 58.9291553133515, + "grad_norm": 4.046576499938965, + "learning_rate": 7.617028015427289e-06, + "loss": 0.0985, + "step": 21627 + }, + { + "epoch": 58.93188010899183, + "grad_norm": 3.4946789741516113, + "learning_rate": 7.616170952730118e-06, + "loss": 0.1829, + "step": 21628 + }, + { + "epoch": 58.93460490463215, + "grad_norm": 5.407798767089844, + "learning_rate": 7.6153139085981296e-06, + "loss": 0.2557, + "step": 21629 + }, + { + "epoch": 58.93732970027248, + "grad_norm": 3.398526430130005, + "learning_rate": 7.614456883038001e-06, + "loss": 0.0642, + "step": 21630 + }, + { + "epoch": 58.940054495912804, + "grad_norm": 3.662095069885254, + "learning_rate": 7.613599876056404e-06, + "loss": 0.1326, + "step": 21631 + }, + { + "epoch": 58.94277929155314, + "grad_norm": 3.950141191482544, + "learning_rate": 7.612742887660016e-06, + "loss": 0.1051, + "step": 21632 + }, + { + "epoch": 58.94550408719346, + "grad_norm": 2.7301089763641357, + "learning_rate": 7.611885917855508e-06, + "loss": 0.0519, + "step": 21633 + }, + { + "epoch": 58.94822888283379, + "grad_norm": 3.6168124675750732, + "learning_rate": 7.611028966649555e-06, + "loss": 0.096, + "step": 21634 + }, + { + "epoch": 58.950953678474114, + "grad_norm": 5.342549800872803, + "learning_rate": 7.610172034048835e-06, + "loss": 0.136, + "step": 21635 + }, + { + "epoch": 58.95367847411444, + "grad_norm": 2.9107892513275146, + "learning_rate": 7.609315120060015e-06, + "loss": 0.0935, + "step": 21636 + }, + { + "epoch": 58.956403269754766, + "grad_norm": 3.528442859649658, + "learning_rate": 7.60845822468977e-06, + "loss": 0.0686, + "step": 21637 + }, + { + "epoch": 58.95912806539509, + "grad_norm": 4.349478721618652, + "learning_rate": 7.6076013479447786e-06, + "loss": 0.1161, + "step": 21638 + }, + { + "epoch": 58.961852861035425, + "grad_norm": 3.902848958969116, + "learning_rate": 7.60674448983171e-06, + "loss": 0.1102, + "step": 21639 + }, + { + "epoch": 58.96457765667575, + "grad_norm": 2.843625545501709, + "learning_rate": 7.60588765035724e-06, + "loss": 0.0689, + "step": 21640 + }, + { + "epoch": 58.967302452316076, + "grad_norm": 3.7142114639282227, + "learning_rate": 7.605030829528037e-06, + "loss": 0.1922, + "step": 21641 + }, + { + "epoch": 58.9700272479564, + "grad_norm": 2.9767210483551025, + "learning_rate": 7.60417402735078e-06, + "loss": 0.0972, + "step": 21642 + }, + { + "epoch": 58.97275204359673, + "grad_norm": 3.785778284072876, + "learning_rate": 7.603317243832137e-06, + "loss": 0.1285, + "step": 21643 + }, + { + "epoch": 58.97547683923706, + "grad_norm": 4.361304759979248, + "learning_rate": 7.6024604789787835e-06, + "loss": 0.0826, + "step": 21644 + }, + { + "epoch": 58.97820163487739, + "grad_norm": 3.8239848613739014, + "learning_rate": 7.601603732797389e-06, + "loss": 0.1777, + "step": 21645 + }, + { + "epoch": 58.98092643051771, + "grad_norm": 4.224652290344238, + "learning_rate": 7.600747005294629e-06, + "loss": 0.0697, + "step": 21646 + }, + { + "epoch": 58.98365122615804, + "grad_norm": 4.886425971984863, + "learning_rate": 7.599890296477171e-06, + "loss": 0.1468, + "step": 21647 + }, + { + "epoch": 58.986376021798364, + "grad_norm": 4.023881435394287, + "learning_rate": 7.599033606351694e-06, + "loss": 0.0609, + "step": 21648 + }, + { + "epoch": 58.98910081743869, + "grad_norm": 2.9752514362335205, + "learning_rate": 7.598176934924863e-06, + "loss": 0.1779, + "step": 21649 + }, + { + "epoch": 58.991825613079016, + "grad_norm": 5.338901042938232, + "learning_rate": 7.5973202822033554e-06, + "loss": 0.1998, + "step": 21650 + }, + { + "epoch": 58.99455040871935, + "grad_norm": 3.1338915824890137, + "learning_rate": 7.596463648193837e-06, + "loss": 0.1939, + "step": 21651 + }, + { + "epoch": 58.997275204359674, + "grad_norm": 4.405067443847656, + "learning_rate": 7.595607032902985e-06, + "loss": 0.1446, + "step": 21652 + }, + { + "epoch": 59.0, + "grad_norm": 2.0436484813690186, + "learning_rate": 7.594750436337467e-06, + "loss": 0.0406, + "step": 21653 + }, + { + "epoch": 59.002724795640326, + "grad_norm": 3.777146577835083, + "learning_rate": 7.593893858503951e-06, + "loss": 0.0633, + "step": 21654 + }, + { + "epoch": 59.00544959128065, + "grad_norm": 4.3965325355529785, + "learning_rate": 7.593037299409116e-06, + "loss": 0.0934, + "step": 21655 + }, + { + "epoch": 59.00817438692098, + "grad_norm": 4.872261047363281, + "learning_rate": 7.592180759059631e-06, + "loss": 0.0787, + "step": 21656 + }, + { + "epoch": 59.01089918256131, + "grad_norm": 2.4931423664093018, + "learning_rate": 7.591324237462162e-06, + "loss": 0.0901, + "step": 21657 + }, + { + "epoch": 59.013623978201636, + "grad_norm": 3.5393104553222656, + "learning_rate": 7.5904677346233845e-06, + "loss": 0.1323, + "step": 21658 + }, + { + "epoch": 59.01634877384196, + "grad_norm": 2.8393118381500244, + "learning_rate": 7.589611250549965e-06, + "loss": 0.0628, + "step": 21659 + }, + { + "epoch": 59.01907356948229, + "grad_norm": 3.608720541000366, + "learning_rate": 7.588754785248578e-06, + "loss": 0.1887, + "step": 21660 + }, + { + "epoch": 59.02179836512261, + "grad_norm": 2.7257919311523438, + "learning_rate": 7.587898338725887e-06, + "loss": 0.052, + "step": 21661 + }, + { + "epoch": 59.02452316076294, + "grad_norm": 5.552196979522705, + "learning_rate": 7.587041910988571e-06, + "loss": 0.0633, + "step": 21662 + }, + { + "epoch": 59.02724795640327, + "grad_norm": 3.2473134994506836, + "learning_rate": 7.586185502043291e-06, + "loss": 0.0936, + "step": 21663 + }, + { + "epoch": 59.0299727520436, + "grad_norm": 3.7006382942199707, + "learning_rate": 7.5853291118967236e-06, + "loss": 0.061, + "step": 21664 + }, + { + "epoch": 59.032697547683924, + "grad_norm": 3.480757474899292, + "learning_rate": 7.584472740555533e-06, + "loss": 0.0865, + "step": 21665 + }, + { + "epoch": 59.03542234332425, + "grad_norm": 4.306460857391357, + "learning_rate": 7.583616388026392e-06, + "loss": 0.0588, + "step": 21666 + }, + { + "epoch": 59.038147138964575, + "grad_norm": 3.5792856216430664, + "learning_rate": 7.582760054315968e-06, + "loss": 0.1445, + "step": 21667 + }, + { + "epoch": 59.0408719346049, + "grad_norm": 3.097454786300659, + "learning_rate": 7.5819037394309326e-06, + "loss": 0.121, + "step": 21668 + }, + { + "epoch": 59.043596730245234, + "grad_norm": 3.4855430126190186, + "learning_rate": 7.581047443377951e-06, + "loss": 0.0504, + "step": 21669 + }, + { + "epoch": 59.04632152588556, + "grad_norm": 3.136826753616333, + "learning_rate": 7.580191166163696e-06, + "loss": 0.1283, + "step": 21670 + }, + { + "epoch": 59.049046321525886, + "grad_norm": 3.7873098850250244, + "learning_rate": 7.5793349077948296e-06, + "loss": 0.0774, + "step": 21671 + }, + { + "epoch": 59.05177111716621, + "grad_norm": 2.9616713523864746, + "learning_rate": 7.578478668278029e-06, + "loss": 0.0621, + "step": 21672 + }, + { + "epoch": 59.05449591280654, + "grad_norm": 3.8275697231292725, + "learning_rate": 7.5776224476199585e-06, + "loss": 0.1353, + "step": 21673 + }, + { + "epoch": 59.05722070844686, + "grad_norm": 3.3241209983825684, + "learning_rate": 7.576766245827285e-06, + "loss": 0.059, + "step": 21674 + }, + { + "epoch": 59.059945504087196, + "grad_norm": 2.50747013092041, + "learning_rate": 7.5759100629066785e-06, + "loss": 0.1116, + "step": 21675 + }, + { + "epoch": 59.06267029972752, + "grad_norm": 3.2242865562438965, + "learning_rate": 7.575053898864808e-06, + "loss": 0.0873, + "step": 21676 + }, + { + "epoch": 59.06539509536785, + "grad_norm": 3.4980032444000244, + "learning_rate": 7.574197753708339e-06, + "loss": 0.1898, + "step": 21677 + }, + { + "epoch": 59.06811989100817, + "grad_norm": 4.965635776519775, + "learning_rate": 7.57334162744394e-06, + "loss": 0.1019, + "step": 21678 + }, + { + "epoch": 59.0708446866485, + "grad_norm": 3.2334609031677246, + "learning_rate": 7.572485520078277e-06, + "loss": 0.0603, + "step": 21679 + }, + { + "epoch": 59.073569482288825, + "grad_norm": 3.3962340354919434, + "learning_rate": 7.571629431618021e-06, + "loss": 0.2385, + "step": 21680 + }, + { + "epoch": 59.07629427792916, + "grad_norm": 2.7325992584228516, + "learning_rate": 7.570773362069835e-06, + "loss": 0.0608, + "step": 21681 + }, + { + "epoch": 59.079019073569484, + "grad_norm": 3.219993829727173, + "learning_rate": 7.569917311440389e-06, + "loss": 0.0719, + "step": 21682 + }, + { + "epoch": 59.08174386920981, + "grad_norm": 2.691089630126953, + "learning_rate": 7.569061279736347e-06, + "loss": 0.0976, + "step": 21683 + }, + { + "epoch": 59.084468664850135, + "grad_norm": 4.899687767028809, + "learning_rate": 7.568205266964379e-06, + "loss": 0.1574, + "step": 21684 + }, + { + "epoch": 59.08719346049046, + "grad_norm": 4.418859958648682, + "learning_rate": 7.567349273131149e-06, + "loss": 0.2519, + "step": 21685 + }, + { + "epoch": 59.08991825613079, + "grad_norm": 3.6111385822296143, + "learning_rate": 7.566493298243327e-06, + "loss": 0.0763, + "step": 21686 + }, + { + "epoch": 59.09264305177112, + "grad_norm": 2.2135980129241943, + "learning_rate": 7.565637342307574e-06, + "loss": 0.0471, + "step": 21687 + }, + { + "epoch": 59.095367847411445, + "grad_norm": 3.797297716140747, + "learning_rate": 7.5647814053305565e-06, + "loss": 0.0653, + "step": 21688 + }, + { + "epoch": 59.09809264305177, + "grad_norm": 3.493048667907715, + "learning_rate": 7.563925487318948e-06, + "loss": 0.058, + "step": 21689 + }, + { + "epoch": 59.1008174386921, + "grad_norm": 3.347757339477539, + "learning_rate": 7.563069588279407e-06, + "loss": 0.0806, + "step": 21690 + }, + { + "epoch": 59.10354223433242, + "grad_norm": 3.1683833599090576, + "learning_rate": 7.562213708218604e-06, + "loss": 0.0761, + "step": 21691 + }, + { + "epoch": 59.10626702997275, + "grad_norm": 3.5190916061401367, + "learning_rate": 7.5613578471432e-06, + "loss": 0.0521, + "step": 21692 + }, + { + "epoch": 59.10899182561308, + "grad_norm": 4.314681529998779, + "learning_rate": 7.560502005059864e-06, + "loss": 0.0595, + "step": 21693 + }, + { + "epoch": 59.11171662125341, + "grad_norm": 5.3859758377075195, + "learning_rate": 7.559646181975259e-06, + "loss": 0.2263, + "step": 21694 + }, + { + "epoch": 59.11444141689373, + "grad_norm": 3.3791892528533936, + "learning_rate": 7.558790377896052e-06, + "loss": 0.1202, + "step": 21695 + }, + { + "epoch": 59.11716621253406, + "grad_norm": 3.9917123317718506, + "learning_rate": 7.557934592828906e-06, + "loss": 0.0982, + "step": 21696 + }, + { + "epoch": 59.119891008174385, + "grad_norm": 3.4781248569488525, + "learning_rate": 7.557078826780488e-06, + "loss": 0.1791, + "step": 21697 + }, + { + "epoch": 59.12261580381471, + "grad_norm": 3.8536505699157715, + "learning_rate": 7.5562230797574585e-06, + "loss": 0.096, + "step": 21698 + }, + { + "epoch": 59.12534059945504, + "grad_norm": 4.126902103424072, + "learning_rate": 7.555367351766487e-06, + "loss": 0.0674, + "step": 21699 + }, + { + "epoch": 59.12806539509537, + "grad_norm": 4.913824558258057, + "learning_rate": 7.5545116428142375e-06, + "loss": 0.0651, + "step": 21700 + }, + { + "epoch": 59.130790190735695, + "grad_norm": 3.8185019493103027, + "learning_rate": 7.553655952907369e-06, + "loss": 0.0649, + "step": 21701 + }, + { + "epoch": 59.13351498637602, + "grad_norm": 3.033230781555176, + "learning_rate": 7.552800282052552e-06, + "loss": 0.0725, + "step": 21702 + }, + { + "epoch": 59.13623978201635, + "grad_norm": 3.427907943725586, + "learning_rate": 7.551944630256447e-06, + "loss": 0.1338, + "step": 21703 + }, + { + "epoch": 59.13896457765667, + "grad_norm": 3.5687830448150635, + "learning_rate": 7.55108899752572e-06, + "loss": 0.243, + "step": 21704 + }, + { + "epoch": 59.141689373297005, + "grad_norm": 4.709448337554932, + "learning_rate": 7.5502333838670295e-06, + "loss": 0.3231, + "step": 21705 + }, + { + "epoch": 59.14441416893733, + "grad_norm": 2.8295841217041016, + "learning_rate": 7.5493777892870416e-06, + "loss": 0.1049, + "step": 21706 + }, + { + "epoch": 59.14713896457766, + "grad_norm": 5.204916954040527, + "learning_rate": 7.548522213792424e-06, + "loss": 0.0607, + "step": 21707 + }, + { + "epoch": 59.14986376021798, + "grad_norm": 3.4823975563049316, + "learning_rate": 7.547666657389836e-06, + "loss": 0.1337, + "step": 21708 + }, + { + "epoch": 59.15258855585831, + "grad_norm": 3.985304117202759, + "learning_rate": 7.546811120085942e-06, + "loss": 0.0356, + "step": 21709 + }, + { + "epoch": 59.155313351498634, + "grad_norm": 3.720289945602417, + "learning_rate": 7.545955601887402e-06, + "loss": 0.066, + "step": 21710 + }, + { + "epoch": 59.15803814713897, + "grad_norm": 3.5102925300598145, + "learning_rate": 7.545100102800883e-06, + "loss": 0.1042, + "step": 21711 + }, + { + "epoch": 59.16076294277929, + "grad_norm": 2.699995279312134, + "learning_rate": 7.544244622833043e-06, + "loss": 0.0558, + "step": 21712 + }, + { + "epoch": 59.16348773841962, + "grad_norm": 5.10889196395874, + "learning_rate": 7.5433891619905496e-06, + "loss": 0.1035, + "step": 21713 + }, + { + "epoch": 59.166212534059945, + "grad_norm": 3.469667673110962, + "learning_rate": 7.542533720280061e-06, + "loss": 0.0737, + "step": 21714 + }, + { + "epoch": 59.16893732970027, + "grad_norm": 3.9109909534454346, + "learning_rate": 7.541678297708241e-06, + "loss": 0.1187, + "step": 21715 + }, + { + "epoch": 59.171662125340596, + "grad_norm": 6.658548355102539, + "learning_rate": 7.5408228942817495e-06, + "loss": 0.0556, + "step": 21716 + }, + { + "epoch": 59.17438692098093, + "grad_norm": 3.173408031463623, + "learning_rate": 7.539967510007253e-06, + "loss": 0.0692, + "step": 21717 + }, + { + "epoch": 59.177111716621255, + "grad_norm": 4.470581531524658, + "learning_rate": 7.5391121448914085e-06, + "loss": 0.2408, + "step": 21718 + }, + { + "epoch": 59.17983651226158, + "grad_norm": 3.0410196781158447, + "learning_rate": 7.5382567989408805e-06, + "loss": 0.1242, + "step": 21719 + }, + { + "epoch": 59.182561307901906, + "grad_norm": 3.175139904022217, + "learning_rate": 7.537401472162328e-06, + "loss": 0.0443, + "step": 21720 + }, + { + "epoch": 59.18528610354223, + "grad_norm": 4.160188674926758, + "learning_rate": 7.536546164562413e-06, + "loss": 0.0828, + "step": 21721 + }, + { + "epoch": 59.18801089918256, + "grad_norm": 3.967879056930542, + "learning_rate": 7.5356908761478e-06, + "loss": 0.147, + "step": 21722 + }, + { + "epoch": 59.19073569482289, + "grad_norm": 3.446207284927368, + "learning_rate": 7.534835606925141e-06, + "loss": 0.1565, + "step": 21723 + }, + { + "epoch": 59.19346049046322, + "grad_norm": 4.34999418258667, + "learning_rate": 7.533980356901107e-06, + "loss": 0.0983, + "step": 21724 + }, + { + "epoch": 59.19618528610354, + "grad_norm": 3.562150716781616, + "learning_rate": 7.533125126082357e-06, + "loss": 0.1047, + "step": 21725 + }, + { + "epoch": 59.19891008174387, + "grad_norm": 3.700178384780884, + "learning_rate": 7.532269914475546e-06, + "loss": 0.2572, + "step": 21726 + }, + { + "epoch": 59.201634877384194, + "grad_norm": 8.654916763305664, + "learning_rate": 7.53141472208734e-06, + "loss": 0.1077, + "step": 21727 + }, + { + "epoch": 59.20435967302452, + "grad_norm": 4.667231559753418, + "learning_rate": 7.530559548924395e-06, + "loss": 0.0829, + "step": 21728 + }, + { + "epoch": 59.20708446866485, + "grad_norm": 3.4512836933135986, + "learning_rate": 7.529704394993374e-06, + "loss": 0.0853, + "step": 21729 + }, + { + "epoch": 59.20980926430518, + "grad_norm": 3.270360231399536, + "learning_rate": 7.528849260300933e-06, + "loss": 0.057, + "step": 21730 + }, + { + "epoch": 59.212534059945504, + "grad_norm": 3.6670432090759277, + "learning_rate": 7.527994144853738e-06, + "loss": 0.2495, + "step": 21731 + }, + { + "epoch": 59.21525885558583, + "grad_norm": 3.787236213684082, + "learning_rate": 7.5271390486584416e-06, + "loss": 0.0844, + "step": 21732 + }, + { + "epoch": 59.217983651226156, + "grad_norm": 4.844411849975586, + "learning_rate": 7.526283971721711e-06, + "loss": 0.2772, + "step": 21733 + }, + { + "epoch": 59.22070844686648, + "grad_norm": 5.151246070861816, + "learning_rate": 7.5254289140501965e-06, + "loss": 0.2213, + "step": 21734 + }, + { + "epoch": 59.223433242506815, + "grad_norm": 3.862370491027832, + "learning_rate": 7.524573875650565e-06, + "loss": 0.0471, + "step": 21735 + }, + { + "epoch": 59.22615803814714, + "grad_norm": 3.706761360168457, + "learning_rate": 7.523718856529471e-06, + "loss": 0.0729, + "step": 21736 + }, + { + "epoch": 59.228882833787466, + "grad_norm": 3.490652561187744, + "learning_rate": 7.522863856693577e-06, + "loss": 0.2747, + "step": 21737 + }, + { + "epoch": 59.23160762942779, + "grad_norm": 4.000617980957031, + "learning_rate": 7.522008876149537e-06, + "loss": 0.0969, + "step": 21738 + }, + { + "epoch": 59.23433242506812, + "grad_norm": 4.829466819763184, + "learning_rate": 7.521153914904013e-06, + "loss": 0.1152, + "step": 21739 + }, + { + "epoch": 59.237057220708444, + "grad_norm": 3.3655080795288086, + "learning_rate": 7.520298972963657e-06, + "loss": 0.1643, + "step": 21740 + }, + { + "epoch": 59.23978201634878, + "grad_norm": 3.153468132019043, + "learning_rate": 7.51944405033514e-06, + "loss": 0.0683, + "step": 21741 + }, + { + "epoch": 59.2425068119891, + "grad_norm": 5.982385635375977, + "learning_rate": 7.51858914702511e-06, + "loss": 0.1112, + "step": 21742 + }, + { + "epoch": 59.24523160762943, + "grad_norm": 3.087956666946411, + "learning_rate": 7.517734263040232e-06, + "loss": 0.0805, + "step": 21743 + }, + { + "epoch": 59.247956403269754, + "grad_norm": 5.980727195739746, + "learning_rate": 7.516879398387156e-06, + "loss": 0.1112, + "step": 21744 + }, + { + "epoch": 59.25068119891008, + "grad_norm": 4.207536697387695, + "learning_rate": 7.516024553072545e-06, + "loss": 0.0576, + "step": 21745 + }, + { + "epoch": 59.253405994550405, + "grad_norm": 3.840688943862915, + "learning_rate": 7.515169727103052e-06, + "loss": 0.1398, + "step": 21746 + }, + { + "epoch": 59.25613079019074, + "grad_norm": 2.959146738052368, + "learning_rate": 7.514314920485341e-06, + "loss": 0.1536, + "step": 21747 + }, + { + "epoch": 59.258855585831064, + "grad_norm": 4.634994029998779, + "learning_rate": 7.513460133226062e-06, + "loss": 0.0914, + "step": 21748 + }, + { + "epoch": 59.26158038147139, + "grad_norm": 2.8339734077453613, + "learning_rate": 7.512605365331878e-06, + "loss": 0.1018, + "step": 21749 + }, + { + "epoch": 59.264305177111716, + "grad_norm": 2.8966667652130127, + "learning_rate": 7.511750616809443e-06, + "loss": 0.0798, + "step": 21750 + }, + { + "epoch": 59.26702997275204, + "grad_norm": 4.672469615936279, + "learning_rate": 7.510895887665413e-06, + "loss": 0.1637, + "step": 21751 + }, + { + "epoch": 59.26975476839237, + "grad_norm": 2.795789957046509, + "learning_rate": 7.510041177906446e-06, + "loss": 0.0714, + "step": 21752 + }, + { + "epoch": 59.2724795640327, + "grad_norm": 4.427687644958496, + "learning_rate": 7.5091864875392e-06, + "loss": 0.1869, + "step": 21753 + }, + { + "epoch": 59.275204359673026, + "grad_norm": 3.7736551761627197, + "learning_rate": 7.508331816570327e-06, + "loss": 0.0782, + "step": 21754 + }, + { + "epoch": 59.27792915531335, + "grad_norm": 5.1422224044799805, + "learning_rate": 7.507477165006487e-06, + "loss": 0.0795, + "step": 21755 + }, + { + "epoch": 59.28065395095368, + "grad_norm": 4.449389934539795, + "learning_rate": 7.506622532854333e-06, + "loss": 0.219, + "step": 21756 + }, + { + "epoch": 59.283378746594, + "grad_norm": 3.5036587715148926, + "learning_rate": 7.50576792012052e-06, + "loss": 0.0755, + "step": 21757 + }, + { + "epoch": 59.28610354223433, + "grad_norm": 3.461836576461792, + "learning_rate": 7.504913326811711e-06, + "loss": 0.1001, + "step": 21758 + }, + { + "epoch": 59.28882833787466, + "grad_norm": 3.3612518310546875, + "learning_rate": 7.504058752934555e-06, + "loss": 0.0488, + "step": 21759 + }, + { + "epoch": 59.29155313351499, + "grad_norm": 3.089484214782715, + "learning_rate": 7.5032041984957106e-06, + "loss": 0.0509, + "step": 21760 + }, + { + "epoch": 59.294277929155314, + "grad_norm": 3.250932455062866, + "learning_rate": 7.502349663501829e-06, + "loss": 0.0917, + "step": 21761 + }, + { + "epoch": 59.29700272479564, + "grad_norm": 3.6009373664855957, + "learning_rate": 7.5014951479595684e-06, + "loss": 0.0587, + "step": 21762 + }, + { + "epoch": 59.299727520435965, + "grad_norm": 4.550698280334473, + "learning_rate": 7.5006406518755856e-06, + "loss": 0.0628, + "step": 21763 + }, + { + "epoch": 59.30245231607629, + "grad_norm": 9.64401912689209, + "learning_rate": 7.499786175256531e-06, + "loss": 0.1326, + "step": 21764 + }, + { + "epoch": 59.305177111716624, + "grad_norm": 2.655383586883545, + "learning_rate": 7.498931718109063e-06, + "loss": 0.0938, + "step": 21765 + }, + { + "epoch": 59.30790190735695, + "grad_norm": 4.906900882720947, + "learning_rate": 7.49807728043983e-06, + "loss": 0.0627, + "step": 21766 + }, + { + "epoch": 59.310626702997276, + "grad_norm": 3.091667413711548, + "learning_rate": 7.497222862255496e-06, + "loss": 0.0704, + "step": 21767 + }, + { + "epoch": 59.3133514986376, + "grad_norm": 5.284510612487793, + "learning_rate": 7.496368463562706e-06, + "loss": 0.1104, + "step": 21768 + }, + { + "epoch": 59.31607629427793, + "grad_norm": 2.9647274017333984, + "learning_rate": 7.495514084368121e-06, + "loss": 0.0474, + "step": 21769 + }, + { + "epoch": 59.31880108991825, + "grad_norm": 3.8396527767181396, + "learning_rate": 7.494659724678388e-06, + "loss": 0.0631, + "step": 21770 + }, + { + "epoch": 59.321525885558586, + "grad_norm": 3.168015956878662, + "learning_rate": 7.493805384500168e-06, + "loss": 0.1236, + "step": 21771 + }, + { + "epoch": 59.32425068119891, + "grad_norm": 9.776162147521973, + "learning_rate": 7.492951063840109e-06, + "loss": 0.119, + "step": 21772 + }, + { + "epoch": 59.32697547683924, + "grad_norm": 5.564446449279785, + "learning_rate": 7.492096762704868e-06, + "loss": 0.2097, + "step": 21773 + }, + { + "epoch": 59.32970027247956, + "grad_norm": 3.545588254928589, + "learning_rate": 7.491242481101091e-06, + "loss": 0.0916, + "step": 21774 + }, + { + "epoch": 59.33242506811989, + "grad_norm": 3.705561876296997, + "learning_rate": 7.490388219035441e-06, + "loss": 0.1592, + "step": 21775 + }, + { + "epoch": 59.335149863760215, + "grad_norm": 4.552818298339844, + "learning_rate": 7.489533976514568e-06, + "loss": 0.0495, + "step": 21776 + }, + { + "epoch": 59.33787465940055, + "grad_norm": 4.008409023284912, + "learning_rate": 7.488679753545121e-06, + "loss": 0.0848, + "step": 21777 + }, + { + "epoch": 59.34059945504087, + "grad_norm": 4.364948749542236, + "learning_rate": 7.487825550133759e-06, + "loss": 0.0598, + "step": 21778 + }, + { + "epoch": 59.3433242506812, + "grad_norm": 3.707984209060669, + "learning_rate": 7.486971366287128e-06, + "loss": 0.1673, + "step": 21779 + }, + { + "epoch": 59.346049046321525, + "grad_norm": 3.483253002166748, + "learning_rate": 7.4861172020118844e-06, + "loss": 0.0927, + "step": 21780 + }, + { + "epoch": 59.34877384196185, + "grad_norm": 3.4793434143066406, + "learning_rate": 7.485263057314678e-06, + "loss": 0.0881, + "step": 21781 + }, + { + "epoch": 59.35149863760218, + "grad_norm": 3.1901800632476807, + "learning_rate": 7.484408932202163e-06, + "loss": 0.1949, + "step": 21782 + }, + { + "epoch": 59.35422343324251, + "grad_norm": 3.7107465267181396, + "learning_rate": 7.483554826680989e-06, + "loss": 0.1693, + "step": 21783 + }, + { + "epoch": 59.356948228882835, + "grad_norm": 4.341519355773926, + "learning_rate": 7.482700740757811e-06, + "loss": 0.1126, + "step": 21784 + }, + { + "epoch": 59.35967302452316, + "grad_norm": 3.539825201034546, + "learning_rate": 7.481846674439276e-06, + "loss": 0.0811, + "step": 21785 + }, + { + "epoch": 59.36239782016349, + "grad_norm": 2.9512150287628174, + "learning_rate": 7.480992627732038e-06, + "loss": 0.1052, + "step": 21786 + }, + { + "epoch": 59.36512261580381, + "grad_norm": 4.722318172454834, + "learning_rate": 7.4801386006427515e-06, + "loss": 0.0778, + "step": 21787 + }, + { + "epoch": 59.36784741144414, + "grad_norm": 3.9388997554779053, + "learning_rate": 7.479284593178061e-06, + "loss": 0.119, + "step": 21788 + }, + { + "epoch": 59.37057220708447, + "grad_norm": 5.726805686950684, + "learning_rate": 7.478430605344624e-06, + "loss": 0.1978, + "step": 21789 + }, + { + "epoch": 59.3732970027248, + "grad_norm": 4.962177276611328, + "learning_rate": 7.477576637149086e-06, + "loss": 0.1384, + "step": 21790 + }, + { + "epoch": 59.37602179836512, + "grad_norm": 2.873889446258545, + "learning_rate": 7.476722688598102e-06, + "loss": 0.0598, + "step": 21791 + }, + { + "epoch": 59.37874659400545, + "grad_norm": 3.9591760635375977, + "learning_rate": 7.475868759698317e-06, + "loss": 0.2101, + "step": 21792 + }, + { + "epoch": 59.381471389645775, + "grad_norm": 3.4086108207702637, + "learning_rate": 7.4750148504563855e-06, + "loss": 0.1091, + "step": 21793 + }, + { + "epoch": 59.3841961852861, + "grad_norm": 4.699950695037842, + "learning_rate": 7.47416096087896e-06, + "loss": 0.206, + "step": 21794 + }, + { + "epoch": 59.38692098092643, + "grad_norm": 2.7233259677886963, + "learning_rate": 7.473307090972685e-06, + "loss": 0.0496, + "step": 21795 + }, + { + "epoch": 59.38964577656676, + "grad_norm": 4.428097724914551, + "learning_rate": 7.4724532407442165e-06, + "loss": 0.1381, + "step": 21796 + }, + { + "epoch": 59.392370572207085, + "grad_norm": 4.300647258758545, + "learning_rate": 7.471599410200198e-06, + "loss": 0.2477, + "step": 21797 + }, + { + "epoch": 59.39509536784741, + "grad_norm": 3.2388229370117188, + "learning_rate": 7.470745599347285e-06, + "loss": 0.0697, + "step": 21798 + }, + { + "epoch": 59.39782016348774, + "grad_norm": 3.206294059753418, + "learning_rate": 7.46989180819212e-06, + "loss": 0.0859, + "step": 21799 + }, + { + "epoch": 59.40054495912806, + "grad_norm": 3.8222544193267822, + "learning_rate": 7.469038036741358e-06, + "loss": 0.1102, + "step": 21800 + }, + { + "epoch": 59.403269754768395, + "grad_norm": 3.2217648029327393, + "learning_rate": 7.468184285001645e-06, + "loss": 0.2023, + "step": 21801 + }, + { + "epoch": 59.40599455040872, + "grad_norm": 4.229472637176514, + "learning_rate": 7.467330552979635e-06, + "loss": 0.0896, + "step": 21802 + }, + { + "epoch": 59.40871934604905, + "grad_norm": 4.491195201873779, + "learning_rate": 7.4664768406819685e-06, + "loss": 0.1437, + "step": 21803 + }, + { + "epoch": 59.41144414168937, + "grad_norm": 3.7320375442504883, + "learning_rate": 7.465623148115302e-06, + "loss": 0.0935, + "step": 21804 + }, + { + "epoch": 59.4141689373297, + "grad_norm": 4.812129974365234, + "learning_rate": 7.46476947528628e-06, + "loss": 0.1163, + "step": 21805 + }, + { + "epoch": 59.416893732970024, + "grad_norm": 5.116265773773193, + "learning_rate": 7.463915822201552e-06, + "loss": 0.0648, + "step": 21806 + }, + { + "epoch": 59.41961852861036, + "grad_norm": 4.548985481262207, + "learning_rate": 7.463062188867764e-06, + "loss": 0.0927, + "step": 21807 + }, + { + "epoch": 59.42234332425068, + "grad_norm": 5.495615005493164, + "learning_rate": 7.462208575291567e-06, + "loss": 0.0849, + "step": 21808 + }, + { + "epoch": 59.42506811989101, + "grad_norm": 3.476064443588257, + "learning_rate": 7.461354981479605e-06, + "loss": 0.1317, + "step": 21809 + }, + { + "epoch": 59.427792915531334, + "grad_norm": 4.945058822631836, + "learning_rate": 7.460501407438533e-06, + "loss": 0.093, + "step": 21810 + }, + { + "epoch": 59.43051771117166, + "grad_norm": 4.617724418640137, + "learning_rate": 7.459647853174993e-06, + "loss": 0.0963, + "step": 21811 + }, + { + "epoch": 59.433242506811986, + "grad_norm": 3.9213743209838867, + "learning_rate": 7.458794318695635e-06, + "loss": 0.0577, + "step": 21812 + }, + { + "epoch": 59.43596730245232, + "grad_norm": 3.279602289199829, + "learning_rate": 7.457940804007104e-06, + "loss": 0.1098, + "step": 21813 + }, + { + "epoch": 59.438692098092645, + "grad_norm": 4.74573278427124, + "learning_rate": 7.457087309116049e-06, + "loss": 0.082, + "step": 21814 + }, + { + "epoch": 59.44141689373297, + "grad_norm": 7.025487422943115, + "learning_rate": 7.456233834029114e-06, + "loss": 0.0725, + "step": 21815 + }, + { + "epoch": 59.444141689373296, + "grad_norm": 4.187443256378174, + "learning_rate": 7.455380378752951e-06, + "loss": 0.067, + "step": 21816 + }, + { + "epoch": 59.44686648501362, + "grad_norm": 3.6091067790985107, + "learning_rate": 7.454526943294201e-06, + "loss": 0.0634, + "step": 21817 + }, + { + "epoch": 59.44959128065395, + "grad_norm": 4.672299385070801, + "learning_rate": 7.4536735276595165e-06, + "loss": 0.0685, + "step": 21818 + }, + { + "epoch": 59.45231607629428, + "grad_norm": 4.091929912567139, + "learning_rate": 7.452820131855538e-06, + "loss": 0.1621, + "step": 21819 + }, + { + "epoch": 59.45504087193461, + "grad_norm": 3.060480833053589, + "learning_rate": 7.451966755888915e-06, + "loss": 0.0589, + "step": 21820 + }, + { + "epoch": 59.45776566757493, + "grad_norm": 3.5286495685577393, + "learning_rate": 7.451113399766292e-06, + "loss": 0.1765, + "step": 21821 + }, + { + "epoch": 59.46049046321526, + "grad_norm": 4.204300403594971, + "learning_rate": 7.450260063494319e-06, + "loss": 0.0821, + "step": 21822 + }, + { + "epoch": 59.463215258855584, + "grad_norm": 3.3798656463623047, + "learning_rate": 7.449406747079635e-06, + "loss": 0.1145, + "step": 21823 + }, + { + "epoch": 59.46594005449591, + "grad_norm": 3.8153555393218994, + "learning_rate": 7.448553450528891e-06, + "loss": 0.0652, + "step": 21824 + }, + { + "epoch": 59.46866485013624, + "grad_norm": 3.8584842681884766, + "learning_rate": 7.447700173848729e-06, + "loss": 0.0803, + "step": 21825 + }, + { + "epoch": 59.47138964577657, + "grad_norm": 4.309252738952637, + "learning_rate": 7.446846917045793e-06, + "loss": 0.193, + "step": 21826 + }, + { + "epoch": 59.474114441416894, + "grad_norm": 4.435990333557129, + "learning_rate": 7.445993680126735e-06, + "loss": 0.0748, + "step": 21827 + }, + { + "epoch": 59.47683923705722, + "grad_norm": 4.829715728759766, + "learning_rate": 7.445140463098197e-06, + "loss": 0.1138, + "step": 21828 + }, + { + "epoch": 59.479564032697546, + "grad_norm": 3.765371561050415, + "learning_rate": 7.444287265966821e-06, + "loss": 0.0964, + "step": 21829 + }, + { + "epoch": 59.48228882833787, + "grad_norm": 3.971548557281494, + "learning_rate": 7.443434088739256e-06, + "loss": 0.1511, + "step": 21830 + }, + { + "epoch": 59.485013623978205, + "grad_norm": 4.259155750274658, + "learning_rate": 7.442580931422141e-06, + "loss": 0.1125, + "step": 21831 + }, + { + "epoch": 59.48773841961853, + "grad_norm": 3.840143918991089, + "learning_rate": 7.441727794022126e-06, + "loss": 0.0983, + "step": 21832 + }, + { + "epoch": 59.490463215258856, + "grad_norm": 4.222861289978027, + "learning_rate": 7.44087467654585e-06, + "loss": 0.0993, + "step": 21833 + }, + { + "epoch": 59.49318801089918, + "grad_norm": 2.950629711151123, + "learning_rate": 7.440021578999963e-06, + "loss": 0.1224, + "step": 21834 + }, + { + "epoch": 59.49591280653951, + "grad_norm": 3.4389383792877197, + "learning_rate": 7.439168501391103e-06, + "loss": 0.1837, + "step": 21835 + }, + { + "epoch": 59.49863760217983, + "grad_norm": 4.719254493713379, + "learning_rate": 7.438315443725919e-06, + "loss": 0.0572, + "step": 21836 + }, + { + "epoch": 59.50136239782017, + "grad_norm": 3.35953950881958, + "learning_rate": 7.437462406011048e-06, + "loss": 0.074, + "step": 21837 + }, + { + "epoch": 59.50408719346049, + "grad_norm": 4.480406761169434, + "learning_rate": 7.43660938825314e-06, + "loss": 0.0826, + "step": 21838 + }, + { + "epoch": 59.50681198910082, + "grad_norm": 4.066308498382568, + "learning_rate": 7.435756390458834e-06, + "loss": 0.089, + "step": 21839 + }, + { + "epoch": 59.509536784741144, + "grad_norm": 4.58651065826416, + "learning_rate": 7.4349034126347765e-06, + "loss": 0.1235, + "step": 21840 + }, + { + "epoch": 59.51226158038147, + "grad_norm": 3.3988780975341797, + "learning_rate": 7.4340504547876066e-06, + "loss": 0.196, + "step": 21841 + }, + { + "epoch": 59.514986376021795, + "grad_norm": 3.3992702960968018, + "learning_rate": 7.433197516923971e-06, + "loss": 0.1059, + "step": 21842 + }, + { + "epoch": 59.51771117166213, + "grad_norm": 3.836113929748535, + "learning_rate": 7.432344599050507e-06, + "loss": 0.0917, + "step": 21843 + }, + { + "epoch": 59.520435967302454, + "grad_norm": 3.456178665161133, + "learning_rate": 7.431491701173862e-06, + "loss": 0.1329, + "step": 21844 + }, + { + "epoch": 59.52316076294278, + "grad_norm": 3.428816318511963, + "learning_rate": 7.43063882330068e-06, + "loss": 0.1099, + "step": 21845 + }, + { + "epoch": 59.525885558583106, + "grad_norm": 3.238723039627075, + "learning_rate": 7.429785965437597e-06, + "loss": 0.13, + "step": 21846 + }, + { + "epoch": 59.52861035422343, + "grad_norm": 4.485742092132568, + "learning_rate": 7.42893312759126e-06, + "loss": 0.1619, + "step": 21847 + }, + { + "epoch": 59.53133514986376, + "grad_norm": 3.8060503005981445, + "learning_rate": 7.4280803097683086e-06, + "loss": 0.0648, + "step": 21848 + }, + { + "epoch": 59.53405994550409, + "grad_norm": 3.3967173099517822, + "learning_rate": 7.427227511975383e-06, + "loss": 0.0954, + "step": 21849 + }, + { + "epoch": 59.536784741144416, + "grad_norm": 3.5591654777526855, + "learning_rate": 7.426374734219131e-06, + "loss": 0.076, + "step": 21850 + }, + { + "epoch": 59.53950953678474, + "grad_norm": 6.30497407913208, + "learning_rate": 7.425521976506186e-06, + "loss": 0.1958, + "step": 21851 + }, + { + "epoch": 59.54223433242507, + "grad_norm": 3.986257553100586, + "learning_rate": 7.424669238843195e-06, + "loss": 0.1863, + "step": 21852 + }, + { + "epoch": 59.54495912806539, + "grad_norm": 3.7997138500213623, + "learning_rate": 7.423816521236795e-06, + "loss": 0.1201, + "step": 21853 + }, + { + "epoch": 59.54768392370572, + "grad_norm": 4.160584449768066, + "learning_rate": 7.4229638236936315e-06, + "loss": 0.1436, + "step": 21854 + }, + { + "epoch": 59.55040871934605, + "grad_norm": 4.1414618492126465, + "learning_rate": 7.422111146220342e-06, + "loss": 0.0686, + "step": 21855 + }, + { + "epoch": 59.55313351498638, + "grad_norm": 3.886396884918213, + "learning_rate": 7.421258488823568e-06, + "loss": 0.0863, + "step": 21856 + }, + { + "epoch": 59.555858310626704, + "grad_norm": 4.574501037597656, + "learning_rate": 7.42040585150995e-06, + "loss": 0.0976, + "step": 21857 + }, + { + "epoch": 59.55858310626703, + "grad_norm": 3.625762701034546, + "learning_rate": 7.419553234286129e-06, + "loss": 0.0833, + "step": 21858 + }, + { + "epoch": 59.561307901907355, + "grad_norm": 3.206472158432007, + "learning_rate": 7.418700637158742e-06, + "loss": 0.1783, + "step": 21859 + }, + { + "epoch": 59.56403269754768, + "grad_norm": 3.9687817096710205, + "learning_rate": 7.417848060134429e-06, + "loss": 0.2486, + "step": 21860 + }, + { + "epoch": 59.566757493188014, + "grad_norm": 3.5982322692871094, + "learning_rate": 7.416995503219837e-06, + "loss": 0.0667, + "step": 21861 + }, + { + "epoch": 59.56948228882834, + "grad_norm": 3.204102039337158, + "learning_rate": 7.416142966421599e-06, + "loss": 0.0469, + "step": 21862 + }, + { + "epoch": 59.572207084468666, + "grad_norm": 3.5523905754089355, + "learning_rate": 7.4152904497463575e-06, + "loss": 0.2118, + "step": 21863 + }, + { + "epoch": 59.57493188010899, + "grad_norm": 3.9007256031036377, + "learning_rate": 7.414437953200751e-06, + "loss": 0.0643, + "step": 21864 + }, + { + "epoch": 59.57765667574932, + "grad_norm": 5.8959736824035645, + "learning_rate": 7.413585476791418e-06, + "loss": 0.1617, + "step": 21865 + }, + { + "epoch": 59.58038147138964, + "grad_norm": 4.635599613189697, + "learning_rate": 7.412733020524997e-06, + "loss": 0.0736, + "step": 21866 + }, + { + "epoch": 59.583106267029976, + "grad_norm": 3.5214428901672363, + "learning_rate": 7.411880584408131e-06, + "loss": 0.2338, + "step": 21867 + }, + { + "epoch": 59.5858310626703, + "grad_norm": 4.32875394821167, + "learning_rate": 7.4110281684474515e-06, + "loss": 0.1346, + "step": 21868 + }, + { + "epoch": 59.58855585831063, + "grad_norm": 3.2541072368621826, + "learning_rate": 7.410175772649605e-06, + "loss": 0.1198, + "step": 21869 + }, + { + "epoch": 59.59128065395095, + "grad_norm": 5.001347064971924, + "learning_rate": 7.4093233970212245e-06, + "loss": 0.0656, + "step": 21870 + }, + { + "epoch": 59.59400544959128, + "grad_norm": 4.108007431030273, + "learning_rate": 7.40847104156895e-06, + "loss": 0.061, + "step": 21871 + }, + { + "epoch": 59.596730245231605, + "grad_norm": 3.7400007247924805, + "learning_rate": 7.40761870629942e-06, + "loss": 0.0729, + "step": 21872 + }, + { + "epoch": 59.59945504087194, + "grad_norm": 3.1615638732910156, + "learning_rate": 7.40676639121927e-06, + "loss": 0.1703, + "step": 21873 + }, + { + "epoch": 59.60217983651226, + "grad_norm": 4.166745185852051, + "learning_rate": 7.405914096335143e-06, + "loss": 0.131, + "step": 21874 + }, + { + "epoch": 59.60490463215259, + "grad_norm": 3.6109678745269775, + "learning_rate": 7.405061821653672e-06, + "loss": 0.1533, + "step": 21875 + }, + { + "epoch": 59.607629427792915, + "grad_norm": 4.113295078277588, + "learning_rate": 7.404209567181497e-06, + "loss": 0.159, + "step": 21876 + }, + { + "epoch": 59.61035422343324, + "grad_norm": 2.682974338531494, + "learning_rate": 7.403357332925251e-06, + "loss": 0.0432, + "step": 21877 + }, + { + "epoch": 59.61307901907357, + "grad_norm": 4.304617404937744, + "learning_rate": 7.402505118891575e-06, + "loss": 0.1348, + "step": 21878 + }, + { + "epoch": 59.6158038147139, + "grad_norm": 4.079246520996094, + "learning_rate": 7.40165292508711e-06, + "loss": 0.0517, + "step": 21879 + }, + { + "epoch": 59.618528610354225, + "grad_norm": 4.5099568367004395, + "learning_rate": 7.400800751518484e-06, + "loss": 0.0699, + "step": 21880 + }, + { + "epoch": 59.62125340599455, + "grad_norm": 4.95874547958374, + "learning_rate": 7.399948598192341e-06, + "loss": 0.0891, + "step": 21881 + }, + { + "epoch": 59.62397820163488, + "grad_norm": 3.754046678543091, + "learning_rate": 7.3990964651153144e-06, + "loss": 0.1493, + "step": 21882 + }, + { + "epoch": 59.6267029972752, + "grad_norm": 4.105714797973633, + "learning_rate": 7.39824435229404e-06, + "loss": 0.224, + "step": 21883 + }, + { + "epoch": 59.62942779291553, + "grad_norm": 3.4785470962524414, + "learning_rate": 7.397392259735155e-06, + "loss": 0.1122, + "step": 21884 + }, + { + "epoch": 59.63215258855586, + "grad_norm": 4.887084484100342, + "learning_rate": 7.396540187445296e-06, + "loss": 0.2015, + "step": 21885 + }, + { + "epoch": 59.63487738419619, + "grad_norm": 3.4088008403778076, + "learning_rate": 7.395688135431096e-06, + "loss": 0.1561, + "step": 21886 + }, + { + "epoch": 59.63760217983651, + "grad_norm": 6.81312894821167, + "learning_rate": 7.394836103699197e-06, + "loss": 0.1588, + "step": 21887 + }, + { + "epoch": 59.64032697547684, + "grad_norm": 4.069431781768799, + "learning_rate": 7.393984092256227e-06, + "loss": 0.1011, + "step": 21888 + }, + { + "epoch": 59.643051771117165, + "grad_norm": 6.171210289001465, + "learning_rate": 7.393132101108827e-06, + "loss": 0.1744, + "step": 21889 + }, + { + "epoch": 59.64577656675749, + "grad_norm": 3.589771032333374, + "learning_rate": 7.392280130263628e-06, + "loss": 0.0546, + "step": 21890 + }, + { + "epoch": 59.64850136239782, + "grad_norm": 3.006995677947998, + "learning_rate": 7.39142817972727e-06, + "loss": 0.0706, + "step": 21891 + }, + { + "epoch": 59.65122615803815, + "grad_norm": 2.884824752807617, + "learning_rate": 7.390576249506384e-06, + "loss": 0.05, + "step": 21892 + }, + { + "epoch": 59.653950953678475, + "grad_norm": 4.403576850891113, + "learning_rate": 7.389724339607606e-06, + "loss": 0.2201, + "step": 21893 + }, + { + "epoch": 59.6566757493188, + "grad_norm": 4.115321636199951, + "learning_rate": 7.388872450037572e-06, + "loss": 0.1991, + "step": 21894 + }, + { + "epoch": 59.65940054495913, + "grad_norm": 5.070188522338867, + "learning_rate": 7.38802058080291e-06, + "loss": 0.1135, + "step": 21895 + }, + { + "epoch": 59.66212534059945, + "grad_norm": 3.9264934062957764, + "learning_rate": 7.387168731910264e-06, + "loss": 0.2953, + "step": 21896 + }, + { + "epoch": 59.664850136239785, + "grad_norm": 23.98346710205078, + "learning_rate": 7.386316903366266e-06, + "loss": 0.0699, + "step": 21897 + }, + { + "epoch": 59.66757493188011, + "grad_norm": 4.844391345977783, + "learning_rate": 7.385465095177544e-06, + "loss": 0.1196, + "step": 21898 + }, + { + "epoch": 59.67029972752044, + "grad_norm": 3.194143533706665, + "learning_rate": 7.384613307350739e-06, + "loss": 0.0528, + "step": 21899 + }, + { + "epoch": 59.67302452316076, + "grad_norm": 4.888129234313965, + "learning_rate": 7.38376153989248e-06, + "loss": 0.1125, + "step": 21900 + }, + { + "epoch": 59.67574931880109, + "grad_norm": 4.619625568389893, + "learning_rate": 7.382909792809403e-06, + "loss": 0.1219, + "step": 21901 + }, + { + "epoch": 59.678474114441414, + "grad_norm": 3.538721799850464, + "learning_rate": 7.3820580661081375e-06, + "loss": 0.0601, + "step": 21902 + }, + { + "epoch": 59.68119891008175, + "grad_norm": 3.7365593910217285, + "learning_rate": 7.381206359795323e-06, + "loss": 0.0731, + "step": 21903 + }, + { + "epoch": 59.68392370572207, + "grad_norm": 3.50585675239563, + "learning_rate": 7.380354673877585e-06, + "loss": 0.1768, + "step": 21904 + }, + { + "epoch": 59.6866485013624, + "grad_norm": 4.8301239013671875, + "learning_rate": 7.379503008361565e-06, + "loss": 0.1422, + "step": 21905 + }, + { + "epoch": 59.689373297002724, + "grad_norm": 2.799285650253296, + "learning_rate": 7.378651363253888e-06, + "loss": 0.0722, + "step": 21906 + }, + { + "epoch": 59.69209809264305, + "grad_norm": 3.759619951248169, + "learning_rate": 7.377799738561192e-06, + "loss": 0.0821, + "step": 21907 + }, + { + "epoch": 59.694822888283376, + "grad_norm": 3.615964412689209, + "learning_rate": 7.376948134290105e-06, + "loss": 0.1244, + "step": 21908 + }, + { + "epoch": 59.69754768392371, + "grad_norm": 3.153252601623535, + "learning_rate": 7.376096550447265e-06, + "loss": 0.0886, + "step": 21909 + }, + { + "epoch": 59.700272479564035, + "grad_norm": 2.7910876274108887, + "learning_rate": 7.375244987039296e-06, + "loss": 0.0422, + "step": 21910 + }, + { + "epoch": 59.70299727520436, + "grad_norm": 4.728867530822754, + "learning_rate": 7.3743934440728385e-06, + "loss": 0.2137, + "step": 21911 + }, + { + "epoch": 59.705722070844686, + "grad_norm": 2.8954384326934814, + "learning_rate": 7.373541921554515e-06, + "loss": 0.0603, + "step": 21912 + }, + { + "epoch": 59.70844686648501, + "grad_norm": 3.641709566116333, + "learning_rate": 7.3726904194909655e-06, + "loss": 0.1728, + "step": 21913 + }, + { + "epoch": 59.71117166212534, + "grad_norm": 3.848088026046753, + "learning_rate": 7.3718389378888175e-06, + "loss": 0.1199, + "step": 21914 + }, + { + "epoch": 59.71389645776567, + "grad_norm": 3.926086187362671, + "learning_rate": 7.370987476754707e-06, + "loss": 0.0781, + "step": 21915 + }, + { + "epoch": 59.716621253406, + "grad_norm": 3.1481707096099854, + "learning_rate": 7.370136036095258e-06, + "loss": 0.1687, + "step": 21916 + }, + { + "epoch": 59.71934604904632, + "grad_norm": 3.281507968902588, + "learning_rate": 7.369284615917107e-06, + "loss": 0.3074, + "step": 21917 + }, + { + "epoch": 59.72207084468665, + "grad_norm": 3.6226589679718018, + "learning_rate": 7.368433216226881e-06, + "loss": 0.1139, + "step": 21918 + }, + { + "epoch": 59.724795640326974, + "grad_norm": 3.5362019538879395, + "learning_rate": 7.3675818370312145e-06, + "loss": 0.1129, + "step": 21919 + }, + { + "epoch": 59.7275204359673, + "grad_norm": 5.129333019256592, + "learning_rate": 7.3667304783367345e-06, + "loss": 0.2957, + "step": 21920 + }, + { + "epoch": 59.73024523160763, + "grad_norm": 3.0170693397521973, + "learning_rate": 7.365879140150074e-06, + "loss": 0.0705, + "step": 21921 + }, + { + "epoch": 59.73297002724796, + "grad_norm": 4.153504371643066, + "learning_rate": 7.36502782247786e-06, + "loss": 0.1186, + "step": 21922 + }, + { + "epoch": 59.735694822888284, + "grad_norm": 3.5138421058654785, + "learning_rate": 7.364176525326726e-06, + "loss": 0.1865, + "step": 21923 + }, + { + "epoch": 59.73841961852861, + "grad_norm": 3.734121561050415, + "learning_rate": 7.3633252487032995e-06, + "loss": 0.151, + "step": 21924 + }, + { + "epoch": 59.741144414168936, + "grad_norm": 4.205217361450195, + "learning_rate": 7.362473992614212e-06, + "loss": 0.1132, + "step": 21925 + }, + { + "epoch": 59.74386920980926, + "grad_norm": 3.6806509494781494, + "learning_rate": 7.361622757066092e-06, + "loss": 0.0675, + "step": 21926 + }, + { + "epoch": 59.746594005449595, + "grad_norm": 3.2617616653442383, + "learning_rate": 7.360771542065569e-06, + "loss": 0.0991, + "step": 21927 + }, + { + "epoch": 59.74931880108992, + "grad_norm": 5.201332092285156, + "learning_rate": 7.3599203476192716e-06, + "loss": 0.1436, + "step": 21928 + }, + { + "epoch": 59.752043596730246, + "grad_norm": 3.168055534362793, + "learning_rate": 7.3590691737338264e-06, + "loss": 0.1375, + "step": 21929 + }, + { + "epoch": 59.75476839237057, + "grad_norm": 3.6250600814819336, + "learning_rate": 7.35821802041587e-06, + "loss": 0.0624, + "step": 21930 + }, + { + "epoch": 59.7574931880109, + "grad_norm": 4.313841342926025, + "learning_rate": 7.357366887672025e-06, + "loss": 0.1178, + "step": 21931 + }, + { + "epoch": 59.76021798365122, + "grad_norm": 4.536067008972168, + "learning_rate": 7.356515775508924e-06, + "loss": 0.2123, + "step": 21932 + }, + { + "epoch": 59.762942779291556, + "grad_norm": 3.065178394317627, + "learning_rate": 7.35566468393319e-06, + "loss": 0.0482, + "step": 21933 + }, + { + "epoch": 59.76566757493188, + "grad_norm": 4.149610996246338, + "learning_rate": 7.354813612951457e-06, + "loss": 0.1382, + "step": 21934 + }, + { + "epoch": 59.76839237057221, + "grad_norm": 3.3267109394073486, + "learning_rate": 7.353962562570347e-06, + "loss": 0.0592, + "step": 21935 + }, + { + "epoch": 59.771117166212534, + "grad_norm": 3.2652664184570312, + "learning_rate": 7.353111532796493e-06, + "loss": 0.1259, + "step": 21936 + }, + { + "epoch": 59.77384196185286, + "grad_norm": 3.761549949645996, + "learning_rate": 7.352260523636523e-06, + "loss": 0.1538, + "step": 21937 + }, + { + "epoch": 59.776566757493185, + "grad_norm": 3.6344947814941406, + "learning_rate": 7.351409535097061e-06, + "loss": 0.0993, + "step": 21938 + }, + { + "epoch": 59.77929155313352, + "grad_norm": 5.851442337036133, + "learning_rate": 7.350558567184738e-06, + "loss": 0.1137, + "step": 21939 + }, + { + "epoch": 59.782016348773844, + "grad_norm": 3.915271282196045, + "learning_rate": 7.349707619906177e-06, + "loss": 0.0746, + "step": 21940 + }, + { + "epoch": 59.78474114441417, + "grad_norm": 4.664577484130859, + "learning_rate": 7.348856693268011e-06, + "loss": 0.0618, + "step": 21941 + }, + { + "epoch": 59.787465940054496, + "grad_norm": 3.6140897274017334, + "learning_rate": 7.348005787276861e-06, + "loss": 0.0537, + "step": 21942 + }, + { + "epoch": 59.79019073569482, + "grad_norm": 2.723332643508911, + "learning_rate": 7.347154901939358e-06, + "loss": 0.0602, + "step": 21943 + }, + { + "epoch": 59.79291553133515, + "grad_norm": 3.181187152862549, + "learning_rate": 7.346304037262127e-06, + "loss": 0.0488, + "step": 21944 + }, + { + "epoch": 59.79564032697548, + "grad_norm": 5.005062580108643, + "learning_rate": 7.345453193251795e-06, + "loss": 0.0624, + "step": 21945 + }, + { + "epoch": 59.798365122615806, + "grad_norm": 4.6376423835754395, + "learning_rate": 7.344602369914984e-06, + "loss": 0.1224, + "step": 21946 + }, + { + "epoch": 59.80108991825613, + "grad_norm": 5.750683784484863, + "learning_rate": 7.343751567258328e-06, + "loss": 0.1832, + "step": 21947 + }, + { + "epoch": 59.80381471389646, + "grad_norm": 3.7080774307250977, + "learning_rate": 7.34290078528845e-06, + "loss": 0.1166, + "step": 21948 + }, + { + "epoch": 59.80653950953678, + "grad_norm": 4.58156681060791, + "learning_rate": 7.342050024011973e-06, + "loss": 0.144, + "step": 21949 + }, + { + "epoch": 59.80926430517711, + "grad_norm": 2.935380458831787, + "learning_rate": 7.3411992834355276e-06, + "loss": 0.053, + "step": 21950 + }, + { + "epoch": 59.81198910081744, + "grad_norm": 5.052936553955078, + "learning_rate": 7.340348563565735e-06, + "loss": 0.1395, + "step": 21951 + }, + { + "epoch": 59.81471389645777, + "grad_norm": 4.201597213745117, + "learning_rate": 7.339497864409223e-06, + "loss": 0.0573, + "step": 21952 + }, + { + "epoch": 59.817438692098094, + "grad_norm": 3.823265790939331, + "learning_rate": 7.338647185972614e-06, + "loss": 0.0551, + "step": 21953 + }, + { + "epoch": 59.82016348773842, + "grad_norm": 4.828398704528809, + "learning_rate": 7.337796528262537e-06, + "loss": 0.1576, + "step": 21954 + }, + { + "epoch": 59.822888283378745, + "grad_norm": 3.4092397689819336, + "learning_rate": 7.336945891285614e-06, + "loss": 0.05, + "step": 21955 + }, + { + "epoch": 59.82561307901907, + "grad_norm": 5.1029863357543945, + "learning_rate": 7.336095275048474e-06, + "loss": 0.1454, + "step": 21956 + }, + { + "epoch": 59.828337874659404, + "grad_norm": 3.9042434692382812, + "learning_rate": 7.3352446795577336e-06, + "loss": 0.1659, + "step": 21957 + }, + { + "epoch": 59.83106267029973, + "grad_norm": 3.6238622665405273, + "learning_rate": 7.334394104820024e-06, + "loss": 0.0742, + "step": 21958 + }, + { + "epoch": 59.833787465940055, + "grad_norm": 12.98780345916748, + "learning_rate": 7.333543550841966e-06, + "loss": 0.1047, + "step": 21959 + }, + { + "epoch": 59.83651226158038, + "grad_norm": 6.426098823547363, + "learning_rate": 7.332693017630185e-06, + "loss": 0.1479, + "step": 21960 + }, + { + "epoch": 59.83923705722071, + "grad_norm": 3.744154214859009, + "learning_rate": 7.331842505191308e-06, + "loss": 0.0855, + "step": 21961 + }, + { + "epoch": 59.84196185286103, + "grad_norm": 8.704964637756348, + "learning_rate": 7.330992013531952e-06, + "loss": 0.1569, + "step": 21962 + }, + { + "epoch": 59.844686648501366, + "grad_norm": 5.0485944747924805, + "learning_rate": 7.330141542658747e-06, + "loss": 0.1304, + "step": 21963 + }, + { + "epoch": 59.84741144414169, + "grad_norm": 4.686516761779785, + "learning_rate": 7.32929109257831e-06, + "loss": 0.0861, + "step": 21964 + }, + { + "epoch": 59.85013623978202, + "grad_norm": 4.361832618713379, + "learning_rate": 7.328440663297269e-06, + "loss": 0.2178, + "step": 21965 + }, + { + "epoch": 59.85286103542234, + "grad_norm": 4.1770501136779785, + "learning_rate": 7.32759025482225e-06, + "loss": 0.098, + "step": 21966 + }, + { + "epoch": 59.85558583106267, + "grad_norm": 2.7962067127227783, + "learning_rate": 7.3267398671598685e-06, + "loss": 0.0984, + "step": 21967 + }, + { + "epoch": 59.858310626702995, + "grad_norm": 3.77594256401062, + "learning_rate": 7.325889500316754e-06, + "loss": 0.169, + "step": 21968 + }, + { + "epoch": 59.86103542234333, + "grad_norm": 5.534327507019043, + "learning_rate": 7.325039154299522e-06, + "loss": 0.2511, + "step": 21969 + }, + { + "epoch": 59.86376021798365, + "grad_norm": 3.6949567794799805, + "learning_rate": 7.324188829114804e-06, + "loss": 0.2434, + "step": 21970 + }, + { + "epoch": 59.86648501362398, + "grad_norm": 6.855175018310547, + "learning_rate": 7.323338524769212e-06, + "loss": 0.0748, + "step": 21971 + }, + { + "epoch": 59.869209809264305, + "grad_norm": 3.2030975818634033, + "learning_rate": 7.322488241269379e-06, + "loss": 0.0537, + "step": 21972 + }, + { + "epoch": 59.87193460490463, + "grad_norm": 5.0401387214660645, + "learning_rate": 7.321637978621916e-06, + "loss": 0.1184, + "step": 21973 + }, + { + "epoch": 59.87465940054496, + "grad_norm": 4.25337553024292, + "learning_rate": 7.320787736833455e-06, + "loss": 0.1038, + "step": 21974 + }, + { + "epoch": 59.87738419618529, + "grad_norm": 4.143477439880371, + "learning_rate": 7.319937515910609e-06, + "loss": 0.1226, + "step": 21975 + }, + { + "epoch": 59.880108991825615, + "grad_norm": 4.022922515869141, + "learning_rate": 7.319087315860005e-06, + "loss": 0.0766, + "step": 21976 + }, + { + "epoch": 59.88283378746594, + "grad_norm": 3.7847626209259033, + "learning_rate": 7.318237136688262e-06, + "loss": 0.0651, + "step": 21977 + }, + { + "epoch": 59.88555858310627, + "grad_norm": 3.106093645095825, + "learning_rate": 7.317386978402003e-06, + "loss": 0.0693, + "step": 21978 + }, + { + "epoch": 59.88828337874659, + "grad_norm": 4.657619953155518, + "learning_rate": 7.316536841007847e-06, + "loss": 0.1568, + "step": 21979 + }, + { + "epoch": 59.89100817438692, + "grad_norm": 4.844773292541504, + "learning_rate": 7.3156867245124175e-06, + "loss": 0.1726, + "step": 21980 + }, + { + "epoch": 59.89373297002725, + "grad_norm": 2.992464303970337, + "learning_rate": 7.314836628922326e-06, + "loss": 0.1088, + "step": 21981 + }, + { + "epoch": 59.89645776566758, + "grad_norm": 4.16619348526001, + "learning_rate": 7.313986554244208e-06, + "loss": 0.1272, + "step": 21982 + }, + { + "epoch": 59.8991825613079, + "grad_norm": 3.4509432315826416, + "learning_rate": 7.313136500484673e-06, + "loss": 0.0958, + "step": 21983 + }, + { + "epoch": 59.90190735694823, + "grad_norm": 3.953277111053467, + "learning_rate": 7.312286467650347e-06, + "loss": 0.0955, + "step": 21984 + }, + { + "epoch": 59.904632152588555, + "grad_norm": 3.0407843589782715, + "learning_rate": 7.311436455747847e-06, + "loss": 0.0777, + "step": 21985 + }, + { + "epoch": 59.90735694822888, + "grad_norm": 3.9172523021698, + "learning_rate": 7.3105864647837934e-06, + "loss": 0.0896, + "step": 21986 + }, + { + "epoch": 59.91008174386921, + "grad_norm": 5.004632472991943, + "learning_rate": 7.309736494764804e-06, + "loss": 0.1148, + "step": 21987 + }, + { + "epoch": 59.91280653950954, + "grad_norm": 3.2358882427215576, + "learning_rate": 7.308886545697502e-06, + "loss": 0.2064, + "step": 21988 + }, + { + "epoch": 59.915531335149865, + "grad_norm": 4.379899501800537, + "learning_rate": 7.308036617588504e-06, + "loss": 0.0795, + "step": 21989 + }, + { + "epoch": 59.91825613079019, + "grad_norm": 3.341609477996826, + "learning_rate": 7.307186710444432e-06, + "loss": 0.1664, + "step": 21990 + }, + { + "epoch": 59.920980926430516, + "grad_norm": 3.8921256065368652, + "learning_rate": 7.3063368242719005e-06, + "loss": 0.1101, + "step": 21991 + }, + { + "epoch": 59.92370572207084, + "grad_norm": 3.9960689544677734, + "learning_rate": 7.3054869590775344e-06, + "loss": 0.0649, + "step": 21992 + }, + { + "epoch": 59.926430517711175, + "grad_norm": 3.2175517082214355, + "learning_rate": 7.304637114867946e-06, + "loss": 0.1003, + "step": 21993 + }, + { + "epoch": 59.9291553133515, + "grad_norm": 3.395170211791992, + "learning_rate": 7.30378729164976e-06, + "loss": 0.0413, + "step": 21994 + }, + { + "epoch": 59.93188010899183, + "grad_norm": 4.161465167999268, + "learning_rate": 7.302937489429589e-06, + "loss": 0.0669, + "step": 21995 + }, + { + "epoch": 59.93460490463215, + "grad_norm": 3.115039587020874, + "learning_rate": 7.302087708214056e-06, + "loss": 0.1485, + "step": 21996 + }, + { + "epoch": 59.93732970027248, + "grad_norm": 3.1612086296081543, + "learning_rate": 7.301237948009775e-06, + "loss": 0.0508, + "step": 21997 + }, + { + "epoch": 59.940054495912804, + "grad_norm": 6.413022518157959, + "learning_rate": 7.3003882088233635e-06, + "loss": 0.2392, + "step": 21998 + }, + { + "epoch": 59.94277929155314, + "grad_norm": 4.683806419372559, + "learning_rate": 7.299538490661446e-06, + "loss": 0.1101, + "step": 21999 + }, + { + "epoch": 59.94550408719346, + "grad_norm": 4.365520000457764, + "learning_rate": 7.298688793530635e-06, + "loss": 0.1686, + "step": 22000 + }, + { + "epoch": 59.94822888283379, + "grad_norm": 3.62276554107666, + "learning_rate": 7.297839117437549e-06, + "loss": 0.1164, + "step": 22001 + }, + { + "epoch": 59.950953678474114, + "grad_norm": 4.794510364532471, + "learning_rate": 7.296989462388806e-06, + "loss": 0.2839, + "step": 22002 + }, + { + "epoch": 59.95367847411444, + "grad_norm": 3.246356964111328, + "learning_rate": 7.2961398283910204e-06, + "loss": 0.1993, + "step": 22003 + }, + { + "epoch": 59.956403269754766, + "grad_norm": 4.223857879638672, + "learning_rate": 7.295290215450812e-06, + "loss": 0.0891, + "step": 22004 + }, + { + "epoch": 59.95912806539509, + "grad_norm": 5.262650966644287, + "learning_rate": 7.2944406235747945e-06, + "loss": 0.1266, + "step": 22005 + }, + { + "epoch": 59.961852861035425, + "grad_norm": 3.6192314624786377, + "learning_rate": 7.293591052769589e-06, + "loss": 0.1053, + "step": 22006 + }, + { + "epoch": 59.96457765667575, + "grad_norm": 3.421889543533325, + "learning_rate": 7.292741503041807e-06, + "loss": 0.0818, + "step": 22007 + }, + { + "epoch": 59.967302452316076, + "grad_norm": 3.889723777770996, + "learning_rate": 7.2918919743980685e-06, + "loss": 0.1904, + "step": 22008 + }, + { + "epoch": 59.9700272479564, + "grad_norm": 7.882750511169434, + "learning_rate": 7.291042466844986e-06, + "loss": 0.0924, + "step": 22009 + }, + { + "epoch": 59.97275204359673, + "grad_norm": 4.6614670753479, + "learning_rate": 7.290192980389182e-06, + "loss": 0.1675, + "step": 22010 + }, + { + "epoch": 59.97547683923706, + "grad_norm": 4.777350902557373, + "learning_rate": 7.289343515037263e-06, + "loss": 0.1633, + "step": 22011 + }, + { + "epoch": 59.97820163487739, + "grad_norm": 3.8556883335113525, + "learning_rate": 7.288494070795853e-06, + "loss": 0.0764, + "step": 22012 + }, + { + "epoch": 59.98092643051771, + "grad_norm": 2.663574695587158, + "learning_rate": 7.287644647671561e-06, + "loss": 0.1514, + "step": 22013 + }, + { + "epoch": 59.98365122615804, + "grad_norm": 3.57833194732666, + "learning_rate": 7.2867952456710075e-06, + "loss": 0.1716, + "step": 22014 + }, + { + "epoch": 59.986376021798364, + "grad_norm": 4.133760929107666, + "learning_rate": 7.2859458648008005e-06, + "loss": 0.1235, + "step": 22015 + }, + { + "epoch": 59.98910081743869, + "grad_norm": 3.7926201820373535, + "learning_rate": 7.285096505067564e-06, + "loss": 0.2471, + "step": 22016 + }, + { + "epoch": 59.991825613079016, + "grad_norm": 5.786928176879883, + "learning_rate": 7.284247166477909e-06, + "loss": 0.1275, + "step": 22017 + }, + { + "epoch": 59.99455040871935, + "grad_norm": 4.353601932525635, + "learning_rate": 7.283397849038447e-06, + "loss": 0.232, + "step": 22018 + }, + { + "epoch": 59.997275204359674, + "grad_norm": 3.548330307006836, + "learning_rate": 7.282548552755799e-06, + "loss": 0.0597, + "step": 22019 + }, + { + "epoch": 60.0, + "grad_norm": 4.561960697174072, + "learning_rate": 7.2816992776365714e-06, + "loss": 0.064, + "step": 22020 + }, + { + "epoch": 60.002724795640326, + "grad_norm": 9.981670379638672, + "learning_rate": 7.280850023687387e-06, + "loss": 0.1695, + "step": 22021 + }, + { + "epoch": 60.00544959128065, + "grad_norm": 5.571465492248535, + "learning_rate": 7.280000790914851e-06, + "loss": 0.1023, + "step": 22022 + }, + { + "epoch": 60.00817438692098, + "grad_norm": 2.7264788150787354, + "learning_rate": 7.27915157932558e-06, + "loss": 0.2045, + "step": 22023 + }, + { + "epoch": 60.01089918256131, + "grad_norm": 3.745054244995117, + "learning_rate": 7.278302388926194e-06, + "loss": 0.068, + "step": 22024 + }, + { + "epoch": 60.013623978201636, + "grad_norm": 4.376850605010986, + "learning_rate": 7.277453219723298e-06, + "loss": 0.1635, + "step": 22025 + }, + { + "epoch": 60.01634877384196, + "grad_norm": 12.780744552612305, + "learning_rate": 7.276604071723511e-06, + "loss": 0.1066, + "step": 22026 + }, + { + "epoch": 60.01907356948229, + "grad_norm": 3.120161771774292, + "learning_rate": 7.275754944933442e-06, + "loss": 0.0925, + "step": 22027 + }, + { + "epoch": 60.02179836512261, + "grad_norm": 4.451543807983398, + "learning_rate": 7.274905839359707e-06, + "loss": 0.0965, + "step": 22028 + }, + { + "epoch": 60.02452316076294, + "grad_norm": 3.282378911972046, + "learning_rate": 7.274056755008916e-06, + "loss": 0.3144, + "step": 22029 + }, + { + "epoch": 60.02724795640327, + "grad_norm": 4.26405143737793, + "learning_rate": 7.273207691887685e-06, + "loss": 0.106, + "step": 22030 + }, + { + "epoch": 60.0299727520436, + "grad_norm": 4.883692741394043, + "learning_rate": 7.272358650002623e-06, + "loss": 0.1461, + "step": 22031 + }, + { + "epoch": 60.032697547683924, + "grad_norm": 2.7487285137176514, + "learning_rate": 7.271509629360343e-06, + "loss": 0.0393, + "step": 22032 + }, + { + "epoch": 60.03542234332425, + "grad_norm": 2.9640891551971436, + "learning_rate": 7.270660629967461e-06, + "loss": 0.0767, + "step": 22033 + }, + { + "epoch": 60.038147138964575, + "grad_norm": 3.9891130924224854, + "learning_rate": 7.269811651830584e-06, + "loss": 0.0686, + "step": 22034 + }, + { + "epoch": 60.0408719346049, + "grad_norm": 6.4960103034973145, + "learning_rate": 7.268962694956329e-06, + "loss": 0.221, + "step": 22035 + }, + { + "epoch": 60.043596730245234, + "grad_norm": 2.927238941192627, + "learning_rate": 7.2681137593513005e-06, + "loss": 0.1274, + "step": 22036 + }, + { + "epoch": 60.04632152588556, + "grad_norm": 2.9344594478607178, + "learning_rate": 7.2672648450221195e-06, + "loss": 0.0531, + "step": 22037 + }, + { + "epoch": 60.049046321525886, + "grad_norm": 6.458965301513672, + "learning_rate": 7.266415951975388e-06, + "loss": 0.1501, + "step": 22038 + }, + { + "epoch": 60.05177111716621, + "grad_norm": 2.0938048362731934, + "learning_rate": 7.265567080217723e-06, + "loss": 0.0368, + "step": 22039 + }, + { + "epoch": 60.05449591280654, + "grad_norm": 6.481177806854248, + "learning_rate": 7.264718229755731e-06, + "loss": 0.0939, + "step": 22040 + }, + { + "epoch": 60.05722070844686, + "grad_norm": 3.4094817638397217, + "learning_rate": 7.263869400596028e-06, + "loss": 0.1864, + "step": 22041 + }, + { + "epoch": 60.059945504087196, + "grad_norm": 3.0574076175689697, + "learning_rate": 7.26302059274522e-06, + "loss": 0.0507, + "step": 22042 + }, + { + "epoch": 60.06267029972752, + "grad_norm": 3.760446310043335, + "learning_rate": 7.262171806209924e-06, + "loss": 0.0899, + "step": 22043 + }, + { + "epoch": 60.06539509536785, + "grad_norm": 4.761295318603516, + "learning_rate": 7.261323040996739e-06, + "loss": 0.1372, + "step": 22044 + }, + { + "epoch": 60.06811989100817, + "grad_norm": 4.419173717498779, + "learning_rate": 7.260474297112286e-06, + "loss": 0.1579, + "step": 22045 + }, + { + "epoch": 60.0708446866485, + "grad_norm": 3.5458569526672363, + "learning_rate": 7.259625574563172e-06, + "loss": 0.055, + "step": 22046 + }, + { + "epoch": 60.073569482288825, + "grad_norm": 5.580803394317627, + "learning_rate": 7.258776873356003e-06, + "loss": 0.054, + "step": 22047 + }, + { + "epoch": 60.07629427792916, + "grad_norm": 4.740196228027344, + "learning_rate": 7.257928193497394e-06, + "loss": 0.1395, + "step": 22048 + }, + { + "epoch": 60.079019073569484, + "grad_norm": 3.0760657787323, + "learning_rate": 7.257079534993949e-06, + "loss": 0.1613, + "step": 22049 + }, + { + "epoch": 60.08174386920981, + "grad_norm": 5.045286178588867, + "learning_rate": 7.2562308978522784e-06, + "loss": 0.1632, + "step": 22050 + }, + { + "epoch": 60.084468664850135, + "grad_norm": 3.709996461868286, + "learning_rate": 7.255382282079e-06, + "loss": 0.0966, + "step": 22051 + }, + { + "epoch": 60.08719346049046, + "grad_norm": 2.9020793437957764, + "learning_rate": 7.254533687680712e-06, + "loss": 0.0437, + "step": 22052 + }, + { + "epoch": 60.08991825613079, + "grad_norm": 6.386335849761963, + "learning_rate": 7.253685114664029e-06, + "loss": 0.1422, + "step": 22053 + }, + { + "epoch": 60.09264305177112, + "grad_norm": 5.222840309143066, + "learning_rate": 7.252836563035557e-06, + "loss": 0.1472, + "step": 22054 + }, + { + "epoch": 60.095367847411445, + "grad_norm": 8.410630226135254, + "learning_rate": 7.251988032801906e-06, + "loss": 0.1042, + "step": 22055 + }, + { + "epoch": 60.09809264305177, + "grad_norm": 4.177931308746338, + "learning_rate": 7.251139523969683e-06, + "loss": 0.0703, + "step": 22056 + }, + { + "epoch": 60.1008174386921, + "grad_norm": 5.191798210144043, + "learning_rate": 7.2502910365454985e-06, + "loss": 0.2655, + "step": 22057 + }, + { + "epoch": 60.10354223433242, + "grad_norm": 3.9571166038513184, + "learning_rate": 7.249442570535956e-06, + "loss": 0.31, + "step": 22058 + }, + { + "epoch": 60.10626702997275, + "grad_norm": 3.569178342819214, + "learning_rate": 7.24859412594767e-06, + "loss": 0.1664, + "step": 22059 + }, + { + "epoch": 60.10899182561308, + "grad_norm": 2.9958372116088867, + "learning_rate": 7.247745702787241e-06, + "loss": 0.0885, + "step": 22060 + }, + { + "epoch": 60.11171662125341, + "grad_norm": 3.663642168045044, + "learning_rate": 7.246897301061282e-06, + "loss": 0.2168, + "step": 22061 + }, + { + "epoch": 60.11444141689373, + "grad_norm": 3.5634939670562744, + "learning_rate": 7.2460489207763965e-06, + "loss": 0.117, + "step": 22062 + }, + { + "epoch": 60.11716621253406, + "grad_norm": 4.0436482429504395, + "learning_rate": 7.245200561939196e-06, + "loss": 0.0934, + "step": 22063 + }, + { + "epoch": 60.119891008174385, + "grad_norm": 3.052210807800293, + "learning_rate": 7.244352224556281e-06, + "loss": 0.1476, + "step": 22064 + }, + { + "epoch": 60.12261580381471, + "grad_norm": 3.5404224395751953, + "learning_rate": 7.243503908634266e-06, + "loss": 0.0699, + "step": 22065 + }, + { + "epoch": 60.12534059945504, + "grad_norm": 2.996366500854492, + "learning_rate": 7.2426556141797525e-06, + "loss": 0.1023, + "step": 22066 + }, + { + "epoch": 60.12806539509537, + "grad_norm": 4.221047401428223, + "learning_rate": 7.241807341199345e-06, + "loss": 0.2897, + "step": 22067 + }, + { + "epoch": 60.130790190735695, + "grad_norm": 4.326673984527588, + "learning_rate": 7.240959089699655e-06, + "loss": 0.1031, + "step": 22068 + }, + { + "epoch": 60.13351498637602, + "grad_norm": 3.4288883209228516, + "learning_rate": 7.2401108596872885e-06, + "loss": 0.0897, + "step": 22069 + }, + { + "epoch": 60.13623978201635, + "grad_norm": 2.740156650543213, + "learning_rate": 7.239262651168848e-06, + "loss": 0.0967, + "step": 22070 + }, + { + "epoch": 60.13896457765667, + "grad_norm": 3.2299089431762695, + "learning_rate": 7.238414464150945e-06, + "loss": 0.0601, + "step": 22071 + }, + { + "epoch": 60.141689373297005, + "grad_norm": 3.3907079696655273, + "learning_rate": 7.237566298640178e-06, + "loss": 0.1046, + "step": 22072 + }, + { + "epoch": 60.14441416893733, + "grad_norm": 6.267420768737793, + "learning_rate": 7.2367181546431565e-06, + "loss": 0.0843, + "step": 22073 + }, + { + "epoch": 60.14713896457766, + "grad_norm": 3.6383748054504395, + "learning_rate": 7.2358700321664845e-06, + "loss": 0.0925, + "step": 22074 + }, + { + "epoch": 60.14986376021798, + "grad_norm": 4.796145439147949, + "learning_rate": 7.2350219312167695e-06, + "loss": 0.0666, + "step": 22075 + }, + { + "epoch": 60.15258855585831, + "grad_norm": 3.1013946533203125, + "learning_rate": 7.234173851800612e-06, + "loss": 0.1023, + "step": 22076 + }, + { + "epoch": 60.155313351498634, + "grad_norm": 3.4992892742156982, + "learning_rate": 7.2333257939246226e-06, + "loss": 0.0661, + "step": 22077 + }, + { + "epoch": 60.15803814713897, + "grad_norm": 3.698241949081421, + "learning_rate": 7.2324777575954e-06, + "loss": 0.0531, + "step": 22078 + }, + { + "epoch": 60.16076294277929, + "grad_norm": 4.444230079650879, + "learning_rate": 7.231629742819554e-06, + "loss": 0.143, + "step": 22079 + }, + { + "epoch": 60.16348773841962, + "grad_norm": 4.365219593048096, + "learning_rate": 7.230781749603685e-06, + "loss": 0.0715, + "step": 22080 + }, + { + "epoch": 60.166212534059945, + "grad_norm": 3.577834129333496, + "learning_rate": 7.2299337779543995e-06, + "loss": 0.2797, + "step": 22081 + }, + { + "epoch": 60.16893732970027, + "grad_norm": 4.878407001495361, + "learning_rate": 7.2290858278783e-06, + "loss": 0.1666, + "step": 22082 + }, + { + "epoch": 60.171662125340596, + "grad_norm": 4.7122802734375, + "learning_rate": 7.2282378993819916e-06, + "loss": 0.0753, + "step": 22083 + }, + { + "epoch": 60.17438692098093, + "grad_norm": 3.255444288253784, + "learning_rate": 7.227389992472073e-06, + "loss": 0.1144, + "step": 22084 + }, + { + "epoch": 60.177111716621255, + "grad_norm": 4.510351181030273, + "learning_rate": 7.226542107155154e-06, + "loss": 0.1177, + "step": 22085 + }, + { + "epoch": 60.17983651226158, + "grad_norm": 6.7560601234436035, + "learning_rate": 7.2256942434378395e-06, + "loss": 0.089, + "step": 22086 + }, + { + "epoch": 60.182561307901906, + "grad_norm": 2.752912998199463, + "learning_rate": 7.224846401326725e-06, + "loss": 0.0446, + "step": 22087 + }, + { + "epoch": 60.18528610354223, + "grad_norm": 3.046994924545288, + "learning_rate": 7.223998580828418e-06, + "loss": 0.1037, + "step": 22088 + }, + { + "epoch": 60.18801089918256, + "grad_norm": 3.984055757522583, + "learning_rate": 7.223150781949524e-06, + "loss": 0.1455, + "step": 22089 + }, + { + "epoch": 60.19073569482289, + "grad_norm": 3.351414918899536, + "learning_rate": 7.222303004696638e-06, + "loss": 0.0956, + "step": 22090 + }, + { + "epoch": 60.19346049046322, + "grad_norm": 3.3346078395843506, + "learning_rate": 7.22145524907637e-06, + "loss": 0.0917, + "step": 22091 + }, + { + "epoch": 60.19618528610354, + "grad_norm": 2.8271543979644775, + "learning_rate": 7.220607515095317e-06, + "loss": 0.1488, + "step": 22092 + }, + { + "epoch": 60.19891008174387, + "grad_norm": 2.8824541568756104, + "learning_rate": 7.219759802760085e-06, + "loss": 0.0432, + "step": 22093 + }, + { + "epoch": 60.201634877384194, + "grad_norm": 3.8971989154815674, + "learning_rate": 7.2189121120772735e-06, + "loss": 0.0515, + "step": 22094 + }, + { + "epoch": 60.20435967302452, + "grad_norm": 5.140842437744141, + "learning_rate": 7.218064443053485e-06, + "loss": 0.0583, + "step": 22095 + }, + { + "epoch": 60.20708446866485, + "grad_norm": 5.072154521942139, + "learning_rate": 7.217216795695321e-06, + "loss": 0.0774, + "step": 22096 + }, + { + "epoch": 60.20980926430518, + "grad_norm": 2.937187910079956, + "learning_rate": 7.216369170009384e-06, + "loss": 0.0567, + "step": 22097 + }, + { + "epoch": 60.212534059945504, + "grad_norm": 6.213933944702148, + "learning_rate": 7.215521566002273e-06, + "loss": 0.119, + "step": 22098 + }, + { + "epoch": 60.21525885558583, + "grad_norm": 3.187241554260254, + "learning_rate": 7.214673983680591e-06, + "loss": 0.0503, + "step": 22099 + }, + { + "epoch": 60.217983651226156, + "grad_norm": 3.052718162536621, + "learning_rate": 7.213826423050937e-06, + "loss": 0.1028, + "step": 22100 + }, + { + "epoch": 60.22070844686648, + "grad_norm": 3.518193006515503, + "learning_rate": 7.212978884119911e-06, + "loss": 0.1897, + "step": 22101 + }, + { + "epoch": 60.223433242506815, + "grad_norm": 2.903453826904297, + "learning_rate": 7.212131366894121e-06, + "loss": 0.0758, + "step": 22102 + }, + { + "epoch": 60.22615803814714, + "grad_norm": 4.256850242614746, + "learning_rate": 7.211283871380159e-06, + "loss": 0.2743, + "step": 22103 + }, + { + "epoch": 60.228882833787466, + "grad_norm": 3.5818071365356445, + "learning_rate": 7.21043639758463e-06, + "loss": 0.0663, + "step": 22104 + }, + { + "epoch": 60.23160762942779, + "grad_norm": 5.526252746582031, + "learning_rate": 7.2095889455141325e-06, + "loss": 0.1409, + "step": 22105 + }, + { + "epoch": 60.23433242506812, + "grad_norm": 4.099296569824219, + "learning_rate": 7.208741515175266e-06, + "loss": 0.118, + "step": 22106 + }, + { + "epoch": 60.237057220708444, + "grad_norm": 3.241194725036621, + "learning_rate": 7.207894106574631e-06, + "loss": 0.0593, + "step": 22107 + }, + { + "epoch": 60.23978201634878, + "grad_norm": 3.287278413772583, + "learning_rate": 7.207046719718827e-06, + "loss": 0.1654, + "step": 22108 + }, + { + "epoch": 60.2425068119891, + "grad_norm": 3.462165117263794, + "learning_rate": 7.206199354614453e-06, + "loss": 0.0911, + "step": 22109 + }, + { + "epoch": 60.24523160762943, + "grad_norm": 6.26113224029541, + "learning_rate": 7.205352011268107e-06, + "loss": 0.0879, + "step": 22110 + }, + { + "epoch": 60.247956403269754, + "grad_norm": 2.651669502258301, + "learning_rate": 7.204504689686392e-06, + "loss": 0.0418, + "step": 22111 + }, + { + "epoch": 60.25068119891008, + "grad_norm": 5.0154805183410645, + "learning_rate": 7.203657389875902e-06, + "loss": 0.0581, + "step": 22112 + }, + { + "epoch": 60.253405994550405, + "grad_norm": 4.798368453979492, + "learning_rate": 7.2028101118432414e-06, + "loss": 0.0945, + "step": 22113 + }, + { + "epoch": 60.25613079019074, + "grad_norm": 3.665332794189453, + "learning_rate": 7.201962855595004e-06, + "loss": 0.0734, + "step": 22114 + }, + { + "epoch": 60.258855585831064, + "grad_norm": 2.9860355854034424, + "learning_rate": 7.2011156211377904e-06, + "loss": 0.0616, + "step": 22115 + }, + { + "epoch": 60.26158038147139, + "grad_norm": 3.9235002994537354, + "learning_rate": 7.200268408478197e-06, + "loss": 0.0806, + "step": 22116 + }, + { + "epoch": 60.264305177111716, + "grad_norm": 5.279658317565918, + "learning_rate": 7.199421217622825e-06, + "loss": 0.0655, + "step": 22117 + }, + { + "epoch": 60.26702997275204, + "grad_norm": 3.8670432567596436, + "learning_rate": 7.198574048578268e-06, + "loss": 0.0725, + "step": 22118 + }, + { + "epoch": 60.26975476839237, + "grad_norm": 3.356159210205078, + "learning_rate": 7.1977269013511254e-06, + "loss": 0.2106, + "step": 22119 + }, + { + "epoch": 60.2724795640327, + "grad_norm": 3.390110731124878, + "learning_rate": 7.196879775947998e-06, + "loss": 0.1548, + "step": 22120 + }, + { + "epoch": 60.275204359673026, + "grad_norm": 5.2056074142456055, + "learning_rate": 7.196032672375479e-06, + "loss": 0.1162, + "step": 22121 + }, + { + "epoch": 60.27792915531335, + "grad_norm": 5.498204708099365, + "learning_rate": 7.19518559064017e-06, + "loss": 0.1115, + "step": 22122 + }, + { + "epoch": 60.28065395095368, + "grad_norm": 3.208754062652588, + "learning_rate": 7.194338530748663e-06, + "loss": 0.0471, + "step": 22123 + }, + { + "epoch": 60.283378746594, + "grad_norm": 3.2935304641723633, + "learning_rate": 7.1934914927075595e-06, + "loss": 0.0933, + "step": 22124 + }, + { + "epoch": 60.28610354223433, + "grad_norm": 2.8551547527313232, + "learning_rate": 7.1926444765234515e-06, + "loss": 0.0838, + "step": 22125 + }, + { + "epoch": 60.28882833787466, + "grad_norm": 3.8854739665985107, + "learning_rate": 7.19179748220294e-06, + "loss": 0.13, + "step": 22126 + }, + { + "epoch": 60.29155313351499, + "grad_norm": 3.63547945022583, + "learning_rate": 7.190950509752617e-06, + "loss": 0.2624, + "step": 22127 + }, + { + "epoch": 60.294277929155314, + "grad_norm": 3.5233612060546875, + "learning_rate": 7.190103559179085e-06, + "loss": 0.1408, + "step": 22128 + }, + { + "epoch": 60.29700272479564, + "grad_norm": 4.2197675704956055, + "learning_rate": 7.1892566304889315e-06, + "loss": 0.1865, + "step": 22129 + }, + { + "epoch": 60.299727520435965, + "grad_norm": 2.6265814304351807, + "learning_rate": 7.188409723688759e-06, + "loss": 0.0843, + "step": 22130 + }, + { + "epoch": 60.30245231607629, + "grad_norm": 3.485671043395996, + "learning_rate": 7.18756283878516e-06, + "loss": 0.0534, + "step": 22131 + }, + { + "epoch": 60.305177111716624, + "grad_norm": 3.559150218963623, + "learning_rate": 7.186715975784731e-06, + "loss": 0.1518, + "step": 22132 + }, + { + "epoch": 60.30790190735695, + "grad_norm": 3.630086660385132, + "learning_rate": 7.18586913469407e-06, + "loss": 0.0574, + "step": 22133 + }, + { + "epoch": 60.310626702997276, + "grad_norm": 4.573139667510986, + "learning_rate": 7.185022315519768e-06, + "loss": 0.1498, + "step": 22134 + }, + { + "epoch": 60.3133514986376, + "grad_norm": 3.360421895980835, + "learning_rate": 7.1841755182684215e-06, + "loss": 0.0763, + "step": 22135 + }, + { + "epoch": 60.31607629427793, + "grad_norm": 5.917803764343262, + "learning_rate": 7.183328742946623e-06, + "loss": 0.1306, + "step": 22136 + }, + { + "epoch": 60.31880108991825, + "grad_norm": 3.198390007019043, + "learning_rate": 7.182481989560971e-06, + "loss": 0.0556, + "step": 22137 + }, + { + "epoch": 60.321525885558586, + "grad_norm": 4.424189567565918, + "learning_rate": 7.18163525811806e-06, + "loss": 0.1054, + "step": 22138 + }, + { + "epoch": 60.32425068119891, + "grad_norm": 3.526097059249878, + "learning_rate": 7.180788548624482e-06, + "loss": 0.1707, + "step": 22139 + }, + { + "epoch": 60.32697547683924, + "grad_norm": 4.693763732910156, + "learning_rate": 7.179941861086834e-06, + "loss": 0.1795, + "step": 22140 + }, + { + "epoch": 60.32970027247956, + "grad_norm": 4.731674671173096, + "learning_rate": 7.179095195511707e-06, + "loss": 0.1277, + "step": 22141 + }, + { + "epoch": 60.33242506811989, + "grad_norm": 4.0111165046691895, + "learning_rate": 7.178248551905696e-06, + "loss": 0.09, + "step": 22142 + }, + { + "epoch": 60.335149863760215, + "grad_norm": 4.440929889678955, + "learning_rate": 7.177401930275394e-06, + "loss": 0.058, + "step": 22143 + }, + { + "epoch": 60.33787465940055, + "grad_norm": 3.536142349243164, + "learning_rate": 7.176555330627395e-06, + "loss": 0.117, + "step": 22144 + }, + { + "epoch": 60.34059945504087, + "grad_norm": 3.8005049228668213, + "learning_rate": 7.175708752968291e-06, + "loss": 0.2346, + "step": 22145 + }, + { + "epoch": 60.3433242506812, + "grad_norm": 4.1204657554626465, + "learning_rate": 7.174862197304679e-06, + "loss": 0.1546, + "step": 22146 + }, + { + "epoch": 60.346049046321525, + "grad_norm": 3.4227209091186523, + "learning_rate": 7.174015663643147e-06, + "loss": 0.0885, + "step": 22147 + }, + { + "epoch": 60.34877384196185, + "grad_norm": 3.576946496963501, + "learning_rate": 7.173169151990291e-06, + "loss": 0.0629, + "step": 22148 + }, + { + "epoch": 60.35149863760218, + "grad_norm": 4.644906520843506, + "learning_rate": 7.172322662352702e-06, + "loss": 0.0993, + "step": 22149 + }, + { + "epoch": 60.35422343324251, + "grad_norm": 5.073850631713867, + "learning_rate": 7.171476194736975e-06, + "loss": 0.1712, + "step": 22150 + }, + { + "epoch": 60.356948228882835, + "grad_norm": 2.734004259109497, + "learning_rate": 7.170629749149698e-06, + "loss": 0.0679, + "step": 22151 + }, + { + "epoch": 60.35967302452316, + "grad_norm": 3.039759635925293, + "learning_rate": 7.169783325597468e-06, + "loss": 0.0629, + "step": 22152 + }, + { + "epoch": 60.36239782016349, + "grad_norm": 6.838952541351318, + "learning_rate": 7.168936924086866e-06, + "loss": 0.1168, + "step": 22153 + }, + { + "epoch": 60.36512261580381, + "grad_norm": 3.255216121673584, + "learning_rate": 7.168090544624501e-06, + "loss": 0.1238, + "step": 22154 + }, + { + "epoch": 60.36784741144414, + "grad_norm": 2.8387744426727295, + "learning_rate": 7.167244187216953e-06, + "loss": 0.1882, + "step": 22155 + }, + { + "epoch": 60.37057220708447, + "grad_norm": 3.734137535095215, + "learning_rate": 7.166397851870816e-06, + "loss": 0.1078, + "step": 22156 + }, + { + "epoch": 60.3732970027248, + "grad_norm": 3.122952461242676, + "learning_rate": 7.165551538592682e-06, + "loss": 0.146, + "step": 22157 + }, + { + "epoch": 60.37602179836512, + "grad_norm": 4.570494651794434, + "learning_rate": 7.164705247389143e-06, + "loss": 0.1751, + "step": 22158 + }, + { + "epoch": 60.37874659400545, + "grad_norm": 3.697592258453369, + "learning_rate": 7.163858978266786e-06, + "loss": 0.0641, + "step": 22159 + }, + { + "epoch": 60.381471389645775, + "grad_norm": 4.88624382019043, + "learning_rate": 7.163012731232206e-06, + "loss": 0.0748, + "step": 22160 + }, + { + "epoch": 60.3841961852861, + "grad_norm": 4.610586643218994, + "learning_rate": 7.162166506291988e-06, + "loss": 0.1797, + "step": 22161 + }, + { + "epoch": 60.38692098092643, + "grad_norm": 3.272887706756592, + "learning_rate": 7.16132030345273e-06, + "loss": 0.1669, + "step": 22162 + }, + { + "epoch": 60.38964577656676, + "grad_norm": 3.7306933403015137, + "learning_rate": 7.160474122721015e-06, + "loss": 0.2393, + "step": 22163 + }, + { + "epoch": 60.392370572207085, + "grad_norm": 2.8864564895629883, + "learning_rate": 7.159627964103439e-06, + "loss": 0.0601, + "step": 22164 + }, + { + "epoch": 60.39509536784741, + "grad_norm": 4.231517791748047, + "learning_rate": 7.158781827606587e-06, + "loss": 0.1163, + "step": 22165 + }, + { + "epoch": 60.39782016348774, + "grad_norm": 3.783748149871826, + "learning_rate": 7.157935713237052e-06, + "loss": 0.1739, + "step": 22166 + }, + { + "epoch": 60.40054495912806, + "grad_norm": 3.2768189907073975, + "learning_rate": 7.15708962100142e-06, + "loss": 0.0844, + "step": 22167 + }, + { + "epoch": 60.403269754768395, + "grad_norm": 4.838784694671631, + "learning_rate": 7.156243550906285e-06, + "loss": 0.1401, + "step": 22168 + }, + { + "epoch": 60.40599455040872, + "grad_norm": 3.03964900970459, + "learning_rate": 7.155397502958231e-06, + "loss": 0.0579, + "step": 22169 + }, + { + "epoch": 60.40871934604905, + "grad_norm": 2.7429299354553223, + "learning_rate": 7.154551477163848e-06, + "loss": 0.0578, + "step": 22170 + }, + { + "epoch": 60.41144414168937, + "grad_norm": 5.089840412139893, + "learning_rate": 7.153705473529731e-06, + "loss": 0.1068, + "step": 22171 + }, + { + "epoch": 60.4141689373297, + "grad_norm": 3.6841890811920166, + "learning_rate": 7.152859492062462e-06, + "loss": 0.0485, + "step": 22172 + }, + { + "epoch": 60.416893732970024, + "grad_norm": 3.1107046604156494, + "learning_rate": 7.152013532768633e-06, + "loss": 0.1558, + "step": 22173 + }, + { + "epoch": 60.41961852861036, + "grad_norm": 2.3434879779815674, + "learning_rate": 7.15116759565483e-06, + "loss": 0.0388, + "step": 22174 + }, + { + "epoch": 60.42234332425068, + "grad_norm": 4.760533332824707, + "learning_rate": 7.150321680727641e-06, + "loss": 0.152, + "step": 22175 + }, + { + "epoch": 60.42506811989101, + "grad_norm": 6.486580848693848, + "learning_rate": 7.149475787993658e-06, + "loss": 0.1653, + "step": 22176 + }, + { + "epoch": 60.427792915531334, + "grad_norm": 3.468561887741089, + "learning_rate": 7.148629917459464e-06, + "loss": 0.1182, + "step": 22177 + }, + { + "epoch": 60.43051771117166, + "grad_norm": 4.1860480308532715, + "learning_rate": 7.147784069131649e-06, + "loss": 0.2068, + "step": 22178 + }, + { + "epoch": 60.433242506811986, + "grad_norm": 8.364831924438477, + "learning_rate": 7.146938243016799e-06, + "loss": 0.1613, + "step": 22179 + }, + { + "epoch": 60.43596730245232, + "grad_norm": 3.9601993560791016, + "learning_rate": 7.146092439121504e-06, + "loss": 0.0836, + "step": 22180 + }, + { + "epoch": 60.438692098092645, + "grad_norm": 3.8030402660369873, + "learning_rate": 7.145246657452347e-06, + "loss": 0.0639, + "step": 22181 + }, + { + "epoch": 60.44141689373297, + "grad_norm": 3.136075258255005, + "learning_rate": 7.144400898015919e-06, + "loss": 0.0527, + "step": 22182 + }, + { + "epoch": 60.444141689373296, + "grad_norm": 3.5900537967681885, + "learning_rate": 7.1435551608188035e-06, + "loss": 0.1179, + "step": 22183 + }, + { + "epoch": 60.44686648501362, + "grad_norm": 3.3428232669830322, + "learning_rate": 7.14270944586759e-06, + "loss": 0.1567, + "step": 22184 + }, + { + "epoch": 60.44959128065395, + "grad_norm": 3.301100492477417, + "learning_rate": 7.141863753168861e-06, + "loss": 0.1342, + "step": 22185 + }, + { + "epoch": 60.45231607629428, + "grad_norm": 2.8534092903137207, + "learning_rate": 7.141018082729208e-06, + "loss": 0.0732, + "step": 22186 + }, + { + "epoch": 60.45504087193461, + "grad_norm": 2.955643892288208, + "learning_rate": 7.14017243455521e-06, + "loss": 0.0669, + "step": 22187 + }, + { + "epoch": 60.45776566757493, + "grad_norm": 3.058328628540039, + "learning_rate": 7.13932680865346e-06, + "loss": 0.0651, + "step": 22188 + }, + { + "epoch": 60.46049046321526, + "grad_norm": 3.639937162399292, + "learning_rate": 7.1384812050305404e-06, + "loss": 0.1457, + "step": 22189 + }, + { + "epoch": 60.463215258855584, + "grad_norm": 3.513044595718384, + "learning_rate": 7.137635623693036e-06, + "loss": 0.1729, + "step": 22190 + }, + { + "epoch": 60.46594005449591, + "grad_norm": 5.378262042999268, + "learning_rate": 7.136790064647536e-06, + "loss": 0.1175, + "step": 22191 + }, + { + "epoch": 60.46866485013624, + "grad_norm": 3.233370304107666, + "learning_rate": 7.1359445279006205e-06, + "loss": 0.0607, + "step": 22192 + }, + { + "epoch": 60.47138964577657, + "grad_norm": 4.573462963104248, + "learning_rate": 7.135099013458879e-06, + "loss": 0.1568, + "step": 22193 + }, + { + "epoch": 60.474114441416894, + "grad_norm": 6.657225131988525, + "learning_rate": 7.134253521328891e-06, + "loss": 0.109, + "step": 22194 + }, + { + "epoch": 60.47683923705722, + "grad_norm": 4.017292022705078, + "learning_rate": 7.133408051517247e-06, + "loss": 0.0874, + "step": 22195 + }, + { + "epoch": 60.479564032697546, + "grad_norm": 4.407981872558594, + "learning_rate": 7.1325626040305275e-06, + "loss": 0.1247, + "step": 22196 + }, + { + "epoch": 60.48228882833787, + "grad_norm": 2.8455512523651123, + "learning_rate": 7.131717178875317e-06, + "loss": 0.056, + "step": 22197 + }, + { + "epoch": 60.485013623978205, + "grad_norm": 4.186744689941406, + "learning_rate": 7.130871776058204e-06, + "loss": 0.0763, + "step": 22198 + }, + { + "epoch": 60.48773841961853, + "grad_norm": 3.396908760070801, + "learning_rate": 7.130026395585766e-06, + "loss": 0.0671, + "step": 22199 + }, + { + "epoch": 60.490463215258856, + "grad_norm": 3.2078208923339844, + "learning_rate": 7.129181037464593e-06, + "loss": 0.0563, + "step": 22200 + }, + { + "epoch": 60.49318801089918, + "grad_norm": 3.7207226753234863, + "learning_rate": 7.1283357017012635e-06, + "loss": 0.1127, + "step": 22201 + }, + { + "epoch": 60.49591280653951, + "grad_norm": 3.3196473121643066, + "learning_rate": 7.127490388302365e-06, + "loss": 0.1172, + "step": 22202 + }, + { + "epoch": 60.49863760217983, + "grad_norm": 3.7749881744384766, + "learning_rate": 7.126645097274477e-06, + "loss": 0.0881, + "step": 22203 + }, + { + "epoch": 60.50136239782017, + "grad_norm": 5.279852390289307, + "learning_rate": 7.125799828624187e-06, + "loss": 0.0739, + "step": 22204 + }, + { + "epoch": 60.50408719346049, + "grad_norm": 3.02209210395813, + "learning_rate": 7.12495458235807e-06, + "loss": 0.1081, + "step": 22205 + }, + { + "epoch": 60.50681198910082, + "grad_norm": 2.5446105003356934, + "learning_rate": 7.1241093584827185e-06, + "loss": 0.0489, + "step": 22206 + }, + { + "epoch": 60.509536784741144, + "grad_norm": 6.3202056884765625, + "learning_rate": 7.12326415700471e-06, + "loss": 0.0687, + "step": 22207 + }, + { + "epoch": 60.51226158038147, + "grad_norm": 4.158862113952637, + "learning_rate": 7.122418977930628e-06, + "loss": 0.1117, + "step": 22208 + }, + { + "epoch": 60.514986376021795, + "grad_norm": 3.6309733390808105, + "learning_rate": 7.121573821267055e-06, + "loss": 0.1504, + "step": 22209 + }, + { + "epoch": 60.51771117166213, + "grad_norm": 8.954504013061523, + "learning_rate": 7.120728687020571e-06, + "loss": 0.1151, + "step": 22210 + }, + { + "epoch": 60.520435967302454, + "grad_norm": 2.6598422527313232, + "learning_rate": 7.1198835751977615e-06, + "loss": 0.1323, + "step": 22211 + }, + { + "epoch": 60.52316076294278, + "grad_norm": 3.196981906890869, + "learning_rate": 7.119038485805203e-06, + "loss": 0.1082, + "step": 22212 + }, + { + "epoch": 60.525885558583106, + "grad_norm": 4.38768196105957, + "learning_rate": 7.118193418849483e-06, + "loss": 0.0946, + "step": 22213 + }, + { + "epoch": 60.52861035422343, + "grad_norm": 3.1019296646118164, + "learning_rate": 7.1173483743371775e-06, + "loss": 0.0557, + "step": 22214 + }, + { + "epoch": 60.53133514986376, + "grad_norm": 3.9349355697631836, + "learning_rate": 7.116503352274873e-06, + "loss": 0.0742, + "step": 22215 + }, + { + "epoch": 60.53405994550409, + "grad_norm": 3.114135503768921, + "learning_rate": 7.115658352669143e-06, + "loss": 0.0707, + "step": 22216 + }, + { + "epoch": 60.536784741144416, + "grad_norm": 2.8861827850341797, + "learning_rate": 7.114813375526577e-06, + "loss": 0.0675, + "step": 22217 + }, + { + "epoch": 60.53950953678474, + "grad_norm": 3.6690704822540283, + "learning_rate": 7.113968420853749e-06, + "loss": 0.07, + "step": 22218 + }, + { + "epoch": 60.54223433242507, + "grad_norm": 3.5133728981018066, + "learning_rate": 7.113123488657243e-06, + "loss": 0.216, + "step": 22219 + }, + { + "epoch": 60.54495912806539, + "grad_norm": 3.4835526943206787, + "learning_rate": 7.11227857894364e-06, + "loss": 0.0794, + "step": 22220 + }, + { + "epoch": 60.54768392370572, + "grad_norm": 3.0973880290985107, + "learning_rate": 7.111433691719516e-06, + "loss": 0.0509, + "step": 22221 + }, + { + "epoch": 60.55040871934605, + "grad_norm": 3.050398826599121, + "learning_rate": 7.110588826991451e-06, + "loss": 0.0558, + "step": 22222 + }, + { + "epoch": 60.55313351498638, + "grad_norm": 3.540860414505005, + "learning_rate": 7.109743984766032e-06, + "loss": 0.134, + "step": 22223 + }, + { + "epoch": 60.555858310626704, + "grad_norm": 3.0423455238342285, + "learning_rate": 7.108899165049832e-06, + "loss": 0.1101, + "step": 22224 + }, + { + "epoch": 60.55858310626703, + "grad_norm": 2.595421314239502, + "learning_rate": 7.108054367849434e-06, + "loss": 0.1572, + "step": 22225 + }, + { + "epoch": 60.561307901907355, + "grad_norm": 3.4921460151672363, + "learning_rate": 7.107209593171414e-06, + "loss": 0.0852, + "step": 22226 + }, + { + "epoch": 60.56403269754768, + "grad_norm": 2.6923108100891113, + "learning_rate": 7.106364841022353e-06, + "loss": 0.1585, + "step": 22227 + }, + { + "epoch": 60.566757493188014, + "grad_norm": 3.6124486923217773, + "learning_rate": 7.105520111408828e-06, + "loss": 0.0763, + "step": 22228 + }, + { + "epoch": 60.56948228882834, + "grad_norm": 3.460284471511841, + "learning_rate": 7.104675404337422e-06, + "loss": 0.0548, + "step": 22229 + }, + { + "epoch": 60.572207084468666, + "grad_norm": 3.73207950592041, + "learning_rate": 7.103830719814708e-06, + "loss": 0.1149, + "step": 22230 + }, + { + "epoch": 60.57493188010899, + "grad_norm": 3.1647777557373047, + "learning_rate": 7.102986057847269e-06, + "loss": 0.0626, + "step": 22231 + }, + { + "epoch": 60.57765667574932, + "grad_norm": 3.840442419052124, + "learning_rate": 7.102141418441681e-06, + "loss": 0.1868, + "step": 22232 + }, + { + "epoch": 60.58038147138964, + "grad_norm": 2.726717710494995, + "learning_rate": 7.101296801604525e-06, + "loss": 0.1371, + "step": 22233 + }, + { + "epoch": 60.583106267029976, + "grad_norm": 4.018718242645264, + "learning_rate": 7.100452207342372e-06, + "loss": 0.0779, + "step": 22234 + }, + { + "epoch": 60.5858310626703, + "grad_norm": 3.435814619064331, + "learning_rate": 7.099607635661806e-06, + "loss": 0.0674, + "step": 22235 + }, + { + "epoch": 60.58855585831063, + "grad_norm": 5.884005546569824, + "learning_rate": 7.0987630865694e-06, + "loss": 0.1441, + "step": 22236 + }, + { + "epoch": 60.59128065395095, + "grad_norm": 4.433471202850342, + "learning_rate": 7.097918560071737e-06, + "loss": 0.1748, + "step": 22237 + }, + { + "epoch": 60.59400544959128, + "grad_norm": 1.9378094673156738, + "learning_rate": 7.0970740561753884e-06, + "loss": 0.1367, + "step": 22238 + }, + { + "epoch": 60.596730245231605, + "grad_norm": 2.8464200496673584, + "learning_rate": 7.0962295748869314e-06, + "loss": 0.2006, + "step": 22239 + }, + { + "epoch": 60.59945504087194, + "grad_norm": 3.6421751976013184, + "learning_rate": 7.095385116212947e-06, + "loss": 0.1616, + "step": 22240 + }, + { + "epoch": 60.60217983651226, + "grad_norm": 4.609543800354004, + "learning_rate": 7.094540680160013e-06, + "loss": 0.1867, + "step": 22241 + }, + { + "epoch": 60.60490463215259, + "grad_norm": 4.839238166809082, + "learning_rate": 7.0936962667347e-06, + "loss": 0.0766, + "step": 22242 + }, + { + "epoch": 60.607629427792915, + "grad_norm": 4.464300155639648, + "learning_rate": 7.092851875943587e-06, + "loss": 0.1777, + "step": 22243 + }, + { + "epoch": 60.61035422343324, + "grad_norm": 4.258381366729736, + "learning_rate": 7.09200750779325e-06, + "loss": 0.0482, + "step": 22244 + }, + { + "epoch": 60.61307901907357, + "grad_norm": 3.4603633880615234, + "learning_rate": 7.091163162290266e-06, + "loss": 0.0709, + "step": 22245 + }, + { + "epoch": 60.6158038147139, + "grad_norm": 2.9299049377441406, + "learning_rate": 7.090318839441209e-06, + "loss": 0.117, + "step": 22246 + }, + { + "epoch": 60.618528610354225, + "grad_norm": 3.896228790283203, + "learning_rate": 7.089474539252656e-06, + "loss": 0.1283, + "step": 22247 + }, + { + "epoch": 60.62125340599455, + "grad_norm": 3.1333820819854736, + "learning_rate": 7.088630261731181e-06, + "loss": 0.1385, + "step": 22248 + }, + { + "epoch": 60.62397820163488, + "grad_norm": 3.3098950386047363, + "learning_rate": 7.087786006883362e-06, + "loss": 0.1398, + "step": 22249 + }, + { + "epoch": 60.6267029972752, + "grad_norm": 3.3676881790161133, + "learning_rate": 7.086941774715767e-06, + "loss": 0.097, + "step": 22250 + }, + { + "epoch": 60.62942779291553, + "grad_norm": 3.3836073875427246, + "learning_rate": 7.08609756523498e-06, + "loss": 0.0805, + "step": 22251 + }, + { + "epoch": 60.63215258855586, + "grad_norm": 4.441920280456543, + "learning_rate": 7.0852533784475695e-06, + "loss": 0.1654, + "step": 22252 + }, + { + "epoch": 60.63487738419619, + "grad_norm": 3.9132440090179443, + "learning_rate": 7.084409214360113e-06, + "loss": 0.0749, + "step": 22253 + }, + { + "epoch": 60.63760217983651, + "grad_norm": 3.0047171115875244, + "learning_rate": 7.083565072979182e-06, + "loss": 0.0818, + "step": 22254 + }, + { + "epoch": 60.64032697547684, + "grad_norm": 3.052492141723633, + "learning_rate": 7.082720954311354e-06, + "loss": 0.0597, + "step": 22255 + }, + { + "epoch": 60.643051771117165, + "grad_norm": 3.1172616481781006, + "learning_rate": 7.081876858363197e-06, + "loss": 0.0921, + "step": 22256 + }, + { + "epoch": 60.64577656675749, + "grad_norm": 2.963144302368164, + "learning_rate": 7.081032785141292e-06, + "loss": 0.2355, + "step": 22257 + }, + { + "epoch": 60.64850136239782, + "grad_norm": 3.6875598430633545, + "learning_rate": 7.0801887346522116e-06, + "loss": 0.0915, + "step": 22258 + }, + { + "epoch": 60.65122615803815, + "grad_norm": 2.982158899307251, + "learning_rate": 7.079344706902525e-06, + "loss": 0.0556, + "step": 22259 + }, + { + "epoch": 60.653950953678475, + "grad_norm": 3.083127021789551, + "learning_rate": 7.0785007018988095e-06, + "loss": 0.0559, + "step": 22260 + }, + { + "epoch": 60.6566757493188, + "grad_norm": 2.750852346420288, + "learning_rate": 7.077656719647636e-06, + "loss": 0.1345, + "step": 22261 + }, + { + "epoch": 60.65940054495913, + "grad_norm": 3.7517549991607666, + "learning_rate": 7.076812760155576e-06, + "loss": 0.0534, + "step": 22262 + }, + { + "epoch": 60.66212534059945, + "grad_norm": 4.5389556884765625, + "learning_rate": 7.075968823429207e-06, + "loss": 0.1213, + "step": 22263 + }, + { + "epoch": 60.664850136239785, + "grad_norm": 3.5940957069396973, + "learning_rate": 7.075124909475097e-06, + "loss": 0.049, + "step": 22264 + }, + { + "epoch": 60.66757493188011, + "grad_norm": 2.6097493171691895, + "learning_rate": 7.074281018299822e-06, + "loss": 0.092, + "step": 22265 + }, + { + "epoch": 60.67029972752044, + "grad_norm": 4.9819655418396, + "learning_rate": 7.07343714990995e-06, + "loss": 0.0739, + "step": 22266 + }, + { + "epoch": 60.67302452316076, + "grad_norm": 3.7648372650146484, + "learning_rate": 7.072593304312057e-06, + "loss": 0.0592, + "step": 22267 + }, + { + "epoch": 60.67574931880109, + "grad_norm": 2.8173046112060547, + "learning_rate": 7.071749481512712e-06, + "loss": 0.083, + "step": 22268 + }, + { + "epoch": 60.678474114441414, + "grad_norm": 4.30924129486084, + "learning_rate": 7.070905681518489e-06, + "loss": 0.2088, + "step": 22269 + }, + { + "epoch": 60.68119891008175, + "grad_norm": 3.3528645038604736, + "learning_rate": 7.070061904335956e-06, + "loss": 0.0917, + "step": 22270 + }, + { + "epoch": 60.68392370572207, + "grad_norm": 3.794343948364258, + "learning_rate": 7.0692181499716905e-06, + "loss": 0.0905, + "step": 22271 + }, + { + "epoch": 60.6866485013624, + "grad_norm": 3.7777822017669678, + "learning_rate": 7.0683744184322554e-06, + "loss": 0.0592, + "step": 22272 + }, + { + "epoch": 60.689373297002724, + "grad_norm": 3.484302043914795, + "learning_rate": 7.067530709724226e-06, + "loss": 0.2144, + "step": 22273 + }, + { + "epoch": 60.69209809264305, + "grad_norm": 3.621645927429199, + "learning_rate": 7.066687023854175e-06, + "loss": 0.0953, + "step": 22274 + }, + { + "epoch": 60.694822888283376, + "grad_norm": 4.2324018478393555, + "learning_rate": 7.06584336082867e-06, + "loss": 0.0622, + "step": 22275 + }, + { + "epoch": 60.69754768392371, + "grad_norm": 3.1080031394958496, + "learning_rate": 7.0649997206542855e-06, + "loss": 0.083, + "step": 22276 + }, + { + "epoch": 60.700272479564035, + "grad_norm": 17.693635940551758, + "learning_rate": 7.064156103337585e-06, + "loss": 0.1117, + "step": 22277 + }, + { + "epoch": 60.70299727520436, + "grad_norm": 3.959184169769287, + "learning_rate": 7.063312508885145e-06, + "loss": 0.1859, + "step": 22278 + }, + { + "epoch": 60.705722070844686, + "grad_norm": 3.653937339782715, + "learning_rate": 7.06246893730353e-06, + "loss": 0.1018, + "step": 22279 + }, + { + "epoch": 60.70844686648501, + "grad_norm": 4.431345462799072, + "learning_rate": 7.061625388599316e-06, + "loss": 0.134, + "step": 22280 + }, + { + "epoch": 60.71117166212534, + "grad_norm": 2.741877317428589, + "learning_rate": 7.060781862779067e-06, + "loss": 0.0766, + "step": 22281 + }, + { + "epoch": 60.71389645776567, + "grad_norm": 3.2073557376861572, + "learning_rate": 7.0599383598493545e-06, + "loss": 0.0572, + "step": 22282 + }, + { + "epoch": 60.716621253406, + "grad_norm": 4.956356048583984, + "learning_rate": 7.059094879816746e-06, + "loss": 0.1087, + "step": 22283 + }, + { + "epoch": 60.71934604904632, + "grad_norm": 3.5810546875, + "learning_rate": 7.058251422687812e-06, + "loss": 0.1391, + "step": 22284 + }, + { + "epoch": 60.72207084468665, + "grad_norm": 2.8752553462982178, + "learning_rate": 7.057407988469123e-06, + "loss": 0.1421, + "step": 22285 + }, + { + "epoch": 60.724795640326974, + "grad_norm": 4.71677303314209, + "learning_rate": 7.056564577167244e-06, + "loss": 0.1228, + "step": 22286 + }, + { + "epoch": 60.7275204359673, + "grad_norm": 3.7873075008392334, + "learning_rate": 7.055721188788749e-06, + "loss": 0.0911, + "step": 22287 + }, + { + "epoch": 60.73024523160763, + "grad_norm": 4.778517723083496, + "learning_rate": 7.054877823340199e-06, + "loss": 0.2246, + "step": 22288 + }, + { + "epoch": 60.73297002724796, + "grad_norm": 5.951353549957275, + "learning_rate": 7.054034480828167e-06, + "loss": 0.12, + "step": 22289 + }, + { + "epoch": 60.735694822888284, + "grad_norm": 4.711767196655273, + "learning_rate": 7.0531911612592184e-06, + "loss": 0.1744, + "step": 22290 + }, + { + "epoch": 60.73841961852861, + "grad_norm": 3.759284496307373, + "learning_rate": 7.052347864639921e-06, + "loss": 0.0527, + "step": 22291 + }, + { + "epoch": 60.741144414168936, + "grad_norm": 4.224436283111572, + "learning_rate": 7.051504590976847e-06, + "loss": 0.0721, + "step": 22292 + }, + { + "epoch": 60.74386920980926, + "grad_norm": 3.3867928981781006, + "learning_rate": 7.050661340276558e-06, + "loss": 0.0701, + "step": 22293 + }, + { + "epoch": 60.746594005449595, + "grad_norm": 3.020172119140625, + "learning_rate": 7.049818112545626e-06, + "loss": 0.0398, + "step": 22294 + }, + { + "epoch": 60.74931880108992, + "grad_norm": 4.343257427215576, + "learning_rate": 7.048974907790613e-06, + "loss": 0.1534, + "step": 22295 + }, + { + "epoch": 60.752043596730246, + "grad_norm": 2.9345269203186035, + "learning_rate": 7.0481317260180905e-06, + "loss": 0.0415, + "step": 22296 + }, + { + "epoch": 60.75476839237057, + "grad_norm": 3.8636176586151123, + "learning_rate": 7.047288567234621e-06, + "loss": 0.1054, + "step": 22297 + }, + { + "epoch": 60.7574931880109, + "grad_norm": 4.413434028625488, + "learning_rate": 7.046445431446775e-06, + "loss": 0.0801, + "step": 22298 + }, + { + "epoch": 60.76021798365122, + "grad_norm": 10.045730590820312, + "learning_rate": 7.045602318661117e-06, + "loss": 0.1175, + "step": 22299 + }, + { + "epoch": 60.762942779291556, + "grad_norm": 4.641239643096924, + "learning_rate": 7.044759228884212e-06, + "loss": 0.1289, + "step": 22300 + }, + { + "epoch": 60.76566757493188, + "grad_norm": 3.2659778594970703, + "learning_rate": 7.043916162122628e-06, + "loss": 0.0746, + "step": 22301 + }, + { + "epoch": 60.76839237057221, + "grad_norm": 3.401627540588379, + "learning_rate": 7.0430731183829305e-06, + "loss": 0.1623, + "step": 22302 + }, + { + "epoch": 60.771117166212534, + "grad_norm": 4.0639190673828125, + "learning_rate": 7.042230097671681e-06, + "loss": 0.1029, + "step": 22303 + }, + { + "epoch": 60.77384196185286, + "grad_norm": 4.258162498474121, + "learning_rate": 7.0413870999954525e-06, + "loss": 0.0601, + "step": 22304 + }, + { + "epoch": 60.776566757493185, + "grad_norm": 3.7025859355926514, + "learning_rate": 7.040544125360802e-06, + "loss": 0.0993, + "step": 22305 + }, + { + "epoch": 60.77929155313352, + "grad_norm": 2.8596882820129395, + "learning_rate": 7.0397011737743e-06, + "loss": 0.0642, + "step": 22306 + }, + { + "epoch": 60.782016348773844, + "grad_norm": 4.452273845672607, + "learning_rate": 7.038858245242513e-06, + "loss": 0.1547, + "step": 22307 + }, + { + "epoch": 60.78474114441417, + "grad_norm": 4.354523658752441, + "learning_rate": 7.038015339771996e-06, + "loss": 0.1604, + "step": 22308 + }, + { + "epoch": 60.787465940054496, + "grad_norm": 3.5376999378204346, + "learning_rate": 7.037172457369324e-06, + "loss": 0.06, + "step": 22309 + }, + { + "epoch": 60.79019073569482, + "grad_norm": 3.7299249172210693, + "learning_rate": 7.036329598041058e-06, + "loss": 0.0904, + "step": 22310 + }, + { + "epoch": 60.79291553133515, + "grad_norm": 4.104896545410156, + "learning_rate": 7.035486761793762e-06, + "loss": 0.1193, + "step": 22311 + }, + { + "epoch": 60.79564032697548, + "grad_norm": 4.079039096832275, + "learning_rate": 7.034643948634e-06, + "loss": 0.0749, + "step": 22312 + }, + { + "epoch": 60.798365122615806, + "grad_norm": 3.414623975753784, + "learning_rate": 7.033801158568334e-06, + "loss": 0.0761, + "step": 22313 + }, + { + "epoch": 60.80108991825613, + "grad_norm": 2.737549066543579, + "learning_rate": 7.03295839160333e-06, + "loss": 0.1327, + "step": 22314 + }, + { + "epoch": 60.80381471389646, + "grad_norm": 3.315855026245117, + "learning_rate": 7.03211564774555e-06, + "loss": 0.1702, + "step": 22315 + }, + { + "epoch": 60.80653950953678, + "grad_norm": 3.430767059326172, + "learning_rate": 7.03127292700156e-06, + "loss": 0.1141, + "step": 22316 + }, + { + "epoch": 60.80926430517711, + "grad_norm": 3.510793924331665, + "learning_rate": 7.030430229377918e-06, + "loss": 0.0642, + "step": 22317 + }, + { + "epoch": 60.81198910081744, + "grad_norm": 3.1327335834503174, + "learning_rate": 7.029587554881192e-06, + "loss": 0.0691, + "step": 22318 + }, + { + "epoch": 60.81471389645777, + "grad_norm": 2.9371345043182373, + "learning_rate": 7.028744903517941e-06, + "loss": 0.118, + "step": 22319 + }, + { + "epoch": 60.817438692098094, + "grad_norm": 4.144138813018799, + "learning_rate": 7.027902275294731e-06, + "loss": 0.1529, + "step": 22320 + }, + { + "epoch": 60.82016348773842, + "grad_norm": 3.3764593601226807, + "learning_rate": 7.027059670218119e-06, + "loss": 0.185, + "step": 22321 + }, + { + "epoch": 60.822888283378745, + "grad_norm": 3.683173894882202, + "learning_rate": 7.026217088294674e-06, + "loss": 0.0987, + "step": 22322 + }, + { + "epoch": 60.82561307901907, + "grad_norm": 3.99582576751709, + "learning_rate": 7.025374529530952e-06, + "loss": 0.1898, + "step": 22323 + }, + { + "epoch": 60.828337874659404, + "grad_norm": 4.927083969116211, + "learning_rate": 7.024531993933521e-06, + "loss": 0.1131, + "step": 22324 + }, + { + "epoch": 60.83106267029973, + "grad_norm": 6.777295112609863, + "learning_rate": 7.023689481508931e-06, + "loss": 0.1139, + "step": 22325 + }, + { + "epoch": 60.833787465940055, + "grad_norm": 4.779987812042236, + "learning_rate": 7.0228469922637586e-06, + "loss": 0.0963, + "step": 22326 + }, + { + "epoch": 60.83651226158038, + "grad_norm": 3.708977460861206, + "learning_rate": 7.0220045262045555e-06, + "loss": 0.0673, + "step": 22327 + }, + { + "epoch": 60.83923705722071, + "grad_norm": 4.627310752868652, + "learning_rate": 7.021162083337888e-06, + "loss": 0.255, + "step": 22328 + }, + { + "epoch": 60.84196185286103, + "grad_norm": 3.8745877742767334, + "learning_rate": 7.020319663670312e-06, + "loss": 0.1111, + "step": 22329 + }, + { + "epoch": 60.844686648501366, + "grad_norm": 4.898205757141113, + "learning_rate": 7.019477267208392e-06, + "loss": 0.1139, + "step": 22330 + }, + { + "epoch": 60.84741144414169, + "grad_norm": 4.8633952140808105, + "learning_rate": 7.018634893958686e-06, + "loss": 0.254, + "step": 22331 + }, + { + "epoch": 60.85013623978202, + "grad_norm": 3.453780174255371, + "learning_rate": 7.0177925439277574e-06, + "loss": 0.0698, + "step": 22332 + }, + { + "epoch": 60.85286103542234, + "grad_norm": 3.9543163776397705, + "learning_rate": 7.016950217122162e-06, + "loss": 0.1174, + "step": 22333 + }, + { + "epoch": 60.85558583106267, + "grad_norm": 4.60977029800415, + "learning_rate": 7.016107913548465e-06, + "loss": 0.1254, + "step": 22334 + }, + { + "epoch": 60.858310626702995, + "grad_norm": 4.855064868927002, + "learning_rate": 7.01526563321322e-06, + "loss": 0.1817, + "step": 22335 + }, + { + "epoch": 60.86103542234333, + "grad_norm": 3.0899245738983154, + "learning_rate": 7.014423376122993e-06, + "loss": 0.1541, + "step": 22336 + }, + { + "epoch": 60.86376021798365, + "grad_norm": 5.996626377105713, + "learning_rate": 7.0135811422843384e-06, + "loss": 0.065, + "step": 22337 + }, + { + "epoch": 60.86648501362398, + "grad_norm": 4.739663600921631, + "learning_rate": 7.0127389317038205e-06, + "loss": 0.1193, + "step": 22338 + }, + { + "epoch": 60.869209809264305, + "grad_norm": 3.998300552368164, + "learning_rate": 7.011896744387993e-06, + "loss": 0.1159, + "step": 22339 + }, + { + "epoch": 60.87193460490463, + "grad_norm": 3.2619245052337646, + "learning_rate": 7.011054580343421e-06, + "loss": 0.0794, + "step": 22340 + }, + { + "epoch": 60.87465940054496, + "grad_norm": 3.9167654514312744, + "learning_rate": 7.010212439576656e-06, + "loss": 0.0969, + "step": 22341 + }, + { + "epoch": 60.87738419618529, + "grad_norm": 3.9060447216033936, + "learning_rate": 7.009370322094258e-06, + "loss": 0.0973, + "step": 22342 + }, + { + "epoch": 60.880108991825615, + "grad_norm": 3.3744008541107178, + "learning_rate": 7.008528227902793e-06, + "loss": 0.1455, + "step": 22343 + }, + { + "epoch": 60.88283378746594, + "grad_norm": 3.30375075340271, + "learning_rate": 7.00768615700881e-06, + "loss": 0.0569, + "step": 22344 + }, + { + "epoch": 60.88555858310627, + "grad_norm": 2.545348644256592, + "learning_rate": 7.006844109418876e-06, + "loss": 0.0956, + "step": 22345 + }, + { + "epoch": 60.88828337874659, + "grad_norm": 5.121275901794434, + "learning_rate": 7.0060020851395395e-06, + "loss": 0.2386, + "step": 22346 + }, + { + "epoch": 60.89100817438692, + "grad_norm": 3.8333396911621094, + "learning_rate": 7.005160084177365e-06, + "loss": 0.1525, + "step": 22347 + }, + { + "epoch": 60.89373297002725, + "grad_norm": 5.419399261474609, + "learning_rate": 7.0043181065389055e-06, + "loss": 0.1043, + "step": 22348 + }, + { + "epoch": 60.89645776566758, + "grad_norm": 3.4094061851501465, + "learning_rate": 7.003476152230719e-06, + "loss": 0.327, + "step": 22349 + }, + { + "epoch": 60.8991825613079, + "grad_norm": 3.9822192192077637, + "learning_rate": 7.0026342212593674e-06, + "loss": 0.0889, + "step": 22350 + }, + { + "epoch": 60.90190735694823, + "grad_norm": 3.1728477478027344, + "learning_rate": 7.001792313631401e-06, + "loss": 0.0861, + "step": 22351 + }, + { + "epoch": 60.904632152588555, + "grad_norm": 3.60927414894104, + "learning_rate": 7.000950429353382e-06, + "loss": 0.0656, + "step": 22352 + }, + { + "epoch": 60.90735694822888, + "grad_norm": 3.099705696105957, + "learning_rate": 7.000108568431863e-06, + "loss": 0.0534, + "step": 22353 + }, + { + "epoch": 60.91008174386921, + "grad_norm": 5.447761058807373, + "learning_rate": 6.999266730873403e-06, + "loss": 0.0543, + "step": 22354 + }, + { + "epoch": 60.91280653950954, + "grad_norm": 3.7554986476898193, + "learning_rate": 6.998424916684557e-06, + "loss": 0.1462, + "step": 22355 + }, + { + "epoch": 60.915531335149865, + "grad_norm": 2.8073854446411133, + "learning_rate": 6.997583125871881e-06, + "loss": 0.057, + "step": 22356 + }, + { + "epoch": 60.91825613079019, + "grad_norm": 3.9090890884399414, + "learning_rate": 6.996741358441928e-06, + "loss": 0.0587, + "step": 22357 + }, + { + "epoch": 60.920980926430516, + "grad_norm": 5.497412204742432, + "learning_rate": 6.995899614401261e-06, + "loss": 0.1058, + "step": 22358 + }, + { + "epoch": 60.92370572207084, + "grad_norm": 5.184669017791748, + "learning_rate": 6.9950578937564265e-06, + "loss": 0.1425, + "step": 22359 + }, + { + "epoch": 60.926430517711175, + "grad_norm": 4.452134132385254, + "learning_rate": 6.994216196513985e-06, + "loss": 0.1044, + "step": 22360 + }, + { + "epoch": 60.9291553133515, + "grad_norm": 3.787231206893921, + "learning_rate": 6.9933745226804965e-06, + "loss": 0.1101, + "step": 22361 + }, + { + "epoch": 60.93188010899183, + "grad_norm": 5.098844051361084, + "learning_rate": 6.992532872262505e-06, + "loss": 0.1892, + "step": 22362 + }, + { + "epoch": 60.93460490463215, + "grad_norm": 2.834341287612915, + "learning_rate": 6.991691245266574e-06, + "loss": 0.0508, + "step": 22363 + }, + { + "epoch": 60.93732970027248, + "grad_norm": 3.818565607070923, + "learning_rate": 6.990849641699254e-06, + "loss": 0.071, + "step": 22364 + }, + { + "epoch": 60.940054495912804, + "grad_norm": 3.319694757461548, + "learning_rate": 6.9900080615671e-06, + "loss": 0.1031, + "step": 22365 + }, + { + "epoch": 60.94277929155314, + "grad_norm": 4.184003829956055, + "learning_rate": 6.989166504876665e-06, + "loss": 0.1331, + "step": 22366 + }, + { + "epoch": 60.94550408719346, + "grad_norm": 3.072000741958618, + "learning_rate": 6.988324971634506e-06, + "loss": 0.0658, + "step": 22367 + }, + { + "epoch": 60.94822888283379, + "grad_norm": 5.3535943031311035, + "learning_rate": 6.987483461847174e-06, + "loss": 0.1483, + "step": 22368 + }, + { + "epoch": 60.950953678474114, + "grad_norm": 3.907127618789673, + "learning_rate": 6.9866419755212264e-06, + "loss": 0.0844, + "step": 22369 + }, + { + "epoch": 60.95367847411444, + "grad_norm": 4.069503307342529, + "learning_rate": 6.98580051266321e-06, + "loss": 0.108, + "step": 22370 + }, + { + "epoch": 60.956403269754766, + "grad_norm": 4.840079307556152, + "learning_rate": 6.9849590732796845e-06, + "loss": 0.0725, + "step": 22371 + }, + { + "epoch": 60.95912806539509, + "grad_norm": 4.470433712005615, + "learning_rate": 6.9841176573772005e-06, + "loss": 0.2054, + "step": 22372 + }, + { + "epoch": 60.961852861035425, + "grad_norm": 3.4157469272613525, + "learning_rate": 6.983276264962311e-06, + "loss": 0.1004, + "step": 22373 + }, + { + "epoch": 60.96457765667575, + "grad_norm": 3.0583250522613525, + "learning_rate": 6.98243489604157e-06, + "loss": 0.0575, + "step": 22374 + }, + { + "epoch": 60.967302452316076, + "grad_norm": 4.783733367919922, + "learning_rate": 6.981593550621528e-06, + "loss": 0.1084, + "step": 22375 + }, + { + "epoch": 60.9700272479564, + "grad_norm": 4.70540714263916, + "learning_rate": 6.980752228708738e-06, + "loss": 0.0414, + "step": 22376 + }, + { + "epoch": 60.97275204359673, + "grad_norm": 5.025938034057617, + "learning_rate": 6.97991093030975e-06, + "loss": 0.0565, + "step": 22377 + }, + { + "epoch": 60.97547683923706, + "grad_norm": 3.380636692047119, + "learning_rate": 6.979069655431121e-06, + "loss": 0.0724, + "step": 22378 + }, + { + "epoch": 60.97820163487739, + "grad_norm": 2.896272897720337, + "learning_rate": 6.978228404079401e-06, + "loss": 0.0569, + "step": 22379 + }, + { + "epoch": 60.98092643051771, + "grad_norm": 5.541884422302246, + "learning_rate": 6.97738717626114e-06, + "loss": 0.0641, + "step": 22380 + }, + { + "epoch": 60.98365122615804, + "grad_norm": 3.4038572311401367, + "learning_rate": 6.976545971982892e-06, + "loss": 0.1173, + "step": 22381 + }, + { + "epoch": 60.986376021798364, + "grad_norm": 4.201849460601807, + "learning_rate": 6.975704791251205e-06, + "loss": 0.0852, + "step": 22382 + }, + { + "epoch": 60.98910081743869, + "grad_norm": 3.5013699531555176, + "learning_rate": 6.974863634072633e-06, + "loss": 0.1106, + "step": 22383 + }, + { + "epoch": 60.991825613079016, + "grad_norm": 2.2500011920928955, + "learning_rate": 6.974022500453723e-06, + "loss": 0.0475, + "step": 22384 + }, + { + "epoch": 60.99455040871935, + "grad_norm": 5.096434593200684, + "learning_rate": 6.973181390401031e-06, + "loss": 0.087, + "step": 22385 + }, + { + "epoch": 60.997275204359674, + "grad_norm": 3.684089422225952, + "learning_rate": 6.972340303921105e-06, + "loss": 0.1392, + "step": 22386 + }, + { + "epoch": 61.0, + "grad_norm": 3.029940128326416, + "learning_rate": 6.971499241020495e-06, + "loss": 0.0491, + "step": 22387 + }, + { + "epoch": 61.002724795640326, + "grad_norm": 3.285654306411743, + "learning_rate": 6.97065820170575e-06, + "loss": 0.046, + "step": 22388 + }, + { + "epoch": 61.00544959128065, + "grad_norm": 4.274191856384277, + "learning_rate": 6.969817185983423e-06, + "loss": 0.1853, + "step": 22389 + }, + { + "epoch": 61.00817438692098, + "grad_norm": 3.9813826084136963, + "learning_rate": 6.968976193860061e-06, + "loss": 0.0845, + "step": 22390 + }, + { + "epoch": 61.01089918256131, + "grad_norm": 3.7100205421447754, + "learning_rate": 6.968135225342216e-06, + "loss": 0.0688, + "step": 22391 + }, + { + "epoch": 61.013623978201636, + "grad_norm": 2.5532753467559814, + "learning_rate": 6.967294280436435e-06, + "loss": 0.0678, + "step": 22392 + }, + { + "epoch": 61.01634877384196, + "grad_norm": 13.749371528625488, + "learning_rate": 6.9664533591492676e-06, + "loss": 0.1025, + "step": 22393 + }, + { + "epoch": 61.01907356948229, + "grad_norm": 5.873416900634766, + "learning_rate": 6.965612461487263e-06, + "loss": 0.1202, + "step": 22394 + }, + { + "epoch": 61.02179836512261, + "grad_norm": 3.4473066329956055, + "learning_rate": 6.9647715874569744e-06, + "loss": 0.0517, + "step": 22395 + }, + { + "epoch": 61.02452316076294, + "grad_norm": 3.542557716369629, + "learning_rate": 6.963930737064946e-06, + "loss": 0.1713, + "step": 22396 + }, + { + "epoch": 61.02724795640327, + "grad_norm": 3.8530821800231934, + "learning_rate": 6.9630899103177275e-06, + "loss": 0.0548, + "step": 22397 + }, + { + "epoch": 61.0299727520436, + "grad_norm": 3.076282501220703, + "learning_rate": 6.962249107221865e-06, + "loss": 0.0881, + "step": 22398 + }, + { + "epoch": 61.032697547683924, + "grad_norm": 3.455415964126587, + "learning_rate": 6.961408327783911e-06, + "loss": 0.1036, + "step": 22399 + }, + { + "epoch": 61.03542234332425, + "grad_norm": 3.222121477127075, + "learning_rate": 6.9605675720104105e-06, + "loss": 0.1229, + "step": 22400 + }, + { + "epoch": 61.038147138964575, + "grad_norm": 4.793354511260986, + "learning_rate": 6.959726839907914e-06, + "loss": 0.1207, + "step": 22401 + }, + { + "epoch": 61.0408719346049, + "grad_norm": 4.104300498962402, + "learning_rate": 6.958886131482964e-06, + "loss": 0.0864, + "step": 22402 + }, + { + "epoch": 61.043596730245234, + "grad_norm": 3.9924874305725098, + "learning_rate": 6.958045446742112e-06, + "loss": 0.0618, + "step": 22403 + }, + { + "epoch": 61.04632152588556, + "grad_norm": 2.7155587673187256, + "learning_rate": 6.957204785691905e-06, + "loss": 0.0994, + "step": 22404 + }, + { + "epoch": 61.049046321525886, + "grad_norm": 3.9910666942596436, + "learning_rate": 6.956364148338888e-06, + "loss": 0.0863, + "step": 22405 + }, + { + "epoch": 61.05177111716621, + "grad_norm": 3.0680413246154785, + "learning_rate": 6.955523534689609e-06, + "loss": 0.0805, + "step": 22406 + }, + { + "epoch": 61.05449591280654, + "grad_norm": 4.468904495239258, + "learning_rate": 6.954682944750616e-06, + "loss": 0.0771, + "step": 22407 + }, + { + "epoch": 61.05722070844686, + "grad_norm": 2.7519149780273438, + "learning_rate": 6.9538423785284524e-06, + "loss": 0.1257, + "step": 22408 + }, + { + "epoch": 61.059945504087196, + "grad_norm": 4.085991382598877, + "learning_rate": 6.953001836029668e-06, + "loss": 0.1341, + "step": 22409 + }, + { + "epoch": 61.06267029972752, + "grad_norm": 3.700883626937866, + "learning_rate": 6.952161317260806e-06, + "loss": 0.1026, + "step": 22410 + }, + { + "epoch": 61.06539509536785, + "grad_norm": 2.7471423149108887, + "learning_rate": 6.951320822228411e-06, + "loss": 0.0779, + "step": 22411 + }, + { + "epoch": 61.06811989100817, + "grad_norm": 3.2887837886810303, + "learning_rate": 6.9504803509390324e-06, + "loss": 0.0651, + "step": 22412 + }, + { + "epoch": 61.0708446866485, + "grad_norm": 4.459373950958252, + "learning_rate": 6.949639903399219e-06, + "loss": 0.0993, + "step": 22413 + }, + { + "epoch": 61.073569482288825, + "grad_norm": 3.905278205871582, + "learning_rate": 6.948799479615508e-06, + "loss": 0.183, + "step": 22414 + }, + { + "epoch": 61.07629427792916, + "grad_norm": 4.412621974945068, + "learning_rate": 6.947959079594451e-06, + "loss": 0.0534, + "step": 22415 + }, + { + "epoch": 61.079019073569484, + "grad_norm": 3.1119372844696045, + "learning_rate": 6.947118703342588e-06, + "loss": 0.0983, + "step": 22416 + }, + { + "epoch": 61.08174386920981, + "grad_norm": 3.1814849376678467, + "learning_rate": 6.9462783508664685e-06, + "loss": 0.0478, + "step": 22417 + }, + { + "epoch": 61.084468664850135, + "grad_norm": 3.6415998935699463, + "learning_rate": 6.9454380221726335e-06, + "loss": 0.2283, + "step": 22418 + }, + { + "epoch": 61.08719346049046, + "grad_norm": 3.1991705894470215, + "learning_rate": 6.9445977172676315e-06, + "loss": 0.1656, + "step": 22419 + }, + { + "epoch": 61.08991825613079, + "grad_norm": 3.5609500408172607, + "learning_rate": 6.943757436158001e-06, + "loss": 0.2535, + "step": 22420 + }, + { + "epoch": 61.09264305177112, + "grad_norm": 3.4742014408111572, + "learning_rate": 6.94291717885029e-06, + "loss": 0.0565, + "step": 22421 + }, + { + "epoch": 61.095367847411445, + "grad_norm": 5.54591703414917, + "learning_rate": 6.9420769453510415e-06, + "loss": 0.0777, + "step": 22422 + }, + { + "epoch": 61.09809264305177, + "grad_norm": 3.9256865978240967, + "learning_rate": 6.941236735666801e-06, + "loss": 0.1117, + "step": 22423 + }, + { + "epoch": 61.1008174386921, + "grad_norm": 4.0424017906188965, + "learning_rate": 6.9403965498041084e-06, + "loss": 0.1486, + "step": 22424 + }, + { + "epoch": 61.10354223433242, + "grad_norm": 3.375750780105591, + "learning_rate": 6.939556387769511e-06, + "loss": 0.3533, + "step": 22425 + }, + { + "epoch": 61.10626702997275, + "grad_norm": 3.0661110877990723, + "learning_rate": 6.9387162495695485e-06, + "loss": 0.2026, + "step": 22426 + }, + { + "epoch": 61.10899182561308, + "grad_norm": 3.263305902481079, + "learning_rate": 6.937876135210766e-06, + "loss": 0.1391, + "step": 22427 + }, + { + "epoch": 61.11171662125341, + "grad_norm": 6.555750370025635, + "learning_rate": 6.937036044699701e-06, + "loss": 0.085, + "step": 22428 + }, + { + "epoch": 61.11444141689373, + "grad_norm": 2.908816337585449, + "learning_rate": 6.936195978042904e-06, + "loss": 0.157, + "step": 22429 + }, + { + "epoch": 61.11716621253406, + "grad_norm": 3.787827253341675, + "learning_rate": 6.9353559352469165e-06, + "loss": 0.1936, + "step": 22430 + }, + { + "epoch": 61.119891008174385, + "grad_norm": 3.831509590148926, + "learning_rate": 6.934515916318276e-06, + "loss": 0.0693, + "step": 22431 + }, + { + "epoch": 61.12261580381471, + "grad_norm": 5.685774326324463, + "learning_rate": 6.9336759212635285e-06, + "loss": 0.0648, + "step": 22432 + }, + { + "epoch": 61.12534059945504, + "grad_norm": 3.847019672393799, + "learning_rate": 6.932835950089211e-06, + "loss": 0.126, + "step": 22433 + }, + { + "epoch": 61.12806539509537, + "grad_norm": 2.8347580432891846, + "learning_rate": 6.93199600280187e-06, + "loss": 0.0598, + "step": 22434 + }, + { + "epoch": 61.130790190735695, + "grad_norm": 2.3914573192596436, + "learning_rate": 6.931156079408048e-06, + "loss": 0.0418, + "step": 22435 + }, + { + "epoch": 61.13351498637602, + "grad_norm": 3.817255973815918, + "learning_rate": 6.930316179914281e-06, + "loss": 0.1644, + "step": 22436 + }, + { + "epoch": 61.13623978201635, + "grad_norm": 3.574416160583496, + "learning_rate": 6.9294763043271156e-06, + "loss": 0.1007, + "step": 22437 + }, + { + "epoch": 61.13896457765667, + "grad_norm": 3.91249942779541, + "learning_rate": 6.928636452653086e-06, + "loss": 0.1997, + "step": 22438 + }, + { + "epoch": 61.141689373297005, + "grad_norm": 4.053663730621338, + "learning_rate": 6.9277966248987405e-06, + "loss": 0.1863, + "step": 22439 + }, + { + "epoch": 61.14441416893733, + "grad_norm": 3.43363881111145, + "learning_rate": 6.926956821070614e-06, + "loss": 0.1179, + "step": 22440 + }, + { + "epoch": 61.14713896457766, + "grad_norm": 3.894035816192627, + "learning_rate": 6.92611704117525e-06, + "loss": 0.0746, + "step": 22441 + }, + { + "epoch": 61.14986376021798, + "grad_norm": 3.0605595111846924, + "learning_rate": 6.925277285219185e-06, + "loss": 0.0626, + "step": 22442 + }, + { + "epoch": 61.15258855585831, + "grad_norm": 4.345304012298584, + "learning_rate": 6.924437553208965e-06, + "loss": 0.1464, + "step": 22443 + }, + { + "epoch": 61.155313351498634, + "grad_norm": 4.668532848358154, + "learning_rate": 6.923597845151124e-06, + "loss": 0.1101, + "step": 22444 + }, + { + "epoch": 61.15803814713897, + "grad_norm": 3.243645429611206, + "learning_rate": 6.922758161052201e-06, + "loss": 0.0891, + "step": 22445 + }, + { + "epoch": 61.16076294277929, + "grad_norm": 4.130244731903076, + "learning_rate": 6.921918500918743e-06, + "loss": 0.1457, + "step": 22446 + }, + { + "epoch": 61.16348773841962, + "grad_norm": 4.43756628036499, + "learning_rate": 6.921078864757282e-06, + "loss": 0.1449, + "step": 22447 + }, + { + "epoch": 61.166212534059945, + "grad_norm": 3.9297196865081787, + "learning_rate": 6.920239252574364e-06, + "loss": 0.0579, + "step": 22448 + }, + { + "epoch": 61.16893732970027, + "grad_norm": 4.997093200683594, + "learning_rate": 6.9193996643765195e-06, + "loss": 0.1195, + "step": 22449 + }, + { + "epoch": 61.171662125340596, + "grad_norm": 3.6902146339416504, + "learning_rate": 6.918560100170293e-06, + "loss": 0.11, + "step": 22450 + }, + { + "epoch": 61.17438692098093, + "grad_norm": 2.218496322631836, + "learning_rate": 6.91772055996222e-06, + "loss": 0.0283, + "step": 22451 + }, + { + "epoch": 61.177111716621255, + "grad_norm": 4.0584211349487305, + "learning_rate": 6.916881043758843e-06, + "loss": 0.1857, + "step": 22452 + }, + { + "epoch": 61.17983651226158, + "grad_norm": 5.4693193435668945, + "learning_rate": 6.916041551566695e-06, + "loss": 0.0712, + "step": 22453 + }, + { + "epoch": 61.182561307901906, + "grad_norm": 2.8290891647338867, + "learning_rate": 6.915202083392316e-06, + "loss": 0.0834, + "step": 22454 + }, + { + "epoch": 61.18528610354223, + "grad_norm": 4.029819488525391, + "learning_rate": 6.9143626392422446e-06, + "loss": 0.1181, + "step": 22455 + }, + { + "epoch": 61.18801089918256, + "grad_norm": 2.920246124267578, + "learning_rate": 6.9135232191230176e-06, + "loss": 0.0597, + "step": 22456 + }, + { + "epoch": 61.19073569482289, + "grad_norm": 3.2647705078125, + "learning_rate": 6.912683823041171e-06, + "loss": 0.1243, + "step": 22457 + }, + { + "epoch": 61.19346049046322, + "grad_norm": 4.116549968719482, + "learning_rate": 6.911844451003244e-06, + "loss": 0.1568, + "step": 22458 + }, + { + "epoch": 61.19618528610354, + "grad_norm": 3.7574572563171387, + "learning_rate": 6.911005103015775e-06, + "loss": 0.2098, + "step": 22459 + }, + { + "epoch": 61.19891008174387, + "grad_norm": 3.683820962905884, + "learning_rate": 6.910165779085296e-06, + "loss": 0.1229, + "step": 22460 + }, + { + "epoch": 61.201634877384194, + "grad_norm": 4.492462158203125, + "learning_rate": 6.90932647921835e-06, + "loss": 0.1008, + "step": 22461 + }, + { + "epoch": 61.20435967302452, + "grad_norm": 3.6631996631622314, + "learning_rate": 6.908487203421465e-06, + "loss": 0.0954, + "step": 22462 + }, + { + "epoch": 61.20708446866485, + "grad_norm": 2.686357021331787, + "learning_rate": 6.907647951701183e-06, + "loss": 0.0509, + "step": 22463 + }, + { + "epoch": 61.20980926430518, + "grad_norm": 3.2772693634033203, + "learning_rate": 6.906808724064043e-06, + "loss": 0.054, + "step": 22464 + }, + { + "epoch": 61.212534059945504, + "grad_norm": 3.1622159481048584, + "learning_rate": 6.905969520516573e-06, + "loss": 0.0817, + "step": 22465 + }, + { + "epoch": 61.21525885558583, + "grad_norm": 3.74229097366333, + "learning_rate": 6.905130341065317e-06, + "loss": 0.0751, + "step": 22466 + }, + { + "epoch": 61.217983651226156, + "grad_norm": 3.26526141166687, + "learning_rate": 6.904291185716802e-06, + "loss": 0.0645, + "step": 22467 + }, + { + "epoch": 61.22070844686648, + "grad_norm": 3.589921236038208, + "learning_rate": 6.903452054477573e-06, + "loss": 0.0629, + "step": 22468 + }, + { + "epoch": 61.223433242506815, + "grad_norm": 5.118885040283203, + "learning_rate": 6.902612947354155e-06, + "loss": 0.1421, + "step": 22469 + }, + { + "epoch": 61.22615803814714, + "grad_norm": 3.6298789978027344, + "learning_rate": 6.9017738643530905e-06, + "loss": 0.0704, + "step": 22470 + }, + { + "epoch": 61.228882833787466, + "grad_norm": 3.2231998443603516, + "learning_rate": 6.90093480548091e-06, + "loss": 0.0662, + "step": 22471 + }, + { + "epoch": 61.23160762942779, + "grad_norm": 2.864978313446045, + "learning_rate": 6.9000957707441505e-06, + "loss": 0.1268, + "step": 22472 + }, + { + "epoch": 61.23433242506812, + "grad_norm": 3.8802876472473145, + "learning_rate": 6.899256760149345e-06, + "loss": 0.0984, + "step": 22473 + }, + { + "epoch": 61.237057220708444, + "grad_norm": 2.5116190910339355, + "learning_rate": 6.898417773703028e-06, + "loss": 0.0491, + "step": 22474 + }, + { + "epoch": 61.23978201634878, + "grad_norm": 3.569486141204834, + "learning_rate": 6.897578811411732e-06, + "loss": 0.0665, + "step": 22475 + }, + { + "epoch": 61.2425068119891, + "grad_norm": 3.417987823486328, + "learning_rate": 6.896739873281995e-06, + "loss": 0.1306, + "step": 22476 + }, + { + "epoch": 61.24523160762943, + "grad_norm": 3.795724868774414, + "learning_rate": 6.8959009593203454e-06, + "loss": 0.2253, + "step": 22477 + }, + { + "epoch": 61.247956403269754, + "grad_norm": 4.208312511444092, + "learning_rate": 6.895062069533322e-06, + "loss": 0.1128, + "step": 22478 + }, + { + "epoch": 61.25068119891008, + "grad_norm": 4.227952480316162, + "learning_rate": 6.894223203927452e-06, + "loss": 0.1524, + "step": 22479 + }, + { + "epoch": 61.253405994550405, + "grad_norm": 5.267580509185791, + "learning_rate": 6.8933843625092715e-06, + "loss": 0.0809, + "step": 22480 + }, + { + "epoch": 61.25613079019074, + "grad_norm": 3.6058425903320312, + "learning_rate": 6.892545545285314e-06, + "loss": 0.0906, + "step": 22481 + }, + { + "epoch": 61.258855585831064, + "grad_norm": 7.454145431518555, + "learning_rate": 6.891706752262115e-06, + "loss": 0.1498, + "step": 22482 + }, + { + "epoch": 61.26158038147139, + "grad_norm": 3.4177675247192383, + "learning_rate": 6.890867983446201e-06, + "loss": 0.0654, + "step": 22483 + }, + { + "epoch": 61.264305177111716, + "grad_norm": 2.882645606994629, + "learning_rate": 6.8900292388441095e-06, + "loss": 0.0957, + "step": 22484 + }, + { + "epoch": 61.26702997275204, + "grad_norm": 3.294074773788452, + "learning_rate": 6.889190518462368e-06, + "loss": 0.0733, + "step": 22485 + }, + { + "epoch": 61.26975476839237, + "grad_norm": 3.619446039199829, + "learning_rate": 6.888351822307513e-06, + "loss": 0.0694, + "step": 22486 + }, + { + "epoch": 61.2724795640327, + "grad_norm": 3.25736141204834, + "learning_rate": 6.887513150386072e-06, + "loss": 0.0637, + "step": 22487 + }, + { + "epoch": 61.275204359673026, + "grad_norm": 4.02907657623291, + "learning_rate": 6.886674502704579e-06, + "loss": 0.1833, + "step": 22488 + }, + { + "epoch": 61.27792915531335, + "grad_norm": 3.1237282752990723, + "learning_rate": 6.885835879269564e-06, + "loss": 0.0694, + "step": 22489 + }, + { + "epoch": 61.28065395095368, + "grad_norm": 8.443364143371582, + "learning_rate": 6.88499728008756e-06, + "loss": 0.1257, + "step": 22490 + }, + { + "epoch": 61.283378746594, + "grad_norm": 4.005463600158691, + "learning_rate": 6.884158705165096e-06, + "loss": 0.0746, + "step": 22491 + }, + { + "epoch": 61.28610354223433, + "grad_norm": 3.8555893898010254, + "learning_rate": 6.883320154508705e-06, + "loss": 0.0707, + "step": 22492 + }, + { + "epoch": 61.28882833787466, + "grad_norm": 2.8718743324279785, + "learning_rate": 6.882481628124915e-06, + "loss": 0.0623, + "step": 22493 + }, + { + "epoch": 61.29155313351499, + "grad_norm": 3.9258992671966553, + "learning_rate": 6.881643126020259e-06, + "loss": 0.1837, + "step": 22494 + }, + { + "epoch": 61.294277929155314, + "grad_norm": 7.436041355133057, + "learning_rate": 6.8808046482012645e-06, + "loss": 0.0849, + "step": 22495 + }, + { + "epoch": 61.29700272479564, + "grad_norm": 3.05180287361145, + "learning_rate": 6.8799661946744646e-06, + "loss": 0.106, + "step": 22496 + }, + { + "epoch": 61.299727520435965, + "grad_norm": 3.570476531982422, + "learning_rate": 6.879127765446383e-06, + "loss": 0.2072, + "step": 22497 + }, + { + "epoch": 61.30245231607629, + "grad_norm": 2.7125468254089355, + "learning_rate": 6.878289360523556e-06, + "loss": 0.0435, + "step": 22498 + }, + { + "epoch": 61.305177111716624, + "grad_norm": 6.026636600494385, + "learning_rate": 6.877450979912512e-06, + "loss": 0.0725, + "step": 22499 + }, + { + "epoch": 61.30790190735695, + "grad_norm": 3.470548391342163, + "learning_rate": 6.876612623619782e-06, + "loss": 0.059, + "step": 22500 + }, + { + "epoch": 61.310626702997276, + "grad_norm": 3.3297195434570312, + "learning_rate": 6.875774291651889e-06, + "loss": 0.1602, + "step": 22501 + }, + { + "epoch": 61.3133514986376, + "grad_norm": 2.9722609519958496, + "learning_rate": 6.874935984015367e-06, + "loss": 0.098, + "step": 22502 + }, + { + "epoch": 61.31607629427793, + "grad_norm": 4.761186122894287, + "learning_rate": 6.874097700716742e-06, + "loss": 0.1268, + "step": 22503 + }, + { + "epoch": 61.31880108991825, + "grad_norm": 3.75443434715271, + "learning_rate": 6.873259441762545e-06, + "loss": 0.0661, + "step": 22504 + }, + { + "epoch": 61.321525885558586, + "grad_norm": 3.4605464935302734, + "learning_rate": 6.872421207159301e-06, + "loss": 0.0559, + "step": 22505 + }, + { + "epoch": 61.32425068119891, + "grad_norm": 2.499070644378662, + "learning_rate": 6.871582996913542e-06, + "loss": 0.0584, + "step": 22506 + }, + { + "epoch": 61.32697547683924, + "grad_norm": 4.2966437339782715, + "learning_rate": 6.870744811031791e-06, + "loss": 0.0485, + "step": 22507 + }, + { + "epoch": 61.32970027247956, + "grad_norm": 8.06656551361084, + "learning_rate": 6.869906649520581e-06, + "loss": 0.1118, + "step": 22508 + }, + { + "epoch": 61.33242506811989, + "grad_norm": 3.6609208583831787, + "learning_rate": 6.869068512386436e-06, + "loss": 0.0799, + "step": 22509 + }, + { + "epoch": 61.335149863760215, + "grad_norm": 2.774722099304199, + "learning_rate": 6.868230399635887e-06, + "loss": 0.1738, + "step": 22510 + }, + { + "epoch": 61.33787465940055, + "grad_norm": 3.4997575283050537, + "learning_rate": 6.867392311275456e-06, + "loss": 0.1908, + "step": 22511 + }, + { + "epoch": 61.34059945504087, + "grad_norm": 2.995242118835449, + "learning_rate": 6.866554247311676e-06, + "loss": 0.1446, + "step": 22512 + }, + { + "epoch": 61.3433242506812, + "grad_norm": 2.2353782653808594, + "learning_rate": 6.865716207751068e-06, + "loss": 0.0471, + "step": 22513 + }, + { + "epoch": 61.346049046321525, + "grad_norm": 4.911764144897461, + "learning_rate": 6.864878192600158e-06, + "loss": 0.1985, + "step": 22514 + }, + { + "epoch": 61.34877384196185, + "grad_norm": 4.077296733856201, + "learning_rate": 6.864040201865481e-06, + "loss": 0.0599, + "step": 22515 + }, + { + "epoch": 61.35149863760218, + "grad_norm": 5.075759410858154, + "learning_rate": 6.863202235553557e-06, + "loss": 0.0898, + "step": 22516 + }, + { + "epoch": 61.35422343324251, + "grad_norm": 3.448331594467163, + "learning_rate": 6.862364293670913e-06, + "loss": 0.0492, + "step": 22517 + }, + { + "epoch": 61.356948228882835, + "grad_norm": 2.8780722618103027, + "learning_rate": 6.8615263762240735e-06, + "loss": 0.124, + "step": 22518 + }, + { + "epoch": 61.35967302452316, + "grad_norm": 3.84973406791687, + "learning_rate": 6.860688483219569e-06, + "loss": 0.1241, + "step": 22519 + }, + { + "epoch": 61.36239782016349, + "grad_norm": 3.990999698638916, + "learning_rate": 6.859850614663916e-06, + "loss": 0.1081, + "step": 22520 + }, + { + "epoch": 61.36512261580381, + "grad_norm": 3.954577922821045, + "learning_rate": 6.859012770563649e-06, + "loss": 0.0656, + "step": 22521 + }, + { + "epoch": 61.36784741144414, + "grad_norm": 4.023142337799072, + "learning_rate": 6.858174950925289e-06, + "loss": 0.0796, + "step": 22522 + }, + { + "epoch": 61.37057220708447, + "grad_norm": 3.638831853866577, + "learning_rate": 6.857337155755362e-06, + "loss": 0.0473, + "step": 22523 + }, + { + "epoch": 61.3732970027248, + "grad_norm": 3.5866053104400635, + "learning_rate": 6.856499385060392e-06, + "loss": 0.1376, + "step": 22524 + }, + { + "epoch": 61.37602179836512, + "grad_norm": 3.0281224250793457, + "learning_rate": 6.855661638846902e-06, + "loss": 0.0581, + "step": 22525 + }, + { + "epoch": 61.37874659400545, + "grad_norm": 3.867025375366211, + "learning_rate": 6.854823917121421e-06, + "loss": 0.0782, + "step": 22526 + }, + { + "epoch": 61.381471389645775, + "grad_norm": 4.331473350524902, + "learning_rate": 6.853986219890467e-06, + "loss": 0.0702, + "step": 22527 + }, + { + "epoch": 61.3841961852861, + "grad_norm": 3.835432291030884, + "learning_rate": 6.853148547160568e-06, + "loss": 0.0706, + "step": 22528 + }, + { + "epoch": 61.38692098092643, + "grad_norm": 5.395134449005127, + "learning_rate": 6.852310898938248e-06, + "loss": 0.1446, + "step": 22529 + }, + { + "epoch": 61.38964577656676, + "grad_norm": 3.941890239715576, + "learning_rate": 6.85147327523003e-06, + "loss": 0.1196, + "step": 22530 + }, + { + "epoch": 61.392370572207085, + "grad_norm": 3.325962781906128, + "learning_rate": 6.850635676042432e-06, + "loss": 0.0991, + "step": 22531 + }, + { + "epoch": 61.39509536784741, + "grad_norm": 4.40023946762085, + "learning_rate": 6.849798101381984e-06, + "loss": 0.0587, + "step": 22532 + }, + { + "epoch": 61.39782016348774, + "grad_norm": 3.027614116668701, + "learning_rate": 6.848960551255208e-06, + "loss": 0.049, + "step": 22533 + }, + { + "epoch": 61.40054495912806, + "grad_norm": 5.605319499969482, + "learning_rate": 6.848123025668626e-06, + "loss": 0.2438, + "step": 22534 + }, + { + "epoch": 61.403269754768395, + "grad_norm": 5.745209217071533, + "learning_rate": 6.847285524628762e-06, + "loss": 0.0956, + "step": 22535 + }, + { + "epoch": 61.40599455040872, + "grad_norm": 3.1595828533172607, + "learning_rate": 6.846448048142134e-06, + "loss": 0.0941, + "step": 22536 + }, + { + "epoch": 61.40871934604905, + "grad_norm": 2.9316658973693848, + "learning_rate": 6.84561059621527e-06, + "loss": 0.1674, + "step": 22537 + }, + { + "epoch": 61.41144414168937, + "grad_norm": 5.271034240722656, + "learning_rate": 6.844773168854686e-06, + "loss": 0.1526, + "step": 22538 + }, + { + "epoch": 61.4141689373297, + "grad_norm": 3.7947235107421875, + "learning_rate": 6.843935766066911e-06, + "loss": 0.0582, + "step": 22539 + }, + { + "epoch": 61.416893732970024, + "grad_norm": 3.0826029777526855, + "learning_rate": 6.8430983878584585e-06, + "loss": 0.0697, + "step": 22540 + }, + { + "epoch": 61.41961852861036, + "grad_norm": 3.8238813877105713, + "learning_rate": 6.842261034235858e-06, + "loss": 0.1339, + "step": 22541 + }, + { + "epoch": 61.42234332425068, + "grad_norm": 4.125527381896973, + "learning_rate": 6.841423705205623e-06, + "loss": 0.1194, + "step": 22542 + }, + { + "epoch": 61.42506811989101, + "grad_norm": 4.080195426940918, + "learning_rate": 6.840586400774282e-06, + "loss": 0.1927, + "step": 22543 + }, + { + "epoch": 61.427792915531334, + "grad_norm": 4.2366228103637695, + "learning_rate": 6.839749120948349e-06, + "loss": 0.1214, + "step": 22544 + }, + { + "epoch": 61.43051771117166, + "grad_norm": 3.4900057315826416, + "learning_rate": 6.8389118657343505e-06, + "loss": 0.0864, + "step": 22545 + }, + { + "epoch": 61.433242506811986, + "grad_norm": 3.958977460861206, + "learning_rate": 6.838074635138805e-06, + "loss": 0.0958, + "step": 22546 + }, + { + "epoch": 61.43596730245232, + "grad_norm": 6.551956653594971, + "learning_rate": 6.8372374291682306e-06, + "loss": 0.2499, + "step": 22547 + }, + { + "epoch": 61.438692098092645, + "grad_norm": 4.2710371017456055, + "learning_rate": 6.836400247829151e-06, + "loss": 0.0968, + "step": 22548 + }, + { + "epoch": 61.44141689373297, + "grad_norm": 2.7208895683288574, + "learning_rate": 6.835563091128081e-06, + "loss": 0.1067, + "step": 22549 + }, + { + "epoch": 61.444141689373296, + "grad_norm": 4.0786285400390625, + "learning_rate": 6.834725959071546e-06, + "loss": 0.1261, + "step": 22550 + }, + { + "epoch": 61.44686648501362, + "grad_norm": 4.6377105712890625, + "learning_rate": 6.833888851666064e-06, + "loss": 0.0836, + "step": 22551 + }, + { + "epoch": 61.44959128065395, + "grad_norm": 3.952730894088745, + "learning_rate": 6.8330517689181534e-06, + "loss": 0.1789, + "step": 22552 + }, + { + "epoch": 61.45231607629428, + "grad_norm": 7.379684925079346, + "learning_rate": 6.832214710834335e-06, + "loss": 0.1058, + "step": 22553 + }, + { + "epoch": 61.45504087193461, + "grad_norm": 4.6327223777771, + "learning_rate": 6.831377677421125e-06, + "loss": 0.131, + "step": 22554 + }, + { + "epoch": 61.45776566757493, + "grad_norm": 2.3379297256469727, + "learning_rate": 6.830540668685045e-06, + "loss": 0.0889, + "step": 22555 + }, + { + "epoch": 61.46049046321526, + "grad_norm": 2.2440812587738037, + "learning_rate": 6.82970368463261e-06, + "loss": 0.1082, + "step": 22556 + }, + { + "epoch": 61.463215258855584, + "grad_norm": 4.8782877922058105, + "learning_rate": 6.8288667252703435e-06, + "loss": 0.0587, + "step": 22557 + }, + { + "epoch": 61.46594005449591, + "grad_norm": 3.6590161323547363, + "learning_rate": 6.828029790604757e-06, + "loss": 0.2096, + "step": 22558 + }, + { + "epoch": 61.46866485013624, + "grad_norm": 3.6848299503326416, + "learning_rate": 6.827192880642377e-06, + "loss": 0.0511, + "step": 22559 + }, + { + "epoch": 61.47138964577657, + "grad_norm": 5.054895877838135, + "learning_rate": 6.826355995389714e-06, + "loss": 0.1669, + "step": 22560 + }, + { + "epoch": 61.474114441416894, + "grad_norm": 3.6900060176849365, + "learning_rate": 6.82551913485329e-06, + "loss": 0.1283, + "step": 22561 + }, + { + "epoch": 61.47683923705722, + "grad_norm": 3.7525711059570312, + "learning_rate": 6.824682299039619e-06, + "loss": 0.0659, + "step": 22562 + }, + { + "epoch": 61.479564032697546, + "grad_norm": 4.069061756134033, + "learning_rate": 6.823845487955222e-06, + "loss": 0.1744, + "step": 22563 + }, + { + "epoch": 61.48228882833787, + "grad_norm": 4.4344096183776855, + "learning_rate": 6.823008701606612e-06, + "loss": 0.1213, + "step": 22564 + }, + { + "epoch": 61.485013623978205, + "grad_norm": 3.128112316131592, + "learning_rate": 6.822171940000311e-06, + "loss": 0.0555, + "step": 22565 + }, + { + "epoch": 61.48773841961853, + "grad_norm": 5.1781110763549805, + "learning_rate": 6.821335203142825e-06, + "loss": 0.0946, + "step": 22566 + }, + { + "epoch": 61.490463215258856, + "grad_norm": 3.098604917526245, + "learning_rate": 6.820498491040684e-06, + "loss": 0.1108, + "step": 22567 + }, + { + "epoch": 61.49318801089918, + "grad_norm": 5.4357075691223145, + "learning_rate": 6.819661803700397e-06, + "loss": 0.0706, + "step": 22568 + }, + { + "epoch": 61.49591280653951, + "grad_norm": 4.7054266929626465, + "learning_rate": 6.818825141128484e-06, + "loss": 0.0891, + "step": 22569 + }, + { + "epoch": 61.49863760217983, + "grad_norm": 5.830087184906006, + "learning_rate": 6.817988503331456e-06, + "loss": 0.303, + "step": 22570 + }, + { + "epoch": 61.50136239782017, + "grad_norm": 4.259527206420898, + "learning_rate": 6.817151890315834e-06, + "loss": 0.2109, + "step": 22571 + }, + { + "epoch": 61.50408719346049, + "grad_norm": 3.3473060131073, + "learning_rate": 6.816315302088128e-06, + "loss": 0.0757, + "step": 22572 + }, + { + "epoch": 61.50681198910082, + "grad_norm": 6.24845552444458, + "learning_rate": 6.815478738654857e-06, + "loss": 0.1215, + "step": 22573 + }, + { + "epoch": 61.509536784741144, + "grad_norm": 5.4939351081848145, + "learning_rate": 6.814642200022534e-06, + "loss": 0.1916, + "step": 22574 + }, + { + "epoch": 61.51226158038147, + "grad_norm": 3.96571946144104, + "learning_rate": 6.813805686197677e-06, + "loss": 0.1267, + "step": 22575 + }, + { + "epoch": 61.514986376021795, + "grad_norm": 3.6861422061920166, + "learning_rate": 6.812969197186796e-06, + "loss": 0.0727, + "step": 22576 + }, + { + "epoch": 61.51771117166213, + "grad_norm": 3.844547986984253, + "learning_rate": 6.8121327329964116e-06, + "loss": 0.1031, + "step": 22577 + }, + { + "epoch": 61.520435967302454, + "grad_norm": 3.123567581176758, + "learning_rate": 6.811296293633032e-06, + "loss": 0.1303, + "step": 22578 + }, + { + "epoch": 61.52316076294278, + "grad_norm": 2.9488346576690674, + "learning_rate": 6.810459879103177e-06, + "loss": 0.0529, + "step": 22579 + }, + { + "epoch": 61.525885558583106, + "grad_norm": 3.1225693225860596, + "learning_rate": 6.8096234894133554e-06, + "loss": 0.0552, + "step": 22580 + }, + { + "epoch": 61.52861035422343, + "grad_norm": 7.820192337036133, + "learning_rate": 6.808787124570086e-06, + "loss": 0.1403, + "step": 22581 + }, + { + "epoch": 61.53133514986376, + "grad_norm": 3.2657599449157715, + "learning_rate": 6.8079507845798754e-06, + "loss": 0.1341, + "step": 22582 + }, + { + "epoch": 61.53405994550409, + "grad_norm": 8.19572639465332, + "learning_rate": 6.807114469449242e-06, + "loss": 0.1402, + "step": 22583 + }, + { + "epoch": 61.536784741144416, + "grad_norm": 5.6479291915893555, + "learning_rate": 6.806278179184701e-06, + "loss": 0.0685, + "step": 22584 + }, + { + "epoch": 61.53950953678474, + "grad_norm": 6.213305473327637, + "learning_rate": 6.805441913792761e-06, + "loss": 0.0791, + "step": 22585 + }, + { + "epoch": 61.54223433242507, + "grad_norm": 3.350292444229126, + "learning_rate": 6.804605673279937e-06, + "loss": 0.1291, + "step": 22586 + }, + { + "epoch": 61.54495912806539, + "grad_norm": 3.873460054397583, + "learning_rate": 6.803769457652743e-06, + "loss": 0.0658, + "step": 22587 + }, + { + "epoch": 61.54768392370572, + "grad_norm": 3.1772074699401855, + "learning_rate": 6.802933266917687e-06, + "loss": 0.1259, + "step": 22588 + }, + { + "epoch": 61.55040871934605, + "grad_norm": 4.587749004364014, + "learning_rate": 6.802097101081286e-06, + "loss": 0.1125, + "step": 22589 + }, + { + "epoch": 61.55313351498638, + "grad_norm": 4.840493202209473, + "learning_rate": 6.801260960150049e-06, + "loss": 0.0879, + "step": 22590 + }, + { + "epoch": 61.555858310626704, + "grad_norm": 3.0096285343170166, + "learning_rate": 6.80042484413049e-06, + "loss": 0.119, + "step": 22591 + }, + { + "epoch": 61.55858310626703, + "grad_norm": 3.6800713539123535, + "learning_rate": 6.799588753029116e-06, + "loss": 0.0525, + "step": 22592 + }, + { + "epoch": 61.561307901907355, + "grad_norm": 4.493557453155518, + "learning_rate": 6.798752686852445e-06, + "loss": 0.1426, + "step": 22593 + }, + { + "epoch": 61.56403269754768, + "grad_norm": 3.826521158218384, + "learning_rate": 6.797916645606984e-06, + "loss": 0.1073, + "step": 22594 + }, + { + "epoch": 61.566757493188014, + "grad_norm": 4.606961250305176, + "learning_rate": 6.797080629299246e-06, + "loss": 0.0999, + "step": 22595 + }, + { + "epoch": 61.56948228882834, + "grad_norm": 3.625265598297119, + "learning_rate": 6.796244637935738e-06, + "loss": 0.1786, + "step": 22596 + }, + { + "epoch": 61.572207084468666, + "grad_norm": 3.434013605117798, + "learning_rate": 6.7954086715229785e-06, + "loss": 0.1318, + "step": 22597 + }, + { + "epoch": 61.57493188010899, + "grad_norm": 4.323663234710693, + "learning_rate": 6.794572730067468e-06, + "loss": 0.0674, + "step": 22598 + }, + { + "epoch": 61.57765667574932, + "grad_norm": 4.009775638580322, + "learning_rate": 6.793736813575726e-06, + "loss": 0.1404, + "step": 22599 + }, + { + "epoch": 61.58038147138964, + "grad_norm": 3.958038568496704, + "learning_rate": 6.792900922054253e-06, + "loss": 0.0547, + "step": 22600 + }, + { + "epoch": 61.583106267029976, + "grad_norm": 5.43556022644043, + "learning_rate": 6.792065055509567e-06, + "loss": 0.104, + "step": 22601 + }, + { + "epoch": 61.5858310626703, + "grad_norm": 3.598926067352295, + "learning_rate": 6.791229213948178e-06, + "loss": 0.0685, + "step": 22602 + }, + { + "epoch": 61.58855585831063, + "grad_norm": 3.2011067867279053, + "learning_rate": 6.79039339737659e-06, + "loss": 0.066, + "step": 22603 + }, + { + "epoch": 61.59128065395095, + "grad_norm": 4.33527135848999, + "learning_rate": 6.7895576058013165e-06, + "loss": 0.1314, + "step": 22604 + }, + { + "epoch": 61.59400544959128, + "grad_norm": 4.108130931854248, + "learning_rate": 6.788721839228863e-06, + "loss": 0.0926, + "step": 22605 + }, + { + "epoch": 61.596730245231605, + "grad_norm": 3.942216157913208, + "learning_rate": 6.787886097665744e-06, + "loss": 0.0581, + "step": 22606 + }, + { + "epoch": 61.59945504087194, + "grad_norm": 4.376565933227539, + "learning_rate": 6.787050381118461e-06, + "loss": 0.0901, + "step": 22607 + }, + { + "epoch": 61.60217983651226, + "grad_norm": 9.13692569732666, + "learning_rate": 6.786214689593527e-06, + "loss": 0.1621, + "step": 22608 + }, + { + "epoch": 61.60490463215259, + "grad_norm": 3.2546372413635254, + "learning_rate": 6.785379023097451e-06, + "loss": 0.1854, + "step": 22609 + }, + { + "epoch": 61.607629427792915, + "grad_norm": 3.8960635662078857, + "learning_rate": 6.784543381636738e-06, + "loss": 0.072, + "step": 22610 + }, + { + "epoch": 61.61035422343324, + "grad_norm": 3.6300668716430664, + "learning_rate": 6.783707765217899e-06, + "loss": 0.0814, + "step": 22611 + }, + { + "epoch": 61.61307901907357, + "grad_norm": 4.188830852508545, + "learning_rate": 6.782872173847439e-06, + "loss": 0.1216, + "step": 22612 + }, + { + "epoch": 61.6158038147139, + "grad_norm": 4.343804359436035, + "learning_rate": 6.78203660753187e-06, + "loss": 0.0654, + "step": 22613 + }, + { + "epoch": 61.618528610354225, + "grad_norm": 4.386777877807617, + "learning_rate": 6.781201066277693e-06, + "loss": 0.1287, + "step": 22614 + }, + { + "epoch": 61.62125340599455, + "grad_norm": 3.194927215576172, + "learning_rate": 6.780365550091421e-06, + "loss": 0.1733, + "step": 22615 + }, + { + "epoch": 61.62397820163488, + "grad_norm": 2.8710696697235107, + "learning_rate": 6.779530058979555e-06, + "loss": 0.0936, + "step": 22616 + }, + { + "epoch": 61.6267029972752, + "grad_norm": 4.807511806488037, + "learning_rate": 6.778694592948605e-06, + "loss": 0.0514, + "step": 22617 + }, + { + "epoch": 61.62942779291553, + "grad_norm": 3.2285690307617188, + "learning_rate": 6.777859152005082e-06, + "loss": 0.1046, + "step": 22618 + }, + { + "epoch": 61.63215258855586, + "grad_norm": 6.532040119171143, + "learning_rate": 6.777023736155486e-06, + "loss": 0.1783, + "step": 22619 + }, + { + "epoch": 61.63487738419619, + "grad_norm": 3.0889177322387695, + "learning_rate": 6.776188345406327e-06, + "loss": 0.0656, + "step": 22620 + }, + { + "epoch": 61.63760217983651, + "grad_norm": 4.285674095153809, + "learning_rate": 6.775352979764107e-06, + "loss": 0.0695, + "step": 22621 + }, + { + "epoch": 61.64032697547684, + "grad_norm": 5.0756001472473145, + "learning_rate": 6.7745176392353365e-06, + "loss": 0.0649, + "step": 22622 + }, + { + "epoch": 61.643051771117165, + "grad_norm": 4.603452682495117, + "learning_rate": 6.773682323826517e-06, + "loss": 0.1991, + "step": 22623 + }, + { + "epoch": 61.64577656675749, + "grad_norm": 3.4590930938720703, + "learning_rate": 6.772847033544157e-06, + "loss": 0.0685, + "step": 22624 + }, + { + "epoch": 61.64850136239782, + "grad_norm": 3.503081798553467, + "learning_rate": 6.77201176839476e-06, + "loss": 0.107, + "step": 22625 + }, + { + "epoch": 61.65122615803815, + "grad_norm": 2.494121551513672, + "learning_rate": 6.771176528384833e-06, + "loss": 0.0417, + "step": 22626 + }, + { + "epoch": 61.653950953678475, + "grad_norm": 5.950601100921631, + "learning_rate": 6.770341313520877e-06, + "loss": 0.1306, + "step": 22627 + }, + { + "epoch": 61.6566757493188, + "grad_norm": 2.828500270843506, + "learning_rate": 6.7695061238094e-06, + "loss": 0.0437, + "step": 22628 + }, + { + "epoch": 61.65940054495913, + "grad_norm": 2.743598461151123, + "learning_rate": 6.7686709592569046e-06, + "loss": 0.0455, + "step": 22629 + }, + { + "epoch": 61.66212534059945, + "grad_norm": 2.979541301727295, + "learning_rate": 6.767835819869897e-06, + "loss": 0.0521, + "step": 22630 + }, + { + "epoch": 61.664850136239785, + "grad_norm": 3.4339613914489746, + "learning_rate": 6.767000705654878e-06, + "loss": 0.2072, + "step": 22631 + }, + { + "epoch": 61.66757493188011, + "grad_norm": 4.0011162757873535, + "learning_rate": 6.766165616618354e-06, + "loss": 0.1283, + "step": 22632 + }, + { + "epoch": 61.67029972752044, + "grad_norm": 3.5324370861053467, + "learning_rate": 6.76533055276683e-06, + "loss": 0.1995, + "step": 22633 + }, + { + "epoch": 61.67302452316076, + "grad_norm": 2.553166627883911, + "learning_rate": 6.764495514106806e-06, + "loss": 0.0326, + "step": 22634 + }, + { + "epoch": 61.67574931880109, + "grad_norm": 4.523924350738525, + "learning_rate": 6.763660500644783e-06, + "loss": 0.0511, + "step": 22635 + }, + { + "epoch": 61.678474114441414, + "grad_norm": 4.016600608825684, + "learning_rate": 6.762825512387273e-06, + "loss": 0.1556, + "step": 22636 + }, + { + "epoch": 61.68119891008175, + "grad_norm": 5.064176082611084, + "learning_rate": 6.761990549340771e-06, + "loss": 0.1284, + "step": 22637 + }, + { + "epoch": 61.68392370572207, + "grad_norm": 2.2795469760894775, + "learning_rate": 6.761155611511786e-06, + "loss": 0.0496, + "step": 22638 + }, + { + "epoch": 61.6866485013624, + "grad_norm": 3.7937819957733154, + "learning_rate": 6.760320698906815e-06, + "loss": 0.1301, + "step": 22639 + }, + { + "epoch": 61.689373297002724, + "grad_norm": 4.277508735656738, + "learning_rate": 6.7594858115323625e-06, + "loss": 0.0692, + "step": 22640 + }, + { + "epoch": 61.69209809264305, + "grad_norm": 2.199242353439331, + "learning_rate": 6.758650949394929e-06, + "loss": 0.0883, + "step": 22641 + }, + { + "epoch": 61.694822888283376, + "grad_norm": 4.541222095489502, + "learning_rate": 6.757816112501019e-06, + "loss": 0.2393, + "step": 22642 + }, + { + "epoch": 61.69754768392371, + "grad_norm": 3.7574493885040283, + "learning_rate": 6.756981300857131e-06, + "loss": 0.0803, + "step": 22643 + }, + { + "epoch": 61.700272479564035, + "grad_norm": 3.8200643062591553, + "learning_rate": 6.75614651446977e-06, + "loss": 0.1866, + "step": 22644 + }, + { + "epoch": 61.70299727520436, + "grad_norm": 3.394278049468994, + "learning_rate": 6.7553117533454345e-06, + "loss": 0.0454, + "step": 22645 + }, + { + "epoch": 61.705722070844686, + "grad_norm": 3.9583377838134766, + "learning_rate": 6.754477017490628e-06, + "loss": 0.1482, + "step": 22646 + }, + { + "epoch": 61.70844686648501, + "grad_norm": 3.4778318405151367, + "learning_rate": 6.753642306911849e-06, + "loss": 0.0746, + "step": 22647 + }, + { + "epoch": 61.71117166212534, + "grad_norm": 5.393945693969727, + "learning_rate": 6.7528076216156e-06, + "loss": 0.0903, + "step": 22648 + }, + { + "epoch": 61.71389645776567, + "grad_norm": 3.733022689819336, + "learning_rate": 6.751972961608379e-06, + "loss": 0.0537, + "step": 22649 + }, + { + "epoch": 61.716621253406, + "grad_norm": 4.430414199829102, + "learning_rate": 6.75113832689669e-06, + "loss": 0.2244, + "step": 22650 + }, + { + "epoch": 61.71934604904632, + "grad_norm": 3.1594595909118652, + "learning_rate": 6.75030371748703e-06, + "loss": 0.1262, + "step": 22651 + }, + { + "epoch": 61.72207084468665, + "grad_norm": 4.033882141113281, + "learning_rate": 6.7494691333858964e-06, + "loss": 0.0899, + "step": 22652 + }, + { + "epoch": 61.724795640326974, + "grad_norm": 3.0013859272003174, + "learning_rate": 6.748634574599795e-06, + "loss": 0.0946, + "step": 22653 + }, + { + "epoch": 61.7275204359673, + "grad_norm": 3.480828285217285, + "learning_rate": 6.747800041135226e-06, + "loss": 0.0471, + "step": 22654 + }, + { + "epoch": 61.73024523160763, + "grad_norm": 6.171280860900879, + "learning_rate": 6.746965532998684e-06, + "loss": 0.0784, + "step": 22655 + }, + { + "epoch": 61.73297002724796, + "grad_norm": 3.1149210929870605, + "learning_rate": 6.7461310501966695e-06, + "loss": 0.0691, + "step": 22656 + }, + { + "epoch": 61.735694822888284, + "grad_norm": 5.454401969909668, + "learning_rate": 6.745296592735682e-06, + "loss": 0.2389, + "step": 22657 + }, + { + "epoch": 61.73841961852861, + "grad_norm": 4.131072521209717, + "learning_rate": 6.744462160622221e-06, + "loss": 0.1386, + "step": 22658 + }, + { + "epoch": 61.741144414168936, + "grad_norm": 3.9972660541534424, + "learning_rate": 6.7436277538627804e-06, + "loss": 0.1325, + "step": 22659 + }, + { + "epoch": 61.74386920980926, + "grad_norm": 3.5973973274230957, + "learning_rate": 6.742793372463865e-06, + "loss": 0.0751, + "step": 22660 + }, + { + "epoch": 61.746594005449595, + "grad_norm": 2.9896881580352783, + "learning_rate": 6.741959016431969e-06, + "loss": 0.0532, + "step": 22661 + }, + { + "epoch": 61.74931880108992, + "grad_norm": 9.038811683654785, + "learning_rate": 6.741124685773592e-06, + "loss": 0.1706, + "step": 22662 + }, + { + "epoch": 61.752043596730246, + "grad_norm": 4.241949081420898, + "learning_rate": 6.7402903804952304e-06, + "loss": 0.158, + "step": 22663 + }, + { + "epoch": 61.75476839237057, + "grad_norm": 2.5723586082458496, + "learning_rate": 6.739456100603383e-06, + "loss": 0.0453, + "step": 22664 + }, + { + "epoch": 61.7574931880109, + "grad_norm": 2.763686180114746, + "learning_rate": 6.738621846104546e-06, + "loss": 0.0517, + "step": 22665 + }, + { + "epoch": 61.76021798365122, + "grad_norm": 2.9788365364074707, + "learning_rate": 6.737787617005218e-06, + "loss": 0.0671, + "step": 22666 + }, + { + "epoch": 61.762942779291556, + "grad_norm": 4.045244216918945, + "learning_rate": 6.736953413311893e-06, + "loss": 0.2312, + "step": 22667 + }, + { + "epoch": 61.76566757493188, + "grad_norm": 3.8430511951446533, + "learning_rate": 6.736119235031074e-06, + "loss": 0.0478, + "step": 22668 + }, + { + "epoch": 61.76839237057221, + "grad_norm": 3.877647638320923, + "learning_rate": 6.735285082169246e-06, + "loss": 0.0659, + "step": 22669 + }, + { + "epoch": 61.771117166212534, + "grad_norm": 3.7261879444122314, + "learning_rate": 6.734450954732916e-06, + "loss": 0.1214, + "step": 22670 + }, + { + "epoch": 61.77384196185286, + "grad_norm": 3.3089585304260254, + "learning_rate": 6.7336168527285796e-06, + "loss": 0.117, + "step": 22671 + }, + { + "epoch": 61.776566757493185, + "grad_norm": 5.874284744262695, + "learning_rate": 6.732782776162727e-06, + "loss": 0.1129, + "step": 22672 + }, + { + "epoch": 61.77929155313352, + "grad_norm": 3.244377613067627, + "learning_rate": 6.731948725041858e-06, + "loss": 0.0564, + "step": 22673 + }, + { + "epoch": 61.782016348773844, + "grad_norm": 3.3005571365356445, + "learning_rate": 6.73111469937247e-06, + "loss": 0.0891, + "step": 22674 + }, + { + "epoch": 61.78474114441417, + "grad_norm": 4.592073917388916, + "learning_rate": 6.730280699161052e-06, + "loss": 0.0561, + "step": 22675 + }, + { + "epoch": 61.787465940054496, + "grad_norm": 3.6790101528167725, + "learning_rate": 6.729446724414103e-06, + "loss": 0.057, + "step": 22676 + }, + { + "epoch": 61.79019073569482, + "grad_norm": 4.135296821594238, + "learning_rate": 6.7286127751381194e-06, + "loss": 0.1755, + "step": 22677 + }, + { + "epoch": 61.79291553133515, + "grad_norm": 4.67214298248291, + "learning_rate": 6.727778851339592e-06, + "loss": 0.0864, + "step": 22678 + }, + { + "epoch": 61.79564032697548, + "grad_norm": 3.8387014865875244, + "learning_rate": 6.726944953025019e-06, + "loss": 0.1451, + "step": 22679 + }, + { + "epoch": 61.798365122615806, + "grad_norm": 3.663045883178711, + "learning_rate": 6.7261110802008944e-06, + "loss": 0.0599, + "step": 22680 + }, + { + "epoch": 61.80108991825613, + "grad_norm": 3.5640475749969482, + "learning_rate": 6.72527723287371e-06, + "loss": 0.1829, + "step": 22681 + }, + { + "epoch": 61.80381471389646, + "grad_norm": 6.209664821624756, + "learning_rate": 6.724443411049961e-06, + "loss": 0.2145, + "step": 22682 + }, + { + "epoch": 61.80653950953678, + "grad_norm": 4.0792717933654785, + "learning_rate": 6.723609614736142e-06, + "loss": 0.0376, + "step": 22683 + }, + { + "epoch": 61.80926430517711, + "grad_norm": 3.1523070335388184, + "learning_rate": 6.722775843938745e-06, + "loss": 0.0529, + "step": 22684 + }, + { + "epoch": 61.81198910081744, + "grad_norm": 4.342679500579834, + "learning_rate": 6.721942098664264e-06, + "loss": 0.1316, + "step": 22685 + }, + { + "epoch": 61.81471389645777, + "grad_norm": 4.211147308349609, + "learning_rate": 6.72110837891919e-06, + "loss": 0.0855, + "step": 22686 + }, + { + "epoch": 61.817438692098094, + "grad_norm": 5.1515631675720215, + "learning_rate": 6.720274684710023e-06, + "loss": 0.1734, + "step": 22687 + }, + { + "epoch": 61.82016348773842, + "grad_norm": 2.444735050201416, + "learning_rate": 6.719441016043249e-06, + "loss": 0.1014, + "step": 22688 + }, + { + "epoch": 61.822888283378745, + "grad_norm": 3.6656153202056885, + "learning_rate": 6.718607372925365e-06, + "loss": 0.2574, + "step": 22689 + }, + { + "epoch": 61.82561307901907, + "grad_norm": 4.523416996002197, + "learning_rate": 6.717773755362857e-06, + "loss": 0.1183, + "step": 22690 + }, + { + "epoch": 61.828337874659404, + "grad_norm": 3.1440584659576416, + "learning_rate": 6.716940163362227e-06, + "loss": 0.0417, + "step": 22691 + }, + { + "epoch": 61.83106267029973, + "grad_norm": 4.38675594329834, + "learning_rate": 6.716106596929956e-06, + "loss": 0.0693, + "step": 22692 + }, + { + "epoch": 61.833787465940055, + "grad_norm": 4.36245584487915, + "learning_rate": 6.715273056072545e-06, + "loss": 0.0868, + "step": 22693 + }, + { + "epoch": 61.83651226158038, + "grad_norm": 3.322178602218628, + "learning_rate": 6.71443954079648e-06, + "loss": 0.0582, + "step": 22694 + }, + { + "epoch": 61.83923705722071, + "grad_norm": 3.655691385269165, + "learning_rate": 6.713606051108252e-06, + "loss": 0.2231, + "step": 22695 + }, + { + "epoch": 61.84196185286103, + "grad_norm": 3.9152729511260986, + "learning_rate": 6.712772587014359e-06, + "loss": 0.1323, + "step": 22696 + }, + { + "epoch": 61.844686648501366, + "grad_norm": 3.867809534072876, + "learning_rate": 6.711939148521284e-06, + "loss": 0.1256, + "step": 22697 + }, + { + "epoch": 61.84741144414169, + "grad_norm": 3.225816249847412, + "learning_rate": 6.711105735635524e-06, + "loss": 0.1185, + "step": 22698 + }, + { + "epoch": 61.85013623978202, + "grad_norm": 3.8987462520599365, + "learning_rate": 6.710272348363563e-06, + "loss": 0.12, + "step": 22699 + }, + { + "epoch": 61.85286103542234, + "grad_norm": 3.257603645324707, + "learning_rate": 6.709438986711898e-06, + "loss": 0.0507, + "step": 22700 + }, + { + "epoch": 61.85558583106267, + "grad_norm": 3.559697151184082, + "learning_rate": 6.708605650687014e-06, + "loss": 0.0934, + "step": 22701 + }, + { + "epoch": 61.858310626702995, + "grad_norm": 2.652071952819824, + "learning_rate": 6.707772340295404e-06, + "loss": 0.0525, + "step": 22702 + }, + { + "epoch": 61.86103542234333, + "grad_norm": 4.298716068267822, + "learning_rate": 6.706939055543558e-06, + "loss": 0.1298, + "step": 22703 + }, + { + "epoch": 61.86376021798365, + "grad_norm": 6.449079513549805, + "learning_rate": 6.70610579643796e-06, + "loss": 0.0603, + "step": 22704 + }, + { + "epoch": 61.86648501362398, + "grad_norm": 3.8100218772888184, + "learning_rate": 6.70527256298511e-06, + "loss": 0.1174, + "step": 22705 + }, + { + "epoch": 61.869209809264305, + "grad_norm": 5.430166244506836, + "learning_rate": 6.704439355191487e-06, + "loss": 0.1655, + "step": 22706 + }, + { + "epoch": 61.87193460490463, + "grad_norm": 4.131312847137451, + "learning_rate": 6.703606173063588e-06, + "loss": 0.1358, + "step": 22707 + }, + { + "epoch": 61.87465940054496, + "grad_norm": 5.626758098602295, + "learning_rate": 6.702773016607895e-06, + "loss": 0.0786, + "step": 22708 + }, + { + "epoch": 61.87738419618529, + "grad_norm": 3.967013359069824, + "learning_rate": 6.701939885830904e-06, + "loss": 0.1383, + "step": 22709 + }, + { + "epoch": 61.880108991825615, + "grad_norm": 3.8643786907196045, + "learning_rate": 6.701106780739095e-06, + "loss": 0.0678, + "step": 22710 + }, + { + "epoch": 61.88283378746594, + "grad_norm": 4.2384843826293945, + "learning_rate": 6.700273701338962e-06, + "loss": 0.0711, + "step": 22711 + }, + { + "epoch": 61.88555858310627, + "grad_norm": 4.261518478393555, + "learning_rate": 6.69944064763699e-06, + "loss": 0.0486, + "step": 22712 + }, + { + "epoch": 61.88828337874659, + "grad_norm": 3.5158252716064453, + "learning_rate": 6.69860761963967e-06, + "loss": 0.134, + "step": 22713 + }, + { + "epoch": 61.89100817438692, + "grad_norm": 3.4491991996765137, + "learning_rate": 6.697774617353485e-06, + "loss": 0.0877, + "step": 22714 + }, + { + "epoch": 61.89373297002725, + "grad_norm": 2.8204474449157715, + "learning_rate": 6.6969416407849264e-06, + "loss": 0.1753, + "step": 22715 + }, + { + "epoch": 61.89645776566758, + "grad_norm": 6.21249532699585, + "learning_rate": 6.696108689940479e-06, + "loss": 0.0854, + "step": 22716 + }, + { + "epoch": 61.8991825613079, + "grad_norm": 4.418528079986572, + "learning_rate": 6.695275764826633e-06, + "loss": 0.0992, + "step": 22717 + }, + { + "epoch": 61.90190735694823, + "grad_norm": 3.096376895904541, + "learning_rate": 6.694442865449871e-06, + "loss": 0.1378, + "step": 22718 + }, + { + "epoch": 61.904632152588555, + "grad_norm": 4.136012077331543, + "learning_rate": 6.6936099918166805e-06, + "loss": 0.2316, + "step": 22719 + }, + { + "epoch": 61.90735694822888, + "grad_norm": 3.673497438430786, + "learning_rate": 6.692777143933552e-06, + "loss": 0.053, + "step": 22720 + }, + { + "epoch": 61.91008174386921, + "grad_norm": 3.3672080039978027, + "learning_rate": 6.6919443218069645e-06, + "loss": 0.102, + "step": 22721 + }, + { + "epoch": 61.91280653950954, + "grad_norm": 2.9719884395599365, + "learning_rate": 6.69111152544341e-06, + "loss": 0.1133, + "step": 22722 + }, + { + "epoch": 61.915531335149865, + "grad_norm": 3.9197938442230225, + "learning_rate": 6.690278754849374e-06, + "loss": 0.0572, + "step": 22723 + }, + { + "epoch": 61.91825613079019, + "grad_norm": 3.8324594497680664, + "learning_rate": 6.68944601003134e-06, + "loss": 0.1418, + "step": 22724 + }, + { + "epoch": 61.920980926430516, + "grad_norm": 2.728116989135742, + "learning_rate": 6.688613290995794e-06, + "loss": 0.0543, + "step": 22725 + }, + { + "epoch": 61.92370572207084, + "grad_norm": 3.0618062019348145, + "learning_rate": 6.6877805977492205e-06, + "loss": 0.0735, + "step": 22726 + }, + { + "epoch": 61.926430517711175, + "grad_norm": 4.998763561248779, + "learning_rate": 6.686947930298107e-06, + "loss": 0.0668, + "step": 22727 + }, + { + "epoch": 61.9291553133515, + "grad_norm": 4.105166435241699, + "learning_rate": 6.686115288648933e-06, + "loss": 0.0877, + "step": 22728 + }, + { + "epoch": 61.93188010899183, + "grad_norm": 4.189581394195557, + "learning_rate": 6.68528267280819e-06, + "loss": 0.089, + "step": 22729 + }, + { + "epoch": 61.93460490463215, + "grad_norm": 4.31670618057251, + "learning_rate": 6.684450082782357e-06, + "loss": 0.1864, + "step": 22730 + }, + { + "epoch": 61.93732970027248, + "grad_norm": 3.497159957885742, + "learning_rate": 6.6836175185779205e-06, + "loss": 0.138, + "step": 22731 + }, + { + "epoch": 61.940054495912804, + "grad_norm": 3.2771823406219482, + "learning_rate": 6.682784980201363e-06, + "loss": 0.0448, + "step": 22732 + }, + { + "epoch": 61.94277929155314, + "grad_norm": 4.763228893280029, + "learning_rate": 6.681952467659172e-06, + "loss": 0.142, + "step": 22733 + }, + { + "epoch": 61.94550408719346, + "grad_norm": 13.746893882751465, + "learning_rate": 6.681119980957825e-06, + "loss": 0.1821, + "step": 22734 + }, + { + "epoch": 61.94822888283379, + "grad_norm": 3.962510824203491, + "learning_rate": 6.680287520103812e-06, + "loss": 0.0684, + "step": 22735 + }, + { + "epoch": 61.950953678474114, + "grad_norm": 2.830461263656616, + "learning_rate": 6.67945508510361e-06, + "loss": 0.0412, + "step": 22736 + }, + { + "epoch": 61.95367847411444, + "grad_norm": 3.46307635307312, + "learning_rate": 6.678622675963708e-06, + "loss": 0.0438, + "step": 22737 + }, + { + "epoch": 61.956403269754766, + "grad_norm": 3.4912824630737305, + "learning_rate": 6.677790292690578e-06, + "loss": 0.1202, + "step": 22738 + }, + { + "epoch": 61.95912806539509, + "grad_norm": 3.3099188804626465, + "learning_rate": 6.676957935290718e-06, + "loss": 0.0973, + "step": 22739 + }, + { + "epoch": 61.961852861035425, + "grad_norm": 5.242749214172363, + "learning_rate": 6.676125603770599e-06, + "loss": 0.1739, + "step": 22740 + }, + { + "epoch": 61.96457765667575, + "grad_norm": 3.9065499305725098, + "learning_rate": 6.675293298136709e-06, + "loss": 0.0613, + "step": 22741 + }, + { + "epoch": 61.967302452316076, + "grad_norm": 3.916933298110962, + "learning_rate": 6.674461018395527e-06, + "loss": 0.0955, + "step": 22742 + }, + { + "epoch": 61.9700272479564, + "grad_norm": 4.395709037780762, + "learning_rate": 6.6736287645535365e-06, + "loss": 0.1493, + "step": 22743 + }, + { + "epoch": 61.97275204359673, + "grad_norm": 4.850771427154541, + "learning_rate": 6.672796536617218e-06, + "loss": 0.1787, + "step": 22744 + }, + { + "epoch": 61.97547683923706, + "grad_norm": 4.9623613357543945, + "learning_rate": 6.671964334593053e-06, + "loss": 0.0814, + "step": 22745 + }, + { + "epoch": 61.97820163487739, + "grad_norm": 3.231295585632324, + "learning_rate": 6.671132158487521e-06, + "loss": 0.0752, + "step": 22746 + }, + { + "epoch": 61.98092643051771, + "grad_norm": 3.3611910343170166, + "learning_rate": 6.6703000083071065e-06, + "loss": 0.0971, + "step": 22747 + }, + { + "epoch": 61.98365122615804, + "grad_norm": 3.1871542930603027, + "learning_rate": 6.669467884058287e-06, + "loss": 0.1521, + "step": 22748 + }, + { + "epoch": 61.986376021798364, + "grad_norm": 3.035025119781494, + "learning_rate": 6.668635785747547e-06, + "loss": 0.0436, + "step": 22749 + }, + { + "epoch": 61.98910081743869, + "grad_norm": 3.5299737453460693, + "learning_rate": 6.667803713381362e-06, + "loss": 0.1288, + "step": 22750 + }, + { + "epoch": 61.991825613079016, + "grad_norm": 4.229928970336914, + "learning_rate": 6.666971666966216e-06, + "loss": 0.0722, + "step": 22751 + }, + { + "epoch": 61.99455040871935, + "grad_norm": 4.067253112792969, + "learning_rate": 6.6661396465085845e-06, + "loss": 0.087, + "step": 22752 + }, + { + "epoch": 61.997275204359674, + "grad_norm": 4.779962062835693, + "learning_rate": 6.665307652014954e-06, + "loss": 0.1442, + "step": 22753 + }, + { + "epoch": 62.0, + "grad_norm": 3.2834765911102295, + "learning_rate": 6.664475683491797e-06, + "loss": 0.0675, + "step": 22754 + }, + { + "epoch": 62.002724795640326, + "grad_norm": 4.060825347900391, + "learning_rate": 6.663643740945594e-06, + "loss": 0.0841, + "step": 22755 + }, + { + "epoch": 62.00544959128065, + "grad_norm": 2.8694839477539062, + "learning_rate": 6.66281182438283e-06, + "loss": 0.1142, + "step": 22756 + }, + { + "epoch": 62.00817438692098, + "grad_norm": 3.719338893890381, + "learning_rate": 6.6619799338099785e-06, + "loss": 0.1246, + "step": 22757 + }, + { + "epoch": 62.01089918256131, + "grad_norm": 2.9884769916534424, + "learning_rate": 6.661148069233522e-06, + "loss": 0.0321, + "step": 22758 + }, + { + "epoch": 62.013623978201636, + "grad_norm": 3.96706485748291, + "learning_rate": 6.660316230659935e-06, + "loss": 0.1392, + "step": 22759 + }, + { + "epoch": 62.01634877384196, + "grad_norm": 3.522141695022583, + "learning_rate": 6.6594844180956965e-06, + "loss": 0.0771, + "step": 22760 + }, + { + "epoch": 62.01907356948229, + "grad_norm": 3.5420284271240234, + "learning_rate": 6.658652631547288e-06, + "loss": 0.1777, + "step": 22761 + }, + { + "epoch": 62.02179836512261, + "grad_norm": 9.910497665405273, + "learning_rate": 6.657820871021185e-06, + "loss": 0.1206, + "step": 22762 + }, + { + "epoch": 62.02452316076294, + "grad_norm": 5.194899559020996, + "learning_rate": 6.656989136523866e-06, + "loss": 0.1064, + "step": 22763 + }, + { + "epoch": 62.02724795640327, + "grad_norm": 3.178278923034668, + "learning_rate": 6.656157428061807e-06, + "loss": 0.1294, + "step": 22764 + }, + { + "epoch": 62.0299727520436, + "grad_norm": 4.71618127822876, + "learning_rate": 6.655325745641488e-06, + "loss": 0.1202, + "step": 22765 + }, + { + "epoch": 62.032697547683924, + "grad_norm": 6.225197792053223, + "learning_rate": 6.654494089269381e-06, + "loss": 0.2833, + "step": 22766 + }, + { + "epoch": 62.03542234332425, + "grad_norm": 3.802011489868164, + "learning_rate": 6.6536624589519705e-06, + "loss": 0.0608, + "step": 22767 + }, + { + "epoch": 62.038147138964575, + "grad_norm": 3.725999116897583, + "learning_rate": 6.652830854695726e-06, + "loss": 0.0752, + "step": 22768 + }, + { + "epoch": 62.0408719346049, + "grad_norm": 3.6398305892944336, + "learning_rate": 6.651999276507129e-06, + "loss": 0.4103, + "step": 22769 + }, + { + "epoch": 62.043596730245234, + "grad_norm": 3.8327982425689697, + "learning_rate": 6.651167724392653e-06, + "loss": 0.15, + "step": 22770 + }, + { + "epoch": 62.04632152588556, + "grad_norm": 3.733111619949341, + "learning_rate": 6.650336198358776e-06, + "loss": 0.1134, + "step": 22771 + }, + { + "epoch": 62.049046321525886, + "grad_norm": 5.347125053405762, + "learning_rate": 6.649504698411968e-06, + "loss": 0.0584, + "step": 22772 + }, + { + "epoch": 62.05177111716621, + "grad_norm": 3.4746041297912598, + "learning_rate": 6.648673224558713e-06, + "loss": 0.117, + "step": 22773 + }, + { + "epoch": 62.05449591280654, + "grad_norm": 3.1897616386413574, + "learning_rate": 6.647841776805485e-06, + "loss": 0.1207, + "step": 22774 + }, + { + "epoch": 62.05722070844686, + "grad_norm": 4.475643157958984, + "learning_rate": 6.647010355158754e-06, + "loss": 0.1592, + "step": 22775 + }, + { + "epoch": 62.059945504087196, + "grad_norm": 3.1270174980163574, + "learning_rate": 6.646178959625002e-06, + "loss": 0.1147, + "step": 22776 + }, + { + "epoch": 62.06267029972752, + "grad_norm": 2.9499459266662598, + "learning_rate": 6.6453475902106975e-06, + "loss": 0.1028, + "step": 22777 + }, + { + "epoch": 62.06539509536785, + "grad_norm": 3.9508938789367676, + "learning_rate": 6.644516246922321e-06, + "loss": 0.0623, + "step": 22778 + }, + { + "epoch": 62.06811989100817, + "grad_norm": 3.2466988563537598, + "learning_rate": 6.643684929766341e-06, + "loss": 0.0425, + "step": 22779 + }, + { + "epoch": 62.0708446866485, + "grad_norm": 2.71771240234375, + "learning_rate": 6.642853638749236e-06, + "loss": 0.0589, + "step": 22780 + }, + { + "epoch": 62.073569482288825, + "grad_norm": 3.7683777809143066, + "learning_rate": 6.642022373877479e-06, + "loss": 0.0885, + "step": 22781 + }, + { + "epoch": 62.07629427792916, + "grad_norm": 4.404494762420654, + "learning_rate": 6.641191135157542e-06, + "loss": 0.1542, + "step": 22782 + }, + { + "epoch": 62.079019073569484, + "grad_norm": 4.745907306671143, + "learning_rate": 6.640359922595902e-06, + "loss": 0.1162, + "step": 22783 + }, + { + "epoch": 62.08174386920981, + "grad_norm": 3.791114568710327, + "learning_rate": 6.6395287361990305e-06, + "loss": 0.0473, + "step": 22784 + }, + { + "epoch": 62.084468664850135, + "grad_norm": 4.590917587280273, + "learning_rate": 6.638697575973402e-06, + "loss": 0.1544, + "step": 22785 + }, + { + "epoch": 62.08719346049046, + "grad_norm": 3.7019877433776855, + "learning_rate": 6.637866441925487e-06, + "loss": 0.0684, + "step": 22786 + }, + { + "epoch": 62.08991825613079, + "grad_norm": 3.172245740890503, + "learning_rate": 6.637035334061761e-06, + "loss": 0.0663, + "step": 22787 + }, + { + "epoch": 62.09264305177112, + "grad_norm": 3.8884174823760986, + "learning_rate": 6.636204252388694e-06, + "loss": 0.0614, + "step": 22788 + }, + { + "epoch": 62.095367847411445, + "grad_norm": 3.3587937355041504, + "learning_rate": 6.6353731969127625e-06, + "loss": 0.0681, + "step": 22789 + }, + { + "epoch": 62.09809264305177, + "grad_norm": 3.02647066116333, + "learning_rate": 6.634542167640432e-06, + "loss": 0.0498, + "step": 22790 + }, + { + "epoch": 62.1008174386921, + "grad_norm": 3.483935594558716, + "learning_rate": 6.63371116457818e-06, + "loss": 0.1736, + "step": 22791 + }, + { + "epoch": 62.10354223433242, + "grad_norm": 3.6119918823242188, + "learning_rate": 6.63288018773248e-06, + "loss": 0.074, + "step": 22792 + }, + { + "epoch": 62.10626702997275, + "grad_norm": 4.372816562652588, + "learning_rate": 6.632049237109799e-06, + "loss": 0.0492, + "step": 22793 + }, + { + "epoch": 62.10899182561308, + "grad_norm": 3.2949540615081787, + "learning_rate": 6.6312183127166115e-06, + "loss": 0.2069, + "step": 22794 + }, + { + "epoch": 62.11171662125341, + "grad_norm": 5.566655158996582, + "learning_rate": 6.630387414559386e-06, + "loss": 0.0888, + "step": 22795 + }, + { + "epoch": 62.11444141689373, + "grad_norm": 3.3440206050872803, + "learning_rate": 6.629556542644597e-06, + "loss": 0.1294, + "step": 22796 + }, + { + "epoch": 62.11716621253406, + "grad_norm": 3.6065633296966553, + "learning_rate": 6.628725696978711e-06, + "loss": 0.0712, + "step": 22797 + }, + { + "epoch": 62.119891008174385, + "grad_norm": 3.9488348960876465, + "learning_rate": 6.627894877568202e-06, + "loss": 0.1127, + "step": 22798 + }, + { + "epoch": 62.12261580381471, + "grad_norm": 4.37799072265625, + "learning_rate": 6.6270640844195365e-06, + "loss": 0.1417, + "step": 22799 + }, + { + "epoch": 62.12534059945504, + "grad_norm": 4.148244857788086, + "learning_rate": 6.626233317539191e-06, + "loss": 0.162, + "step": 22800 + }, + { + "epoch": 62.12806539509537, + "grad_norm": 3.745007276535034, + "learning_rate": 6.6254025769336295e-06, + "loss": 0.0533, + "step": 22801 + }, + { + "epoch": 62.130790190735695, + "grad_norm": 5.023813724517822, + "learning_rate": 6.624571862609326e-06, + "loss": 0.181, + "step": 22802 + }, + { + "epoch": 62.13351498637602, + "grad_norm": 3.1756930351257324, + "learning_rate": 6.623741174572746e-06, + "loss": 0.0804, + "step": 22803 + }, + { + "epoch": 62.13623978201635, + "grad_norm": 3.4608798027038574, + "learning_rate": 6.622910512830363e-06, + "loss": 0.0426, + "step": 22804 + }, + { + "epoch": 62.13896457765667, + "grad_norm": 3.84564208984375, + "learning_rate": 6.622079877388643e-06, + "loss": 0.0689, + "step": 22805 + }, + { + "epoch": 62.141689373297005, + "grad_norm": 3.2299728393554688, + "learning_rate": 6.6212492682540555e-06, + "loss": 0.1371, + "step": 22806 + }, + { + "epoch": 62.14441416893733, + "grad_norm": 3.502675771713257, + "learning_rate": 6.620418685433068e-06, + "loss": 0.2039, + "step": 22807 + }, + { + "epoch": 62.14713896457766, + "grad_norm": 2.6872618198394775, + "learning_rate": 6.619588128932155e-06, + "loss": 0.2084, + "step": 22808 + }, + { + "epoch": 62.14986376021798, + "grad_norm": 3.869669198989868, + "learning_rate": 6.618757598757779e-06, + "loss": 0.078, + "step": 22809 + }, + { + "epoch": 62.15258855585831, + "grad_norm": 4.502622604370117, + "learning_rate": 6.617927094916412e-06, + "loss": 0.1044, + "step": 22810 + }, + { + "epoch": 62.155313351498634, + "grad_norm": 2.8535523414611816, + "learning_rate": 6.617096617414518e-06, + "loss": 0.0967, + "step": 22811 + }, + { + "epoch": 62.15803814713897, + "grad_norm": 3.1820380687713623, + "learning_rate": 6.616266166258568e-06, + "loss": 0.2063, + "step": 22812 + }, + { + "epoch": 62.16076294277929, + "grad_norm": 3.9617884159088135, + "learning_rate": 6.615435741455026e-06, + "loss": 0.0825, + "step": 22813 + }, + { + "epoch": 62.16348773841962, + "grad_norm": 4.588679790496826, + "learning_rate": 6.614605343010365e-06, + "loss": 0.1096, + "step": 22814 + }, + { + "epoch": 62.166212534059945, + "grad_norm": 4.685179233551025, + "learning_rate": 6.6137749709310465e-06, + "loss": 0.1026, + "step": 22815 + }, + { + "epoch": 62.16893732970027, + "grad_norm": 3.87353777885437, + "learning_rate": 6.612944625223541e-06, + "loss": 0.1091, + "step": 22816 + }, + { + "epoch": 62.171662125340596, + "grad_norm": 4.411993980407715, + "learning_rate": 6.61211430589431e-06, + "loss": 0.0944, + "step": 22817 + }, + { + "epoch": 62.17438692098093, + "grad_norm": 3.567234992980957, + "learning_rate": 6.611284012949828e-06, + "loss": 0.1051, + "step": 22818 + }, + { + "epoch": 62.177111716621255, + "grad_norm": 3.051919460296631, + "learning_rate": 6.610453746396555e-06, + "loss": 0.1047, + "step": 22819 + }, + { + "epoch": 62.17983651226158, + "grad_norm": 2.727727174758911, + "learning_rate": 6.609623506240961e-06, + "loss": 0.1108, + "step": 22820 + }, + { + "epoch": 62.182561307901906, + "grad_norm": 4.26987886428833, + "learning_rate": 6.608793292489506e-06, + "loss": 0.121, + "step": 22821 + }, + { + "epoch": 62.18528610354223, + "grad_norm": 3.376009702682495, + "learning_rate": 6.607963105148664e-06, + "loss": 0.0849, + "step": 22822 + }, + { + "epoch": 62.18801089918256, + "grad_norm": 3.40041446685791, + "learning_rate": 6.607132944224893e-06, + "loss": 0.1266, + "step": 22823 + }, + { + "epoch": 62.19073569482289, + "grad_norm": 3.012694835662842, + "learning_rate": 6.6063028097246605e-06, + "loss": 0.0609, + "step": 22824 + }, + { + "epoch": 62.19346049046322, + "grad_norm": 2.8245034217834473, + "learning_rate": 6.605472701654434e-06, + "loss": 0.0454, + "step": 22825 + }, + { + "epoch": 62.19618528610354, + "grad_norm": 3.4797093868255615, + "learning_rate": 6.604642620020678e-06, + "loss": 0.0927, + "step": 22826 + }, + { + "epoch": 62.19891008174387, + "grad_norm": 6.359492778778076, + "learning_rate": 6.603812564829855e-06, + "loss": 0.0571, + "step": 22827 + }, + { + "epoch": 62.201634877384194, + "grad_norm": 3.569110870361328, + "learning_rate": 6.602982536088431e-06, + "loss": 0.1096, + "step": 22828 + }, + { + "epoch": 62.20435967302452, + "grad_norm": 5.001374244689941, + "learning_rate": 6.60215253380287e-06, + "loss": 0.1512, + "step": 22829 + }, + { + "epoch": 62.20708446866485, + "grad_norm": 2.981616973876953, + "learning_rate": 6.601322557979636e-06, + "loss": 0.1859, + "step": 22830 + }, + { + "epoch": 62.20980926430518, + "grad_norm": 3.294882297515869, + "learning_rate": 6.600492608625191e-06, + "loss": 0.0759, + "step": 22831 + }, + { + "epoch": 62.212534059945504, + "grad_norm": 4.741713523864746, + "learning_rate": 6.599662685746002e-06, + "loss": 0.0959, + "step": 22832 + }, + { + "epoch": 62.21525885558583, + "grad_norm": 4.462095260620117, + "learning_rate": 6.598832789348529e-06, + "loss": 0.1026, + "step": 22833 + }, + { + "epoch": 62.217983651226156, + "grad_norm": 4.4329962730407715, + "learning_rate": 6.598002919439239e-06, + "loss": 0.1621, + "step": 22834 + }, + { + "epoch": 62.22070844686648, + "grad_norm": 3.6745359897613525, + "learning_rate": 6.59717307602459e-06, + "loss": 0.1032, + "step": 22835 + }, + { + "epoch": 62.223433242506815, + "grad_norm": 4.1733784675598145, + "learning_rate": 6.59634325911105e-06, + "loss": 0.1479, + "step": 22836 + }, + { + "epoch": 62.22615803814714, + "grad_norm": 2.0391476154327393, + "learning_rate": 6.595513468705077e-06, + "loss": 0.0373, + "step": 22837 + }, + { + "epoch": 62.228882833787466, + "grad_norm": 14.953900337219238, + "learning_rate": 6.594683704813137e-06, + "loss": 0.2215, + "step": 22838 + }, + { + "epoch": 62.23160762942779, + "grad_norm": 3.2969255447387695, + "learning_rate": 6.5938539674416905e-06, + "loss": 0.1065, + "step": 22839 + }, + { + "epoch": 62.23433242506812, + "grad_norm": 3.650846242904663, + "learning_rate": 6.5930242565972e-06, + "loss": 0.0568, + "step": 22840 + }, + { + "epoch": 62.237057220708444, + "grad_norm": 3.5891788005828857, + "learning_rate": 6.592194572286124e-06, + "loss": 0.0856, + "step": 22841 + }, + { + "epoch": 62.23978201634878, + "grad_norm": 3.088629961013794, + "learning_rate": 6.591364914514927e-06, + "loss": 0.0868, + "step": 22842 + }, + { + "epoch": 62.2425068119891, + "grad_norm": 3.256484031677246, + "learning_rate": 6.590535283290074e-06, + "loss": 0.1134, + "step": 22843 + }, + { + "epoch": 62.24523160762943, + "grad_norm": 3.364840030670166, + "learning_rate": 6.58970567861802e-06, + "loss": 0.0648, + "step": 22844 + }, + { + "epoch": 62.247956403269754, + "grad_norm": 3.455981731414795, + "learning_rate": 6.5888761005052304e-06, + "loss": 0.1585, + "step": 22845 + }, + { + "epoch": 62.25068119891008, + "grad_norm": 3.8239667415618896, + "learning_rate": 6.588046548958162e-06, + "loss": 0.1382, + "step": 22846 + }, + { + "epoch": 62.253405994550405, + "grad_norm": 4.428664207458496, + "learning_rate": 6.587217023983278e-06, + "loss": 0.1051, + "step": 22847 + }, + { + "epoch": 62.25613079019074, + "grad_norm": 3.8833417892456055, + "learning_rate": 6.586387525587039e-06, + "loss": 0.0665, + "step": 22848 + }, + { + "epoch": 62.258855585831064, + "grad_norm": 4.516501426696777, + "learning_rate": 6.585558053775902e-06, + "loss": 0.1367, + "step": 22849 + }, + { + "epoch": 62.26158038147139, + "grad_norm": 3.3930704593658447, + "learning_rate": 6.584728608556332e-06, + "loss": 0.3072, + "step": 22850 + }, + { + "epoch": 62.264305177111716, + "grad_norm": 3.414585828781128, + "learning_rate": 6.583899189934784e-06, + "loss": 0.1806, + "step": 22851 + }, + { + "epoch": 62.26702997275204, + "grad_norm": 3.077812433242798, + "learning_rate": 6.58306979791772e-06, + "loss": 0.1024, + "step": 22852 + }, + { + "epoch": 62.26975476839237, + "grad_norm": 3.2056987285614014, + "learning_rate": 6.5822404325115964e-06, + "loss": 0.1084, + "step": 22853 + }, + { + "epoch": 62.2724795640327, + "grad_norm": 3.5665276050567627, + "learning_rate": 6.581411093722876e-06, + "loss": 0.106, + "step": 22854 + }, + { + "epoch": 62.275204359673026, + "grad_norm": 4.732414245605469, + "learning_rate": 6.580581781558015e-06, + "loss": 0.0642, + "step": 22855 + }, + { + "epoch": 62.27792915531335, + "grad_norm": 2.251091957092285, + "learning_rate": 6.579752496023475e-06, + "loss": 0.0789, + "step": 22856 + }, + { + "epoch": 62.28065395095368, + "grad_norm": 3.588737964630127, + "learning_rate": 6.578923237125709e-06, + "loss": 0.0486, + "step": 22857 + }, + { + "epoch": 62.283378746594, + "grad_norm": 3.733673334121704, + "learning_rate": 6.578094004871178e-06, + "loss": 0.0958, + "step": 22858 + }, + { + "epoch": 62.28610354223433, + "grad_norm": 3.861920118331909, + "learning_rate": 6.577264799266345e-06, + "loss": 0.0709, + "step": 22859 + }, + { + "epoch": 62.28882833787466, + "grad_norm": 3.939540386199951, + "learning_rate": 6.5764356203176605e-06, + "loss": 0.1253, + "step": 22860 + }, + { + "epoch": 62.29155313351499, + "grad_norm": 8.028321266174316, + "learning_rate": 6.575606468031589e-06, + "loss": 0.0796, + "step": 22861 + }, + { + "epoch": 62.294277929155314, + "grad_norm": 2.7306878566741943, + "learning_rate": 6.57477734241458e-06, + "loss": 0.0484, + "step": 22862 + }, + { + "epoch": 62.29700272479564, + "grad_norm": 3.1638236045837402, + "learning_rate": 6.573948243473098e-06, + "loss": 0.0798, + "step": 22863 + }, + { + "epoch": 62.299727520435965, + "grad_norm": 2.6454055309295654, + "learning_rate": 6.5731191712135954e-06, + "loss": 0.0588, + "step": 22864 + }, + { + "epoch": 62.30245231607629, + "grad_norm": 3.520888090133667, + "learning_rate": 6.572290125642531e-06, + "loss": 0.1743, + "step": 22865 + }, + { + "epoch": 62.305177111716624, + "grad_norm": 3.0653371810913086, + "learning_rate": 6.571461106766359e-06, + "loss": 0.0354, + "step": 22866 + }, + { + "epoch": 62.30790190735695, + "grad_norm": 3.277329683303833, + "learning_rate": 6.570632114591541e-06, + "loss": 0.0808, + "step": 22867 + }, + { + "epoch": 62.310626702997276, + "grad_norm": 3.780304193496704, + "learning_rate": 6.569803149124526e-06, + "loss": 0.1052, + "step": 22868 + }, + { + "epoch": 62.3133514986376, + "grad_norm": 5.893295764923096, + "learning_rate": 6.568974210371775e-06, + "loss": 0.0695, + "step": 22869 + }, + { + "epoch": 62.31607629427793, + "grad_norm": 3.770939826965332, + "learning_rate": 6.568145298339743e-06, + "loss": 0.2501, + "step": 22870 + }, + { + "epoch": 62.31880108991825, + "grad_norm": 5.348854064941406, + "learning_rate": 6.567316413034884e-06, + "loss": 0.1459, + "step": 22871 + }, + { + "epoch": 62.321525885558586, + "grad_norm": 4.396578311920166, + "learning_rate": 6.566487554463657e-06, + "loss": 0.0785, + "step": 22872 + }, + { + "epoch": 62.32425068119891, + "grad_norm": 3.6802093982696533, + "learning_rate": 6.5656587226325105e-06, + "loss": 0.0627, + "step": 22873 + }, + { + "epoch": 62.32697547683924, + "grad_norm": 6.617048740386963, + "learning_rate": 6.564829917547907e-06, + "loss": 0.0515, + "step": 22874 + }, + { + "epoch": 62.32970027247956, + "grad_norm": 2.9462718963623047, + "learning_rate": 6.564001139216294e-06, + "loss": 0.0632, + "step": 22875 + }, + { + "epoch": 62.33242506811989, + "grad_norm": 2.8858888149261475, + "learning_rate": 6.563172387644129e-06, + "loss": 0.0726, + "step": 22876 + }, + { + "epoch": 62.335149863760215, + "grad_norm": 4.954010963439941, + "learning_rate": 6.56234366283787e-06, + "loss": 0.1487, + "step": 22877 + }, + { + "epoch": 62.33787465940055, + "grad_norm": 3.1028778553009033, + "learning_rate": 6.561514964803966e-06, + "loss": 0.0567, + "step": 22878 + }, + { + "epoch": 62.34059945504087, + "grad_norm": 3.4563522338867188, + "learning_rate": 6.560686293548875e-06, + "loss": 0.0522, + "step": 22879 + }, + { + "epoch": 62.3433242506812, + "grad_norm": 4.651001930236816, + "learning_rate": 6.5598576490790465e-06, + "loss": 0.0906, + "step": 22880 + }, + { + "epoch": 62.346049046321525, + "grad_norm": 3.897664785385132, + "learning_rate": 6.559029031400937e-06, + "loss": 0.1486, + "step": 22881 + }, + { + "epoch": 62.34877384196185, + "grad_norm": 4.379997253417969, + "learning_rate": 6.558200440520999e-06, + "loss": 0.0798, + "step": 22882 + }, + { + "epoch": 62.35149863760218, + "grad_norm": 3.9950928688049316, + "learning_rate": 6.557371876445684e-06, + "loss": 0.0663, + "step": 22883 + }, + { + "epoch": 62.35422343324251, + "grad_norm": 4.069232940673828, + "learning_rate": 6.556543339181447e-06, + "loss": 0.1113, + "step": 22884 + }, + { + "epoch": 62.356948228882835, + "grad_norm": 3.1827847957611084, + "learning_rate": 6.555714828734739e-06, + "loss": 0.158, + "step": 22885 + }, + { + "epoch": 62.35967302452316, + "grad_norm": 5.421937942504883, + "learning_rate": 6.554886345112013e-06, + "loss": 0.1692, + "step": 22886 + }, + { + "epoch": 62.36239782016349, + "grad_norm": 7.863237380981445, + "learning_rate": 6.554057888319723e-06, + "loss": 0.0802, + "step": 22887 + }, + { + "epoch": 62.36512261580381, + "grad_norm": 3.065836191177368, + "learning_rate": 6.553229458364317e-06, + "loss": 0.062, + "step": 22888 + }, + { + "epoch": 62.36784741144414, + "grad_norm": 2.846912384033203, + "learning_rate": 6.552401055252251e-06, + "loss": 0.1029, + "step": 22889 + }, + { + "epoch": 62.37057220708447, + "grad_norm": 3.9938836097717285, + "learning_rate": 6.551572678989973e-06, + "loss": 0.0571, + "step": 22890 + }, + { + "epoch": 62.3732970027248, + "grad_norm": 3.762964963912964, + "learning_rate": 6.550744329583934e-06, + "loss": 0.1132, + "step": 22891 + }, + { + "epoch": 62.37602179836512, + "grad_norm": 2.934399127960205, + "learning_rate": 6.5499160070405906e-06, + "loss": 0.1613, + "step": 22892 + }, + { + "epoch": 62.37874659400545, + "grad_norm": 5.411092281341553, + "learning_rate": 6.549087711366386e-06, + "loss": 0.2198, + "step": 22893 + }, + { + "epoch": 62.381471389645775, + "grad_norm": 3.6235530376434326, + "learning_rate": 6.548259442567778e-06, + "loss": 0.2015, + "step": 22894 + }, + { + "epoch": 62.3841961852861, + "grad_norm": 3.070939302444458, + "learning_rate": 6.547431200651217e-06, + "loss": 0.0508, + "step": 22895 + }, + { + "epoch": 62.38692098092643, + "grad_norm": 3.4948794841766357, + "learning_rate": 6.546602985623147e-06, + "loss": 0.067, + "step": 22896 + }, + { + "epoch": 62.38964577656676, + "grad_norm": 3.767698287963867, + "learning_rate": 6.545774797490025e-06, + "loss": 0.084, + "step": 22897 + }, + { + "epoch": 62.392370572207085, + "grad_norm": 2.9165124893188477, + "learning_rate": 6.544946636258295e-06, + "loss": 0.076, + "step": 22898 + }, + { + "epoch": 62.39509536784741, + "grad_norm": 4.044775485992432, + "learning_rate": 6.544118501934411e-06, + "loss": 0.067, + "step": 22899 + }, + { + "epoch": 62.39782016348774, + "grad_norm": 4.254181385040283, + "learning_rate": 6.543290394524819e-06, + "loss": 0.1345, + "step": 22900 + }, + { + "epoch": 62.40054495912806, + "grad_norm": 4.1424174308776855, + "learning_rate": 6.542462314035973e-06, + "loss": 0.0813, + "step": 22901 + }, + { + "epoch": 62.403269754768395, + "grad_norm": 3.561481237411499, + "learning_rate": 6.541634260474317e-06, + "loss": 0.161, + "step": 22902 + }, + { + "epoch": 62.40599455040872, + "grad_norm": 4.19312047958374, + "learning_rate": 6.540806233846304e-06, + "loss": 0.1083, + "step": 22903 + }, + { + "epoch": 62.40871934604905, + "grad_norm": 3.018279552459717, + "learning_rate": 6.539978234158379e-06, + "loss": 0.1363, + "step": 22904 + }, + { + "epoch": 62.41144414168937, + "grad_norm": 3.0838325023651123, + "learning_rate": 6.539150261416993e-06, + "loss": 0.148, + "step": 22905 + }, + { + "epoch": 62.4141689373297, + "grad_norm": 4.2507195472717285, + "learning_rate": 6.538322315628593e-06, + "loss": 0.1253, + "step": 22906 + }, + { + "epoch": 62.416893732970024, + "grad_norm": 3.0164480209350586, + "learning_rate": 6.537494396799629e-06, + "loss": 0.1134, + "step": 22907 + }, + { + "epoch": 62.41961852861036, + "grad_norm": 3.5077004432678223, + "learning_rate": 6.536666504936544e-06, + "loss": 0.068, + "step": 22908 + }, + { + "epoch": 62.42234332425068, + "grad_norm": 3.6945509910583496, + "learning_rate": 6.53583864004579e-06, + "loss": 0.1392, + "step": 22909 + }, + { + "epoch": 62.42506811989101, + "grad_norm": 3.732836961746216, + "learning_rate": 6.53501080213381e-06, + "loss": 0.1401, + "step": 22910 + }, + { + "epoch": 62.427792915531334, + "grad_norm": 4.5331525802612305, + "learning_rate": 6.534182991207059e-06, + "loss": 0.0895, + "step": 22911 + }, + { + "epoch": 62.43051771117166, + "grad_norm": 2.5722134113311768, + "learning_rate": 6.533355207271976e-06, + "loss": 0.0633, + "step": 22912 + }, + { + "epoch": 62.433242506811986, + "grad_norm": 4.173740863800049, + "learning_rate": 6.532527450335016e-06, + "loss": 0.1205, + "step": 22913 + }, + { + "epoch": 62.43596730245232, + "grad_norm": 4.303950786590576, + "learning_rate": 6.531699720402616e-06, + "loss": 0.0599, + "step": 22914 + }, + { + "epoch": 62.438692098092645, + "grad_norm": 4.381292343139648, + "learning_rate": 6.530872017481232e-06, + "loss": 0.1366, + "step": 22915 + }, + { + "epoch": 62.44141689373297, + "grad_norm": 4.8696699142456055, + "learning_rate": 6.5300443415772995e-06, + "loss": 0.0825, + "step": 22916 + }, + { + "epoch": 62.444141689373296, + "grad_norm": 4.519044399261475, + "learning_rate": 6.529216692697273e-06, + "loss": 0.0635, + "step": 22917 + }, + { + "epoch": 62.44686648501362, + "grad_norm": 3.354917287826538, + "learning_rate": 6.528389070847594e-06, + "loss": 0.1498, + "step": 22918 + }, + { + "epoch": 62.44959128065395, + "grad_norm": 2.6892342567443848, + "learning_rate": 6.527561476034712e-06, + "loss": 0.0421, + "step": 22919 + }, + { + "epoch": 62.45231607629428, + "grad_norm": 11.079471588134766, + "learning_rate": 6.526733908265066e-06, + "loss": 0.1292, + "step": 22920 + }, + { + "epoch": 62.45504087193461, + "grad_norm": 3.2886509895324707, + "learning_rate": 6.525906367545108e-06, + "loss": 0.1325, + "step": 22921 + }, + { + "epoch": 62.45776566757493, + "grad_norm": 5.297695159912109, + "learning_rate": 6.525078853881275e-06, + "loss": 0.0459, + "step": 22922 + }, + { + "epoch": 62.46049046321526, + "grad_norm": 5.968097686767578, + "learning_rate": 6.524251367280019e-06, + "loss": 0.0914, + "step": 22923 + }, + { + "epoch": 62.463215258855584, + "grad_norm": 3.63021183013916, + "learning_rate": 6.5234239077477815e-06, + "loss": 0.1216, + "step": 22924 + }, + { + "epoch": 62.46594005449591, + "grad_norm": 7.625444412231445, + "learning_rate": 6.522596475291005e-06, + "loss": 0.2645, + "step": 22925 + }, + { + "epoch": 62.46866485013624, + "grad_norm": 2.5148627758026123, + "learning_rate": 6.521769069916136e-06, + "loss": 0.0398, + "step": 22926 + }, + { + "epoch": 62.47138964577657, + "grad_norm": 3.4624040126800537, + "learning_rate": 6.520941691629615e-06, + "loss": 0.0617, + "step": 22927 + }, + { + "epoch": 62.474114441416894, + "grad_norm": 4.036266803741455, + "learning_rate": 6.520114340437892e-06, + "loss": 0.1025, + "step": 22928 + }, + { + "epoch": 62.47683923705722, + "grad_norm": 4.457673072814941, + "learning_rate": 6.5192870163474045e-06, + "loss": 0.1141, + "step": 22929 + }, + { + "epoch": 62.479564032697546, + "grad_norm": 3.806377649307251, + "learning_rate": 6.518459719364601e-06, + "loss": 0.2224, + "step": 22930 + }, + { + "epoch": 62.48228882833787, + "grad_norm": 3.7779488563537598, + "learning_rate": 6.517632449495916e-06, + "loss": 0.0782, + "step": 22931 + }, + { + "epoch": 62.485013623978205, + "grad_norm": 3.29911732673645, + "learning_rate": 6.516805206747803e-06, + "loss": 0.0529, + "step": 22932 + }, + { + "epoch": 62.48773841961853, + "grad_norm": 3.861456871032715, + "learning_rate": 6.515977991126694e-06, + "loss": 0.1291, + "step": 22933 + }, + { + "epoch": 62.490463215258856, + "grad_norm": 2.820650815963745, + "learning_rate": 6.515150802639037e-06, + "loss": 0.1041, + "step": 22934 + }, + { + "epoch": 62.49318801089918, + "grad_norm": 3.721628427505493, + "learning_rate": 6.514323641291276e-06, + "loss": 0.072, + "step": 22935 + }, + { + "epoch": 62.49591280653951, + "grad_norm": 5.200292587280273, + "learning_rate": 6.5134965070898496e-06, + "loss": 0.165, + "step": 22936 + }, + { + "epoch": 62.49863760217983, + "grad_norm": 5.09596061706543, + "learning_rate": 6.512669400041201e-06, + "loss": 0.1449, + "step": 22937 + }, + { + "epoch": 62.50136239782017, + "grad_norm": 4.042686462402344, + "learning_rate": 6.5118423201517665e-06, + "loss": 0.1748, + "step": 22938 + }, + { + "epoch": 62.50408719346049, + "grad_norm": 3.972289562225342, + "learning_rate": 6.511015267427997e-06, + "loss": 0.0756, + "step": 22939 + }, + { + "epoch": 62.50681198910082, + "grad_norm": 3.087763547897339, + "learning_rate": 6.510188241876325e-06, + "loss": 0.0502, + "step": 22940 + }, + { + "epoch": 62.509536784741144, + "grad_norm": 3.365104913711548, + "learning_rate": 6.509361243503196e-06, + "loss": 0.1303, + "step": 22941 + }, + { + "epoch": 62.51226158038147, + "grad_norm": 2.906590700149536, + "learning_rate": 6.508534272315048e-06, + "loss": 0.1028, + "step": 22942 + }, + { + "epoch": 62.514986376021795, + "grad_norm": 3.973233938217163, + "learning_rate": 6.507707328318326e-06, + "loss": 0.0884, + "step": 22943 + }, + { + "epoch": 62.51771117166213, + "grad_norm": 2.7279627323150635, + "learning_rate": 6.50688041151946e-06, + "loss": 0.0567, + "step": 22944 + }, + { + "epoch": 62.520435967302454, + "grad_norm": 3.1076507568359375, + "learning_rate": 6.506053521924902e-06, + "loss": 0.1277, + "step": 22945 + }, + { + "epoch": 62.52316076294278, + "grad_norm": 2.818887710571289, + "learning_rate": 6.5052266595410874e-06, + "loss": 0.0497, + "step": 22946 + }, + { + "epoch": 62.525885558583106, + "grad_norm": 3.5251336097717285, + "learning_rate": 6.504399824374453e-06, + "loss": 0.1078, + "step": 22947 + }, + { + "epoch": 62.52861035422343, + "grad_norm": 4.230286121368408, + "learning_rate": 6.503573016431442e-06, + "loss": 0.1738, + "step": 22948 + }, + { + "epoch": 62.53133514986376, + "grad_norm": 5.084421634674072, + "learning_rate": 6.502746235718491e-06, + "loss": 0.0744, + "step": 22949 + }, + { + "epoch": 62.53405994550409, + "grad_norm": 4.893348693847656, + "learning_rate": 6.50191948224204e-06, + "loss": 0.2584, + "step": 22950 + }, + { + "epoch": 62.536784741144416, + "grad_norm": 2.828664779663086, + "learning_rate": 6.501092756008527e-06, + "loss": 0.0339, + "step": 22951 + }, + { + "epoch": 62.53950953678474, + "grad_norm": 3.1087496280670166, + "learning_rate": 6.500266057024392e-06, + "loss": 0.0791, + "step": 22952 + }, + { + "epoch": 62.54223433242507, + "grad_norm": 4.159045219421387, + "learning_rate": 6.499439385296071e-06, + "loss": 0.0734, + "step": 22953 + }, + { + "epoch": 62.54495912806539, + "grad_norm": 4.612759113311768, + "learning_rate": 6.498612740830006e-06, + "loss": 0.1996, + "step": 22954 + }, + { + "epoch": 62.54768392370572, + "grad_norm": 3.0963053703308105, + "learning_rate": 6.497786123632628e-06, + "loss": 0.2474, + "step": 22955 + }, + { + "epoch": 62.55040871934605, + "grad_norm": 3.6551713943481445, + "learning_rate": 6.4969595337103806e-06, + "loss": 0.1128, + "step": 22956 + }, + { + "epoch": 62.55313351498638, + "grad_norm": 4.4289469718933105, + "learning_rate": 6.496132971069702e-06, + "loss": 0.099, + "step": 22957 + }, + { + "epoch": 62.555858310626704, + "grad_norm": 4.449501991271973, + "learning_rate": 6.495306435717024e-06, + "loss": 0.1284, + "step": 22958 + }, + { + "epoch": 62.55858310626703, + "grad_norm": 3.4457151889801025, + "learning_rate": 6.49447992765879e-06, + "loss": 0.071, + "step": 22959 + }, + { + "epoch": 62.561307901907355, + "grad_norm": 3.6617636680603027, + "learning_rate": 6.49365344690143e-06, + "loss": 0.1488, + "step": 22960 + }, + { + "epoch": 62.56403269754768, + "grad_norm": 4.430767059326172, + "learning_rate": 6.492826993451386e-06, + "loss": 0.0816, + "step": 22961 + }, + { + "epoch": 62.566757493188014, + "grad_norm": 2.1721184253692627, + "learning_rate": 6.49200056731509e-06, + "loss": 0.049, + "step": 22962 + }, + { + "epoch": 62.56948228882834, + "grad_norm": 3.556936740875244, + "learning_rate": 6.491174168498981e-06, + "loss": 0.0695, + "step": 22963 + }, + { + "epoch": 62.572207084468666, + "grad_norm": 2.796623468399048, + "learning_rate": 6.490347797009498e-06, + "loss": 0.1317, + "step": 22964 + }, + { + "epoch": 62.57493188010899, + "grad_norm": 3.142650842666626, + "learning_rate": 6.489521452853071e-06, + "loss": 0.0619, + "step": 22965 + }, + { + "epoch": 62.57765667574932, + "grad_norm": 3.462892532348633, + "learning_rate": 6.488695136036141e-06, + "loss": 0.1504, + "step": 22966 + }, + { + "epoch": 62.58038147138964, + "grad_norm": 3.852605104446411, + "learning_rate": 6.487868846565136e-06, + "loss": 0.0701, + "step": 22967 + }, + { + "epoch": 62.583106267029976, + "grad_norm": 3.334852933883667, + "learning_rate": 6.487042584446499e-06, + "loss": 0.1001, + "step": 22968 + }, + { + "epoch": 62.5858310626703, + "grad_norm": 3.1268060207366943, + "learning_rate": 6.486216349686658e-06, + "loss": 0.0504, + "step": 22969 + }, + { + "epoch": 62.58855585831063, + "grad_norm": 3.4463112354278564, + "learning_rate": 6.485390142292054e-06, + "loss": 0.1764, + "step": 22970 + }, + { + "epoch": 62.59128065395095, + "grad_norm": 3.072113275527954, + "learning_rate": 6.484563962269117e-06, + "loss": 0.2094, + "step": 22971 + }, + { + "epoch": 62.59400544959128, + "grad_norm": 3.998873710632324, + "learning_rate": 6.483737809624284e-06, + "loss": 0.0854, + "step": 22972 + }, + { + "epoch": 62.596730245231605, + "grad_norm": 5.751617431640625, + "learning_rate": 6.482911684363985e-06, + "loss": 0.0551, + "step": 22973 + }, + { + "epoch": 62.59945504087194, + "grad_norm": 4.150777339935303, + "learning_rate": 6.48208558649466e-06, + "loss": 0.1185, + "step": 22974 + }, + { + "epoch": 62.60217983651226, + "grad_norm": 3.205233335494995, + "learning_rate": 6.481259516022735e-06, + "loss": 0.0503, + "step": 22975 + }, + { + "epoch": 62.60490463215259, + "grad_norm": 2.293523073196411, + "learning_rate": 6.480433472954653e-06, + "loss": 0.0456, + "step": 22976 + }, + { + "epoch": 62.607629427792915, + "grad_norm": 5.082372188568115, + "learning_rate": 6.479607457296837e-06, + "loss": 0.1792, + "step": 22977 + }, + { + "epoch": 62.61035422343324, + "grad_norm": 3.6771934032440186, + "learning_rate": 6.4787814690557264e-06, + "loss": 0.066, + "step": 22978 + }, + { + "epoch": 62.61307901907357, + "grad_norm": 5.0433125495910645, + "learning_rate": 6.47795550823775e-06, + "loss": 0.1291, + "step": 22979 + }, + { + "epoch": 62.6158038147139, + "grad_norm": 4.6060638427734375, + "learning_rate": 6.4771295748493455e-06, + "loss": 0.1177, + "step": 22980 + }, + { + "epoch": 62.618528610354225, + "grad_norm": 4.242333889007568, + "learning_rate": 6.476303668896941e-06, + "loss": 0.165, + "step": 22981 + }, + { + "epoch": 62.62125340599455, + "grad_norm": 3.4630861282348633, + "learning_rate": 6.475477790386974e-06, + "loss": 0.0747, + "step": 22982 + }, + { + "epoch": 62.62397820163488, + "grad_norm": 4.103496551513672, + "learning_rate": 6.474651939325869e-06, + "loss": 0.0476, + "step": 22983 + }, + { + "epoch": 62.6267029972752, + "grad_norm": 3.7876334190368652, + "learning_rate": 6.473826115720063e-06, + "loss": 0.0741, + "step": 22984 + }, + { + "epoch": 62.62942779291553, + "grad_norm": 3.482868194580078, + "learning_rate": 6.473000319575985e-06, + "loss": 0.0423, + "step": 22985 + }, + { + "epoch": 62.63215258855586, + "grad_norm": 3.449143648147583, + "learning_rate": 6.472174550900068e-06, + "loss": 0.1145, + "step": 22986 + }, + { + "epoch": 62.63487738419619, + "grad_norm": 3.775345802307129, + "learning_rate": 6.471348809698741e-06, + "loss": 0.0668, + "step": 22987 + }, + { + "epoch": 62.63760217983651, + "grad_norm": 4.094781875610352, + "learning_rate": 6.470523095978436e-06, + "loss": 0.0812, + "step": 22988 + }, + { + "epoch": 62.64032697547684, + "grad_norm": 3.8218133449554443, + "learning_rate": 6.469697409745583e-06, + "loss": 0.0597, + "step": 22989 + }, + { + "epoch": 62.643051771117165, + "grad_norm": 3.766822338104248, + "learning_rate": 6.468871751006614e-06, + "loss": 0.1651, + "step": 22990 + }, + { + "epoch": 62.64577656675749, + "grad_norm": 4.768446445465088, + "learning_rate": 6.468046119767956e-06, + "loss": 0.0915, + "step": 22991 + }, + { + "epoch": 62.64850136239782, + "grad_norm": 4.536155700683594, + "learning_rate": 6.4672205160360455e-06, + "loss": 0.09, + "step": 22992 + }, + { + "epoch": 62.65122615803815, + "grad_norm": 2.9946510791778564, + "learning_rate": 6.466394939817305e-06, + "loss": 0.0805, + "step": 22993 + }, + { + "epoch": 62.653950953678475, + "grad_norm": 5.23456335067749, + "learning_rate": 6.465569391118167e-06, + "loss": 0.0767, + "step": 22994 + }, + { + "epoch": 62.6566757493188, + "grad_norm": 4.049919605255127, + "learning_rate": 6.464743869945061e-06, + "loss": 0.1955, + "step": 22995 + }, + { + "epoch": 62.65940054495913, + "grad_norm": 3.183833599090576, + "learning_rate": 6.4639183763044124e-06, + "loss": 0.0743, + "step": 22996 + }, + { + "epoch": 62.66212534059945, + "grad_norm": 2.2236080169677734, + "learning_rate": 6.463092910202656e-06, + "loss": 0.0352, + "step": 22997 + }, + { + "epoch": 62.664850136239785, + "grad_norm": 4.320413112640381, + "learning_rate": 6.462267471646221e-06, + "loss": 0.0835, + "step": 22998 + }, + { + "epoch": 62.66757493188011, + "grad_norm": 4.502333641052246, + "learning_rate": 6.461442060641531e-06, + "loss": 0.0905, + "step": 22999 + }, + { + "epoch": 62.67029972752044, + "grad_norm": 3.6087913513183594, + "learning_rate": 6.460616677195017e-06, + "loss": 0.2139, + "step": 23000 + }, + { + "epoch": 62.67302452316076, + "grad_norm": 3.9240729808807373, + "learning_rate": 6.4597913213131054e-06, + "loss": 0.151, + "step": 23001 + }, + { + "epoch": 62.67574931880109, + "grad_norm": 3.8604400157928467, + "learning_rate": 6.458965993002228e-06, + "loss": 0.1207, + "step": 23002 + }, + { + "epoch": 62.678474114441414, + "grad_norm": 3.887859344482422, + "learning_rate": 6.458140692268806e-06, + "loss": 0.1225, + "step": 23003 + }, + { + "epoch": 62.68119891008175, + "grad_norm": 3.3446779251098633, + "learning_rate": 6.457315419119273e-06, + "loss": 0.1642, + "step": 23004 + }, + { + "epoch": 62.68392370572207, + "grad_norm": 3.9583802223205566, + "learning_rate": 6.45649017356005e-06, + "loss": 0.052, + "step": 23005 + }, + { + "epoch": 62.6866485013624, + "grad_norm": 4.6864142417907715, + "learning_rate": 6.4556649555975715e-06, + "loss": 0.0983, + "step": 23006 + }, + { + "epoch": 62.689373297002724, + "grad_norm": 4.684879779815674, + "learning_rate": 6.454839765238259e-06, + "loss": 0.1146, + "step": 23007 + }, + { + "epoch": 62.69209809264305, + "grad_norm": 1.921517014503479, + "learning_rate": 6.45401460248854e-06, + "loss": 0.0321, + "step": 23008 + }, + { + "epoch": 62.694822888283376, + "grad_norm": 3.720921754837036, + "learning_rate": 6.45318946735484e-06, + "loss": 0.0698, + "step": 23009 + }, + { + "epoch": 62.69754768392371, + "grad_norm": 5.4707512855529785, + "learning_rate": 6.452364359843588e-06, + "loss": 0.1797, + "step": 23010 + }, + { + "epoch": 62.700272479564035, + "grad_norm": 6.212604522705078, + "learning_rate": 6.451539279961206e-06, + "loss": 0.1189, + "step": 23011 + }, + { + "epoch": 62.70299727520436, + "grad_norm": 3.161020517349243, + "learning_rate": 6.450714227714126e-06, + "loss": 0.0461, + "step": 23012 + }, + { + "epoch": 62.705722070844686, + "grad_norm": 4.240825176239014, + "learning_rate": 6.449889203108762e-06, + "loss": 0.0928, + "step": 23013 + }, + { + "epoch": 62.70844686648501, + "grad_norm": 3.6804215908050537, + "learning_rate": 6.449064206151551e-06, + "loss": 0.0814, + "step": 23014 + }, + { + "epoch": 62.71117166212534, + "grad_norm": 3.9061172008514404, + "learning_rate": 6.448239236848914e-06, + "loss": 0.0518, + "step": 23015 + }, + { + "epoch": 62.71389645776567, + "grad_norm": 3.953368663787842, + "learning_rate": 6.447414295207275e-06, + "loss": 0.0742, + "step": 23016 + }, + { + "epoch": 62.716621253406, + "grad_norm": 3.946296215057373, + "learning_rate": 6.446589381233062e-06, + "loss": 0.1001, + "step": 23017 + }, + { + "epoch": 62.71934604904632, + "grad_norm": 2.48675799369812, + "learning_rate": 6.445764494932691e-06, + "loss": 0.0501, + "step": 23018 + }, + { + "epoch": 62.72207084468665, + "grad_norm": 5.315413475036621, + "learning_rate": 6.444939636312597e-06, + "loss": 0.0797, + "step": 23019 + }, + { + "epoch": 62.724795640326974, + "grad_norm": 3.369425058364868, + "learning_rate": 6.4441148053791956e-06, + "loss": 0.1928, + "step": 23020 + }, + { + "epoch": 62.7275204359673, + "grad_norm": 5.1165900230407715, + "learning_rate": 6.443290002138913e-06, + "loss": 0.1932, + "step": 23021 + }, + { + "epoch": 62.73024523160763, + "grad_norm": 3.6062586307525635, + "learning_rate": 6.442465226598177e-06, + "loss": 0.0462, + "step": 23022 + }, + { + "epoch": 62.73297002724796, + "grad_norm": 4.3308186531066895, + "learning_rate": 6.4416404787634045e-06, + "loss": 0.0815, + "step": 23023 + }, + { + "epoch": 62.735694822888284, + "grad_norm": 4.880808353424072, + "learning_rate": 6.440815758641023e-06, + "loss": 0.0867, + "step": 23024 + }, + { + "epoch": 62.73841961852861, + "grad_norm": 4.942392349243164, + "learning_rate": 6.439991066237452e-06, + "loss": 0.0578, + "step": 23025 + }, + { + "epoch": 62.741144414168936, + "grad_norm": 7.794327735900879, + "learning_rate": 6.4391664015591185e-06, + "loss": 0.1435, + "step": 23026 + }, + { + "epoch": 62.74386920980926, + "grad_norm": 5.124037265777588, + "learning_rate": 6.438341764612439e-06, + "loss": 0.0851, + "step": 23027 + }, + { + "epoch": 62.746594005449595, + "grad_norm": 3.0087430477142334, + "learning_rate": 6.437517155403843e-06, + "loss": 0.0451, + "step": 23028 + }, + { + "epoch": 62.74931880108992, + "grad_norm": 3.278937339782715, + "learning_rate": 6.4366925739397456e-06, + "loss": 0.0645, + "step": 23029 + }, + { + "epoch": 62.752043596730246, + "grad_norm": 4.432502746582031, + "learning_rate": 6.4358680202265696e-06, + "loss": 0.0653, + "step": 23030 + }, + { + "epoch": 62.75476839237057, + "grad_norm": 3.406248092651367, + "learning_rate": 6.435043494270743e-06, + "loss": 0.0725, + "step": 23031 + }, + { + "epoch": 62.7574931880109, + "grad_norm": 3.52441143989563, + "learning_rate": 6.434218996078683e-06, + "loss": 0.1595, + "step": 23032 + }, + { + "epoch": 62.76021798365122, + "grad_norm": 4.138480186462402, + "learning_rate": 6.43339452565681e-06, + "loss": 0.0607, + "step": 23033 + }, + { + "epoch": 62.762942779291556, + "grad_norm": 2.9758920669555664, + "learning_rate": 6.432570083011544e-06, + "loss": 0.028, + "step": 23034 + }, + { + "epoch": 62.76566757493188, + "grad_norm": 1.8794962167739868, + "learning_rate": 6.43174566814931e-06, + "loss": 0.0844, + "step": 23035 + }, + { + "epoch": 62.76839237057221, + "grad_norm": 3.843134880065918, + "learning_rate": 6.4309212810765245e-06, + "loss": 0.0503, + "step": 23036 + }, + { + "epoch": 62.771117166212534, + "grad_norm": 2.8406097888946533, + "learning_rate": 6.43009692179961e-06, + "loss": 0.0443, + "step": 23037 + }, + { + "epoch": 62.77384196185286, + "grad_norm": 3.2359085083007812, + "learning_rate": 6.429272590324984e-06, + "loss": 0.048, + "step": 23038 + }, + { + "epoch": 62.776566757493185, + "grad_norm": 4.195863246917725, + "learning_rate": 6.428448286659071e-06, + "loss": 0.1102, + "step": 23039 + }, + { + "epoch": 62.77929155313352, + "grad_norm": 4.652376651763916, + "learning_rate": 6.427624010808284e-06, + "loss": 0.0817, + "step": 23040 + }, + { + "epoch": 62.782016348773844, + "grad_norm": 4.894301414489746, + "learning_rate": 6.42679976277905e-06, + "loss": 0.1194, + "step": 23041 + }, + { + "epoch": 62.78474114441417, + "grad_norm": 3.5861191749572754, + "learning_rate": 6.425975542577783e-06, + "loss": 0.0572, + "step": 23042 + }, + { + "epoch": 62.787465940054496, + "grad_norm": 3.2628448009490967, + "learning_rate": 6.425151350210901e-06, + "loss": 0.1383, + "step": 23043 + }, + { + "epoch": 62.79019073569482, + "grad_norm": 3.143688678741455, + "learning_rate": 6.424327185684829e-06, + "loss": 0.0881, + "step": 23044 + }, + { + "epoch": 62.79291553133515, + "grad_norm": 3.5223324298858643, + "learning_rate": 6.423503049005979e-06, + "loss": 0.1007, + "step": 23045 + }, + { + "epoch": 62.79564032697548, + "grad_norm": 3.900768518447876, + "learning_rate": 6.422678940180775e-06, + "loss": 0.0517, + "step": 23046 + }, + { + "epoch": 62.798365122615806, + "grad_norm": 3.8422086238861084, + "learning_rate": 6.42185485921563e-06, + "loss": 0.2194, + "step": 23047 + }, + { + "epoch": 62.80108991825613, + "grad_norm": 11.169679641723633, + "learning_rate": 6.421030806116961e-06, + "loss": 0.0797, + "step": 23048 + }, + { + "epoch": 62.80381471389646, + "grad_norm": 2.756113052368164, + "learning_rate": 6.420206780891194e-06, + "loss": 0.1232, + "step": 23049 + }, + { + "epoch": 62.80653950953678, + "grad_norm": 4.002607822418213, + "learning_rate": 6.419382783544739e-06, + "loss": 0.0707, + "step": 23050 + }, + { + "epoch": 62.80926430517711, + "grad_norm": 2.948599100112915, + "learning_rate": 6.4185588140840195e-06, + "loss": 0.05, + "step": 23051 + }, + { + "epoch": 62.81198910081744, + "grad_norm": 2.4843387603759766, + "learning_rate": 6.417734872515444e-06, + "loss": 0.1476, + "step": 23052 + }, + { + "epoch": 62.81471389645777, + "grad_norm": 4.173250675201416, + "learning_rate": 6.416910958845437e-06, + "loss": 0.0786, + "step": 23053 + }, + { + "epoch": 62.817438692098094, + "grad_norm": 3.032074213027954, + "learning_rate": 6.41608707308041e-06, + "loss": 0.0606, + "step": 23054 + }, + { + "epoch": 62.82016348773842, + "grad_norm": 3.3955652713775635, + "learning_rate": 6.415263215226785e-06, + "loss": 0.0556, + "step": 23055 + }, + { + "epoch": 62.822888283378745, + "grad_norm": 4.590451717376709, + "learning_rate": 6.414439385290971e-06, + "loss": 0.1345, + "step": 23056 + }, + { + "epoch": 62.82561307901907, + "grad_norm": 3.456740379333496, + "learning_rate": 6.41361558327939e-06, + "loss": 0.1016, + "step": 23057 + }, + { + "epoch": 62.828337874659404, + "grad_norm": 3.6677567958831787, + "learning_rate": 6.412791809198453e-06, + "loss": 0.2228, + "step": 23058 + }, + { + "epoch": 62.83106267029973, + "grad_norm": 3.0606536865234375, + "learning_rate": 6.411968063054581e-06, + "loss": 0.1989, + "step": 23059 + }, + { + "epoch": 62.833787465940055, + "grad_norm": 3.7640984058380127, + "learning_rate": 6.411144344854183e-06, + "loss": 0.0694, + "step": 23060 + }, + { + "epoch": 62.83651226158038, + "grad_norm": 4.457794666290283, + "learning_rate": 6.410320654603681e-06, + "loss": 0.1596, + "step": 23061 + }, + { + "epoch": 62.83923705722071, + "grad_norm": 3.6370296478271484, + "learning_rate": 6.409496992309483e-06, + "loss": 0.0636, + "step": 23062 + }, + { + "epoch": 62.84196185286103, + "grad_norm": 3.8966104984283447, + "learning_rate": 6.408673357978009e-06, + "loss": 0.1126, + "step": 23063 + }, + { + "epoch": 62.844686648501366, + "grad_norm": 2.9331953525543213, + "learning_rate": 6.407849751615669e-06, + "loss": 0.0573, + "step": 23064 + }, + { + "epoch": 62.84741144414169, + "grad_norm": 4.1566643714904785, + "learning_rate": 6.407026173228878e-06, + "loss": 0.2003, + "step": 23065 + }, + { + "epoch": 62.85013623978202, + "grad_norm": 3.167177438735962, + "learning_rate": 6.406202622824054e-06, + "loss": 0.1327, + "step": 23066 + }, + { + "epoch": 62.85286103542234, + "grad_norm": 3.376971960067749, + "learning_rate": 6.40537910040761e-06, + "loss": 0.0528, + "step": 23067 + }, + { + "epoch": 62.85558583106267, + "grad_norm": 4.459584712982178, + "learning_rate": 6.404555605985956e-06, + "loss": 0.13, + "step": 23068 + }, + { + "epoch": 62.858310626702995, + "grad_norm": 2.184400796890259, + "learning_rate": 6.403732139565508e-06, + "loss": 0.1063, + "step": 23069 + }, + { + "epoch": 62.86103542234333, + "grad_norm": 3.7576041221618652, + "learning_rate": 6.402908701152677e-06, + "loss": 0.0779, + "step": 23070 + }, + { + "epoch": 62.86376021798365, + "grad_norm": 2.7387702465057373, + "learning_rate": 6.40208529075388e-06, + "loss": 0.0501, + "step": 23071 + }, + { + "epoch": 62.86648501362398, + "grad_norm": 3.7353484630584717, + "learning_rate": 6.401261908375525e-06, + "loss": 0.106, + "step": 23072 + }, + { + "epoch": 62.869209809264305, + "grad_norm": 3.082329750061035, + "learning_rate": 6.4004385540240266e-06, + "loss": 0.1467, + "step": 23073 + }, + { + "epoch": 62.87193460490463, + "grad_norm": 3.7303121089935303, + "learning_rate": 6.399615227705797e-06, + "loss": 0.1449, + "step": 23074 + }, + { + "epoch": 62.87465940054496, + "grad_norm": 4.027122497558594, + "learning_rate": 6.398791929427248e-06, + "loss": 0.1382, + "step": 23075 + }, + { + "epoch": 62.87738419618529, + "grad_norm": 6.679190158843994, + "learning_rate": 6.397968659194792e-06, + "loss": 0.0637, + "step": 23076 + }, + { + "epoch": 62.880108991825615, + "grad_norm": 3.6560263633728027, + "learning_rate": 6.397145417014841e-06, + "loss": 0.2501, + "step": 23077 + }, + { + "epoch": 62.88283378746594, + "grad_norm": 3.46293044090271, + "learning_rate": 6.3963222028938035e-06, + "loss": 0.1211, + "step": 23078 + }, + { + "epoch": 62.88555858310627, + "grad_norm": 3.248948097229004, + "learning_rate": 6.395499016838095e-06, + "loss": 0.1566, + "step": 23079 + }, + { + "epoch": 62.88828337874659, + "grad_norm": 3.2963860034942627, + "learning_rate": 6.394675858854121e-06, + "loss": 0.0635, + "step": 23080 + }, + { + "epoch": 62.89100817438692, + "grad_norm": 2.887035608291626, + "learning_rate": 6.393852728948299e-06, + "loss": 0.0419, + "step": 23081 + }, + { + "epoch": 62.89373297002725, + "grad_norm": 3.3246560096740723, + "learning_rate": 6.393029627127031e-06, + "loss": 0.1175, + "step": 23082 + }, + { + "epoch": 62.89645776566758, + "grad_norm": 3.9478142261505127, + "learning_rate": 6.392206553396734e-06, + "loss": 0.1017, + "step": 23083 + }, + { + "epoch": 62.8991825613079, + "grad_norm": 3.3078768253326416, + "learning_rate": 6.391383507763816e-06, + "loss": 0.0651, + "step": 23084 + }, + { + "epoch": 62.90190735694823, + "grad_norm": 2.7478339672088623, + "learning_rate": 6.39056049023469e-06, + "loss": 0.0435, + "step": 23085 + }, + { + "epoch": 62.904632152588555, + "grad_norm": 2.965304374694824, + "learning_rate": 6.3897375008157606e-06, + "loss": 0.0603, + "step": 23086 + }, + { + "epoch": 62.90735694822888, + "grad_norm": 3.521054744720459, + "learning_rate": 6.388914539513441e-06, + "loss": 0.0816, + "step": 23087 + }, + { + "epoch": 62.91008174386921, + "grad_norm": 3.507844924926758, + "learning_rate": 6.388091606334137e-06, + "loss": 0.257, + "step": 23088 + }, + { + "epoch": 62.91280653950954, + "grad_norm": 3.3088457584381104, + "learning_rate": 6.387268701284261e-06, + "loss": 0.1144, + "step": 23089 + }, + { + "epoch": 62.915531335149865, + "grad_norm": 3.2807881832122803, + "learning_rate": 6.386445824370218e-06, + "loss": 0.0795, + "step": 23090 + }, + { + "epoch": 62.91825613079019, + "grad_norm": 2.9147677421569824, + "learning_rate": 6.385622975598422e-06, + "loss": 0.0522, + "step": 23091 + }, + { + "epoch": 62.920980926430516, + "grad_norm": 2.9333882331848145, + "learning_rate": 6.384800154975274e-06, + "loss": 0.1078, + "step": 23092 + }, + { + "epoch": 62.92370572207084, + "grad_norm": 5.346883773803711, + "learning_rate": 6.38397736250719e-06, + "loss": 0.1202, + "step": 23093 + }, + { + "epoch": 62.926430517711175, + "grad_norm": 3.9388911724090576, + "learning_rate": 6.38315459820057e-06, + "loss": 0.0678, + "step": 23094 + }, + { + "epoch": 62.9291553133515, + "grad_norm": 3.2417473793029785, + "learning_rate": 6.382331862061828e-06, + "loss": 0.2092, + "step": 23095 + }, + { + "epoch": 62.93188010899183, + "grad_norm": 4.299763202667236, + "learning_rate": 6.381509154097367e-06, + "loss": 0.2748, + "step": 23096 + }, + { + "epoch": 62.93460490463215, + "grad_norm": 3.4272220134735107, + "learning_rate": 6.3806864743136e-06, + "loss": 0.1067, + "step": 23097 + }, + { + "epoch": 62.93732970027248, + "grad_norm": 2.880706310272217, + "learning_rate": 6.379863822716926e-06, + "loss": 0.0938, + "step": 23098 + }, + { + "epoch": 62.940054495912804, + "grad_norm": 3.2244069576263428, + "learning_rate": 6.379041199313756e-06, + "loss": 0.0526, + "step": 23099 + }, + { + "epoch": 62.94277929155314, + "grad_norm": 3.6588704586029053, + "learning_rate": 6.378218604110499e-06, + "loss": 0.1616, + "step": 23100 + }, + { + "epoch": 62.94550408719346, + "grad_norm": 3.856618642807007, + "learning_rate": 6.377396037113557e-06, + "loss": 0.1594, + "step": 23101 + }, + { + "epoch": 62.94822888283379, + "grad_norm": 2.894587516784668, + "learning_rate": 6.376573498329341e-06, + "loss": 0.0425, + "step": 23102 + }, + { + "epoch": 62.950953678474114, + "grad_norm": 3.4893734455108643, + "learning_rate": 6.375750987764251e-06, + "loss": 0.0518, + "step": 23103 + }, + { + "epoch": 62.95367847411444, + "grad_norm": 3.840693950653076, + "learning_rate": 6.374928505424698e-06, + "loss": 0.0658, + "step": 23104 + }, + { + "epoch": 62.956403269754766, + "grad_norm": 4.003078937530518, + "learning_rate": 6.374106051317084e-06, + "loss": 0.1181, + "step": 23105 + }, + { + "epoch": 62.95912806539509, + "grad_norm": 3.1735715866088867, + "learning_rate": 6.373283625447817e-06, + "loss": 0.0516, + "step": 23106 + }, + { + "epoch": 62.961852861035425, + "grad_norm": 2.5085859298706055, + "learning_rate": 6.372461227823297e-06, + "loss": 0.0466, + "step": 23107 + }, + { + "epoch": 62.96457765667575, + "grad_norm": 2.9543776512145996, + "learning_rate": 6.371638858449933e-06, + "loss": 0.0694, + "step": 23108 + }, + { + "epoch": 62.967302452316076, + "grad_norm": 2.8159821033477783, + "learning_rate": 6.370816517334132e-06, + "loss": 0.0855, + "step": 23109 + }, + { + "epoch": 62.9700272479564, + "grad_norm": 2.9434163570404053, + "learning_rate": 6.369994204482293e-06, + "loss": 0.0479, + "step": 23110 + }, + { + "epoch": 62.97275204359673, + "grad_norm": 3.5817837715148926, + "learning_rate": 6.369171919900823e-06, + "loss": 0.0796, + "step": 23111 + }, + { + "epoch": 62.97547683923706, + "grad_norm": 4.305360317230225, + "learning_rate": 6.368349663596123e-06, + "loss": 0.0885, + "step": 23112 + }, + { + "epoch": 62.97820163487739, + "grad_norm": 2.948730707168579, + "learning_rate": 6.367527435574602e-06, + "loss": 0.1264, + "step": 23113 + }, + { + "epoch": 62.98092643051771, + "grad_norm": 3.276205539703369, + "learning_rate": 6.366705235842658e-06, + "loss": 0.0605, + "step": 23114 + }, + { + "epoch": 62.98365122615804, + "grad_norm": 3.5483663082122803, + "learning_rate": 6.365883064406699e-06, + "loss": 0.0799, + "step": 23115 + }, + { + "epoch": 62.986376021798364, + "grad_norm": 3.094501495361328, + "learning_rate": 6.365060921273121e-06, + "loss": 0.0563, + "step": 23116 + }, + { + "epoch": 62.98910081743869, + "grad_norm": 3.6306135654449463, + "learning_rate": 6.364238806448335e-06, + "loss": 0.0665, + "step": 23117 + }, + { + "epoch": 62.991825613079016, + "grad_norm": 4.325113296508789, + "learning_rate": 6.3634167199387405e-06, + "loss": 0.1833, + "step": 23118 + }, + { + "epoch": 62.99455040871935, + "grad_norm": 4.262590408325195, + "learning_rate": 6.362594661750739e-06, + "loss": 0.2229, + "step": 23119 + }, + { + "epoch": 62.997275204359674, + "grad_norm": 4.426522731781006, + "learning_rate": 6.361772631890735e-06, + "loss": 0.0679, + "step": 23120 + }, + { + "epoch": 63.0, + "grad_norm": 3.957909345626831, + "learning_rate": 6.360950630365126e-06, + "loss": 0.0765, + "step": 23121 + }, + { + "epoch": 63.002724795640326, + "grad_norm": 2.1313045024871826, + "learning_rate": 6.360128657180318e-06, + "loss": 0.1728, + "step": 23122 + }, + { + "epoch": 63.00544959128065, + "grad_norm": 4.392509937286377, + "learning_rate": 6.3593067123427096e-06, + "loss": 0.128, + "step": 23123 + }, + { + "epoch": 63.00817438692098, + "grad_norm": 2.8958847522735596, + "learning_rate": 6.358484795858704e-06, + "loss": 0.0489, + "step": 23124 + }, + { + "epoch": 63.01089918256131, + "grad_norm": 3.2617640495300293, + "learning_rate": 6.357662907734701e-06, + "loss": 0.079, + "step": 23125 + }, + { + "epoch": 63.013623978201636, + "grad_norm": 3.2560315132141113, + "learning_rate": 6.356841047977104e-06, + "loss": 0.1265, + "step": 23126 + }, + { + "epoch": 63.01634877384196, + "grad_norm": 3.201209783554077, + "learning_rate": 6.35601921659231e-06, + "loss": 0.0574, + "step": 23127 + }, + { + "epoch": 63.01907356948229, + "grad_norm": 3.6940200328826904, + "learning_rate": 6.355197413586722e-06, + "loss": 0.0563, + "step": 23128 + }, + { + "epoch": 63.02179836512261, + "grad_norm": 3.270508050918579, + "learning_rate": 6.354375638966739e-06, + "loss": 0.0326, + "step": 23129 + }, + { + "epoch": 63.02452316076294, + "grad_norm": 4.936068534851074, + "learning_rate": 6.35355389273876e-06, + "loss": 0.0716, + "step": 23130 + }, + { + "epoch": 63.02724795640327, + "grad_norm": 4.696451187133789, + "learning_rate": 6.352732174909187e-06, + "loss": 0.11, + "step": 23131 + }, + { + "epoch": 63.0299727520436, + "grad_norm": 4.848161697387695, + "learning_rate": 6.351910485484417e-06, + "loss": 0.1006, + "step": 23132 + }, + { + "epoch": 63.032697547683924, + "grad_norm": 4.534578800201416, + "learning_rate": 6.351088824470853e-06, + "loss": 0.0653, + "step": 23133 + }, + { + "epoch": 63.03542234332425, + "grad_norm": 3.329862117767334, + "learning_rate": 6.3502671918748886e-06, + "loss": 0.2054, + "step": 23134 + }, + { + "epoch": 63.038147138964575, + "grad_norm": 2.6438238620758057, + "learning_rate": 6.349445587702927e-06, + "loss": 0.0395, + "step": 23135 + }, + { + "epoch": 63.0408719346049, + "grad_norm": 3.2166786193847656, + "learning_rate": 6.348624011961368e-06, + "loss": 0.0499, + "step": 23136 + }, + { + "epoch": 63.043596730245234, + "grad_norm": 3.3035888671875, + "learning_rate": 6.347802464656605e-06, + "loss": 0.2443, + "step": 23137 + }, + { + "epoch": 63.04632152588556, + "grad_norm": 2.5024590492248535, + "learning_rate": 6.3469809457950406e-06, + "loss": 0.0414, + "step": 23138 + }, + { + "epoch": 63.049046321525886, + "grad_norm": 4.230470657348633, + "learning_rate": 6.346159455383069e-06, + "loss": 0.0729, + "step": 23139 + }, + { + "epoch": 63.05177111716621, + "grad_norm": 3.702749013900757, + "learning_rate": 6.3453379934270945e-06, + "loss": 0.0662, + "step": 23140 + }, + { + "epoch": 63.05449591280654, + "grad_norm": 3.2805144786834717, + "learning_rate": 6.3445165599335044e-06, + "loss": 0.067, + "step": 23141 + }, + { + "epoch": 63.05722070844686, + "grad_norm": 3.6586036682128906, + "learning_rate": 6.343695154908707e-06, + "loss": 0.0644, + "step": 23142 + }, + { + "epoch": 63.059945504087196, + "grad_norm": 3.8456904888153076, + "learning_rate": 6.34287377835909e-06, + "loss": 0.0516, + "step": 23143 + }, + { + "epoch": 63.06267029972752, + "grad_norm": 3.517930746078491, + "learning_rate": 6.342052430291057e-06, + "loss": 0.0473, + "step": 23144 + }, + { + "epoch": 63.06539509536785, + "grad_norm": 2.3302736282348633, + "learning_rate": 6.341231110710999e-06, + "loss": 0.0396, + "step": 23145 + }, + { + "epoch": 63.06811989100817, + "grad_norm": 2.6586661338806152, + "learning_rate": 6.340409819625319e-06, + "loss": 0.0737, + "step": 23146 + }, + { + "epoch": 63.0708446866485, + "grad_norm": 3.8887076377868652, + "learning_rate": 6.339588557040406e-06, + "loss": 0.0706, + "step": 23147 + }, + { + "epoch": 63.073569482288825, + "grad_norm": 3.4590799808502197, + "learning_rate": 6.338767322962662e-06, + "loss": 0.084, + "step": 23148 + }, + { + "epoch": 63.07629427792916, + "grad_norm": 3.049461841583252, + "learning_rate": 6.337946117398479e-06, + "loss": 0.1283, + "step": 23149 + }, + { + "epoch": 63.079019073569484, + "grad_norm": 4.627965927124023, + "learning_rate": 6.3371249403542556e-06, + "loss": 0.0628, + "step": 23150 + }, + { + "epoch": 63.08174386920981, + "grad_norm": 6.178308486938477, + "learning_rate": 6.336303791836379e-06, + "loss": 0.0555, + "step": 23151 + }, + { + "epoch": 63.084468664850135, + "grad_norm": 3.0092344284057617, + "learning_rate": 6.335482671851256e-06, + "loss": 0.0935, + "step": 23152 + }, + { + "epoch": 63.08719346049046, + "grad_norm": 4.038009166717529, + "learning_rate": 6.334661580405274e-06, + "loss": 0.1331, + "step": 23153 + }, + { + "epoch": 63.08991825613079, + "grad_norm": 4.0561089515686035, + "learning_rate": 6.333840517504832e-06, + "loss": 0.0791, + "step": 23154 + }, + { + "epoch": 63.09264305177112, + "grad_norm": 3.6039934158325195, + "learning_rate": 6.333019483156322e-06, + "loss": 0.0545, + "step": 23155 + }, + { + "epoch": 63.095367847411445, + "grad_norm": 5.1222758293151855, + "learning_rate": 6.332198477366138e-06, + "loss": 0.1295, + "step": 23156 + }, + { + "epoch": 63.09809264305177, + "grad_norm": 3.006937026977539, + "learning_rate": 6.331377500140672e-06, + "loss": 0.1013, + "step": 23157 + }, + { + "epoch": 63.1008174386921, + "grad_norm": 2.899261474609375, + "learning_rate": 6.330556551486324e-06, + "loss": 0.0502, + "step": 23158 + }, + { + "epoch": 63.10354223433242, + "grad_norm": 2.8537375926971436, + "learning_rate": 6.329735631409479e-06, + "loss": 0.093, + "step": 23159 + }, + { + "epoch": 63.10626702997275, + "grad_norm": 5.385002613067627, + "learning_rate": 6.328914739916539e-06, + "loss": 0.1324, + "step": 23160 + }, + { + "epoch": 63.10899182561308, + "grad_norm": 3.247054100036621, + "learning_rate": 6.328093877013888e-06, + "loss": 0.0566, + "step": 23161 + }, + { + "epoch": 63.11171662125341, + "grad_norm": 4.962833404541016, + "learning_rate": 6.327273042707929e-06, + "loss": 0.0938, + "step": 23162 + }, + { + "epoch": 63.11444141689373, + "grad_norm": 3.9605371952056885, + "learning_rate": 6.3264522370050455e-06, + "loss": 0.1092, + "step": 23163 + }, + { + "epoch": 63.11716621253406, + "grad_norm": 5.63825798034668, + "learning_rate": 6.325631459911635e-06, + "loss": 0.1948, + "step": 23164 + }, + { + "epoch": 63.119891008174385, + "grad_norm": 8.609911918640137, + "learning_rate": 6.324810711434089e-06, + "loss": 0.0495, + "step": 23165 + }, + { + "epoch": 63.12261580381471, + "grad_norm": 2.54370379447937, + "learning_rate": 6.3239899915787985e-06, + "loss": 0.1144, + "step": 23166 + }, + { + "epoch": 63.12534059945504, + "grad_norm": 3.7156083583831787, + "learning_rate": 6.323169300352155e-06, + "loss": 0.0787, + "step": 23167 + }, + { + "epoch": 63.12806539509537, + "grad_norm": 2.9712140560150146, + "learning_rate": 6.322348637760547e-06, + "loss": 0.083, + "step": 23168 + }, + { + "epoch": 63.130790190735695, + "grad_norm": 3.4311819076538086, + "learning_rate": 6.321528003810375e-06, + "loss": 0.0789, + "step": 23169 + }, + { + "epoch": 63.13351498637602, + "grad_norm": 4.052380084991455, + "learning_rate": 6.320707398508021e-06, + "loss": 0.2009, + "step": 23170 + }, + { + "epoch": 63.13623978201635, + "grad_norm": 3.0860378742218018, + "learning_rate": 6.3198868218598805e-06, + "loss": 0.0515, + "step": 23171 + }, + { + "epoch": 63.13896457765667, + "grad_norm": 3.465501070022583, + "learning_rate": 6.319066273872345e-06, + "loss": 0.0596, + "step": 23172 + }, + { + "epoch": 63.141689373297005, + "grad_norm": 2.6912052631378174, + "learning_rate": 6.318245754551802e-06, + "loss": 0.1229, + "step": 23173 + }, + { + "epoch": 63.14441416893733, + "grad_norm": 4.115647792816162, + "learning_rate": 6.317425263904643e-06, + "loss": 0.288, + "step": 23174 + }, + { + "epoch": 63.14713896457766, + "grad_norm": 3.4655401706695557, + "learning_rate": 6.316604801937256e-06, + "loss": 0.1119, + "step": 23175 + }, + { + "epoch": 63.14986376021798, + "grad_norm": 3.3207101821899414, + "learning_rate": 6.315784368656034e-06, + "loss": 0.1297, + "step": 23176 + }, + { + "epoch": 63.15258855585831, + "grad_norm": 3.8398549556732178, + "learning_rate": 6.314963964067362e-06, + "loss": 0.1018, + "step": 23177 + }, + { + "epoch": 63.155313351498634, + "grad_norm": 2.4407057762145996, + "learning_rate": 6.314143588177636e-06, + "loss": 0.0443, + "step": 23178 + }, + { + "epoch": 63.15803814713897, + "grad_norm": 3.8973379135131836, + "learning_rate": 6.313323240993237e-06, + "loss": 0.1692, + "step": 23179 + }, + { + "epoch": 63.16076294277929, + "grad_norm": 3.2764265537261963, + "learning_rate": 6.312502922520562e-06, + "loss": 0.0479, + "step": 23180 + }, + { + "epoch": 63.16348773841962, + "grad_norm": 3.1338770389556885, + "learning_rate": 6.311682632765992e-06, + "loss": 0.0828, + "step": 23181 + }, + { + "epoch": 63.166212534059945, + "grad_norm": 3.19219708442688, + "learning_rate": 6.310862371735922e-06, + "loss": 0.1193, + "step": 23182 + }, + { + "epoch": 63.16893732970027, + "grad_norm": 2.779780626296997, + "learning_rate": 6.310042139436734e-06, + "loss": 0.0954, + "step": 23183 + }, + { + "epoch": 63.171662125340596, + "grad_norm": 2.7828152179718018, + "learning_rate": 6.309221935874822e-06, + "loss": 0.159, + "step": 23184 + }, + { + "epoch": 63.17438692098093, + "grad_norm": 4.583054542541504, + "learning_rate": 6.308401761056566e-06, + "loss": 0.1784, + "step": 23185 + }, + { + "epoch": 63.177111716621255, + "grad_norm": 4.487547874450684, + "learning_rate": 6.30758161498836e-06, + "loss": 0.056, + "step": 23186 + }, + { + "epoch": 63.17983651226158, + "grad_norm": 2.659743309020996, + "learning_rate": 6.306761497676594e-06, + "loss": 0.0419, + "step": 23187 + }, + { + "epoch": 63.182561307901906, + "grad_norm": 3.0457241535186768, + "learning_rate": 6.305941409127646e-06, + "loss": 0.155, + "step": 23188 + }, + { + "epoch": 63.18528610354223, + "grad_norm": 3.6640207767486572, + "learning_rate": 6.305121349347911e-06, + "loss": 0.1206, + "step": 23189 + }, + { + "epoch": 63.18801089918256, + "grad_norm": 4.56561803817749, + "learning_rate": 6.304301318343768e-06, + "loss": 0.0968, + "step": 23190 + }, + { + "epoch": 63.19073569482289, + "grad_norm": 2.028547763824463, + "learning_rate": 6.303481316121611e-06, + "loss": 0.0346, + "step": 23191 + }, + { + "epoch": 63.19346049046322, + "grad_norm": 2.4169869422912598, + "learning_rate": 6.302661342687822e-06, + "loss": 0.1654, + "step": 23192 + }, + { + "epoch": 63.19618528610354, + "grad_norm": 2.399566888809204, + "learning_rate": 6.3018413980487865e-06, + "loss": 0.0388, + "step": 23193 + }, + { + "epoch": 63.19891008174387, + "grad_norm": 3.032816171646118, + "learning_rate": 6.301021482210889e-06, + "loss": 0.1188, + "step": 23194 + }, + { + "epoch": 63.201634877384194, + "grad_norm": 2.597745895385742, + "learning_rate": 6.30020159518052e-06, + "loss": 0.0819, + "step": 23195 + }, + { + "epoch": 63.20435967302452, + "grad_norm": 4.5145440101623535, + "learning_rate": 6.2993817369640616e-06, + "loss": 0.0866, + "step": 23196 + }, + { + "epoch": 63.20708446866485, + "grad_norm": 2.7119181156158447, + "learning_rate": 6.2985619075678985e-06, + "loss": 0.113, + "step": 23197 + }, + { + "epoch": 63.20980926430518, + "grad_norm": 3.1414027214050293, + "learning_rate": 6.297742106998417e-06, + "loss": 0.0728, + "step": 23198 + }, + { + "epoch": 63.212534059945504, + "grad_norm": 3.252021312713623, + "learning_rate": 6.296922335262e-06, + "loss": 0.0826, + "step": 23199 + }, + { + "epoch": 63.21525885558583, + "grad_norm": 4.101782321929932, + "learning_rate": 6.296102592365035e-06, + "loss": 0.0869, + "step": 23200 + }, + { + "epoch": 63.217983651226156, + "grad_norm": 3.352304697036743, + "learning_rate": 6.2952828783139e-06, + "loss": 0.0724, + "step": 23201 + }, + { + "epoch": 63.22070844686648, + "grad_norm": 3.0583438873291016, + "learning_rate": 6.294463193114982e-06, + "loss": 0.1035, + "step": 23202 + }, + { + "epoch": 63.223433242506815, + "grad_norm": 2.796839714050293, + "learning_rate": 6.293643536774668e-06, + "loss": 0.0969, + "step": 23203 + }, + { + "epoch": 63.22615803814714, + "grad_norm": 4.15037727355957, + "learning_rate": 6.292823909299338e-06, + "loss": 0.1032, + "step": 23204 + }, + { + "epoch": 63.228882833787466, + "grad_norm": 2.8994171619415283, + "learning_rate": 6.2920043106953774e-06, + "loss": 0.0624, + "step": 23205 + }, + { + "epoch": 63.23160762942779, + "grad_norm": 2.9009017944335938, + "learning_rate": 6.291184740969168e-06, + "loss": 0.044, + "step": 23206 + }, + { + "epoch": 63.23433242506812, + "grad_norm": 3.7608728408813477, + "learning_rate": 6.290365200127091e-06, + "loss": 0.0563, + "step": 23207 + }, + { + "epoch": 63.237057220708444, + "grad_norm": 3.7963707447052, + "learning_rate": 6.289545688175531e-06, + "loss": 0.1759, + "step": 23208 + }, + { + "epoch": 63.23978201634878, + "grad_norm": 7.580491065979004, + "learning_rate": 6.2887262051208704e-06, + "loss": 0.1625, + "step": 23209 + }, + { + "epoch": 63.2425068119891, + "grad_norm": 3.113636016845703, + "learning_rate": 6.28790675096949e-06, + "loss": 0.0569, + "step": 23210 + }, + { + "epoch": 63.24523160762943, + "grad_norm": 4.224898338317871, + "learning_rate": 6.287087325727774e-06, + "loss": 0.0839, + "step": 23211 + }, + { + "epoch": 63.247956403269754, + "grad_norm": 3.5268211364746094, + "learning_rate": 6.286267929402099e-06, + "loss": 0.0683, + "step": 23212 + }, + { + "epoch": 63.25068119891008, + "grad_norm": 3.5836639404296875, + "learning_rate": 6.285448561998853e-06, + "loss": 0.0988, + "step": 23213 + }, + { + "epoch": 63.253405994550405, + "grad_norm": 2.8314950466156006, + "learning_rate": 6.284629223524412e-06, + "loss": 0.0655, + "step": 23214 + }, + { + "epoch": 63.25613079019074, + "grad_norm": 2.798389196395874, + "learning_rate": 6.283809913985162e-06, + "loss": 0.143, + "step": 23215 + }, + { + "epoch": 63.258855585831064, + "grad_norm": 3.1230967044830322, + "learning_rate": 6.282990633387477e-06, + "loss": 0.0964, + "step": 23216 + }, + { + "epoch": 63.26158038147139, + "grad_norm": 3.065552234649658, + "learning_rate": 6.282171381737742e-06, + "loss": 0.106, + "step": 23217 + }, + { + "epoch": 63.264305177111716, + "grad_norm": 4.310557842254639, + "learning_rate": 6.281352159042338e-06, + "loss": 0.0504, + "step": 23218 + }, + { + "epoch": 63.26702997275204, + "grad_norm": 3.7876176834106445, + "learning_rate": 6.280532965307643e-06, + "loss": 0.1395, + "step": 23219 + }, + { + "epoch": 63.26975476839237, + "grad_norm": 3.4245898723602295, + "learning_rate": 6.279713800540035e-06, + "loss": 0.1101, + "step": 23220 + }, + { + "epoch": 63.2724795640327, + "grad_norm": 4.20367431640625, + "learning_rate": 6.2788946647459e-06, + "loss": 0.0961, + "step": 23221 + }, + { + "epoch": 63.275204359673026, + "grad_norm": 3.2108347415924072, + "learning_rate": 6.278075557931611e-06, + "loss": 0.0642, + "step": 23222 + }, + { + "epoch": 63.27792915531335, + "grad_norm": 6.693216800689697, + "learning_rate": 6.277256480103553e-06, + "loss": 0.1121, + "step": 23223 + }, + { + "epoch": 63.28065395095368, + "grad_norm": 3.909276247024536, + "learning_rate": 6.276437431268098e-06, + "loss": 0.0429, + "step": 23224 + }, + { + "epoch": 63.283378746594, + "grad_norm": 3.625056028366089, + "learning_rate": 6.275618411431633e-06, + "loss": 0.1419, + "step": 23225 + }, + { + "epoch": 63.28610354223433, + "grad_norm": 3.083132266998291, + "learning_rate": 6.274799420600528e-06, + "loss": 0.0598, + "step": 23226 + }, + { + "epoch": 63.28882833787466, + "grad_norm": 3.109088897705078, + "learning_rate": 6.273980458781168e-06, + "loss": 0.0653, + "step": 23227 + }, + { + "epoch": 63.29155313351499, + "grad_norm": 6.317144870758057, + "learning_rate": 6.273161525979926e-06, + "loss": 0.0505, + "step": 23228 + }, + { + "epoch": 63.294277929155314, + "grad_norm": 4.329389572143555, + "learning_rate": 6.2723426222031845e-06, + "loss": 0.0939, + "step": 23229 + }, + { + "epoch": 63.29700272479564, + "grad_norm": 2.5851826667785645, + "learning_rate": 6.271523747457316e-06, + "loss": 0.0514, + "step": 23230 + }, + { + "epoch": 63.299727520435965, + "grad_norm": 2.7832398414611816, + "learning_rate": 6.270704901748703e-06, + "loss": 0.196, + "step": 23231 + }, + { + "epoch": 63.30245231607629, + "grad_norm": 3.224717378616333, + "learning_rate": 6.269886085083718e-06, + "loss": 0.0691, + "step": 23232 + }, + { + "epoch": 63.305177111716624, + "grad_norm": 2.864311933517456, + "learning_rate": 6.269067297468743e-06, + "loss": 0.056, + "step": 23233 + }, + { + "epoch": 63.30790190735695, + "grad_norm": 3.1728298664093018, + "learning_rate": 6.268248538910149e-06, + "loss": 0.1322, + "step": 23234 + }, + { + "epoch": 63.310626702997276, + "grad_norm": 3.160740852355957, + "learning_rate": 6.267429809414316e-06, + "loss": 0.0515, + "step": 23235 + }, + { + "epoch": 63.3133514986376, + "grad_norm": 2.3517680168151855, + "learning_rate": 6.266611108987619e-06, + "loss": 0.0548, + "step": 23236 + }, + { + "epoch": 63.31607629427793, + "grad_norm": 2.645186185836792, + "learning_rate": 6.265792437636433e-06, + "loss": 0.1263, + "step": 23237 + }, + { + "epoch": 63.31880108991825, + "grad_norm": 4.053886413574219, + "learning_rate": 6.264973795367136e-06, + "loss": 0.2391, + "step": 23238 + }, + { + "epoch": 63.321525885558586, + "grad_norm": 3.03579044342041, + "learning_rate": 6.264155182186105e-06, + "loss": 0.0501, + "step": 23239 + }, + { + "epoch": 63.32425068119891, + "grad_norm": 3.4309818744659424, + "learning_rate": 6.263336598099712e-06, + "loss": 0.0423, + "step": 23240 + }, + { + "epoch": 63.32697547683924, + "grad_norm": 4.73743200302124, + "learning_rate": 6.262518043114336e-06, + "loss": 0.1231, + "step": 23241 + }, + { + "epoch": 63.32970027247956, + "grad_norm": 4.359729290008545, + "learning_rate": 6.261699517236346e-06, + "loss": 0.0983, + "step": 23242 + }, + { + "epoch": 63.33242506811989, + "grad_norm": 4.368567943572998, + "learning_rate": 6.260881020472122e-06, + "loss": 0.1999, + "step": 23243 + }, + { + "epoch": 63.335149863760215, + "grad_norm": 4.852414608001709, + "learning_rate": 6.260062552828035e-06, + "loss": 0.0729, + "step": 23244 + }, + { + "epoch": 63.33787465940055, + "grad_norm": 3.412858724594116, + "learning_rate": 6.259244114310461e-06, + "loss": 0.0379, + "step": 23245 + }, + { + "epoch": 63.34059945504087, + "grad_norm": 2.490328550338745, + "learning_rate": 6.2584257049257724e-06, + "loss": 0.0409, + "step": 23246 + }, + { + "epoch": 63.3433242506812, + "grad_norm": 2.6413326263427734, + "learning_rate": 6.257607324680346e-06, + "loss": 0.0684, + "step": 23247 + }, + { + "epoch": 63.346049046321525, + "grad_norm": 3.239886999130249, + "learning_rate": 6.25678897358055e-06, + "loss": 0.0564, + "step": 23248 + }, + { + "epoch": 63.34877384196185, + "grad_norm": 8.035508155822754, + "learning_rate": 6.255970651632764e-06, + "loss": 0.1955, + "step": 23249 + }, + { + "epoch": 63.35149863760218, + "grad_norm": 3.526515245437622, + "learning_rate": 6.255152358843357e-06, + "loss": 0.0843, + "step": 23250 + }, + { + "epoch": 63.35422343324251, + "grad_norm": 3.029080629348755, + "learning_rate": 6.254334095218704e-06, + "loss": 0.2116, + "step": 23251 + }, + { + "epoch": 63.356948228882835, + "grad_norm": 3.12518572807312, + "learning_rate": 6.253515860765175e-06, + "loss": 0.1754, + "step": 23252 + }, + { + "epoch": 63.35967302452316, + "grad_norm": 4.568018913269043, + "learning_rate": 6.252697655489145e-06, + "loss": 0.1433, + "step": 23253 + }, + { + "epoch": 63.36239782016349, + "grad_norm": 5.089962959289551, + "learning_rate": 6.2518794793969815e-06, + "loss": 0.0689, + "step": 23254 + }, + { + "epoch": 63.36512261580381, + "grad_norm": 3.837120771408081, + "learning_rate": 6.251061332495062e-06, + "loss": 0.1469, + "step": 23255 + }, + { + "epoch": 63.36784741144414, + "grad_norm": 3.126713752746582, + "learning_rate": 6.2502432147897584e-06, + "loss": 0.0976, + "step": 23256 + }, + { + "epoch": 63.37057220708447, + "grad_norm": 2.7455477714538574, + "learning_rate": 6.249425126287439e-06, + "loss": 0.0451, + "step": 23257 + }, + { + "epoch": 63.3732970027248, + "grad_norm": 3.298961877822876, + "learning_rate": 6.248607066994473e-06, + "loss": 0.1045, + "step": 23258 + }, + { + "epoch": 63.37602179836512, + "grad_norm": 3.4833261966705322, + "learning_rate": 6.247789036917238e-06, + "loss": 0.0773, + "step": 23259 + }, + { + "epoch": 63.37874659400545, + "grad_norm": 3.407968044281006, + "learning_rate": 6.246971036062099e-06, + "loss": 0.0694, + "step": 23260 + }, + { + "epoch": 63.381471389645775, + "grad_norm": 3.166114568710327, + "learning_rate": 6.246153064435432e-06, + "loss": 0.0649, + "step": 23261 + }, + { + "epoch": 63.3841961852861, + "grad_norm": 3.347496271133423, + "learning_rate": 6.245335122043601e-06, + "loss": 0.0461, + "step": 23262 + }, + { + "epoch": 63.38692098092643, + "grad_norm": 2.5239617824554443, + "learning_rate": 6.244517208892982e-06, + "loss": 0.0366, + "step": 23263 + }, + { + "epoch": 63.38964577656676, + "grad_norm": 5.172435760498047, + "learning_rate": 6.243699324989941e-06, + "loss": 0.1966, + "step": 23264 + }, + { + "epoch": 63.392370572207085, + "grad_norm": 3.0878472328186035, + "learning_rate": 6.242881470340848e-06, + "loss": 0.1901, + "step": 23265 + }, + { + "epoch": 63.39509536784741, + "grad_norm": 3.729919910430908, + "learning_rate": 6.242063644952072e-06, + "loss": 0.214, + "step": 23266 + }, + { + "epoch": 63.39782016348774, + "grad_norm": 3.1580615043640137, + "learning_rate": 6.241245848829986e-06, + "loss": 0.1801, + "step": 23267 + }, + { + "epoch": 63.40054495912806, + "grad_norm": 4.145963191986084, + "learning_rate": 6.240428081980955e-06, + "loss": 0.0921, + "step": 23268 + }, + { + "epoch": 63.403269754768395, + "grad_norm": 4.048202037811279, + "learning_rate": 6.239610344411351e-06, + "loss": 0.1434, + "step": 23269 + }, + { + "epoch": 63.40599455040872, + "grad_norm": 3.7490174770355225, + "learning_rate": 6.238792636127537e-06, + "loss": 0.0401, + "step": 23270 + }, + { + "epoch": 63.40871934604905, + "grad_norm": 3.656370162963867, + "learning_rate": 6.2379749571358835e-06, + "loss": 0.1079, + "step": 23271 + }, + { + "epoch": 63.41144414168937, + "grad_norm": 2.9822680950164795, + "learning_rate": 6.237157307442765e-06, + "loss": 0.0524, + "step": 23272 + }, + { + "epoch": 63.4141689373297, + "grad_norm": 3.4221558570861816, + "learning_rate": 6.2363396870545425e-06, + "loss": 0.0777, + "step": 23273 + }, + { + "epoch": 63.416893732970024, + "grad_norm": 3.2517075538635254, + "learning_rate": 6.235522095977586e-06, + "loss": 0.043, + "step": 23274 + }, + { + "epoch": 63.41961852861036, + "grad_norm": 4.3678388595581055, + "learning_rate": 6.234704534218261e-06, + "loss": 0.0559, + "step": 23275 + }, + { + "epoch": 63.42234332425068, + "grad_norm": 2.94924259185791, + "learning_rate": 6.233887001782937e-06, + "loss": 0.0751, + "step": 23276 + }, + { + "epoch": 63.42506811989101, + "grad_norm": 3.8434195518493652, + "learning_rate": 6.233069498677979e-06, + "loss": 0.1142, + "step": 23277 + }, + { + "epoch": 63.427792915531334, + "grad_norm": 4.644426345825195, + "learning_rate": 6.232252024909755e-06, + "loss": 0.1899, + "step": 23278 + }, + { + "epoch": 63.43051771117166, + "grad_norm": 3.1543736457824707, + "learning_rate": 6.231434580484631e-06, + "loss": 0.117, + "step": 23279 + }, + { + "epoch": 63.433242506811986, + "grad_norm": 11.50169563293457, + "learning_rate": 6.230617165408974e-06, + "loss": 0.0844, + "step": 23280 + }, + { + "epoch": 63.43596730245232, + "grad_norm": 2.459075450897217, + "learning_rate": 6.229799779689147e-06, + "loss": 0.1937, + "step": 23281 + }, + { + "epoch": 63.438692098092645, + "grad_norm": 3.03531813621521, + "learning_rate": 6.228982423331519e-06, + "loss": 0.0462, + "step": 23282 + }, + { + "epoch": 63.44141689373297, + "grad_norm": 4.1016364097595215, + "learning_rate": 6.228165096342456e-06, + "loss": 0.1717, + "step": 23283 + }, + { + "epoch": 63.444141689373296, + "grad_norm": 3.0312306880950928, + "learning_rate": 6.227347798728319e-06, + "loss": 0.0757, + "step": 23284 + }, + { + "epoch": 63.44686648501362, + "grad_norm": 3.6765177249908447, + "learning_rate": 6.2265305304954796e-06, + "loss": 0.0562, + "step": 23285 + }, + { + "epoch": 63.44959128065395, + "grad_norm": 4.016444206237793, + "learning_rate": 6.225713291650295e-06, + "loss": 0.0948, + "step": 23286 + }, + { + "epoch": 63.45231607629428, + "grad_norm": 2.561192750930786, + "learning_rate": 6.224896082199137e-06, + "loss": 0.0612, + "step": 23287 + }, + { + "epoch": 63.45504087193461, + "grad_norm": 4.448768615722656, + "learning_rate": 6.224078902148365e-06, + "loss": 0.1659, + "step": 23288 + }, + { + "epoch": 63.45776566757493, + "grad_norm": 3.9424736499786377, + "learning_rate": 6.223261751504343e-06, + "loss": 0.0883, + "step": 23289 + }, + { + "epoch": 63.46049046321526, + "grad_norm": 2.7465972900390625, + "learning_rate": 6.222444630273439e-06, + "loss": 0.1047, + "step": 23290 + }, + { + "epoch": 63.463215258855584, + "grad_norm": 3.563305139541626, + "learning_rate": 6.221627538462015e-06, + "loss": 0.1321, + "step": 23291 + }, + { + "epoch": 63.46594005449591, + "grad_norm": 2.556574583053589, + "learning_rate": 6.2208104760764355e-06, + "loss": 0.0486, + "step": 23292 + }, + { + "epoch": 63.46866485013624, + "grad_norm": 3.7904469966888428, + "learning_rate": 6.21999344312306e-06, + "loss": 0.2267, + "step": 23293 + }, + { + "epoch": 63.47138964577657, + "grad_norm": 3.538381576538086, + "learning_rate": 6.219176439608256e-06, + "loss": 0.0865, + "step": 23294 + }, + { + "epoch": 63.474114441416894, + "grad_norm": 5.882189750671387, + "learning_rate": 6.218359465538383e-06, + "loss": 0.1995, + "step": 23295 + }, + { + "epoch": 63.47683923705722, + "grad_norm": 4.156144142150879, + "learning_rate": 6.217542520919806e-06, + "loss": 0.1735, + "step": 23296 + }, + { + "epoch": 63.479564032697546, + "grad_norm": 3.2747654914855957, + "learning_rate": 6.2167256057588845e-06, + "loss": 0.2048, + "step": 23297 + }, + { + "epoch": 63.48228882833787, + "grad_norm": 4.409388065338135, + "learning_rate": 6.215908720061983e-06, + "loss": 0.1567, + "step": 23298 + }, + { + "epoch": 63.485013623978205, + "grad_norm": 3.5134851932525635, + "learning_rate": 6.2150918638354614e-06, + "loss": 0.0733, + "step": 23299 + }, + { + "epoch": 63.48773841961853, + "grad_norm": 2.8112776279449463, + "learning_rate": 6.214275037085685e-06, + "loss": 0.0524, + "step": 23300 + }, + { + "epoch": 63.490463215258856, + "grad_norm": 2.8188395500183105, + "learning_rate": 6.21345823981901e-06, + "loss": 0.1395, + "step": 23301 + }, + { + "epoch": 63.49318801089918, + "grad_norm": 3.1712307929992676, + "learning_rate": 6.212641472041803e-06, + "loss": 0.047, + "step": 23302 + }, + { + "epoch": 63.49591280653951, + "grad_norm": 6.838955879211426, + "learning_rate": 6.211824733760421e-06, + "loss": 0.1084, + "step": 23303 + }, + { + "epoch": 63.49863760217983, + "grad_norm": 9.094196319580078, + "learning_rate": 6.211008024981224e-06, + "loss": 0.0401, + "step": 23304 + }, + { + "epoch": 63.50136239782017, + "grad_norm": 3.0622928142547607, + "learning_rate": 6.210191345710579e-06, + "loss": 0.0586, + "step": 23305 + }, + { + "epoch": 63.50408719346049, + "grad_norm": 2.8008289337158203, + "learning_rate": 6.209374695954835e-06, + "loss": 0.0498, + "step": 23306 + }, + { + "epoch": 63.50681198910082, + "grad_norm": 3.7828431129455566, + "learning_rate": 6.208558075720363e-06, + "loss": 0.1245, + "step": 23307 + }, + { + "epoch": 63.509536784741144, + "grad_norm": 2.386240243911743, + "learning_rate": 6.20774148501352e-06, + "loss": 0.0478, + "step": 23308 + }, + { + "epoch": 63.51226158038147, + "grad_norm": 3.705430030822754, + "learning_rate": 6.206924923840663e-06, + "loss": 0.0741, + "step": 23309 + }, + { + "epoch": 63.514986376021795, + "grad_norm": 4.189337253570557, + "learning_rate": 6.206108392208153e-06, + "loss": 0.1043, + "step": 23310 + }, + { + "epoch": 63.51771117166213, + "grad_norm": 5.269558906555176, + "learning_rate": 6.205291890122348e-06, + "loss": 0.1404, + "step": 23311 + }, + { + "epoch": 63.520435967302454, + "grad_norm": 2.9411356449127197, + "learning_rate": 6.204475417589609e-06, + "loss": 0.0504, + "step": 23312 + }, + { + "epoch": 63.52316076294278, + "grad_norm": 4.213926792144775, + "learning_rate": 6.203658974616291e-06, + "loss": 0.1546, + "step": 23313 + }, + { + "epoch": 63.525885558583106, + "grad_norm": 3.6228363513946533, + "learning_rate": 6.202842561208759e-06, + "loss": 0.0669, + "step": 23314 + }, + { + "epoch": 63.52861035422343, + "grad_norm": 3.2594707012176514, + "learning_rate": 6.2020261773733624e-06, + "loss": 0.1955, + "step": 23315 + }, + { + "epoch": 63.53133514986376, + "grad_norm": 4.12902307510376, + "learning_rate": 6.201209823116466e-06, + "loss": 0.1094, + "step": 23316 + }, + { + "epoch": 63.53405994550409, + "grad_norm": 4.914697647094727, + "learning_rate": 6.200393498444424e-06, + "loss": 0.0828, + "step": 23317 + }, + { + "epoch": 63.536784741144416, + "grad_norm": 3.1628105640411377, + "learning_rate": 6.199577203363597e-06, + "loss": 0.0857, + "step": 23318 + }, + { + "epoch": 63.53950953678474, + "grad_norm": 3.894613742828369, + "learning_rate": 6.198760937880339e-06, + "loss": 0.1076, + "step": 23319 + }, + { + "epoch": 63.54223433242507, + "grad_norm": 7.148128032684326, + "learning_rate": 6.197944702001009e-06, + "loss": 0.106, + "step": 23320 + }, + { + "epoch": 63.54495912806539, + "grad_norm": 2.830425977706909, + "learning_rate": 6.197128495731964e-06, + "loss": 0.089, + "step": 23321 + }, + { + "epoch": 63.54768392370572, + "grad_norm": 3.2133290767669678, + "learning_rate": 6.196312319079558e-06, + "loss": 0.0776, + "step": 23322 + }, + { + "epoch": 63.55040871934605, + "grad_norm": 2.6843209266662598, + "learning_rate": 6.195496172050146e-06, + "loss": 0.1461, + "step": 23323 + }, + { + "epoch": 63.55313351498638, + "grad_norm": 3.6621501445770264, + "learning_rate": 6.194680054650093e-06, + "loss": 0.0686, + "step": 23324 + }, + { + "epoch": 63.555858310626704, + "grad_norm": 3.502528667449951, + "learning_rate": 6.193863966885746e-06, + "loss": 0.0671, + "step": 23325 + }, + { + "epoch": 63.55858310626703, + "grad_norm": 3.7787718772888184, + "learning_rate": 6.193047908763468e-06, + "loss": 0.1247, + "step": 23326 + }, + { + "epoch": 63.561307901907355, + "grad_norm": 4.0733137130737305, + "learning_rate": 6.192231880289605e-06, + "loss": 0.1937, + "step": 23327 + }, + { + "epoch": 63.56403269754768, + "grad_norm": 4.627094745635986, + "learning_rate": 6.191415881470523e-06, + "loss": 0.1104, + "step": 23328 + }, + { + "epoch": 63.566757493188014, + "grad_norm": 4.041052341461182, + "learning_rate": 6.190599912312567e-06, + "loss": 0.0751, + "step": 23329 + }, + { + "epoch": 63.56948228882834, + "grad_norm": 4.6674089431762695, + "learning_rate": 6.189783972822101e-06, + "loss": 0.2169, + "step": 23330 + }, + { + "epoch": 63.572207084468666, + "grad_norm": 3.0642614364624023, + "learning_rate": 6.18896806300547e-06, + "loss": 0.1121, + "step": 23331 + }, + { + "epoch": 63.57493188010899, + "grad_norm": 2.9342877864837646, + "learning_rate": 6.188152182869037e-06, + "loss": 0.052, + "step": 23332 + }, + { + "epoch": 63.57765667574932, + "grad_norm": 7.390470027923584, + "learning_rate": 6.187336332419149e-06, + "loss": 0.0707, + "step": 23333 + }, + { + "epoch": 63.58038147138964, + "grad_norm": 3.899533271789551, + "learning_rate": 6.186520511662167e-06, + "loss": 0.0682, + "step": 23334 + }, + { + "epoch": 63.583106267029976, + "grad_norm": 2.7589640617370605, + "learning_rate": 6.185704720604435e-06, + "loss": 0.0457, + "step": 23335 + }, + { + "epoch": 63.5858310626703, + "grad_norm": 4.35020637512207, + "learning_rate": 6.184888959252317e-06, + "loss": 0.0815, + "step": 23336 + }, + { + "epoch": 63.58855585831063, + "grad_norm": 3.891713857650757, + "learning_rate": 6.184073227612158e-06, + "loss": 0.0616, + "step": 23337 + }, + { + "epoch": 63.59128065395095, + "grad_norm": 3.372689962387085, + "learning_rate": 6.183257525690316e-06, + "loss": 0.1289, + "step": 23338 + }, + { + "epoch": 63.59400544959128, + "grad_norm": 4.840092182159424, + "learning_rate": 6.182441853493139e-06, + "loss": 0.0915, + "step": 23339 + }, + { + "epoch": 63.596730245231605, + "grad_norm": 3.8786606788635254, + "learning_rate": 6.181626211026979e-06, + "loss": 0.1452, + "step": 23340 + }, + { + "epoch": 63.59945504087194, + "grad_norm": 4.334212779998779, + "learning_rate": 6.180810598298197e-06, + "loss": 0.1316, + "step": 23341 + }, + { + "epoch": 63.60217983651226, + "grad_norm": 3.7547287940979004, + "learning_rate": 6.179995015313136e-06, + "loss": 0.0625, + "step": 23342 + }, + { + "epoch": 63.60490463215259, + "grad_norm": 3.1574583053588867, + "learning_rate": 6.1791794620781535e-06, + "loss": 0.0625, + "step": 23343 + }, + { + "epoch": 63.607629427792915, + "grad_norm": 3.161449670791626, + "learning_rate": 6.178363938599596e-06, + "loss": 0.1815, + "step": 23344 + }, + { + "epoch": 63.61035422343324, + "grad_norm": 3.764359712600708, + "learning_rate": 6.1775484448838184e-06, + "loss": 0.0677, + "step": 23345 + }, + { + "epoch": 63.61307901907357, + "grad_norm": 2.69553804397583, + "learning_rate": 6.176732980937171e-06, + "loss": 0.0426, + "step": 23346 + }, + { + "epoch": 63.6158038147139, + "grad_norm": 2.6529035568237305, + "learning_rate": 6.175917546766003e-06, + "loss": 0.0488, + "step": 23347 + }, + { + "epoch": 63.618528610354225, + "grad_norm": 3.1602330207824707, + "learning_rate": 6.175102142376668e-06, + "loss": 0.1056, + "step": 23348 + }, + { + "epoch": 63.62125340599455, + "grad_norm": 3.942868947982788, + "learning_rate": 6.1742867677755115e-06, + "loss": 0.089, + "step": 23349 + }, + { + "epoch": 63.62397820163488, + "grad_norm": 3.5963327884674072, + "learning_rate": 6.173471422968889e-06, + "loss": 0.1397, + "step": 23350 + }, + { + "epoch": 63.6267029972752, + "grad_norm": 3.471452474594116, + "learning_rate": 6.172656107963146e-06, + "loss": 0.0894, + "step": 23351 + }, + { + "epoch": 63.62942779291553, + "grad_norm": 3.224921464920044, + "learning_rate": 6.171840822764636e-06, + "loss": 0.077, + "step": 23352 + }, + { + "epoch": 63.63215258855586, + "grad_norm": 4.43481969833374, + "learning_rate": 6.1710255673797045e-06, + "loss": 0.1299, + "step": 23353 + }, + { + "epoch": 63.63487738419619, + "grad_norm": 3.6068527698516846, + "learning_rate": 6.170210341814705e-06, + "loss": 0.0552, + "step": 23354 + }, + { + "epoch": 63.63760217983651, + "grad_norm": 3.184776782989502, + "learning_rate": 6.169395146075982e-06, + "loss": 0.1718, + "step": 23355 + }, + { + "epoch": 63.64032697547684, + "grad_norm": 3.762660026550293, + "learning_rate": 6.168579980169889e-06, + "loss": 0.1105, + "step": 23356 + }, + { + "epoch": 63.643051771117165, + "grad_norm": 3.6248199939727783, + "learning_rate": 6.167764844102766e-06, + "loss": 0.0953, + "step": 23357 + }, + { + "epoch": 63.64577656675749, + "grad_norm": 3.9380240440368652, + "learning_rate": 6.16694973788097e-06, + "loss": 0.1276, + "step": 23358 + }, + { + "epoch": 63.64850136239782, + "grad_norm": 3.3067786693573, + "learning_rate": 6.166134661510848e-06, + "loss": 0.2126, + "step": 23359 + }, + { + "epoch": 63.65122615803815, + "grad_norm": 3.041841506958008, + "learning_rate": 6.165319614998744e-06, + "loss": 0.0539, + "step": 23360 + }, + { + "epoch": 63.653950953678475, + "grad_norm": 3.897139549255371, + "learning_rate": 6.164504598351009e-06, + "loss": 0.0902, + "step": 23361 + }, + { + "epoch": 63.6566757493188, + "grad_norm": 4.920825004577637, + "learning_rate": 6.1636896115739864e-06, + "loss": 0.119, + "step": 23362 + }, + { + "epoch": 63.65940054495913, + "grad_norm": 5.995110511779785, + "learning_rate": 6.1628746546740295e-06, + "loss": 0.12, + "step": 23363 + }, + { + "epoch": 63.66212534059945, + "grad_norm": 2.7097299098968506, + "learning_rate": 6.162059727657477e-06, + "loss": 0.0461, + "step": 23364 + }, + { + "epoch": 63.664850136239785, + "grad_norm": 3.5396687984466553, + "learning_rate": 6.161244830530684e-06, + "loss": 0.0666, + "step": 23365 + }, + { + "epoch": 63.66757493188011, + "grad_norm": 3.118617057800293, + "learning_rate": 6.1604299632999885e-06, + "loss": 0.076, + "step": 23366 + }, + { + "epoch": 63.67029972752044, + "grad_norm": 2.875271797180176, + "learning_rate": 6.159615125971743e-06, + "loss": 0.0653, + "step": 23367 + }, + { + "epoch": 63.67302452316076, + "grad_norm": 3.1477246284484863, + "learning_rate": 6.158800318552292e-06, + "loss": 0.052, + "step": 23368 + }, + { + "epoch": 63.67574931880109, + "grad_norm": 2.3785343170166016, + "learning_rate": 6.157985541047979e-06, + "loss": 0.0805, + "step": 23369 + }, + { + "epoch": 63.678474114441414, + "grad_norm": 3.3399782180786133, + "learning_rate": 6.157170793465153e-06, + "loss": 0.0467, + "step": 23370 + }, + { + "epoch": 63.68119891008175, + "grad_norm": 3.1951773166656494, + "learning_rate": 6.156356075810154e-06, + "loss": 0.0588, + "step": 23371 + }, + { + "epoch": 63.68392370572207, + "grad_norm": 4.3294291496276855, + "learning_rate": 6.155541388089332e-06, + "loss": 0.0572, + "step": 23372 + }, + { + "epoch": 63.6866485013624, + "grad_norm": 3.3137307167053223, + "learning_rate": 6.15472673030903e-06, + "loss": 0.1471, + "step": 23373 + }, + { + "epoch": 63.689373297002724, + "grad_norm": 4.323788642883301, + "learning_rate": 6.1539121024755935e-06, + "loss": 0.0858, + "step": 23374 + }, + { + "epoch": 63.69209809264305, + "grad_norm": 8.91159439086914, + "learning_rate": 6.153097504595362e-06, + "loss": 0.1609, + "step": 23375 + }, + { + "epoch": 63.694822888283376, + "grad_norm": 3.2635562419891357, + "learning_rate": 6.152282936674685e-06, + "loss": 0.0982, + "step": 23376 + }, + { + "epoch": 63.69754768392371, + "grad_norm": 6.164497375488281, + "learning_rate": 6.151468398719906e-06, + "loss": 0.0945, + "step": 23377 + }, + { + "epoch": 63.700272479564035, + "grad_norm": 3.8145058155059814, + "learning_rate": 6.1506538907373655e-06, + "loss": 0.1023, + "step": 23378 + }, + { + "epoch": 63.70299727520436, + "grad_norm": 8.545085906982422, + "learning_rate": 6.149839412733411e-06, + "loss": 0.1553, + "step": 23379 + }, + { + "epoch": 63.705722070844686, + "grad_norm": 3.8043572902679443, + "learning_rate": 6.149024964714382e-06, + "loss": 0.0795, + "step": 23380 + }, + { + "epoch": 63.70844686648501, + "grad_norm": 5.421295642852783, + "learning_rate": 6.148210546686624e-06, + "loss": 0.1608, + "step": 23381 + }, + { + "epoch": 63.71117166212534, + "grad_norm": 4.151515007019043, + "learning_rate": 6.1473961586564756e-06, + "loss": 0.1208, + "step": 23382 + }, + { + "epoch": 63.71389645776567, + "grad_norm": 3.885204553604126, + "learning_rate": 6.146581800630285e-06, + "loss": 0.05, + "step": 23383 + }, + { + "epoch": 63.716621253406, + "grad_norm": 5.078805923461914, + "learning_rate": 6.145767472614389e-06, + "loss": 0.0525, + "step": 23384 + }, + { + "epoch": 63.71934604904632, + "grad_norm": 13.722284317016602, + "learning_rate": 6.144953174615133e-06, + "loss": 0.1069, + "step": 23385 + }, + { + "epoch": 63.72207084468665, + "grad_norm": 2.9433112144470215, + "learning_rate": 6.1441389066388565e-06, + "loss": 0.0536, + "step": 23386 + }, + { + "epoch": 63.724795640326974, + "grad_norm": 5.2005934715271, + "learning_rate": 6.143324668691904e-06, + "loss": 0.0922, + "step": 23387 + }, + { + "epoch": 63.7275204359673, + "grad_norm": 32.43373107910156, + "learning_rate": 6.142510460780613e-06, + "loss": 0.1307, + "step": 23388 + }, + { + "epoch": 63.73024523160763, + "grad_norm": 3.6497414112091064, + "learning_rate": 6.141696282911328e-06, + "loss": 0.1544, + "step": 23389 + }, + { + "epoch": 63.73297002724796, + "grad_norm": 2.5020391941070557, + "learning_rate": 6.140882135090387e-06, + "loss": 0.0819, + "step": 23390 + }, + { + "epoch": 63.735694822888284, + "grad_norm": 10.11089038848877, + "learning_rate": 6.14006801732413e-06, + "loss": 0.1541, + "step": 23391 + }, + { + "epoch": 63.73841961852861, + "grad_norm": 5.140850067138672, + "learning_rate": 6.139253929618898e-06, + "loss": 0.1014, + "step": 23392 + }, + { + "epoch": 63.741144414168936, + "grad_norm": 3.9001197814941406, + "learning_rate": 6.138439871981037e-06, + "loss": 0.075, + "step": 23393 + }, + { + "epoch": 63.74386920980926, + "grad_norm": 3.613224744796753, + "learning_rate": 6.137625844416879e-06, + "loss": 0.0802, + "step": 23394 + }, + { + "epoch": 63.746594005449595, + "grad_norm": 4.303200721740723, + "learning_rate": 6.136811846932769e-06, + "loss": 0.2148, + "step": 23395 + }, + { + "epoch": 63.74931880108992, + "grad_norm": 3.9668211936950684, + "learning_rate": 6.135997879535042e-06, + "loss": 0.1465, + "step": 23396 + }, + { + "epoch": 63.752043596730246, + "grad_norm": 6.469911098480225, + "learning_rate": 6.135183942230041e-06, + "loss": 0.0962, + "step": 23397 + }, + { + "epoch": 63.75476839237057, + "grad_norm": 2.9736506938934326, + "learning_rate": 6.1343700350241005e-06, + "loss": 0.1374, + "step": 23398 + }, + { + "epoch": 63.7574931880109, + "grad_norm": 4.08699369430542, + "learning_rate": 6.133556157923565e-06, + "loss": 0.2162, + "step": 23399 + }, + { + "epoch": 63.76021798365122, + "grad_norm": 10.112793922424316, + "learning_rate": 6.132742310934767e-06, + "loss": 0.1232, + "step": 23400 + }, + { + "epoch": 63.762942779291556, + "grad_norm": 2.8908116817474365, + "learning_rate": 6.131928494064049e-06, + "loss": 0.063, + "step": 23401 + }, + { + "epoch": 63.76566757493188, + "grad_norm": 3.213243007659912, + "learning_rate": 6.1311147073177455e-06, + "loss": 0.0645, + "step": 23402 + }, + { + "epoch": 63.76839237057221, + "grad_norm": 3.9643075466156006, + "learning_rate": 6.1303009507021995e-06, + "loss": 0.071, + "step": 23403 + }, + { + "epoch": 63.771117166212534, + "grad_norm": 4.139108180999756, + "learning_rate": 6.129487224223741e-06, + "loss": 0.0958, + "step": 23404 + }, + { + "epoch": 63.77384196185286, + "grad_norm": 2.657076835632324, + "learning_rate": 6.128673527888715e-06, + "loss": 0.1464, + "step": 23405 + }, + { + "epoch": 63.776566757493185, + "grad_norm": 4.322707176208496, + "learning_rate": 6.127859861703453e-06, + "loss": 0.0725, + "step": 23406 + }, + { + "epoch": 63.77929155313352, + "grad_norm": 4.337071418762207, + "learning_rate": 6.127046225674294e-06, + "loss": 0.0573, + "step": 23407 + }, + { + "epoch": 63.782016348773844, + "grad_norm": 3.0265305042266846, + "learning_rate": 6.126232619807575e-06, + "loss": 0.089, + "step": 23408 + }, + { + "epoch": 63.78474114441417, + "grad_norm": 4.078360080718994, + "learning_rate": 6.125419044109629e-06, + "loss": 0.1439, + "step": 23409 + }, + { + "epoch": 63.787465940054496, + "grad_norm": 3.665076971054077, + "learning_rate": 6.124605498586796e-06, + "loss": 0.0772, + "step": 23410 + }, + { + "epoch": 63.79019073569482, + "grad_norm": 3.631455183029175, + "learning_rate": 6.123791983245411e-06, + "loss": 0.2251, + "step": 23411 + }, + { + "epoch": 63.79291553133515, + "grad_norm": 4.092085838317871, + "learning_rate": 6.122978498091809e-06, + "loss": 0.1069, + "step": 23412 + }, + { + "epoch": 63.79564032697548, + "grad_norm": 3.549079656600952, + "learning_rate": 6.1221650431323285e-06, + "loss": 0.0529, + "step": 23413 + }, + { + "epoch": 63.798365122615806, + "grad_norm": 4.666623592376709, + "learning_rate": 6.121351618373299e-06, + "loss": 0.1635, + "step": 23414 + }, + { + "epoch": 63.80108991825613, + "grad_norm": 4.067806243896484, + "learning_rate": 6.12053822382106e-06, + "loss": 0.1598, + "step": 23415 + }, + { + "epoch": 63.80381471389646, + "grad_norm": 3.807265520095825, + "learning_rate": 6.119724859481943e-06, + "loss": 0.2297, + "step": 23416 + }, + { + "epoch": 63.80653950953678, + "grad_norm": 5.882267951965332, + "learning_rate": 6.1189115253622855e-06, + "loss": 0.0705, + "step": 23417 + }, + { + "epoch": 63.80926430517711, + "grad_norm": 4.377636909484863, + "learning_rate": 6.118098221468418e-06, + "loss": 0.0788, + "step": 23418 + }, + { + "epoch": 63.81198910081744, + "grad_norm": 4.685329914093018, + "learning_rate": 6.117284947806679e-06, + "loss": 0.1384, + "step": 23419 + }, + { + "epoch": 63.81471389645777, + "grad_norm": 3.047091007232666, + "learning_rate": 6.116471704383397e-06, + "loss": 0.0516, + "step": 23420 + }, + { + "epoch": 63.817438692098094, + "grad_norm": 5.363067626953125, + "learning_rate": 6.1156584912049126e-06, + "loss": 0.1065, + "step": 23421 + }, + { + "epoch": 63.82016348773842, + "grad_norm": 4.223793983459473, + "learning_rate": 6.114845308277551e-06, + "loss": 0.1137, + "step": 23422 + }, + { + "epoch": 63.822888283378745, + "grad_norm": 8.914681434631348, + "learning_rate": 6.114032155607651e-06, + "loss": 0.0651, + "step": 23423 + }, + { + "epoch": 63.82561307901907, + "grad_norm": 4.6169586181640625, + "learning_rate": 6.113219033201543e-06, + "loss": 0.0403, + "step": 23424 + }, + { + "epoch": 63.828337874659404, + "grad_norm": 4.677670955657959, + "learning_rate": 6.11240594106556e-06, + "loss": 0.1227, + "step": 23425 + }, + { + "epoch": 63.83106267029973, + "grad_norm": 4.268988132476807, + "learning_rate": 6.111592879206032e-06, + "loss": 0.0742, + "step": 23426 + }, + { + "epoch": 63.833787465940055, + "grad_norm": 3.756197690963745, + "learning_rate": 6.110779847629295e-06, + "loss": 0.1008, + "step": 23427 + }, + { + "epoch": 63.83651226158038, + "grad_norm": 3.9022650718688965, + "learning_rate": 6.109966846341681e-06, + "loss": 0.1418, + "step": 23428 + }, + { + "epoch": 63.83923705722071, + "grad_norm": 4.158533096313477, + "learning_rate": 6.109153875349518e-06, + "loss": 0.1343, + "step": 23429 + }, + { + "epoch": 63.84196185286103, + "grad_norm": 3.451460838317871, + "learning_rate": 6.1083409346591425e-06, + "loss": 0.1802, + "step": 23430 + }, + { + "epoch": 63.844686648501366, + "grad_norm": 2.8260531425476074, + "learning_rate": 6.1075280242768785e-06, + "loss": 0.0645, + "step": 23431 + }, + { + "epoch": 63.84741144414169, + "grad_norm": 3.1926558017730713, + "learning_rate": 6.106715144209063e-06, + "loss": 0.0895, + "step": 23432 + }, + { + "epoch": 63.85013623978202, + "grad_norm": 2.9613037109375, + "learning_rate": 6.105902294462026e-06, + "loss": 0.0688, + "step": 23433 + }, + { + "epoch": 63.85286103542234, + "grad_norm": 2.9341928958892822, + "learning_rate": 6.105089475042094e-06, + "loss": 0.0531, + "step": 23434 + }, + { + "epoch": 63.85558583106267, + "grad_norm": 3.9897468090057373, + "learning_rate": 6.104276685955603e-06, + "loss": 0.1707, + "step": 23435 + }, + { + "epoch": 63.858310626702995, + "grad_norm": 2.8880317211151123, + "learning_rate": 6.103463927208877e-06, + "loss": 0.1079, + "step": 23436 + }, + { + "epoch": 63.86103542234333, + "grad_norm": 3.641231060028076, + "learning_rate": 6.10265119880825e-06, + "loss": 0.0816, + "step": 23437 + }, + { + "epoch": 63.86376021798365, + "grad_norm": 4.001800537109375, + "learning_rate": 6.101838500760049e-06, + "loss": 0.1587, + "step": 23438 + }, + { + "epoch": 63.86648501362398, + "grad_norm": 3.740647554397583, + "learning_rate": 6.101025833070607e-06, + "loss": 0.0818, + "step": 23439 + }, + { + "epoch": 63.869209809264305, + "grad_norm": 3.308682441711426, + "learning_rate": 6.100213195746246e-06, + "loss": 0.0719, + "step": 23440 + }, + { + "epoch": 63.87193460490463, + "grad_norm": 3.250107765197754, + "learning_rate": 6.099400588793303e-06, + "loss": 0.2026, + "step": 23441 + }, + { + "epoch": 63.87465940054496, + "grad_norm": 3.7879693508148193, + "learning_rate": 6.0985880122181e-06, + "loss": 0.247, + "step": 23442 + }, + { + "epoch": 63.87738419618529, + "grad_norm": 4.270380020141602, + "learning_rate": 6.097775466026966e-06, + "loss": 0.186, + "step": 23443 + }, + { + "epoch": 63.880108991825615, + "grad_norm": 6.7312164306640625, + "learning_rate": 6.096962950226235e-06, + "loss": 0.059, + "step": 23444 + }, + { + "epoch": 63.88283378746594, + "grad_norm": 4.286167621612549, + "learning_rate": 6.096150464822229e-06, + "loss": 0.1302, + "step": 23445 + }, + { + "epoch": 63.88555858310627, + "grad_norm": 3.4437525272369385, + "learning_rate": 6.095338009821279e-06, + "loss": 0.0749, + "step": 23446 + }, + { + "epoch": 63.88828337874659, + "grad_norm": 3.741774559020996, + "learning_rate": 6.09452558522971e-06, + "loss": 0.0961, + "step": 23447 + }, + { + "epoch": 63.89100817438692, + "grad_norm": 4.192138195037842, + "learning_rate": 6.093713191053852e-06, + "loss": 0.1778, + "step": 23448 + }, + { + "epoch": 63.89373297002725, + "grad_norm": 4.225839614868164, + "learning_rate": 6.092900827300028e-06, + "loss": 0.0554, + "step": 23449 + }, + { + "epoch": 63.89645776566758, + "grad_norm": 2.9316306114196777, + "learning_rate": 6.0920884939745675e-06, + "loss": 0.0339, + "step": 23450 + }, + { + "epoch": 63.8991825613079, + "grad_norm": 4.158364295959473, + "learning_rate": 6.091276191083795e-06, + "loss": 0.1724, + "step": 23451 + }, + { + "epoch": 63.90190735694823, + "grad_norm": 2.9727489948272705, + "learning_rate": 6.090463918634039e-06, + "loss": 0.0573, + "step": 23452 + }, + { + "epoch": 63.904632152588555, + "grad_norm": 2.535248279571533, + "learning_rate": 6.089651676631623e-06, + "loss": 0.0386, + "step": 23453 + }, + { + "epoch": 63.90735694822888, + "grad_norm": 3.114696502685547, + "learning_rate": 6.088839465082873e-06, + "loss": 0.3108, + "step": 23454 + }, + { + "epoch": 63.91008174386921, + "grad_norm": 2.4612932205200195, + "learning_rate": 6.088027283994118e-06, + "loss": 0.0494, + "step": 23455 + }, + { + "epoch": 63.91280653950954, + "grad_norm": 2.5667924880981445, + "learning_rate": 6.087215133371678e-06, + "loss": 0.0502, + "step": 23456 + }, + { + "epoch": 63.915531335149865, + "grad_norm": 4.460409164428711, + "learning_rate": 6.086403013221883e-06, + "loss": 0.0899, + "step": 23457 + }, + { + "epoch": 63.91825613079019, + "grad_norm": 3.584872245788574, + "learning_rate": 6.085590923551053e-06, + "loss": 0.1044, + "step": 23458 + }, + { + "epoch": 63.920980926430516, + "grad_norm": 3.301926374435425, + "learning_rate": 6.084778864365517e-06, + "loss": 0.104, + "step": 23459 + }, + { + "epoch": 63.92370572207084, + "grad_norm": 3.8156473636627197, + "learning_rate": 6.083966835671595e-06, + "loss": 0.1698, + "step": 23460 + }, + { + "epoch": 63.926430517711175, + "grad_norm": 3.2632346153259277, + "learning_rate": 6.083154837475613e-06, + "loss": 0.0506, + "step": 23461 + }, + { + "epoch": 63.9291553133515, + "grad_norm": 2.7662084102630615, + "learning_rate": 6.082342869783897e-06, + "loss": 0.1222, + "step": 23462 + }, + { + "epoch": 63.93188010899183, + "grad_norm": 3.916504383087158, + "learning_rate": 6.081530932602768e-06, + "loss": 0.0466, + "step": 23463 + }, + { + "epoch": 63.93460490463215, + "grad_norm": 3.228099822998047, + "learning_rate": 6.0807190259385506e-06, + "loss": 0.0453, + "step": 23464 + }, + { + "epoch": 63.93732970027248, + "grad_norm": 2.837225914001465, + "learning_rate": 6.079907149797567e-06, + "loss": 0.0531, + "step": 23465 + }, + { + "epoch": 63.940054495912804, + "grad_norm": 5.713571071624756, + "learning_rate": 6.079095304186141e-06, + "loss": 0.152, + "step": 23466 + }, + { + "epoch": 63.94277929155314, + "grad_norm": 5.183123588562012, + "learning_rate": 6.078283489110593e-06, + "loss": 0.0838, + "step": 23467 + }, + { + "epoch": 63.94550408719346, + "grad_norm": 4.887022972106934, + "learning_rate": 6.077471704577249e-06, + "loss": 0.0654, + "step": 23468 + }, + { + "epoch": 63.94822888283379, + "grad_norm": 3.4347918033599854, + "learning_rate": 6.076659950592427e-06, + "loss": 0.0449, + "step": 23469 + }, + { + "epoch": 63.950953678474114, + "grad_norm": 3.740933656692505, + "learning_rate": 6.075848227162453e-06, + "loss": 0.0723, + "step": 23470 + }, + { + "epoch": 63.95367847411444, + "grad_norm": 4.064043998718262, + "learning_rate": 6.075036534293646e-06, + "loss": 0.095, + "step": 23471 + }, + { + "epoch": 63.956403269754766, + "grad_norm": 4.198511600494385, + "learning_rate": 6.074224871992329e-06, + "loss": 0.0793, + "step": 23472 + }, + { + "epoch": 63.95912806539509, + "grad_norm": 2.671219825744629, + "learning_rate": 6.0734132402648205e-06, + "loss": 0.22, + "step": 23473 + }, + { + "epoch": 63.961852861035425, + "grad_norm": 3.583232879638672, + "learning_rate": 6.0726016391174435e-06, + "loss": 0.1097, + "step": 23474 + }, + { + "epoch": 63.96457765667575, + "grad_norm": 4.212375640869141, + "learning_rate": 6.071790068556519e-06, + "loss": 0.0852, + "step": 23475 + }, + { + "epoch": 63.967302452316076, + "grad_norm": 3.3939666748046875, + "learning_rate": 6.070978528588369e-06, + "loss": 0.2639, + "step": 23476 + }, + { + "epoch": 63.9700272479564, + "grad_norm": 3.3759117126464844, + "learning_rate": 6.0701670192193085e-06, + "loss": 0.0426, + "step": 23477 + }, + { + "epoch": 63.97275204359673, + "grad_norm": 4.86347770690918, + "learning_rate": 6.06935554045566e-06, + "loss": 0.1106, + "step": 23478 + }, + { + "epoch": 63.97547683923706, + "grad_norm": 4.830080032348633, + "learning_rate": 6.068544092303744e-06, + "loss": 0.0797, + "step": 23479 + }, + { + "epoch": 63.97820163487739, + "grad_norm": 3.3038806915283203, + "learning_rate": 6.067732674769884e-06, + "loss": 0.0478, + "step": 23480 + }, + { + "epoch": 63.98092643051771, + "grad_norm": 3.3870160579681396, + "learning_rate": 6.0669212878603925e-06, + "loss": 0.047, + "step": 23481 + }, + { + "epoch": 63.98365122615804, + "grad_norm": 3.249441623687744, + "learning_rate": 6.066109931581594e-06, + "loss": 0.1047, + "step": 23482 + }, + { + "epoch": 63.986376021798364, + "grad_norm": 3.0960967540740967, + "learning_rate": 6.065298605939803e-06, + "loss": 0.0614, + "step": 23483 + }, + { + "epoch": 63.98910081743869, + "grad_norm": 4.144088268280029, + "learning_rate": 6.064487310941341e-06, + "loss": 0.1204, + "step": 23484 + }, + { + "epoch": 63.991825613079016, + "grad_norm": 3.5295004844665527, + "learning_rate": 6.063676046592523e-06, + "loss": 0.0812, + "step": 23485 + }, + { + "epoch": 63.99455040871935, + "grad_norm": 4.128300666809082, + "learning_rate": 6.062864812899672e-06, + "loss": 0.0623, + "step": 23486 + }, + { + "epoch": 63.997275204359674, + "grad_norm": 4.500547409057617, + "learning_rate": 6.0620536098690995e-06, + "loss": 0.1733, + "step": 23487 + }, + { + "epoch": 64.0, + "grad_norm": 2.8028404712677, + "learning_rate": 6.061242437507131e-06, + "loss": 0.097, + "step": 23488 + }, + { + "epoch": 64.00272479564033, + "grad_norm": 3.697244644165039, + "learning_rate": 6.0604312958200754e-06, + "loss": 0.1127, + "step": 23489 + }, + { + "epoch": 64.00544959128065, + "grad_norm": 2.81890869140625, + "learning_rate": 6.059620184814258e-06, + "loss": 0.0508, + "step": 23490 + }, + { + "epoch": 64.00817438692098, + "grad_norm": 4.149252414703369, + "learning_rate": 6.058809104495988e-06, + "loss": 0.1435, + "step": 23491 + }, + { + "epoch": 64.0108991825613, + "grad_norm": 4.215442657470703, + "learning_rate": 6.05799805487159e-06, + "loss": 0.1213, + "step": 23492 + }, + { + "epoch": 64.01362397820164, + "grad_norm": 5.0310845375061035, + "learning_rate": 6.057187035947373e-06, + "loss": 0.0664, + "step": 23493 + }, + { + "epoch": 64.01634877384195, + "grad_norm": 4.0117316246032715, + "learning_rate": 6.056376047729658e-06, + "loss": 0.057, + "step": 23494 + }, + { + "epoch": 64.01907356948229, + "grad_norm": 4.201609134674072, + "learning_rate": 6.055565090224756e-06, + "loss": 0.0598, + "step": 23495 + }, + { + "epoch": 64.02179836512262, + "grad_norm": 2.948737382888794, + "learning_rate": 6.054754163438989e-06, + "loss": 0.1505, + "step": 23496 + }, + { + "epoch": 64.02452316076294, + "grad_norm": 3.196985960006714, + "learning_rate": 6.053943267378668e-06, + "loss": 0.0358, + "step": 23497 + }, + { + "epoch": 64.02724795640327, + "grad_norm": 3.8606789112091064, + "learning_rate": 6.053132402050112e-06, + "loss": 0.1597, + "step": 23498 + }, + { + "epoch": 64.02997275204359, + "grad_norm": 2.8317203521728516, + "learning_rate": 6.052321567459634e-06, + "loss": 0.0381, + "step": 23499 + }, + { + "epoch": 64.03269754768392, + "grad_norm": 3.4053215980529785, + "learning_rate": 6.051510763613548e-06, + "loss": 0.1608, + "step": 23500 + }, + { + "epoch": 64.03542234332426, + "grad_norm": 2.6956491470336914, + "learning_rate": 6.0506999905181696e-06, + "loss": 0.066, + "step": 23501 + }, + { + "epoch": 64.03814713896458, + "grad_norm": 3.694140672683716, + "learning_rate": 6.049889248179812e-06, + "loss": 0.0862, + "step": 23502 + }, + { + "epoch": 64.04087193460491, + "grad_norm": 4.136013031005859, + "learning_rate": 6.049078536604789e-06, + "loss": 0.0517, + "step": 23503 + }, + { + "epoch": 64.04359673024523, + "grad_norm": 3.58744215965271, + "learning_rate": 6.048267855799417e-06, + "loss": 0.1088, + "step": 23504 + }, + { + "epoch": 64.04632152588556, + "grad_norm": 5.858720302581787, + "learning_rate": 6.047457205770006e-06, + "loss": 0.1104, + "step": 23505 + }, + { + "epoch": 64.04904632152588, + "grad_norm": 4.341165542602539, + "learning_rate": 6.046646586522873e-06, + "loss": 0.0937, + "step": 23506 + }, + { + "epoch": 64.05177111716621, + "grad_norm": 3.494215250015259, + "learning_rate": 6.045835998064326e-06, + "loss": 0.0948, + "step": 23507 + }, + { + "epoch": 64.05449591280654, + "grad_norm": 4.5636444091796875, + "learning_rate": 6.045025440400684e-06, + "loss": 0.0909, + "step": 23508 + }, + { + "epoch": 64.05722070844686, + "grad_norm": 3.3840458393096924, + "learning_rate": 6.044214913538255e-06, + "loss": 0.0815, + "step": 23509 + }, + { + "epoch": 64.0599455040872, + "grad_norm": 4.306269645690918, + "learning_rate": 6.043404417483356e-06, + "loss": 0.0694, + "step": 23510 + }, + { + "epoch": 64.06267029972751, + "grad_norm": 4.181427478790283, + "learning_rate": 6.0425939522422926e-06, + "loss": 0.0867, + "step": 23511 + }, + { + "epoch": 64.06539509536785, + "grad_norm": 4.496644496917725, + "learning_rate": 6.041783517821378e-06, + "loss": 0.0971, + "step": 23512 + }, + { + "epoch": 64.06811989100818, + "grad_norm": 2.958178997039795, + "learning_rate": 6.040973114226929e-06, + "loss": 0.0444, + "step": 23513 + }, + { + "epoch": 64.0708446866485, + "grad_norm": 2.571974277496338, + "learning_rate": 6.0401627414652545e-06, + "loss": 0.2193, + "step": 23514 + }, + { + "epoch": 64.07356948228883, + "grad_norm": 4.502200603485107, + "learning_rate": 6.039352399542665e-06, + "loss": 0.0657, + "step": 23515 + }, + { + "epoch": 64.07629427792915, + "grad_norm": 3.3185508251190186, + "learning_rate": 6.03854208846547e-06, + "loss": 0.0551, + "step": 23516 + }, + { + "epoch": 64.07901907356948, + "grad_norm": 3.644416093826294, + "learning_rate": 6.037731808239984e-06, + "loss": 0.0602, + "step": 23517 + }, + { + "epoch": 64.0817438692098, + "grad_norm": 3.460526466369629, + "learning_rate": 6.036921558872513e-06, + "loss": 0.0653, + "step": 23518 + }, + { + "epoch": 64.08446866485014, + "grad_norm": 4.2937703132629395, + "learning_rate": 6.03611134036937e-06, + "loss": 0.2086, + "step": 23519 + }, + { + "epoch": 64.08719346049047, + "grad_norm": 3.382347822189331, + "learning_rate": 6.035301152736866e-06, + "loss": 0.0655, + "step": 23520 + }, + { + "epoch": 64.08991825613079, + "grad_norm": 4.8122053146362305, + "learning_rate": 6.0344909959813055e-06, + "loss": 0.134, + "step": 23521 + }, + { + "epoch": 64.09264305177112, + "grad_norm": 8.842113494873047, + "learning_rate": 6.033680870109005e-06, + "loss": 0.0767, + "step": 23522 + }, + { + "epoch": 64.09536784741144, + "grad_norm": 4.6074628829956055, + "learning_rate": 6.032870775126268e-06, + "loss": 0.0574, + "step": 23523 + }, + { + "epoch": 64.09809264305177, + "grad_norm": 2.9115238189697266, + "learning_rate": 6.032060711039408e-06, + "loss": 0.0374, + "step": 23524 + }, + { + "epoch": 64.1008174386921, + "grad_norm": 4.844232082366943, + "learning_rate": 6.03125067785473e-06, + "loss": 0.1889, + "step": 23525 + }, + { + "epoch": 64.10354223433242, + "grad_norm": 3.5602612495422363, + "learning_rate": 6.030440675578544e-06, + "loss": 0.2008, + "step": 23526 + }, + { + "epoch": 64.10626702997276, + "grad_norm": 11.935846328735352, + "learning_rate": 6.0296307042171575e-06, + "loss": 0.1966, + "step": 23527 + }, + { + "epoch": 64.10899182561307, + "grad_norm": 3.367767572402954, + "learning_rate": 6.0288207637768815e-06, + "loss": 0.0498, + "step": 23528 + }, + { + "epoch": 64.11171662125341, + "grad_norm": 4.081257343292236, + "learning_rate": 6.028010854264017e-06, + "loss": 0.113, + "step": 23529 + }, + { + "epoch": 64.11444141689373, + "grad_norm": 3.3737878799438477, + "learning_rate": 6.027200975684879e-06, + "loss": 0.075, + "step": 23530 + }, + { + "epoch": 64.11716621253406, + "grad_norm": 3.344336748123169, + "learning_rate": 6.026391128045773e-06, + "loss": 0.1097, + "step": 23531 + }, + { + "epoch": 64.11989100817439, + "grad_norm": 4.564388751983643, + "learning_rate": 6.0255813113530036e-06, + "loss": 0.1994, + "step": 23532 + }, + { + "epoch": 64.12261580381471, + "grad_norm": 5.7605085372924805, + "learning_rate": 6.02477152561288e-06, + "loss": 0.0787, + "step": 23533 + }, + { + "epoch": 64.12534059945504, + "grad_norm": 4.184399604797363, + "learning_rate": 6.023961770831708e-06, + "loss": 0.2097, + "step": 23534 + }, + { + "epoch": 64.12806539509536, + "grad_norm": 4.196770668029785, + "learning_rate": 6.023152047015794e-06, + "loss": 0.0756, + "step": 23535 + }, + { + "epoch": 64.1307901907357, + "grad_norm": 4.043728351593018, + "learning_rate": 6.022342354171442e-06, + "loss": 0.1195, + "step": 23536 + }, + { + "epoch": 64.13351498637603, + "grad_norm": 3.506322145462036, + "learning_rate": 6.021532692304962e-06, + "loss": 0.0915, + "step": 23537 + }, + { + "epoch": 64.13623978201635, + "grad_norm": 3.506742477416992, + "learning_rate": 6.020723061422655e-06, + "loss": 0.0478, + "step": 23538 + }, + { + "epoch": 64.13896457765668, + "grad_norm": 3.656735420227051, + "learning_rate": 6.019913461530831e-06, + "loss": 0.0684, + "step": 23539 + }, + { + "epoch": 64.141689373297, + "grad_norm": 4.760861873626709, + "learning_rate": 6.019103892635791e-06, + "loss": 0.2306, + "step": 23540 + }, + { + "epoch": 64.14441416893733, + "grad_norm": 9.18626880645752, + "learning_rate": 6.018294354743842e-06, + "loss": 0.1383, + "step": 23541 + }, + { + "epoch": 64.14713896457765, + "grad_norm": 4.248356819152832, + "learning_rate": 6.01748484786129e-06, + "loss": 0.0574, + "step": 23542 + }, + { + "epoch": 64.14986376021798, + "grad_norm": 8.526737213134766, + "learning_rate": 6.016675371994436e-06, + "loss": 0.0503, + "step": 23543 + }, + { + "epoch": 64.15258855585832, + "grad_norm": 4.397159099578857, + "learning_rate": 6.015865927149588e-06, + "loss": 0.0593, + "step": 23544 + }, + { + "epoch": 64.15531335149863, + "grad_norm": 4.602883338928223, + "learning_rate": 6.015056513333046e-06, + "loss": 0.0727, + "step": 23545 + }, + { + "epoch": 64.15803814713897, + "grad_norm": 4.110457420349121, + "learning_rate": 6.014247130551117e-06, + "loss": 0.1262, + "step": 23546 + }, + { + "epoch": 64.16076294277929, + "grad_norm": 5.497186183929443, + "learning_rate": 6.013437778810101e-06, + "loss": 0.1247, + "step": 23547 + }, + { + "epoch": 64.16348773841962, + "grad_norm": 3.1408705711364746, + "learning_rate": 6.012628458116303e-06, + "loss": 0.0833, + "step": 23548 + }, + { + "epoch": 64.16621253405995, + "grad_norm": 3.999343156814575, + "learning_rate": 6.011819168476028e-06, + "loss": 0.2633, + "step": 23549 + }, + { + "epoch": 64.16893732970027, + "grad_norm": 3.464352607727051, + "learning_rate": 6.011009909895576e-06, + "loss": 0.0944, + "step": 23550 + }, + { + "epoch": 64.1716621253406, + "grad_norm": 2.916966438293457, + "learning_rate": 6.010200682381253e-06, + "loss": 0.0702, + "step": 23551 + }, + { + "epoch": 64.17438692098092, + "grad_norm": 4.517367362976074, + "learning_rate": 6.009391485939355e-06, + "loss": 0.0854, + "step": 23552 + }, + { + "epoch": 64.17711171662125, + "grad_norm": 3.6340513229370117, + "learning_rate": 6.008582320576191e-06, + "loss": 0.0675, + "step": 23553 + }, + { + "epoch": 64.17983651226157, + "grad_norm": 3.23189377784729, + "learning_rate": 6.0077731862980584e-06, + "loss": 0.0867, + "step": 23554 + }, + { + "epoch": 64.1825613079019, + "grad_norm": 5.061977863311768, + "learning_rate": 6.00696408311126e-06, + "loss": 0.0566, + "step": 23555 + }, + { + "epoch": 64.18528610354224, + "grad_norm": 4.160363674163818, + "learning_rate": 6.0061550110220954e-06, + "loss": 0.1581, + "step": 23556 + }, + { + "epoch": 64.18801089918256, + "grad_norm": 2.9718129634857178, + "learning_rate": 6.005345970036868e-06, + "loss": 0.0473, + "step": 23557 + }, + { + "epoch": 64.19073569482289, + "grad_norm": 3.0926907062530518, + "learning_rate": 6.004536960161877e-06, + "loss": 0.1364, + "step": 23558 + }, + { + "epoch": 64.19346049046321, + "grad_norm": 3.834367036819458, + "learning_rate": 6.003727981403427e-06, + "loss": 0.0651, + "step": 23559 + }, + { + "epoch": 64.19618528610354, + "grad_norm": 3.2685959339141846, + "learning_rate": 6.0029190337678104e-06, + "loss": 0.0539, + "step": 23560 + }, + { + "epoch": 64.19891008174388, + "grad_norm": 4.632725715637207, + "learning_rate": 6.002110117261334e-06, + "loss": 0.3755, + "step": 23561 + }, + { + "epoch": 64.2016348773842, + "grad_norm": 2.591708183288574, + "learning_rate": 6.001301231890293e-06, + "loss": 0.044, + "step": 23562 + }, + { + "epoch": 64.20435967302453, + "grad_norm": 4.842454433441162, + "learning_rate": 6.0004923776609925e-06, + "loss": 0.1532, + "step": 23563 + }, + { + "epoch": 64.20708446866485, + "grad_norm": 4.658775806427002, + "learning_rate": 5.999683554579723e-06, + "loss": 0.0782, + "step": 23564 + }, + { + "epoch": 64.20980926430518, + "grad_norm": 5.350197792053223, + "learning_rate": 5.998874762652793e-06, + "loss": 0.1631, + "step": 23565 + }, + { + "epoch": 64.2125340599455, + "grad_norm": 5.568068027496338, + "learning_rate": 5.998066001886498e-06, + "loss": 0.1451, + "step": 23566 + }, + { + "epoch": 64.21525885558583, + "grad_norm": 5.235050678253174, + "learning_rate": 5.997257272287136e-06, + "loss": 0.0705, + "step": 23567 + }, + { + "epoch": 64.21798365122616, + "grad_norm": 2.4079315662384033, + "learning_rate": 5.9964485738610045e-06, + "loss": 0.1124, + "step": 23568 + }, + { + "epoch": 64.22070844686648, + "grad_norm": 4.350709438323975, + "learning_rate": 5.995639906614406e-06, + "loss": 0.0596, + "step": 23569 + }, + { + "epoch": 64.22343324250681, + "grad_norm": 2.903782606124878, + "learning_rate": 5.994831270553632e-06, + "loss": 0.0631, + "step": 23570 + }, + { + "epoch": 64.22615803814713, + "grad_norm": 2.8252782821655273, + "learning_rate": 5.994022665684985e-06, + "loss": 0.0819, + "step": 23571 + }, + { + "epoch": 64.22888283378747, + "grad_norm": 3.7527451515197754, + "learning_rate": 5.993214092014758e-06, + "loss": 0.073, + "step": 23572 + }, + { + "epoch": 64.2316076294278, + "grad_norm": 2.4014880657196045, + "learning_rate": 5.992405549549253e-06, + "loss": 0.0374, + "step": 23573 + }, + { + "epoch": 64.23433242506812, + "grad_norm": 3.990499258041382, + "learning_rate": 5.991597038294763e-06, + "loss": 0.0882, + "step": 23574 + }, + { + "epoch": 64.23705722070845, + "grad_norm": 3.87880277633667, + "learning_rate": 5.9907885582575875e-06, + "loss": 0.1614, + "step": 23575 + }, + { + "epoch": 64.23978201634877, + "grad_norm": 15.022882461547852, + "learning_rate": 5.989980109444021e-06, + "loss": 0.114, + "step": 23576 + }, + { + "epoch": 64.2425068119891, + "grad_norm": 7.59397029876709, + "learning_rate": 5.98917169186036e-06, + "loss": 0.1435, + "step": 23577 + }, + { + "epoch": 64.24523160762942, + "grad_norm": 3.6357462406158447, + "learning_rate": 5.988363305512901e-06, + "loss": 0.0959, + "step": 23578 + }, + { + "epoch": 64.24795640326975, + "grad_norm": 3.291400194168091, + "learning_rate": 5.987554950407941e-06, + "loss": 0.0752, + "step": 23579 + }, + { + "epoch": 64.25068119891009, + "grad_norm": 3.1410319805145264, + "learning_rate": 5.986746626551772e-06, + "loss": 0.0426, + "step": 23580 + }, + { + "epoch": 64.2534059945504, + "grad_norm": 3.742543935775757, + "learning_rate": 5.985938333950689e-06, + "loss": 0.0794, + "step": 23581 + }, + { + "epoch": 64.25613079019074, + "grad_norm": 4.182135105133057, + "learning_rate": 5.985130072610993e-06, + "loss": 0.171, + "step": 23582 + }, + { + "epoch": 64.25885558583106, + "grad_norm": 3.4071569442749023, + "learning_rate": 5.984321842538973e-06, + "loss": 0.0514, + "step": 23583 + }, + { + "epoch": 64.26158038147139, + "grad_norm": 4.205199241638184, + "learning_rate": 5.9835136437409235e-06, + "loss": 0.151, + "step": 23584 + }, + { + "epoch": 64.26430517711172, + "grad_norm": 3.668665885925293, + "learning_rate": 5.982705476223145e-06, + "loss": 0.0614, + "step": 23585 + }, + { + "epoch": 64.26702997275204, + "grad_norm": 4.014118194580078, + "learning_rate": 5.981897339991923e-06, + "loss": 0.0442, + "step": 23586 + }, + { + "epoch": 64.26975476839237, + "grad_norm": 4.413239002227783, + "learning_rate": 5.981089235053559e-06, + "loss": 0.0809, + "step": 23587 + }, + { + "epoch": 64.2724795640327, + "grad_norm": 3.7972803115844727, + "learning_rate": 5.980281161414339e-06, + "loss": 0.0749, + "step": 23588 + }, + { + "epoch": 64.27520435967303, + "grad_norm": 2.0995733737945557, + "learning_rate": 5.9794731190805635e-06, + "loss": 0.1192, + "step": 23589 + }, + { + "epoch": 64.27792915531334, + "grad_norm": 2.1572067737579346, + "learning_rate": 5.978665108058519e-06, + "loss": 0.1144, + "step": 23590 + }, + { + "epoch": 64.28065395095368, + "grad_norm": 3.133448362350464, + "learning_rate": 5.977857128354503e-06, + "loss": 0.0576, + "step": 23591 + }, + { + "epoch": 64.28337874659401, + "grad_norm": 3.8053882122039795, + "learning_rate": 5.977049179974804e-06, + "loss": 0.1044, + "step": 23592 + }, + { + "epoch": 64.28610354223433, + "grad_norm": 3.0806984901428223, + "learning_rate": 5.976241262925719e-06, + "loss": 0.0541, + "step": 23593 + }, + { + "epoch": 64.28882833787466, + "grad_norm": 3.3876729011535645, + "learning_rate": 5.975433377213537e-06, + "loss": 0.075, + "step": 23594 + }, + { + "epoch": 64.29155313351498, + "grad_norm": 3.0282328128814697, + "learning_rate": 5.974625522844551e-06, + "loss": 0.1608, + "step": 23595 + }, + { + "epoch": 64.29427792915531, + "grad_norm": 3.436739444732666, + "learning_rate": 5.9738176998250484e-06, + "loss": 0.1862, + "step": 23596 + }, + { + "epoch": 64.29700272479565, + "grad_norm": 3.1355998516082764, + "learning_rate": 5.973009908161328e-06, + "loss": 0.0927, + "step": 23597 + }, + { + "epoch": 64.29972752043597, + "grad_norm": 3.6452877521514893, + "learning_rate": 5.972202147859671e-06, + "loss": 0.0777, + "step": 23598 + }, + { + "epoch": 64.3024523160763, + "grad_norm": 3.05553936958313, + "learning_rate": 5.971394418926379e-06, + "loss": 0.1025, + "step": 23599 + }, + { + "epoch": 64.30517711171662, + "grad_norm": 4.310255527496338, + "learning_rate": 5.970586721367737e-06, + "loss": 0.1987, + "step": 23600 + }, + { + "epoch": 64.30790190735695, + "grad_norm": 3.7769877910614014, + "learning_rate": 5.969779055190035e-06, + "loss": 0.0601, + "step": 23601 + }, + { + "epoch": 64.31062670299727, + "grad_norm": 3.2985124588012695, + "learning_rate": 5.968971420399565e-06, + "loss": 0.054, + "step": 23602 + }, + { + "epoch": 64.3133514986376, + "grad_norm": 2.882575750350952, + "learning_rate": 5.968163817002616e-06, + "loss": 0.0957, + "step": 23603 + }, + { + "epoch": 64.31607629427793, + "grad_norm": 3.0860962867736816, + "learning_rate": 5.967356245005478e-06, + "loss": 0.0546, + "step": 23604 + }, + { + "epoch": 64.31880108991825, + "grad_norm": 2.7559969425201416, + "learning_rate": 5.966548704414436e-06, + "loss": 0.0598, + "step": 23605 + }, + { + "epoch": 64.32152588555859, + "grad_norm": 3.6411938667297363, + "learning_rate": 5.965741195235786e-06, + "loss": 0.0511, + "step": 23606 + }, + { + "epoch": 64.3242506811989, + "grad_norm": 3.7164576053619385, + "learning_rate": 5.964933717475814e-06, + "loss": 0.1375, + "step": 23607 + }, + { + "epoch": 64.32697547683924, + "grad_norm": 2.882533073425293, + "learning_rate": 5.964126271140807e-06, + "loss": 0.1998, + "step": 23608 + }, + { + "epoch": 64.32970027247957, + "grad_norm": 4.589282512664795, + "learning_rate": 5.963318856237057e-06, + "loss": 0.194, + "step": 23609 + }, + { + "epoch": 64.33242506811989, + "grad_norm": 3.3938426971435547, + "learning_rate": 5.962511472770847e-06, + "loss": 0.0724, + "step": 23610 + }, + { + "epoch": 64.33514986376022, + "grad_norm": 4.910046100616455, + "learning_rate": 5.96170412074847e-06, + "loss": 0.1615, + "step": 23611 + }, + { + "epoch": 64.33787465940054, + "grad_norm": 4.328702449798584, + "learning_rate": 5.96089680017621e-06, + "loss": 0.1349, + "step": 23612 + }, + { + "epoch": 64.34059945504087, + "grad_norm": 3.49149751663208, + "learning_rate": 5.960089511060357e-06, + "loss": 0.3481, + "step": 23613 + }, + { + "epoch": 64.34332425068119, + "grad_norm": 3.5896120071411133, + "learning_rate": 5.959282253407195e-06, + "loss": 0.1556, + "step": 23614 + }, + { + "epoch": 64.34604904632153, + "grad_norm": 3.272707939147949, + "learning_rate": 5.958475027223009e-06, + "loss": 0.0618, + "step": 23615 + }, + { + "epoch": 64.34877384196186, + "grad_norm": 2.840674877166748, + "learning_rate": 5.9576678325140956e-06, + "loss": 0.0625, + "step": 23616 + }, + { + "epoch": 64.35149863760218, + "grad_norm": 5.62224817276001, + "learning_rate": 5.9568606692867325e-06, + "loss": 0.0908, + "step": 23617 + }, + { + "epoch": 64.35422343324251, + "grad_norm": 4.2583417892456055, + "learning_rate": 5.95605353754721e-06, + "loss": 0.1116, + "step": 23618 + }, + { + "epoch": 64.35694822888283, + "grad_norm": 2.7511730194091797, + "learning_rate": 5.955246437301811e-06, + "loss": 0.302, + "step": 23619 + }, + { + "epoch": 64.35967302452316, + "grad_norm": 4.065578937530518, + "learning_rate": 5.954439368556826e-06, + "loss": 0.0696, + "step": 23620 + }, + { + "epoch": 64.3623978201635, + "grad_norm": 3.425901412963867, + "learning_rate": 5.953632331318533e-06, + "loss": 0.0741, + "step": 23621 + }, + { + "epoch": 64.36512261580381, + "grad_norm": 3.6608924865722656, + "learning_rate": 5.952825325593223e-06, + "loss": 0.066, + "step": 23622 + }, + { + "epoch": 64.36784741144415, + "grad_norm": 3.296431541442871, + "learning_rate": 5.952018351387178e-06, + "loss": 0.1276, + "step": 23623 + }, + { + "epoch": 64.37057220708446, + "grad_norm": 3.9703187942504883, + "learning_rate": 5.951211408706685e-06, + "loss": 0.0704, + "step": 23624 + }, + { + "epoch": 64.3732970027248, + "grad_norm": 3.351677417755127, + "learning_rate": 5.9504044975580265e-06, + "loss": 0.1034, + "step": 23625 + }, + { + "epoch": 64.37602179836512, + "grad_norm": 4.483058452606201, + "learning_rate": 5.9495976179474876e-06, + "loss": 0.049, + "step": 23626 + }, + { + "epoch": 64.37874659400545, + "grad_norm": 2.7362608909606934, + "learning_rate": 5.948790769881352e-06, + "loss": 0.1589, + "step": 23627 + }, + { + "epoch": 64.38147138964578, + "grad_norm": 2.8398773670196533, + "learning_rate": 5.947983953365902e-06, + "loss": 0.0986, + "step": 23628 + }, + { + "epoch": 64.3841961852861, + "grad_norm": 11.262439727783203, + "learning_rate": 5.947177168407425e-06, + "loss": 0.0562, + "step": 23629 + }, + { + "epoch": 64.38692098092643, + "grad_norm": 5.799773693084717, + "learning_rate": 5.9463704150122e-06, + "loss": 0.1101, + "step": 23630 + }, + { + "epoch": 64.38964577656675, + "grad_norm": 4.184062957763672, + "learning_rate": 5.945563693186514e-06, + "loss": 0.1407, + "step": 23631 + }, + { + "epoch": 64.39237057220708, + "grad_norm": 3.3891074657440186, + "learning_rate": 5.9447570029366456e-06, + "loss": 0.128, + "step": 23632 + }, + { + "epoch": 64.39509536784742, + "grad_norm": 4.880205154418945, + "learning_rate": 5.943950344268876e-06, + "loss": 0.2385, + "step": 23633 + }, + { + "epoch": 64.39782016348774, + "grad_norm": 2.8757264614105225, + "learning_rate": 5.943143717189495e-06, + "loss": 0.0491, + "step": 23634 + }, + { + "epoch": 64.40054495912807, + "grad_norm": 3.768073797225952, + "learning_rate": 5.942337121704779e-06, + "loss": 0.2386, + "step": 23635 + }, + { + "epoch": 64.40326975476839, + "grad_norm": 3.859701156616211, + "learning_rate": 5.941530557821012e-06, + "loss": 0.2186, + "step": 23636 + }, + { + "epoch": 64.40599455040872, + "grad_norm": 2.6606013774871826, + "learning_rate": 5.940724025544473e-06, + "loss": 0.0503, + "step": 23637 + }, + { + "epoch": 64.40871934604904, + "grad_norm": 2.6012561321258545, + "learning_rate": 5.939917524881446e-06, + "loss": 0.0692, + "step": 23638 + }, + { + "epoch": 64.41144414168937, + "grad_norm": 3.684028387069702, + "learning_rate": 5.939111055838209e-06, + "loss": 0.1585, + "step": 23639 + }, + { + "epoch": 64.4141689373297, + "grad_norm": 4.496323585510254, + "learning_rate": 5.9383046184210465e-06, + "loss": 0.1435, + "step": 23640 + }, + { + "epoch": 64.41689373297002, + "grad_norm": 4.281190395355225, + "learning_rate": 5.937498212636235e-06, + "loss": 0.1141, + "step": 23641 + }, + { + "epoch": 64.41961852861036, + "grad_norm": 3.095984935760498, + "learning_rate": 5.936691838490058e-06, + "loss": 0.1678, + "step": 23642 + }, + { + "epoch": 64.42234332425068, + "grad_norm": 4.5127129554748535, + "learning_rate": 5.935885495988794e-06, + "loss": 0.0855, + "step": 23643 + }, + { + "epoch": 64.42506811989101, + "grad_norm": 2.6886441707611084, + "learning_rate": 5.935079185138722e-06, + "loss": 0.0443, + "step": 23644 + }, + { + "epoch": 64.42779291553134, + "grad_norm": 3.247974395751953, + "learning_rate": 5.934272905946123e-06, + "loss": 0.0949, + "step": 23645 + }, + { + "epoch": 64.43051771117166, + "grad_norm": 3.4779772758483887, + "learning_rate": 5.933466658417277e-06, + "loss": 0.0816, + "step": 23646 + }, + { + "epoch": 64.433242506812, + "grad_norm": 4.464017868041992, + "learning_rate": 5.932660442558459e-06, + "loss": 0.0907, + "step": 23647 + }, + { + "epoch": 64.43596730245231, + "grad_norm": 4.169822692871094, + "learning_rate": 5.931854258375953e-06, + "loss": 0.1062, + "step": 23648 + }, + { + "epoch": 64.43869209809264, + "grad_norm": 2.2529373168945312, + "learning_rate": 5.931048105876034e-06, + "loss": 0.0909, + "step": 23649 + }, + { + "epoch": 64.44141689373296, + "grad_norm": 5.601505279541016, + "learning_rate": 5.930241985064978e-06, + "loss": 0.1398, + "step": 23650 + }, + { + "epoch": 64.4441416893733, + "grad_norm": 3.7766969203948975, + "learning_rate": 5.92943589594907e-06, + "loss": 0.0856, + "step": 23651 + }, + { + "epoch": 64.44686648501363, + "grad_norm": 8.199073791503906, + "learning_rate": 5.928629838534586e-06, + "loss": 0.1029, + "step": 23652 + }, + { + "epoch": 64.44959128065395, + "grad_norm": 4.182126998901367, + "learning_rate": 5.9278238128277975e-06, + "loss": 0.0928, + "step": 23653 + }, + { + "epoch": 64.45231607629428, + "grad_norm": 5.7247443199157715, + "learning_rate": 5.92701781883499e-06, + "loss": 0.0868, + "step": 23654 + }, + { + "epoch": 64.4550408719346, + "grad_norm": 4.4931206703186035, + "learning_rate": 5.926211856562434e-06, + "loss": 0.0469, + "step": 23655 + }, + { + "epoch": 64.45776566757493, + "grad_norm": 3.3259570598602295, + "learning_rate": 5.925405926016412e-06, + "loss": 0.0708, + "step": 23656 + }, + { + "epoch": 64.46049046321527, + "grad_norm": 3.7143845558166504, + "learning_rate": 5.924600027203194e-06, + "loss": 0.0705, + "step": 23657 + }, + { + "epoch": 64.46321525885558, + "grad_norm": 4.819847583770752, + "learning_rate": 5.923794160129064e-06, + "loss": 0.0793, + "step": 23658 + }, + { + "epoch": 64.46594005449592, + "grad_norm": 3.607992649078369, + "learning_rate": 5.92298832480029e-06, + "loss": 0.055, + "step": 23659 + }, + { + "epoch": 64.46866485013624, + "grad_norm": 4.808532238006592, + "learning_rate": 5.9221825212231545e-06, + "loss": 0.1354, + "step": 23660 + }, + { + "epoch": 64.47138964577657, + "grad_norm": 5.646035671234131, + "learning_rate": 5.921376749403928e-06, + "loss": 0.168, + "step": 23661 + }, + { + "epoch": 64.47411444141689, + "grad_norm": 3.122415781021118, + "learning_rate": 5.92057100934889e-06, + "loss": 0.0751, + "step": 23662 + }, + { + "epoch": 64.47683923705722, + "grad_norm": 3.0227866172790527, + "learning_rate": 5.919765301064311e-06, + "loss": 0.0569, + "step": 23663 + }, + { + "epoch": 64.47956403269755, + "grad_norm": 3.958361864089966, + "learning_rate": 5.9189596245564715e-06, + "loss": 0.0974, + "step": 23664 + }, + { + "epoch": 64.48228882833787, + "grad_norm": 2.760798215866089, + "learning_rate": 5.918153979831641e-06, + "loss": 0.0459, + "step": 23665 + }, + { + "epoch": 64.4850136239782, + "grad_norm": 4.043485164642334, + "learning_rate": 5.917348366896099e-06, + "loss": 0.0965, + "step": 23666 + }, + { + "epoch": 64.48773841961852, + "grad_norm": 3.1446847915649414, + "learning_rate": 5.9165427857561096e-06, + "loss": 0.0407, + "step": 23667 + }, + { + "epoch": 64.49046321525886, + "grad_norm": 2.5701584815979004, + "learning_rate": 5.915737236417957e-06, + "loss": 0.049, + "step": 23668 + }, + { + "epoch": 64.49318801089919, + "grad_norm": 6.109796047210693, + "learning_rate": 5.914931718887915e-06, + "loss": 0.1148, + "step": 23669 + }, + { + "epoch": 64.49591280653951, + "grad_norm": 3.7845213413238525, + "learning_rate": 5.9141262331722505e-06, + "loss": 0.0693, + "step": 23670 + }, + { + "epoch": 64.49863760217984, + "grad_norm": 2.7459239959716797, + "learning_rate": 5.913320779277239e-06, + "loss": 0.0453, + "step": 23671 + }, + { + "epoch": 64.50136239782016, + "grad_norm": 3.674323320388794, + "learning_rate": 5.912515357209154e-06, + "loss": 0.0809, + "step": 23672 + }, + { + "epoch": 64.50408719346049, + "grad_norm": 13.672555923461914, + "learning_rate": 5.911709966974269e-06, + "loss": 0.1282, + "step": 23673 + }, + { + "epoch": 64.50681198910081, + "grad_norm": 4.414234638214111, + "learning_rate": 5.910904608578855e-06, + "loss": 0.083, + "step": 23674 + }, + { + "epoch": 64.50953678474114, + "grad_norm": 3.071168899536133, + "learning_rate": 5.910099282029182e-06, + "loss": 0.1563, + "step": 23675 + }, + { + "epoch": 64.51226158038148, + "grad_norm": 3.6425254344940186, + "learning_rate": 5.909293987331528e-06, + "loss": 0.1284, + "step": 23676 + }, + { + "epoch": 64.5149863760218, + "grad_norm": 4.040872097015381, + "learning_rate": 5.908488724492157e-06, + "loss": 0.0854, + "step": 23677 + }, + { + "epoch": 64.51771117166213, + "grad_norm": 3.6724729537963867, + "learning_rate": 5.907683493517348e-06, + "loss": 0.1106, + "step": 23678 + }, + { + "epoch": 64.52043596730245, + "grad_norm": 4.090834140777588, + "learning_rate": 5.906878294413365e-06, + "loss": 0.1218, + "step": 23679 + }, + { + "epoch": 64.52316076294278, + "grad_norm": 3.1486189365386963, + "learning_rate": 5.906073127186485e-06, + "loss": 0.0427, + "step": 23680 + }, + { + "epoch": 64.52588555858311, + "grad_norm": 3.0365872383117676, + "learning_rate": 5.905267991842972e-06, + "loss": 0.0673, + "step": 23681 + }, + { + "epoch": 64.52861035422343, + "grad_norm": 5.883402347564697, + "learning_rate": 5.904462888389104e-06, + "loss": 0.1758, + "step": 23682 + }, + { + "epoch": 64.53133514986376, + "grad_norm": 4.505124092102051, + "learning_rate": 5.903657816831143e-06, + "loss": 0.0527, + "step": 23683 + }, + { + "epoch": 64.53405994550408, + "grad_norm": 4.534233570098877, + "learning_rate": 5.902852777175363e-06, + "loss": 0.1013, + "step": 23684 + }, + { + "epoch": 64.53678474114442, + "grad_norm": 3.4307634830474854, + "learning_rate": 5.9020477694280375e-06, + "loss": 0.0566, + "step": 23685 + }, + { + "epoch": 64.53950953678473, + "grad_norm": 3.6816563606262207, + "learning_rate": 5.9012427935954295e-06, + "loss": 0.1486, + "step": 23686 + }, + { + "epoch": 64.54223433242507, + "grad_norm": 4.910661220550537, + "learning_rate": 5.900437849683813e-06, + "loss": 0.0868, + "step": 23687 + }, + { + "epoch": 64.5449591280654, + "grad_norm": 4.9586310386657715, + "learning_rate": 5.899632937699453e-06, + "loss": 0.0842, + "step": 23688 + }, + { + "epoch": 64.54768392370572, + "grad_norm": 5.120810508728027, + "learning_rate": 5.89882805764862e-06, + "loss": 0.0779, + "step": 23689 + }, + { + "epoch": 64.55040871934605, + "grad_norm": 3.6106836795806885, + "learning_rate": 5.898023209537582e-06, + "loss": 0.1112, + "step": 23690 + }, + { + "epoch": 64.55313351498637, + "grad_norm": 4.148248672485352, + "learning_rate": 5.897218393372609e-06, + "loss": 0.0957, + "step": 23691 + }, + { + "epoch": 64.5558583106267, + "grad_norm": 6.041697025299072, + "learning_rate": 5.896413609159964e-06, + "loss": 0.0736, + "step": 23692 + }, + { + "epoch": 64.55858310626704, + "grad_norm": 5.618400573730469, + "learning_rate": 5.8956088569059185e-06, + "loss": 0.0865, + "step": 23693 + }, + { + "epoch": 64.56130790190736, + "grad_norm": 3.0874156951904297, + "learning_rate": 5.89480413661674e-06, + "loss": 0.0391, + "step": 23694 + }, + { + "epoch": 64.56403269754769, + "grad_norm": 3.1987128257751465, + "learning_rate": 5.893999448298695e-06, + "loss": 0.149, + "step": 23695 + }, + { + "epoch": 64.566757493188, + "grad_norm": 3.7000083923339844, + "learning_rate": 5.893194791958051e-06, + "loss": 0.059, + "step": 23696 + }, + { + "epoch": 64.56948228882834, + "grad_norm": 3.5692005157470703, + "learning_rate": 5.892390167601072e-06, + "loss": 0.0889, + "step": 23697 + }, + { + "epoch": 64.57220708446866, + "grad_norm": 4.626175403594971, + "learning_rate": 5.891585575234028e-06, + "loss": 0.0917, + "step": 23698 + }, + { + "epoch": 64.57493188010899, + "grad_norm": 3.606637477874756, + "learning_rate": 5.89078101486318e-06, + "loss": 0.0576, + "step": 23699 + }, + { + "epoch": 64.57765667574932, + "grad_norm": 3.872769355773926, + "learning_rate": 5.889976486494802e-06, + "loss": 0.0773, + "step": 23700 + }, + { + "epoch": 64.58038147138964, + "grad_norm": 2.6828160285949707, + "learning_rate": 5.889171990135149e-06, + "loss": 0.0369, + "step": 23701 + }, + { + "epoch": 64.58310626702998, + "grad_norm": 4.715063095092773, + "learning_rate": 5.8883675257904936e-06, + "loss": 0.0663, + "step": 23702 + }, + { + "epoch": 64.5858310626703, + "grad_norm": 4.230589389801025, + "learning_rate": 5.887563093467103e-06, + "loss": 0.1712, + "step": 23703 + }, + { + "epoch": 64.58855585831063, + "grad_norm": 3.561528444290161, + "learning_rate": 5.886758693171236e-06, + "loss": 0.0678, + "step": 23704 + }, + { + "epoch": 64.59128065395096, + "grad_norm": 2.2918155193328857, + "learning_rate": 5.885954324909162e-06, + "loss": 0.0359, + "step": 23705 + }, + { + "epoch": 64.59400544959128, + "grad_norm": 3.7067036628723145, + "learning_rate": 5.885149988687141e-06, + "loss": 0.1517, + "step": 23706 + }, + { + "epoch": 64.59673024523161, + "grad_norm": 3.9828476905822754, + "learning_rate": 5.8843456845114426e-06, + "loss": 0.0573, + "step": 23707 + }, + { + "epoch": 64.59945504087193, + "grad_norm": 2.729644775390625, + "learning_rate": 5.883541412388325e-06, + "loss": 0.0392, + "step": 23708 + }, + { + "epoch": 64.60217983651226, + "grad_norm": 3.2439920902252197, + "learning_rate": 5.8827371723240555e-06, + "loss": 0.0729, + "step": 23709 + }, + { + "epoch": 64.60490463215258, + "grad_norm": 2.972121000289917, + "learning_rate": 5.881932964324895e-06, + "loss": 0.0569, + "step": 23710 + }, + { + "epoch": 64.60762942779292, + "grad_norm": 3.8448119163513184, + "learning_rate": 5.88112878839711e-06, + "loss": 0.0483, + "step": 23711 + }, + { + "epoch": 64.61035422343325, + "grad_norm": 3.6391313076019287, + "learning_rate": 5.88032464454696e-06, + "loss": 0.0694, + "step": 23712 + }, + { + "epoch": 64.61307901907357, + "grad_norm": 7.126327037811279, + "learning_rate": 5.879520532780709e-06, + "loss": 0.1552, + "step": 23713 + }, + { + "epoch": 64.6158038147139, + "grad_norm": 2.7950947284698486, + "learning_rate": 5.87871645310462e-06, + "loss": 0.0911, + "step": 23714 + }, + { + "epoch": 64.61852861035422, + "grad_norm": 2.5468971729278564, + "learning_rate": 5.877912405524954e-06, + "loss": 0.0395, + "step": 23715 + }, + { + "epoch": 64.62125340599455, + "grad_norm": 4.573666095733643, + "learning_rate": 5.8771083900479744e-06, + "loss": 0.1448, + "step": 23716 + }, + { + "epoch": 64.62397820163488, + "grad_norm": 3.492250680923462, + "learning_rate": 5.876304406679941e-06, + "loss": 0.0556, + "step": 23717 + }, + { + "epoch": 64.6267029972752, + "grad_norm": 12.995576858520508, + "learning_rate": 5.875500455427119e-06, + "loss": 0.1026, + "step": 23718 + }, + { + "epoch": 64.62942779291554, + "grad_norm": 3.482884168624878, + "learning_rate": 5.874696536295761e-06, + "loss": 0.0827, + "step": 23719 + }, + { + "epoch": 64.63215258855585, + "grad_norm": 3.9052515029907227, + "learning_rate": 5.873892649292136e-06, + "loss": 0.0709, + "step": 23720 + }, + { + "epoch": 64.63487738419619, + "grad_norm": 2.956522226333618, + "learning_rate": 5.873088794422505e-06, + "loss": 0.0453, + "step": 23721 + }, + { + "epoch": 64.6376021798365, + "grad_norm": 3.4227848052978516, + "learning_rate": 5.872284971693123e-06, + "loss": 0.061, + "step": 23722 + }, + { + "epoch": 64.64032697547684, + "grad_norm": 2.823970317840576, + "learning_rate": 5.871481181110255e-06, + "loss": 0.0748, + "step": 23723 + }, + { + "epoch": 64.64305177111717, + "grad_norm": 3.349766731262207, + "learning_rate": 5.870677422680156e-06, + "loss": 0.0453, + "step": 23724 + }, + { + "epoch": 64.64577656675749, + "grad_norm": 4.023482799530029, + "learning_rate": 5.8698736964090904e-06, + "loss": 0.096, + "step": 23725 + }, + { + "epoch": 64.64850136239782, + "grad_norm": 3.8858907222747803, + "learning_rate": 5.8690700023033145e-06, + "loss": 0.1997, + "step": 23726 + }, + { + "epoch": 64.65122615803814, + "grad_norm": 3.495682954788208, + "learning_rate": 5.86826634036909e-06, + "loss": 0.0511, + "step": 23727 + }, + { + "epoch": 64.65395095367847, + "grad_norm": 4.163297176361084, + "learning_rate": 5.867462710612672e-06, + "loss": 0.0771, + "step": 23728 + }, + { + "epoch": 64.65667574931881, + "grad_norm": 3.787161111831665, + "learning_rate": 5.866659113040324e-06, + "loss": 0.2429, + "step": 23729 + }, + { + "epoch": 64.65940054495913, + "grad_norm": 4.401248455047607, + "learning_rate": 5.8658555476582994e-06, + "loss": 0.1871, + "step": 23730 + }, + { + "epoch": 64.66212534059946, + "grad_norm": 3.2518022060394287, + "learning_rate": 5.865052014472861e-06, + "loss": 0.0604, + "step": 23731 + }, + { + "epoch": 64.66485013623978, + "grad_norm": 3.5951952934265137, + "learning_rate": 5.8642485134902625e-06, + "loss": 0.0658, + "step": 23732 + }, + { + "epoch": 64.66757493188011, + "grad_norm": 2.5962295532226562, + "learning_rate": 5.863445044716764e-06, + "loss": 0.0431, + "step": 23733 + }, + { + "epoch": 64.67029972752043, + "grad_norm": 2.7388525009155273, + "learning_rate": 5.862641608158623e-06, + "loss": 0.0415, + "step": 23734 + }, + { + "epoch": 64.67302452316076, + "grad_norm": 2.9878427982330322, + "learning_rate": 5.861838203822096e-06, + "loss": 0.0564, + "step": 23735 + }, + { + "epoch": 64.6757493188011, + "grad_norm": 3.394355297088623, + "learning_rate": 5.861034831713435e-06, + "loss": 0.0978, + "step": 23736 + }, + { + "epoch": 64.67847411444141, + "grad_norm": 2.9823338985443115, + "learning_rate": 5.860231491838906e-06, + "loss": 0.084, + "step": 23737 + }, + { + "epoch": 64.68119891008175, + "grad_norm": 2.810248851776123, + "learning_rate": 5.859428184204761e-06, + "loss": 0.2109, + "step": 23738 + }, + { + "epoch": 64.68392370572207, + "grad_norm": 3.4153311252593994, + "learning_rate": 5.858624908817257e-06, + "loss": 0.092, + "step": 23739 + }, + { + "epoch": 64.6866485013624, + "grad_norm": 4.189194679260254, + "learning_rate": 5.857821665682646e-06, + "loss": 0.1303, + "step": 23740 + }, + { + "epoch": 64.68937329700273, + "grad_norm": 3.2839243412017822, + "learning_rate": 5.857018454807189e-06, + "loss": 0.041, + "step": 23741 + }, + { + "epoch": 64.69209809264305, + "grad_norm": 4.326436996459961, + "learning_rate": 5.856215276197137e-06, + "loss": 0.1038, + "step": 23742 + }, + { + "epoch": 64.69482288828338, + "grad_norm": 4.688022613525391, + "learning_rate": 5.855412129858749e-06, + "loss": 0.1052, + "step": 23743 + }, + { + "epoch": 64.6975476839237, + "grad_norm": 3.6603691577911377, + "learning_rate": 5.854609015798277e-06, + "loss": 0.0609, + "step": 23744 + }, + { + "epoch": 64.70027247956403, + "grad_norm": 3.4955921173095703, + "learning_rate": 5.8538059340219774e-06, + "loss": 0.0596, + "step": 23745 + }, + { + "epoch": 64.70299727520435, + "grad_norm": 3.845290184020996, + "learning_rate": 5.853002884536103e-06, + "loss": 0.0873, + "step": 23746 + }, + { + "epoch": 64.70572207084469, + "grad_norm": 3.763108968734741, + "learning_rate": 5.852199867346909e-06, + "loss": 0.1474, + "step": 23747 + }, + { + "epoch": 64.70844686648502, + "grad_norm": 4.986370086669922, + "learning_rate": 5.851396882460648e-06, + "loss": 0.2225, + "step": 23748 + }, + { + "epoch": 64.71117166212534, + "grad_norm": 3.1233103275299072, + "learning_rate": 5.850593929883577e-06, + "loss": 0.076, + "step": 23749 + }, + { + "epoch": 64.71389645776567, + "grad_norm": 4.560542583465576, + "learning_rate": 5.8497910096219435e-06, + "loss": 0.1405, + "step": 23750 + }, + { + "epoch": 64.71662125340599, + "grad_norm": 3.0604021549224854, + "learning_rate": 5.848988121682006e-06, + "loss": 0.0767, + "step": 23751 + }, + { + "epoch": 64.71934604904632, + "grad_norm": 23.736257553100586, + "learning_rate": 5.848185266070016e-06, + "loss": 0.1333, + "step": 23752 + }, + { + "epoch": 64.72207084468666, + "grad_norm": 4.732005596160889, + "learning_rate": 5.847382442792222e-06, + "loss": 0.0737, + "step": 23753 + }, + { + "epoch": 64.72479564032697, + "grad_norm": 3.6705281734466553, + "learning_rate": 5.8465796518548824e-06, + "loss": 0.0856, + "step": 23754 + }, + { + "epoch": 64.7275204359673, + "grad_norm": 3.666384220123291, + "learning_rate": 5.845776893264247e-06, + "loss": 0.1425, + "step": 23755 + }, + { + "epoch": 64.73024523160763, + "grad_norm": 4.7612175941467285, + "learning_rate": 5.844974167026567e-06, + "loss": 0.1459, + "step": 23756 + }, + { + "epoch": 64.73297002724796, + "grad_norm": 3.4738609790802, + "learning_rate": 5.8441714731480944e-06, + "loss": 0.2016, + "step": 23757 + }, + { + "epoch": 64.73569482288828, + "grad_norm": 4.037792682647705, + "learning_rate": 5.843368811635081e-06, + "loss": 0.0613, + "step": 23758 + }, + { + "epoch": 64.73841961852861, + "grad_norm": 3.863607406616211, + "learning_rate": 5.842566182493779e-06, + "loss": 0.1571, + "step": 23759 + }, + { + "epoch": 64.74114441416894, + "grad_norm": 3.6390492916107178, + "learning_rate": 5.8417635857304355e-06, + "loss": 0.2208, + "step": 23760 + }, + { + "epoch": 64.74386920980926, + "grad_norm": 2.9504313468933105, + "learning_rate": 5.840961021351305e-06, + "loss": 0.1737, + "step": 23761 + }, + { + "epoch": 64.7465940054496, + "grad_norm": 4.13885498046875, + "learning_rate": 5.840158489362635e-06, + "loss": 0.0879, + "step": 23762 + }, + { + "epoch": 64.74931880108991, + "grad_norm": 3.5123114585876465, + "learning_rate": 5.839355989770678e-06, + "loss": 0.0843, + "step": 23763 + }, + { + "epoch": 64.75204359673025, + "grad_norm": 3.2950191497802734, + "learning_rate": 5.8385535225816805e-06, + "loss": 0.0929, + "step": 23764 + }, + { + "epoch": 64.75476839237058, + "grad_norm": 3.906742572784424, + "learning_rate": 5.8377510878018975e-06, + "loss": 0.0736, + "step": 23765 + }, + { + "epoch": 64.7574931880109, + "grad_norm": 2.814589500427246, + "learning_rate": 5.836948685437573e-06, + "loss": 0.0522, + "step": 23766 + }, + { + "epoch": 64.76021798365123, + "grad_norm": 12.155994415283203, + "learning_rate": 5.836146315494956e-06, + "loss": 0.0752, + "step": 23767 + }, + { + "epoch": 64.76294277929155, + "grad_norm": 3.8262643814086914, + "learning_rate": 5.835343977980301e-06, + "loss": 0.1724, + "step": 23768 + }, + { + "epoch": 64.76566757493188, + "grad_norm": 5.280486106872559, + "learning_rate": 5.834541672899852e-06, + "loss": 0.1184, + "step": 23769 + }, + { + "epoch": 64.7683923705722, + "grad_norm": 5.157360076904297, + "learning_rate": 5.8337394002598565e-06, + "loss": 0.0717, + "step": 23770 + }, + { + "epoch": 64.77111716621253, + "grad_norm": 2.7944915294647217, + "learning_rate": 5.832937160066567e-06, + "loss": 0.1283, + "step": 23771 + }, + { + "epoch": 64.77384196185287, + "grad_norm": 4.003580570220947, + "learning_rate": 5.832134952326225e-06, + "loss": 0.0931, + "step": 23772 + }, + { + "epoch": 64.77656675749319, + "grad_norm": 5.369149208068848, + "learning_rate": 5.831332777045087e-06, + "loss": 0.0656, + "step": 23773 + }, + { + "epoch": 64.77929155313352, + "grad_norm": 4.331752777099609, + "learning_rate": 5.830530634229393e-06, + "loss": 0.0937, + "step": 23774 + }, + { + "epoch": 64.78201634877384, + "grad_norm": 4.510578155517578, + "learning_rate": 5.829728523885394e-06, + "loss": 0.2126, + "step": 23775 + }, + { + "epoch": 64.78474114441417, + "grad_norm": 3.1642606258392334, + "learning_rate": 5.82892644601933e-06, + "loss": 0.0441, + "step": 23776 + }, + { + "epoch": 64.7874659400545, + "grad_norm": 3.814603805541992, + "learning_rate": 5.828124400637456e-06, + "loss": 0.0558, + "step": 23777 + }, + { + "epoch": 64.79019073569482, + "grad_norm": 3.7792811393737793, + "learning_rate": 5.827322387746018e-06, + "loss": 0.1459, + "step": 23778 + }, + { + "epoch": 64.79291553133515, + "grad_norm": 2.392956256866455, + "learning_rate": 5.826520407351252e-06, + "loss": 0.0369, + "step": 23779 + }, + { + "epoch": 64.79564032697547, + "grad_norm": 4.206678867340088, + "learning_rate": 5.8257184594594155e-06, + "loss": 0.0805, + "step": 23780 + }, + { + "epoch": 64.7983651226158, + "grad_norm": 3.7099359035491943, + "learning_rate": 5.824916544076749e-06, + "loss": 0.0595, + "step": 23781 + }, + { + "epoch": 64.80108991825612, + "grad_norm": 3.81819486618042, + "learning_rate": 5.824114661209498e-06, + "loss": 0.1998, + "step": 23782 + }, + { + "epoch": 64.80381471389646, + "grad_norm": 2.6584384441375732, + "learning_rate": 5.823312810863904e-06, + "loss": 0.0494, + "step": 23783 + }, + { + "epoch": 64.80653950953679, + "grad_norm": 5.343811511993408, + "learning_rate": 5.82251099304622e-06, + "loss": 0.0862, + "step": 23784 + }, + { + "epoch": 64.80926430517711, + "grad_norm": 3.189709424972534, + "learning_rate": 5.821709207762684e-06, + "loss": 0.0693, + "step": 23785 + }, + { + "epoch": 64.81198910081744, + "grad_norm": 4.335069179534912, + "learning_rate": 5.8209074550195445e-06, + "loss": 0.0996, + "step": 23786 + }, + { + "epoch": 64.81471389645776, + "grad_norm": 2.99347186088562, + "learning_rate": 5.8201057348230384e-06, + "loss": 0.1596, + "step": 23787 + }, + { + "epoch": 64.8174386920981, + "grad_norm": 3.288522243499756, + "learning_rate": 5.819304047179415e-06, + "loss": 0.1391, + "step": 23788 + }, + { + "epoch": 64.82016348773843, + "grad_norm": 5.136707305908203, + "learning_rate": 5.81850239209492e-06, + "loss": 0.0824, + "step": 23789 + }, + { + "epoch": 64.82288828337875, + "grad_norm": 3.021090030670166, + "learning_rate": 5.8177007695757935e-06, + "loss": 0.0393, + "step": 23790 + }, + { + "epoch": 64.82561307901908, + "grad_norm": 3.8290157318115234, + "learning_rate": 5.816899179628279e-06, + "loss": 0.0666, + "step": 23791 + }, + { + "epoch": 64.8283378746594, + "grad_norm": 2.9695990085601807, + "learning_rate": 5.816097622258616e-06, + "loss": 0.0864, + "step": 23792 + }, + { + "epoch": 64.83106267029973, + "grad_norm": 3.0893306732177734, + "learning_rate": 5.815296097473053e-06, + "loss": 0.0979, + "step": 23793 + }, + { + "epoch": 64.83378746594005, + "grad_norm": 5.386440277099609, + "learning_rate": 5.814494605277831e-06, + "loss": 0.1461, + "step": 23794 + }, + { + "epoch": 64.83651226158038, + "grad_norm": 3.264275074005127, + "learning_rate": 5.813693145679189e-06, + "loss": 0.048, + "step": 23795 + }, + { + "epoch": 64.83923705722071, + "grad_norm": 6.261340141296387, + "learning_rate": 5.8128917186833655e-06, + "loss": 0.1283, + "step": 23796 + }, + { + "epoch": 64.84196185286103, + "grad_norm": 3.908447027206421, + "learning_rate": 5.812090324296611e-06, + "loss": 0.0849, + "step": 23797 + }, + { + "epoch": 64.84468664850137, + "grad_norm": 4.705367565155029, + "learning_rate": 5.811288962525163e-06, + "loss": 0.0543, + "step": 23798 + }, + { + "epoch": 64.84741144414168, + "grad_norm": 4.353753566741943, + "learning_rate": 5.810487633375261e-06, + "loss": 0.077, + "step": 23799 + }, + { + "epoch": 64.85013623978202, + "grad_norm": 3.5391647815704346, + "learning_rate": 5.8096863368531435e-06, + "loss": 0.0938, + "step": 23800 + }, + { + "epoch": 64.85286103542235, + "grad_norm": 3.7956371307373047, + "learning_rate": 5.808885072965057e-06, + "loss": 0.0657, + "step": 23801 + }, + { + "epoch": 64.85558583106267, + "grad_norm": 3.606250762939453, + "learning_rate": 5.808083841717238e-06, + "loss": 0.0892, + "step": 23802 + }, + { + "epoch": 64.858310626703, + "grad_norm": 4.2467546463012695, + "learning_rate": 5.807282643115924e-06, + "loss": 0.0761, + "step": 23803 + }, + { + "epoch": 64.86103542234332, + "grad_norm": 3.940117359161377, + "learning_rate": 5.8064814771673625e-06, + "loss": 0.0849, + "step": 23804 + }, + { + "epoch": 64.86376021798365, + "grad_norm": 3.2259116172790527, + "learning_rate": 5.805680343877783e-06, + "loss": 0.146, + "step": 23805 + }, + { + "epoch": 64.86648501362397, + "grad_norm": 3.804685592651367, + "learning_rate": 5.804879243253435e-06, + "loss": 0.0772, + "step": 23806 + }, + { + "epoch": 64.8692098092643, + "grad_norm": 4.051899433135986, + "learning_rate": 5.804078175300551e-06, + "loss": 0.0817, + "step": 23807 + }, + { + "epoch": 64.87193460490464, + "grad_norm": 2.5785562992095947, + "learning_rate": 5.80327714002537e-06, + "loss": 0.1555, + "step": 23808 + }, + { + "epoch": 64.87465940054496, + "grad_norm": 3.2376959323883057, + "learning_rate": 5.802476137434132e-06, + "loss": 0.0874, + "step": 23809 + }, + { + "epoch": 64.87738419618529, + "grad_norm": 3.2956013679504395, + "learning_rate": 5.801675167533078e-06, + "loss": 0.0406, + "step": 23810 + }, + { + "epoch": 64.88010899182561, + "grad_norm": 3.075345277786255, + "learning_rate": 5.80087423032844e-06, + "loss": 0.035, + "step": 23811 + }, + { + "epoch": 64.88283378746594, + "grad_norm": 4.006364822387695, + "learning_rate": 5.800073325826456e-06, + "loss": 0.2162, + "step": 23812 + }, + { + "epoch": 64.88555858310627, + "grad_norm": 4.077402114868164, + "learning_rate": 5.799272454033369e-06, + "loss": 0.0608, + "step": 23813 + }, + { + "epoch": 64.88828337874659, + "grad_norm": 4.445973873138428, + "learning_rate": 5.7984716149554136e-06, + "loss": 0.1193, + "step": 23814 + }, + { + "epoch": 64.89100817438693, + "grad_norm": 4.7350358963012695, + "learning_rate": 5.797670808598826e-06, + "loss": 0.0419, + "step": 23815 + }, + { + "epoch": 64.89373297002724, + "grad_norm": 4.542581558227539, + "learning_rate": 5.796870034969837e-06, + "loss": 0.058, + "step": 23816 + }, + { + "epoch": 64.89645776566758, + "grad_norm": 3.4470760822296143, + "learning_rate": 5.796069294074696e-06, + "loss": 0.1338, + "step": 23817 + }, + { + "epoch": 64.8991825613079, + "grad_norm": 6.367007255554199, + "learning_rate": 5.795268585919629e-06, + "loss": 0.0696, + "step": 23818 + }, + { + "epoch": 64.90190735694823, + "grad_norm": 4.687518119812012, + "learning_rate": 5.794467910510877e-06, + "loss": 0.0515, + "step": 23819 + }, + { + "epoch": 64.90463215258856, + "grad_norm": 3.0287528038024902, + "learning_rate": 5.793667267854668e-06, + "loss": 0.1559, + "step": 23820 + }, + { + "epoch": 64.90735694822888, + "grad_norm": 4.91618537902832, + "learning_rate": 5.792866657957248e-06, + "loss": 0.1055, + "step": 23821 + }, + { + "epoch": 64.91008174386921, + "grad_norm": 4.167760372161865, + "learning_rate": 5.792066080824843e-06, + "loss": 0.1429, + "step": 23822 + }, + { + "epoch": 64.91280653950953, + "grad_norm": 5.756951808929443, + "learning_rate": 5.791265536463696e-06, + "loss": 0.1086, + "step": 23823 + }, + { + "epoch": 64.91553133514986, + "grad_norm": 3.9203407764434814, + "learning_rate": 5.790465024880033e-06, + "loss": 0.2407, + "step": 23824 + }, + { + "epoch": 64.9182561307902, + "grad_norm": 3.6706271171569824, + "learning_rate": 5.7896645460800986e-06, + "loss": 0.0792, + "step": 23825 + }, + { + "epoch": 64.92098092643052, + "grad_norm": 2.9809834957122803, + "learning_rate": 5.7888641000701195e-06, + "loss": 0.0855, + "step": 23826 + }, + { + "epoch": 64.92370572207085, + "grad_norm": 2.1346495151519775, + "learning_rate": 5.788063686856331e-06, + "loss": 0.0711, + "step": 23827 + }, + { + "epoch": 64.92643051771117, + "grad_norm": 3.736856460571289, + "learning_rate": 5.7872633064449635e-06, + "loss": 0.1116, + "step": 23828 + }, + { + "epoch": 64.9291553133515, + "grad_norm": 3.1223020553588867, + "learning_rate": 5.786462958842258e-06, + "loss": 0.1157, + "step": 23829 + }, + { + "epoch": 64.93188010899182, + "grad_norm": 3.967301368713379, + "learning_rate": 5.785662644054444e-06, + "loss": 0.0643, + "step": 23830 + }, + { + "epoch": 64.93460490463215, + "grad_norm": 2.076726198196411, + "learning_rate": 5.784862362087752e-06, + "loss": 0.0399, + "step": 23831 + }, + { + "epoch": 64.93732970027249, + "grad_norm": 3.1352274417877197, + "learning_rate": 5.7840621129484135e-06, + "loss": 0.137, + "step": 23832 + }, + { + "epoch": 64.9400544959128, + "grad_norm": 3.6743693351745605, + "learning_rate": 5.783261896642667e-06, + "loss": 0.0588, + "step": 23833 + }, + { + "epoch": 64.94277929155314, + "grad_norm": 3.836276054382324, + "learning_rate": 5.7824617131767415e-06, + "loss": 0.1027, + "step": 23834 + }, + { + "epoch": 64.94550408719346, + "grad_norm": 3.9120116233825684, + "learning_rate": 5.7816615625568684e-06, + "loss": 0.1289, + "step": 23835 + }, + { + "epoch": 64.94822888283379, + "grad_norm": 3.290968894958496, + "learning_rate": 5.780861444789275e-06, + "loss": 0.1574, + "step": 23836 + }, + { + "epoch": 64.95095367847412, + "grad_norm": 4.4691338539123535, + "learning_rate": 5.780061359880201e-06, + "loss": 0.0539, + "step": 23837 + }, + { + "epoch": 64.95367847411444, + "grad_norm": 3.319869041442871, + "learning_rate": 5.779261307835873e-06, + "loss": 0.1171, + "step": 23838 + }, + { + "epoch": 64.95640326975477, + "grad_norm": 3.370058298110962, + "learning_rate": 5.778461288662519e-06, + "loss": 0.0974, + "step": 23839 + }, + { + "epoch": 64.95912806539509, + "grad_norm": 3.132575035095215, + "learning_rate": 5.777661302366375e-06, + "loss": 0.041, + "step": 23840 + }, + { + "epoch": 64.96185286103542, + "grad_norm": 3.5255424976348877, + "learning_rate": 5.7768613489536664e-06, + "loss": 0.2366, + "step": 23841 + }, + { + "epoch": 64.96457765667574, + "grad_norm": 6.005019664764404, + "learning_rate": 5.776061428430631e-06, + "loss": 0.0631, + "step": 23842 + }, + { + "epoch": 64.96730245231608, + "grad_norm": 3.278092384338379, + "learning_rate": 5.77526154080349e-06, + "loss": 0.055, + "step": 23843 + }, + { + "epoch": 64.97002724795641, + "grad_norm": 4.543281555175781, + "learning_rate": 5.774461686078474e-06, + "loss": 0.0932, + "step": 23844 + }, + { + "epoch": 64.97275204359673, + "grad_norm": 3.6716113090515137, + "learning_rate": 5.773661864261818e-06, + "loss": 0.0464, + "step": 23845 + }, + { + "epoch": 64.97547683923706, + "grad_norm": 4.8436408042907715, + "learning_rate": 5.772862075359748e-06, + "loss": 0.0997, + "step": 23846 + }, + { + "epoch": 64.97820163487738, + "grad_norm": 6.906503200531006, + "learning_rate": 5.772062319378491e-06, + "loss": 0.0867, + "step": 23847 + }, + { + "epoch": 64.98092643051771, + "grad_norm": 3.953674077987671, + "learning_rate": 5.771262596324273e-06, + "loss": 0.2447, + "step": 23848 + }, + { + "epoch": 64.98365122615803, + "grad_norm": 4.3087687492370605, + "learning_rate": 5.77046290620333e-06, + "loss": 0.0432, + "step": 23849 + }, + { + "epoch": 64.98637602179836, + "grad_norm": 3.8011410236358643, + "learning_rate": 5.7696632490218865e-06, + "loss": 0.1285, + "step": 23850 + }, + { + "epoch": 64.9891008174387, + "grad_norm": 2.6955769062042236, + "learning_rate": 5.768863624786167e-06, + "loss": 0.0968, + "step": 23851 + }, + { + "epoch": 64.99182561307902, + "grad_norm": 3.028332233428955, + "learning_rate": 5.768064033502401e-06, + "loss": 0.2483, + "step": 23852 + }, + { + "epoch": 64.99455040871935, + "grad_norm": 3.8396477699279785, + "learning_rate": 5.767264475176817e-06, + "loss": 0.0473, + "step": 23853 + }, + { + "epoch": 64.99727520435967, + "grad_norm": 7.509429454803467, + "learning_rate": 5.766464949815642e-06, + "loss": 0.0472, + "step": 23854 + }, + { + "epoch": 65.0, + "grad_norm": 4.404361248016357, + "learning_rate": 5.765665457425102e-06, + "loss": 0.1461, + "step": 23855 + }, + { + "epoch": 65.00272479564033, + "grad_norm": 3.704347610473633, + "learning_rate": 5.76486599801142e-06, + "loss": 0.1096, + "step": 23856 + }, + { + "epoch": 65.00544959128065, + "grad_norm": 3.681830644607544, + "learning_rate": 5.7640665715808244e-06, + "loss": 0.0545, + "step": 23857 + }, + { + "epoch": 65.00817438692098, + "grad_norm": 2.457608461380005, + "learning_rate": 5.763267178139544e-06, + "loss": 0.0389, + "step": 23858 + }, + { + "epoch": 65.0108991825613, + "grad_norm": 4.0209221839904785, + "learning_rate": 5.7624678176938055e-06, + "loss": 0.0727, + "step": 23859 + }, + { + "epoch": 65.01362397820164, + "grad_norm": 4.337145805358887, + "learning_rate": 5.76166849024983e-06, + "loss": 0.0531, + "step": 23860 + }, + { + "epoch": 65.01634877384195, + "grad_norm": 3.689896821975708, + "learning_rate": 5.760869195813841e-06, + "loss": 0.0878, + "step": 23861 + }, + { + "epoch": 65.01907356948229, + "grad_norm": 2.472669839859009, + "learning_rate": 5.760069934392068e-06, + "loss": 0.0407, + "step": 23862 + }, + { + "epoch": 65.02179836512262, + "grad_norm": 2.7535672187805176, + "learning_rate": 5.759270705990736e-06, + "loss": 0.1648, + "step": 23863 + }, + { + "epoch": 65.02452316076294, + "grad_norm": 3.401129722595215, + "learning_rate": 5.758471510616066e-06, + "loss": 0.0941, + "step": 23864 + }, + { + "epoch": 65.02724795640327, + "grad_norm": 3.3423852920532227, + "learning_rate": 5.75767234827428e-06, + "loss": 0.1656, + "step": 23865 + }, + { + "epoch": 65.02997275204359, + "grad_norm": 8.871487617492676, + "learning_rate": 5.756873218971609e-06, + "loss": 0.1037, + "step": 23866 + }, + { + "epoch": 65.03269754768392, + "grad_norm": 3.4835875034332275, + "learning_rate": 5.756074122714272e-06, + "loss": 0.0955, + "step": 23867 + }, + { + "epoch": 65.03542234332426, + "grad_norm": 4.024458408355713, + "learning_rate": 5.755275059508492e-06, + "loss": 0.1101, + "step": 23868 + }, + { + "epoch": 65.03814713896458, + "grad_norm": 6.285836219787598, + "learning_rate": 5.754476029360494e-06, + "loss": 0.0603, + "step": 23869 + }, + { + "epoch": 65.04087193460491, + "grad_norm": 2.6335160732269287, + "learning_rate": 5.753677032276501e-06, + "loss": 0.027, + "step": 23870 + }, + { + "epoch": 65.04359673024523, + "grad_norm": 7.402361869812012, + "learning_rate": 5.752878068262735e-06, + "loss": 0.0817, + "step": 23871 + }, + { + "epoch": 65.04632152588556, + "grad_norm": 3.73759388923645, + "learning_rate": 5.7520791373254135e-06, + "loss": 0.2076, + "step": 23872 + }, + { + "epoch": 65.04904632152588, + "grad_norm": 4.1924967765808105, + "learning_rate": 5.751280239470768e-06, + "loss": 0.1566, + "step": 23873 + }, + { + "epoch": 65.05177111716621, + "grad_norm": 3.7623181343078613, + "learning_rate": 5.750481374705011e-06, + "loss": 0.0936, + "step": 23874 + }, + { + "epoch": 65.05449591280654, + "grad_norm": 3.846261978149414, + "learning_rate": 5.749682543034371e-06, + "loss": 0.0799, + "step": 23875 + }, + { + "epoch": 65.05722070844686, + "grad_norm": 3.157371997833252, + "learning_rate": 5.748883744465067e-06, + "loss": 0.0922, + "step": 23876 + }, + { + "epoch": 65.0599455040872, + "grad_norm": 3.514310836791992, + "learning_rate": 5.748084979003317e-06, + "loss": 0.0944, + "step": 23877 + }, + { + "epoch": 65.06267029972751, + "grad_norm": 3.686051607131958, + "learning_rate": 5.7472862466553455e-06, + "loss": 0.0584, + "step": 23878 + }, + { + "epoch": 65.06539509536785, + "grad_norm": 3.2389907836914062, + "learning_rate": 5.746487547427375e-06, + "loss": 0.031, + "step": 23879 + }, + { + "epoch": 65.06811989100818, + "grad_norm": 4.23587703704834, + "learning_rate": 5.74568888132562e-06, + "loss": 0.0866, + "step": 23880 + }, + { + "epoch": 65.0708446866485, + "grad_norm": 3.1292333602905273, + "learning_rate": 5.744890248356301e-06, + "loss": 0.1782, + "step": 23881 + }, + { + "epoch": 65.07356948228883, + "grad_norm": 6.11333703994751, + "learning_rate": 5.744091648525642e-06, + "loss": 0.1356, + "step": 23882 + }, + { + "epoch": 65.07629427792915, + "grad_norm": 3.8605904579162598, + "learning_rate": 5.743293081839862e-06, + "loss": 0.1539, + "step": 23883 + }, + { + "epoch": 65.07901907356948, + "grad_norm": 3.3380041122436523, + "learning_rate": 5.742494548305177e-06, + "loss": 0.0656, + "step": 23884 + }, + { + "epoch": 65.0817438692098, + "grad_norm": 2.9059176445007324, + "learning_rate": 5.741696047927805e-06, + "loss": 0.1074, + "step": 23885 + }, + { + "epoch": 65.08446866485014, + "grad_norm": 4.149163246154785, + "learning_rate": 5.74089758071397e-06, + "loss": 0.1008, + "step": 23886 + }, + { + "epoch": 65.08719346049047, + "grad_norm": 5.573852062225342, + "learning_rate": 5.740099146669888e-06, + "loss": 0.1068, + "step": 23887 + }, + { + "epoch": 65.08991825613079, + "grad_norm": 2.9669737815856934, + "learning_rate": 5.739300745801777e-06, + "loss": 0.0586, + "step": 23888 + }, + { + "epoch": 65.09264305177112, + "grad_norm": 5.7165207862854, + "learning_rate": 5.73850237811585e-06, + "loss": 0.1362, + "step": 23889 + }, + { + "epoch": 65.09536784741144, + "grad_norm": 3.295400619506836, + "learning_rate": 5.737704043618333e-06, + "loss": 0.1248, + "step": 23890 + }, + { + "epoch": 65.09809264305177, + "grad_norm": 3.5518786907196045, + "learning_rate": 5.7369057423154376e-06, + "loss": 0.1259, + "step": 23891 + }, + { + "epoch": 65.1008174386921, + "grad_norm": 3.840667486190796, + "learning_rate": 5.736107474213385e-06, + "loss": 0.0872, + "step": 23892 + }, + { + "epoch": 65.10354223433242, + "grad_norm": 2.7150371074676514, + "learning_rate": 5.735309239318387e-06, + "loss": 0.0492, + "step": 23893 + }, + { + "epoch": 65.10626702997276, + "grad_norm": 4.040241718292236, + "learning_rate": 5.734511037636667e-06, + "loss": 0.102, + "step": 23894 + }, + { + "epoch": 65.10899182561307, + "grad_norm": 3.0391008853912354, + "learning_rate": 5.7337128691744395e-06, + "loss": 0.1093, + "step": 23895 + }, + { + "epoch": 65.11171662125341, + "grad_norm": 3.4439523220062256, + "learning_rate": 5.732914733937917e-06, + "loss": 0.1107, + "step": 23896 + }, + { + "epoch": 65.11444141689373, + "grad_norm": 2.2255547046661377, + "learning_rate": 5.732116631933313e-06, + "loss": 0.064, + "step": 23897 + }, + { + "epoch": 65.11716621253406, + "grad_norm": 2.6797420978546143, + "learning_rate": 5.731318563166852e-06, + "loss": 0.1443, + "step": 23898 + }, + { + "epoch": 65.11989100817439, + "grad_norm": 2.8840904235839844, + "learning_rate": 5.7305205276447454e-06, + "loss": 0.0928, + "step": 23899 + }, + { + "epoch": 65.12261580381471, + "grad_norm": 5.082234859466553, + "learning_rate": 5.729722525373206e-06, + "loss": 0.1268, + "step": 23900 + }, + { + "epoch": 65.12534059945504, + "grad_norm": 4.612484931945801, + "learning_rate": 5.728924556358446e-06, + "loss": 0.1005, + "step": 23901 + }, + { + "epoch": 65.12806539509536, + "grad_norm": 7.932746410369873, + "learning_rate": 5.72812662060669e-06, + "loss": 0.0973, + "step": 23902 + }, + { + "epoch": 65.1307901907357, + "grad_norm": 3.5816659927368164, + "learning_rate": 5.727328718124146e-06, + "loss": 0.0798, + "step": 23903 + }, + { + "epoch": 65.13351498637603, + "grad_norm": 4.132866382598877, + "learning_rate": 5.726530848917027e-06, + "loss": 0.0699, + "step": 23904 + }, + { + "epoch": 65.13623978201635, + "grad_norm": 3.856076240539551, + "learning_rate": 5.725733012991545e-06, + "loss": 0.1263, + "step": 23905 + }, + { + "epoch": 65.13896457765668, + "grad_norm": 2.9017820358276367, + "learning_rate": 5.724935210353921e-06, + "loss": 0.0398, + "step": 23906 + }, + { + "epoch": 65.141689373297, + "grad_norm": 4.9340362548828125, + "learning_rate": 5.724137441010363e-06, + "loss": 0.0603, + "step": 23907 + }, + { + "epoch": 65.14441416893733, + "grad_norm": 3.251796245574951, + "learning_rate": 5.723339704967081e-06, + "loss": 0.1711, + "step": 23908 + }, + { + "epoch": 65.14713896457765, + "grad_norm": 3.3560702800750732, + "learning_rate": 5.722542002230293e-06, + "loss": 0.0489, + "step": 23909 + }, + { + "epoch": 65.14986376021798, + "grad_norm": 2.926656723022461, + "learning_rate": 5.721744332806214e-06, + "loss": 0.1059, + "step": 23910 + }, + { + "epoch": 65.15258855585832, + "grad_norm": 3.202542781829834, + "learning_rate": 5.720946696701053e-06, + "loss": 0.0916, + "step": 23911 + }, + { + "epoch": 65.15531335149863, + "grad_norm": 2.3384954929351807, + "learning_rate": 5.720149093921019e-06, + "loss": 0.0805, + "step": 23912 + }, + { + "epoch": 65.15803814713897, + "grad_norm": 3.166487693786621, + "learning_rate": 5.719351524472326e-06, + "loss": 0.0754, + "step": 23913 + }, + { + "epoch": 65.16076294277929, + "grad_norm": 3.3758294582366943, + "learning_rate": 5.718553988361186e-06, + "loss": 0.0535, + "step": 23914 + }, + { + "epoch": 65.16348773841962, + "grad_norm": 3.6121857166290283, + "learning_rate": 5.717756485593811e-06, + "loss": 0.1576, + "step": 23915 + }, + { + "epoch": 65.16621253405995, + "grad_norm": 3.9699673652648926, + "learning_rate": 5.71695901617641e-06, + "loss": 0.1821, + "step": 23916 + }, + { + "epoch": 65.16893732970027, + "grad_norm": 5.422703266143799, + "learning_rate": 5.716161580115192e-06, + "loss": 0.0867, + "step": 23917 + }, + { + "epoch": 65.1716621253406, + "grad_norm": 3.7113823890686035, + "learning_rate": 5.715364177416371e-06, + "loss": 0.074, + "step": 23918 + }, + { + "epoch": 65.17438692098092, + "grad_norm": 3.7007954120635986, + "learning_rate": 5.714566808086159e-06, + "loss": 0.06, + "step": 23919 + }, + { + "epoch": 65.17711171662125, + "grad_norm": 2.973315954208374, + "learning_rate": 5.713769472130761e-06, + "loss": 0.0549, + "step": 23920 + }, + { + "epoch": 65.17983651226157, + "grad_norm": 3.80631685256958, + "learning_rate": 5.712972169556384e-06, + "loss": 0.1644, + "step": 23921 + }, + { + "epoch": 65.1825613079019, + "grad_norm": 3.6280059814453125, + "learning_rate": 5.712174900369247e-06, + "loss": 0.0815, + "step": 23922 + }, + { + "epoch": 65.18528610354224, + "grad_norm": 3.664151191711426, + "learning_rate": 5.7113776645755525e-06, + "loss": 0.0644, + "step": 23923 + }, + { + "epoch": 65.18801089918256, + "grad_norm": 3.0507638454437256, + "learning_rate": 5.710580462181512e-06, + "loss": 0.0471, + "step": 23924 + }, + { + "epoch": 65.19073569482289, + "grad_norm": 3.5027029514312744, + "learning_rate": 5.709783293193329e-06, + "loss": 0.0435, + "step": 23925 + }, + { + "epoch": 65.19346049046321, + "grad_norm": 3.2568349838256836, + "learning_rate": 5.708986157617215e-06, + "loss": 0.1404, + "step": 23926 + }, + { + "epoch": 65.19618528610354, + "grad_norm": 3.2480835914611816, + "learning_rate": 5.708189055459382e-06, + "loss": 0.1218, + "step": 23927 + }, + { + "epoch": 65.19891008174388, + "grad_norm": 3.107895612716675, + "learning_rate": 5.707391986726035e-06, + "loss": 0.1223, + "step": 23928 + }, + { + "epoch": 65.2016348773842, + "grad_norm": 3.600494146347046, + "learning_rate": 5.706594951423381e-06, + "loss": 0.1503, + "step": 23929 + }, + { + "epoch": 65.20435967302453, + "grad_norm": 2.3023030757904053, + "learning_rate": 5.705797949557624e-06, + "loss": 0.0413, + "step": 23930 + }, + { + "epoch": 65.20708446866485, + "grad_norm": 5.529454231262207, + "learning_rate": 5.705000981134979e-06, + "loss": 0.1598, + "step": 23931 + }, + { + "epoch": 65.20980926430518, + "grad_norm": 3.8024990558624268, + "learning_rate": 5.704204046161647e-06, + "loss": 0.0639, + "step": 23932 + }, + { + "epoch": 65.2125340599455, + "grad_norm": 2.6368520259857178, + "learning_rate": 5.703407144643831e-06, + "loss": 0.0415, + "step": 23933 + }, + { + "epoch": 65.21525885558583, + "grad_norm": 3.5451037883758545, + "learning_rate": 5.702610276587747e-06, + "loss": 0.0826, + "step": 23934 + }, + { + "epoch": 65.21798365122616, + "grad_norm": 3.3370540142059326, + "learning_rate": 5.701813441999596e-06, + "loss": 0.1027, + "step": 23935 + }, + { + "epoch": 65.22070844686648, + "grad_norm": 3.4198203086853027, + "learning_rate": 5.701016640885582e-06, + "loss": 0.1539, + "step": 23936 + }, + { + "epoch": 65.22343324250681, + "grad_norm": 2.761240243911743, + "learning_rate": 5.700219873251909e-06, + "loss": 0.0561, + "step": 23937 + }, + { + "epoch": 65.22615803814713, + "grad_norm": 3.3922760486602783, + "learning_rate": 5.699423139104789e-06, + "loss": 0.058, + "step": 23938 + }, + { + "epoch": 65.22888283378747, + "grad_norm": 4.2228875160217285, + "learning_rate": 5.698626438450423e-06, + "loss": 0.0668, + "step": 23939 + }, + { + "epoch": 65.2316076294278, + "grad_norm": 2.832742691040039, + "learning_rate": 5.697829771295017e-06, + "loss": 0.0572, + "step": 23940 + }, + { + "epoch": 65.23433242506812, + "grad_norm": 3.4886770248413086, + "learning_rate": 5.69703313764477e-06, + "loss": 0.1091, + "step": 23941 + }, + { + "epoch": 65.23705722070845, + "grad_norm": 3.390244722366333, + "learning_rate": 5.69623653750589e-06, + "loss": 0.0806, + "step": 23942 + }, + { + "epoch": 65.23978201634877, + "grad_norm": 2.5988874435424805, + "learning_rate": 5.695439970884585e-06, + "loss": 0.0569, + "step": 23943 + }, + { + "epoch": 65.2425068119891, + "grad_norm": 3.5327260494232178, + "learning_rate": 5.694643437787055e-06, + "loss": 0.0625, + "step": 23944 + }, + { + "epoch": 65.24523160762942, + "grad_norm": 3.5905511379241943, + "learning_rate": 5.693846938219505e-06, + "loss": 0.1286, + "step": 23945 + }, + { + "epoch": 65.24795640326975, + "grad_norm": 3.403218984603882, + "learning_rate": 5.693050472188131e-06, + "loss": 0.2239, + "step": 23946 + }, + { + "epoch": 65.25068119891009, + "grad_norm": 5.678621768951416, + "learning_rate": 5.692254039699146e-06, + "loss": 0.0844, + "step": 23947 + }, + { + "epoch": 65.2534059945504, + "grad_norm": 4.893455505371094, + "learning_rate": 5.691457640758746e-06, + "loss": 0.1923, + "step": 23948 + }, + { + "epoch": 65.25613079019074, + "grad_norm": 4.162020683288574, + "learning_rate": 5.690661275373137e-06, + "loss": 0.0803, + "step": 23949 + }, + { + "epoch": 65.25885558583106, + "grad_norm": 3.102487564086914, + "learning_rate": 5.689864943548514e-06, + "loss": 0.1249, + "step": 23950 + }, + { + "epoch": 65.26158038147139, + "grad_norm": 4.126766681671143, + "learning_rate": 5.68906864529109e-06, + "loss": 0.0503, + "step": 23951 + }, + { + "epoch": 65.26430517711172, + "grad_norm": 3.4668099880218506, + "learning_rate": 5.688272380607058e-06, + "loss": 0.0627, + "step": 23952 + }, + { + "epoch": 65.26702997275204, + "grad_norm": 4.390965938568115, + "learning_rate": 5.68747614950262e-06, + "loss": 0.1044, + "step": 23953 + }, + { + "epoch": 65.26975476839237, + "grad_norm": 3.341416597366333, + "learning_rate": 5.686679951983982e-06, + "loss": 0.2101, + "step": 23954 + }, + { + "epoch": 65.2724795640327, + "grad_norm": 3.0021090507507324, + "learning_rate": 5.6858837880573426e-06, + "loss": 0.1412, + "step": 23955 + }, + { + "epoch": 65.27520435967303, + "grad_norm": 3.424797534942627, + "learning_rate": 5.685087657728902e-06, + "loss": 0.0528, + "step": 23956 + }, + { + "epoch": 65.27792915531334, + "grad_norm": 5.805532932281494, + "learning_rate": 5.6842915610048545e-06, + "loss": 0.0576, + "step": 23957 + }, + { + "epoch": 65.28065395095368, + "grad_norm": 3.436185836791992, + "learning_rate": 5.683495497891409e-06, + "loss": 0.0781, + "step": 23958 + }, + { + "epoch": 65.28337874659401, + "grad_norm": 3.735299825668335, + "learning_rate": 5.682699468394763e-06, + "loss": 0.0649, + "step": 23959 + }, + { + "epoch": 65.28610354223433, + "grad_norm": 5.107840061187744, + "learning_rate": 5.6819034725211096e-06, + "loss": 0.0715, + "step": 23960 + }, + { + "epoch": 65.28882833787466, + "grad_norm": 3.0492615699768066, + "learning_rate": 5.681107510276658e-06, + "loss": 0.0492, + "step": 23961 + }, + { + "epoch": 65.29155313351498, + "grad_norm": 2.9003193378448486, + "learning_rate": 5.680311581667597e-06, + "loss": 0.0675, + "step": 23962 + }, + { + "epoch": 65.29427792915531, + "grad_norm": 4.069297790527344, + "learning_rate": 5.6795156867001345e-06, + "loss": 0.0813, + "step": 23963 + }, + { + "epoch": 65.29700272479565, + "grad_norm": 6.263089179992676, + "learning_rate": 5.678719825380466e-06, + "loss": 0.0683, + "step": 23964 + }, + { + "epoch": 65.29972752043597, + "grad_norm": 2.939884662628174, + "learning_rate": 5.677923997714787e-06, + "loss": 0.1354, + "step": 23965 + }, + { + "epoch": 65.3024523160763, + "grad_norm": 15.638578414916992, + "learning_rate": 5.677128203709294e-06, + "loss": 0.081, + "step": 23966 + }, + { + "epoch": 65.30517711171662, + "grad_norm": 3.349811315536499, + "learning_rate": 5.676332443370189e-06, + "loss": 0.2152, + "step": 23967 + }, + { + "epoch": 65.30790190735695, + "grad_norm": 2.394726037979126, + "learning_rate": 5.675536716703671e-06, + "loss": 0.0341, + "step": 23968 + }, + { + "epoch": 65.31062670299727, + "grad_norm": 5.335820198059082, + "learning_rate": 5.674741023715933e-06, + "loss": 0.1909, + "step": 23969 + }, + { + "epoch": 65.3133514986376, + "grad_norm": 3.1315112113952637, + "learning_rate": 5.673945364413167e-06, + "loss": 0.0595, + "step": 23970 + }, + { + "epoch": 65.31607629427793, + "grad_norm": 3.580753803253174, + "learning_rate": 5.67314973880158e-06, + "loss": 0.0642, + "step": 23971 + }, + { + "epoch": 65.31880108991825, + "grad_norm": 3.06107759475708, + "learning_rate": 5.672354146887364e-06, + "loss": 0.1235, + "step": 23972 + }, + { + "epoch": 65.32152588555859, + "grad_norm": 3.051346778869629, + "learning_rate": 5.671558588676715e-06, + "loss": 0.0778, + "step": 23973 + }, + { + "epoch": 65.3242506811989, + "grad_norm": 4.6618781089782715, + "learning_rate": 5.6707630641758235e-06, + "loss": 0.057, + "step": 23974 + }, + { + "epoch": 65.32697547683924, + "grad_norm": 3.14992094039917, + "learning_rate": 5.6699675733908955e-06, + "loss": 0.1994, + "step": 23975 + }, + { + "epoch": 65.32970027247957, + "grad_norm": 5.335004806518555, + "learning_rate": 5.6691721163281185e-06, + "loss": 0.11, + "step": 23976 + }, + { + "epoch": 65.33242506811989, + "grad_norm": 3.9652626514434814, + "learning_rate": 5.668376692993687e-06, + "loss": 0.0529, + "step": 23977 + }, + { + "epoch": 65.33514986376022, + "grad_norm": 2.6379270553588867, + "learning_rate": 5.6675813033937985e-06, + "loss": 0.0925, + "step": 23978 + }, + { + "epoch": 65.33787465940054, + "grad_norm": 3.380904197692871, + "learning_rate": 5.666785947534651e-06, + "loss": 0.0937, + "step": 23979 + }, + { + "epoch": 65.34059945504087, + "grad_norm": 2.9610610008239746, + "learning_rate": 5.6659906254224355e-06, + "loss": 0.0366, + "step": 23980 + }, + { + "epoch": 65.34332425068119, + "grad_norm": 4.081940174102783, + "learning_rate": 5.665195337063345e-06, + "loss": 0.0642, + "step": 23981 + }, + { + "epoch": 65.34604904632153, + "grad_norm": 3.9273087978363037, + "learning_rate": 5.664400082463569e-06, + "loss": 0.2661, + "step": 23982 + }, + { + "epoch": 65.34877384196186, + "grad_norm": 4.0738115310668945, + "learning_rate": 5.663604861629311e-06, + "loss": 0.0475, + "step": 23983 + }, + { + "epoch": 65.35149863760218, + "grad_norm": 2.5269320011138916, + "learning_rate": 5.662809674566759e-06, + "loss": 0.0425, + "step": 23984 + }, + { + "epoch": 65.35422343324251, + "grad_norm": 3.172858238220215, + "learning_rate": 5.662014521282104e-06, + "loss": 0.1479, + "step": 23985 + }, + { + "epoch": 65.35694822888283, + "grad_norm": 3.7630107402801514, + "learning_rate": 5.661219401781537e-06, + "loss": 0.1608, + "step": 23986 + }, + { + "epoch": 65.35967302452316, + "grad_norm": 2.8426389694213867, + "learning_rate": 5.660424316071258e-06, + "loss": 0.0597, + "step": 23987 + }, + { + "epoch": 65.3623978201635, + "grad_norm": 3.6083157062530518, + "learning_rate": 5.6596292641574535e-06, + "loss": 0.077, + "step": 23988 + }, + { + "epoch": 65.36512261580381, + "grad_norm": 3.9012110233306885, + "learning_rate": 5.658834246046319e-06, + "loss": 0.077, + "step": 23989 + }, + { + "epoch": 65.36784741144415, + "grad_norm": 5.432197570800781, + "learning_rate": 5.658039261744037e-06, + "loss": 0.0528, + "step": 23990 + }, + { + "epoch": 65.37057220708446, + "grad_norm": 4.274069786071777, + "learning_rate": 5.657244311256811e-06, + "loss": 0.0567, + "step": 23991 + }, + { + "epoch": 65.3732970027248, + "grad_norm": 2.6049606800079346, + "learning_rate": 5.656449394590826e-06, + "loss": 0.0566, + "step": 23992 + }, + { + "epoch": 65.37602179836512, + "grad_norm": 3.093290328979492, + "learning_rate": 5.655654511752274e-06, + "loss": 0.0436, + "step": 23993 + }, + { + "epoch": 65.37874659400545, + "grad_norm": 5.726058483123779, + "learning_rate": 5.654859662747337e-06, + "loss": 0.0719, + "step": 23994 + }, + { + "epoch": 65.38147138964578, + "grad_norm": 4.21392822265625, + "learning_rate": 5.6540648475822215e-06, + "loss": 0.1087, + "step": 23995 + }, + { + "epoch": 65.3841961852861, + "grad_norm": 7.224810600280762, + "learning_rate": 5.653270066263108e-06, + "loss": 0.2051, + "step": 23996 + }, + { + "epoch": 65.38692098092643, + "grad_norm": 2.78900408744812, + "learning_rate": 5.6524753187961865e-06, + "loss": 0.0409, + "step": 23997 + }, + { + "epoch": 65.38964577656675, + "grad_norm": 2.8519763946533203, + "learning_rate": 5.6516806051876435e-06, + "loss": 0.2213, + "step": 23998 + }, + { + "epoch": 65.39237057220708, + "grad_norm": 2.725651502609253, + "learning_rate": 5.650885925443678e-06, + "loss": 0.1322, + "step": 23999 + }, + { + "epoch": 65.39509536784742, + "grad_norm": 2.827827215194702, + "learning_rate": 5.650091279570471e-06, + "loss": 0.0543, + "step": 24000 + }, + { + "epoch": 65.39782016348774, + "grad_norm": 3.800290584564209, + "learning_rate": 5.649296667574215e-06, + "loss": 0.0997, + "step": 24001 + }, + { + "epoch": 65.40054495912807, + "grad_norm": 2.7473745346069336, + "learning_rate": 5.6485020894610905e-06, + "loss": 0.0733, + "step": 24002 + }, + { + "epoch": 65.40326975476839, + "grad_norm": 3.0474374294281006, + "learning_rate": 5.647707545237298e-06, + "loss": 0.0391, + "step": 24003 + }, + { + "epoch": 65.40599455040872, + "grad_norm": 2.3979551792144775, + "learning_rate": 5.646913034909016e-06, + "loss": 0.0303, + "step": 24004 + }, + { + "epoch": 65.40871934604904, + "grad_norm": 5.561906814575195, + "learning_rate": 5.646118558482438e-06, + "loss": 0.0617, + "step": 24005 + }, + { + "epoch": 65.41144414168937, + "grad_norm": 4.902659893035889, + "learning_rate": 5.645324115963742e-06, + "loss": 0.0445, + "step": 24006 + }, + { + "epoch": 65.4141689373297, + "grad_norm": 3.7582004070281982, + "learning_rate": 5.644529707359128e-06, + "loss": 0.1675, + "step": 24007 + }, + { + "epoch": 65.41689373297002, + "grad_norm": 2.687662124633789, + "learning_rate": 5.643735332674776e-06, + "loss": 0.0862, + "step": 24008 + }, + { + "epoch": 65.41961852861036, + "grad_norm": 7.281131744384766, + "learning_rate": 5.6429409919168724e-06, + "loss": 0.1605, + "step": 24009 + }, + { + "epoch": 65.42234332425068, + "grad_norm": 4.193109035491943, + "learning_rate": 5.6421466850915986e-06, + "loss": 0.115, + "step": 24010 + }, + { + "epoch": 65.42506811989101, + "grad_norm": 2.208326578140259, + "learning_rate": 5.641352412205148e-06, + "loss": 0.1176, + "step": 24011 + }, + { + "epoch": 65.42779291553134, + "grad_norm": 2.9011576175689697, + "learning_rate": 5.640558173263708e-06, + "loss": 0.0433, + "step": 24012 + }, + { + "epoch": 65.43051771117166, + "grad_norm": 3.144461154937744, + "learning_rate": 5.6397639682734616e-06, + "loss": 0.115, + "step": 24013 + }, + { + "epoch": 65.433242506812, + "grad_norm": 8.688531875610352, + "learning_rate": 5.638969797240592e-06, + "loss": 0.1619, + "step": 24014 + }, + { + "epoch": 65.43596730245231, + "grad_norm": 3.3656513690948486, + "learning_rate": 5.638175660171281e-06, + "loss": 0.0642, + "step": 24015 + }, + { + "epoch": 65.43869209809264, + "grad_norm": 3.899275302886963, + "learning_rate": 5.637381557071724e-06, + "loss": 0.1298, + "step": 24016 + }, + { + "epoch": 65.44141689373296, + "grad_norm": 3.7607948780059814, + "learning_rate": 5.636587487948096e-06, + "loss": 0.153, + "step": 24017 + }, + { + "epoch": 65.4441416893733, + "grad_norm": 3.140089750289917, + "learning_rate": 5.635793452806582e-06, + "loss": 0.106, + "step": 24018 + }, + { + "epoch": 65.44686648501363, + "grad_norm": 3.5234313011169434, + "learning_rate": 5.634999451653372e-06, + "loss": 0.0493, + "step": 24019 + }, + { + "epoch": 65.44959128065395, + "grad_norm": 3.7180094718933105, + "learning_rate": 5.6342054844946446e-06, + "loss": 0.0855, + "step": 24020 + }, + { + "epoch": 65.45231607629428, + "grad_norm": 2.1237192153930664, + "learning_rate": 5.633411551336585e-06, + "loss": 0.0274, + "step": 24021 + }, + { + "epoch": 65.4550408719346, + "grad_norm": 5.453552722930908, + "learning_rate": 5.6326176521853725e-06, + "loss": 0.1127, + "step": 24022 + }, + { + "epoch": 65.45776566757493, + "grad_norm": 4.5644965171813965, + "learning_rate": 5.631823787047196e-06, + "loss": 0.0522, + "step": 24023 + }, + { + "epoch": 65.46049046321527, + "grad_norm": 4.731208801269531, + "learning_rate": 5.631029955928236e-06, + "loss": 0.0849, + "step": 24024 + }, + { + "epoch": 65.46321525885558, + "grad_norm": 3.8543739318847656, + "learning_rate": 5.630236158834675e-06, + "loss": 0.0694, + "step": 24025 + }, + { + "epoch": 65.46594005449592, + "grad_norm": 6.913013935089111, + "learning_rate": 5.629442395772688e-06, + "loss": 0.0746, + "step": 24026 + }, + { + "epoch": 65.46866485013624, + "grad_norm": 3.2953193187713623, + "learning_rate": 5.628648666748467e-06, + "loss": 0.0407, + "step": 24027 + }, + { + "epoch": 65.47138964577657, + "grad_norm": 5.9116411209106445, + "learning_rate": 5.627854971768187e-06, + "loss": 0.0566, + "step": 24028 + }, + { + "epoch": 65.47411444141689, + "grad_norm": 2.8418362140655518, + "learning_rate": 5.627061310838035e-06, + "loss": 0.0636, + "step": 24029 + }, + { + "epoch": 65.47683923705722, + "grad_norm": 3.1597983837127686, + "learning_rate": 5.626267683964188e-06, + "loss": 0.2027, + "step": 24030 + }, + { + "epoch": 65.47956403269755, + "grad_norm": 4.115743637084961, + "learning_rate": 5.625474091152825e-06, + "loss": 0.0791, + "step": 24031 + }, + { + "epoch": 65.48228882833787, + "grad_norm": 2.599477767944336, + "learning_rate": 5.624680532410134e-06, + "loss": 0.0422, + "step": 24032 + }, + { + "epoch": 65.4850136239782, + "grad_norm": 3.156306028366089, + "learning_rate": 5.623887007742288e-06, + "loss": 0.0869, + "step": 24033 + }, + { + "epoch": 65.48773841961852, + "grad_norm": 3.8809096813201904, + "learning_rate": 5.623093517155469e-06, + "loss": 0.083, + "step": 24034 + }, + { + "epoch": 65.49046321525886, + "grad_norm": 3.6313915252685547, + "learning_rate": 5.622300060655854e-06, + "loss": 0.0614, + "step": 24035 + }, + { + "epoch": 65.49318801089919, + "grad_norm": 4.227549076080322, + "learning_rate": 5.62150663824963e-06, + "loss": 0.1316, + "step": 24036 + }, + { + "epoch": 65.49591280653951, + "grad_norm": 2.85221529006958, + "learning_rate": 5.620713249942968e-06, + "loss": 0.0393, + "step": 24037 + }, + { + "epoch": 65.49863760217984, + "grad_norm": 9.981179237365723, + "learning_rate": 5.619919895742054e-06, + "loss": 0.1113, + "step": 24038 + }, + { + "epoch": 65.50136239782016, + "grad_norm": 2.98490309715271, + "learning_rate": 5.619126575653058e-06, + "loss": 0.0444, + "step": 24039 + }, + { + "epoch": 65.50408719346049, + "grad_norm": 3.901944875717163, + "learning_rate": 5.618333289682165e-06, + "loss": 0.1477, + "step": 24040 + }, + { + "epoch": 65.50681198910081, + "grad_norm": 3.7826104164123535, + "learning_rate": 5.617540037835553e-06, + "loss": 0.115, + "step": 24041 + }, + { + "epoch": 65.50953678474114, + "grad_norm": 3.9240939617156982, + "learning_rate": 5.616746820119394e-06, + "loss": 0.0512, + "step": 24042 + }, + { + "epoch": 65.51226158038148, + "grad_norm": 3.282703399658203, + "learning_rate": 5.615953636539875e-06, + "loss": 0.0468, + "step": 24043 + }, + { + "epoch": 65.5149863760218, + "grad_norm": 3.200434446334839, + "learning_rate": 5.6151604871031665e-06, + "loss": 0.0706, + "step": 24044 + }, + { + "epoch": 65.51771117166213, + "grad_norm": 2.988568067550659, + "learning_rate": 5.6143673718154466e-06, + "loss": 0.1459, + "step": 24045 + }, + { + "epoch": 65.52043596730245, + "grad_norm": 3.289043426513672, + "learning_rate": 5.6135742906828894e-06, + "loss": 0.0495, + "step": 24046 + }, + { + "epoch": 65.52316076294278, + "grad_norm": 3.8344788551330566, + "learning_rate": 5.612781243711673e-06, + "loss": 0.0881, + "step": 24047 + }, + { + "epoch": 65.52588555858311, + "grad_norm": 3.664890766143799, + "learning_rate": 5.611988230907981e-06, + "loss": 0.0843, + "step": 24048 + }, + { + "epoch": 65.52861035422343, + "grad_norm": 3.223095417022705, + "learning_rate": 5.611195252277983e-06, + "loss": 0.0946, + "step": 24049 + }, + { + "epoch": 65.53133514986376, + "grad_norm": 3.1708548069000244, + "learning_rate": 5.610402307827855e-06, + "loss": 0.1086, + "step": 24050 + }, + { + "epoch": 65.53405994550408, + "grad_norm": 4.720671653747559, + "learning_rate": 5.609609397563768e-06, + "loss": 0.1158, + "step": 24051 + }, + { + "epoch": 65.53678474114442, + "grad_norm": 3.3979437351226807, + "learning_rate": 5.6088165214919064e-06, + "loss": 0.1681, + "step": 24052 + }, + { + "epoch": 65.53950953678473, + "grad_norm": 2.8669590950012207, + "learning_rate": 5.6080236796184395e-06, + "loss": 0.0421, + "step": 24053 + }, + { + "epoch": 65.54223433242507, + "grad_norm": 3.282972574234009, + "learning_rate": 5.607230871949543e-06, + "loss": 0.0595, + "step": 24054 + }, + { + "epoch": 65.5449591280654, + "grad_norm": 5.365381240844727, + "learning_rate": 5.606438098491388e-06, + "loss": 0.2275, + "step": 24055 + }, + { + "epoch": 65.54768392370572, + "grad_norm": 4.928396224975586, + "learning_rate": 5.605645359250155e-06, + "loss": 0.3508, + "step": 24056 + }, + { + "epoch": 65.55040871934605, + "grad_norm": 2.4006850719451904, + "learning_rate": 5.604852654232015e-06, + "loss": 0.042, + "step": 24057 + }, + { + "epoch": 65.55313351498637, + "grad_norm": 3.378596544265747, + "learning_rate": 5.604059983443139e-06, + "loss": 0.0603, + "step": 24058 + }, + { + "epoch": 65.5558583106267, + "grad_norm": 3.948317527770996, + "learning_rate": 5.6032673468897015e-06, + "loss": 0.1374, + "step": 24059 + }, + { + "epoch": 65.55858310626704, + "grad_norm": 3.6100611686706543, + "learning_rate": 5.602474744577879e-06, + "loss": 0.1618, + "step": 24060 + }, + { + "epoch": 65.56130790190736, + "grad_norm": 3.3356940746307373, + "learning_rate": 5.6016821765138405e-06, + "loss": 0.1528, + "step": 24061 + }, + { + "epoch": 65.56403269754769, + "grad_norm": 3.4731838703155518, + "learning_rate": 5.600889642703758e-06, + "loss": 0.0455, + "step": 24062 + }, + { + "epoch": 65.566757493188, + "grad_norm": 3.523421287536621, + "learning_rate": 5.6000971431538045e-06, + "loss": 0.063, + "step": 24063 + }, + { + "epoch": 65.56948228882834, + "grad_norm": 2.8029582500457764, + "learning_rate": 5.599304677870157e-06, + "loss": 0.0412, + "step": 24064 + }, + { + "epoch": 65.57220708446866, + "grad_norm": 3.948566198348999, + "learning_rate": 5.598512246858982e-06, + "loss": 0.0912, + "step": 24065 + }, + { + "epoch": 65.57493188010899, + "grad_norm": 3.1863033771514893, + "learning_rate": 5.5977198501264514e-06, + "loss": 0.1724, + "step": 24066 + }, + { + "epoch": 65.57765667574932, + "grad_norm": 3.802523374557495, + "learning_rate": 5.5969274876787334e-06, + "loss": 0.0417, + "step": 24067 + }, + { + "epoch": 65.58038147138964, + "grad_norm": 3.8693065643310547, + "learning_rate": 5.5961351595220084e-06, + "loss": 0.0874, + "step": 24068 + }, + { + "epoch": 65.58310626702998, + "grad_norm": 2.525731325149536, + "learning_rate": 5.595342865662439e-06, + "loss": 0.0332, + "step": 24069 + }, + { + "epoch": 65.5858310626703, + "grad_norm": 2.4688730239868164, + "learning_rate": 5.594550606106198e-06, + "loss": 0.0323, + "step": 24070 + }, + { + "epoch": 65.58855585831063, + "grad_norm": 3.272493362426758, + "learning_rate": 5.593758380859452e-06, + "loss": 0.053, + "step": 24071 + }, + { + "epoch": 65.59128065395096, + "grad_norm": 3.4990341663360596, + "learning_rate": 5.5929661899283775e-06, + "loss": 0.1053, + "step": 24072 + }, + { + "epoch": 65.59400544959128, + "grad_norm": 4.865126609802246, + "learning_rate": 5.59217403331914e-06, + "loss": 0.1447, + "step": 24073 + }, + { + "epoch": 65.59673024523161, + "grad_norm": 3.6281673908233643, + "learning_rate": 5.5913819110379095e-06, + "loss": 0.275, + "step": 24074 + }, + { + "epoch": 65.59945504087193, + "grad_norm": 2.552403211593628, + "learning_rate": 5.5905898230908506e-06, + "loss": 0.0828, + "step": 24075 + }, + { + "epoch": 65.60217983651226, + "grad_norm": 3.726198434829712, + "learning_rate": 5.5897977694841396e-06, + "loss": 0.0527, + "step": 24076 + }, + { + "epoch": 65.60490463215258, + "grad_norm": 3.713240623474121, + "learning_rate": 5.589005750223944e-06, + "loss": 0.0471, + "step": 24077 + }, + { + "epoch": 65.60762942779292, + "grad_norm": 3.081360101699829, + "learning_rate": 5.588213765316427e-06, + "loss": 0.0417, + "step": 24078 + }, + { + "epoch": 65.61035422343325, + "grad_norm": 4.682824611663818, + "learning_rate": 5.587421814767757e-06, + "loss": 0.1321, + "step": 24079 + }, + { + "epoch": 65.61307901907357, + "grad_norm": 7.3144402503967285, + "learning_rate": 5.586629898584103e-06, + "loss": 0.103, + "step": 24080 + }, + { + "epoch": 65.6158038147139, + "grad_norm": 3.2913010120391846, + "learning_rate": 5.5858380167716375e-06, + "loss": 0.1756, + "step": 24081 + }, + { + "epoch": 65.61852861035422, + "grad_norm": 3.0218420028686523, + "learning_rate": 5.585046169336524e-06, + "loss": 0.0964, + "step": 24082 + }, + { + "epoch": 65.62125340599455, + "grad_norm": 3.8760106563568115, + "learning_rate": 5.584254356284924e-06, + "loss": 0.1442, + "step": 24083 + }, + { + "epoch": 65.62397820163488, + "grad_norm": 3.4273133277893066, + "learning_rate": 5.583462577623013e-06, + "loss": 0.056, + "step": 24084 + }, + { + "epoch": 65.6267029972752, + "grad_norm": 3.849010705947876, + "learning_rate": 5.5826708333569536e-06, + "loss": 0.0884, + "step": 24085 + }, + { + "epoch": 65.62942779291554, + "grad_norm": 4.020907878875732, + "learning_rate": 5.58187912349291e-06, + "loss": 0.079, + "step": 24086 + }, + { + "epoch": 65.63215258855585, + "grad_norm": 3.489081382751465, + "learning_rate": 5.581087448037048e-06, + "loss": 0.1209, + "step": 24087 + }, + { + "epoch": 65.63487738419619, + "grad_norm": 3.759430170059204, + "learning_rate": 5.580295806995538e-06, + "loss": 0.1076, + "step": 24088 + }, + { + "epoch": 65.6376021798365, + "grad_norm": 5.0124192237854, + "learning_rate": 5.5795042003745416e-06, + "loss": 0.0612, + "step": 24089 + }, + { + "epoch": 65.64032697547684, + "grad_norm": 3.5506246089935303, + "learning_rate": 5.578712628180225e-06, + "loss": 0.0413, + "step": 24090 + }, + { + "epoch": 65.64305177111717, + "grad_norm": 4.744014263153076, + "learning_rate": 5.577921090418747e-06, + "loss": 0.0588, + "step": 24091 + }, + { + "epoch": 65.64577656675749, + "grad_norm": 5.604671478271484, + "learning_rate": 5.577129587096282e-06, + "loss": 0.148, + "step": 24092 + }, + { + "epoch": 65.64850136239782, + "grad_norm": 3.916191816329956, + "learning_rate": 5.576338118218989e-06, + "loss": 0.1333, + "step": 24093 + }, + { + "epoch": 65.65122615803814, + "grad_norm": 3.4078290462493896, + "learning_rate": 5.575546683793034e-06, + "loss": 0.1086, + "step": 24094 + }, + { + "epoch": 65.65395095367847, + "grad_norm": 3.0936272144317627, + "learning_rate": 5.574755283824573e-06, + "loss": 0.3191, + "step": 24095 + }, + { + "epoch": 65.65667574931881, + "grad_norm": 3.2433664798736572, + "learning_rate": 5.5739639183197805e-06, + "loss": 0.0491, + "step": 24096 + }, + { + "epoch": 65.65940054495913, + "grad_norm": 3.436826705932617, + "learning_rate": 5.57317258728481e-06, + "loss": 0.0872, + "step": 24097 + }, + { + "epoch": 65.66212534059946, + "grad_norm": 3.36426043510437, + "learning_rate": 5.572381290725833e-06, + "loss": 0.0732, + "step": 24098 + }, + { + "epoch": 65.66485013623978, + "grad_norm": 3.7712724208831787, + "learning_rate": 5.571590028649008e-06, + "loss": 0.0706, + "step": 24099 + }, + { + "epoch": 65.66757493188011, + "grad_norm": 2.650465726852417, + "learning_rate": 5.570798801060493e-06, + "loss": 0.0863, + "step": 24100 + }, + { + "epoch": 65.67029972752043, + "grad_norm": 3.8432295322418213, + "learning_rate": 5.570007607966459e-06, + "loss": 0.1962, + "step": 24101 + }, + { + "epoch": 65.67302452316076, + "grad_norm": 3.3361594676971436, + "learning_rate": 5.569216449373063e-06, + "loss": 0.0664, + "step": 24102 + }, + { + "epoch": 65.6757493188011, + "grad_norm": 2.96706485748291, + "learning_rate": 5.568425325286466e-06, + "loss": 0.0439, + "step": 24103 + }, + { + "epoch": 65.67847411444141, + "grad_norm": 4.701183795928955, + "learning_rate": 5.567634235712827e-06, + "loss": 0.0799, + "step": 24104 + }, + { + "epoch": 65.68119891008175, + "grad_norm": 2.7475826740264893, + "learning_rate": 5.566843180658313e-06, + "loss": 0.0347, + "step": 24105 + }, + { + "epoch": 65.68392370572207, + "grad_norm": 3.762141227722168, + "learning_rate": 5.566052160129083e-06, + "loss": 0.0479, + "step": 24106 + }, + { + "epoch": 65.6866485013624, + "grad_norm": 4.1154465675354, + "learning_rate": 5.565261174131291e-06, + "loss": 0.084, + "step": 24107 + }, + { + "epoch": 65.68937329700273, + "grad_norm": 2.481872320175171, + "learning_rate": 5.5644702226711055e-06, + "loss": 0.0817, + "step": 24108 + }, + { + "epoch": 65.69209809264305, + "grad_norm": 4.318648338317871, + "learning_rate": 5.563679305754685e-06, + "loss": 0.1184, + "step": 24109 + }, + { + "epoch": 65.69482288828338, + "grad_norm": 4.170182704925537, + "learning_rate": 5.5628884233881865e-06, + "loss": 0.1345, + "step": 24110 + }, + { + "epoch": 65.6975476839237, + "grad_norm": 3.049823522567749, + "learning_rate": 5.562097575577765e-06, + "loss": 0.0576, + "step": 24111 + }, + { + "epoch": 65.70027247956403, + "grad_norm": 3.304457664489746, + "learning_rate": 5.56130676232959e-06, + "loss": 0.1247, + "step": 24112 + }, + { + "epoch": 65.70299727520435, + "grad_norm": 2.9516074657440186, + "learning_rate": 5.5605159836498145e-06, + "loss": 0.0471, + "step": 24113 + }, + { + "epoch": 65.70572207084469, + "grad_norm": 2.629530906677246, + "learning_rate": 5.559725239544595e-06, + "loss": 0.0428, + "step": 24114 + }, + { + "epoch": 65.70844686648502, + "grad_norm": 3.6818525791168213, + "learning_rate": 5.558934530020095e-06, + "loss": 0.08, + "step": 24115 + }, + { + "epoch": 65.71117166212534, + "grad_norm": 6.104763507843018, + "learning_rate": 5.558143855082466e-06, + "loss": 0.1501, + "step": 24116 + }, + { + "epoch": 65.71389645776567, + "grad_norm": 3.2225263118743896, + "learning_rate": 5.557353214737875e-06, + "loss": 0.0893, + "step": 24117 + }, + { + "epoch": 65.71662125340599, + "grad_norm": 6.144196510314941, + "learning_rate": 5.556562608992473e-06, + "loss": 0.2236, + "step": 24118 + }, + { + "epoch": 65.71934604904632, + "grad_norm": 2.8399598598480225, + "learning_rate": 5.555772037852418e-06, + "loss": 0.0458, + "step": 24119 + }, + { + "epoch": 65.72207084468666, + "grad_norm": 3.0409440994262695, + "learning_rate": 5.554981501323864e-06, + "loss": 0.0571, + "step": 24120 + }, + { + "epoch": 65.72479564032697, + "grad_norm": 3.4222543239593506, + "learning_rate": 5.554190999412975e-06, + "loss": 0.0918, + "step": 24121 + }, + { + "epoch": 65.7275204359673, + "grad_norm": 3.6440134048461914, + "learning_rate": 5.553400532125903e-06, + "loss": 0.1618, + "step": 24122 + }, + { + "epoch": 65.73024523160763, + "grad_norm": 4.814828872680664, + "learning_rate": 5.552610099468805e-06, + "loss": 0.1118, + "step": 24123 + }, + { + "epoch": 65.73297002724796, + "grad_norm": 3.9907937049865723, + "learning_rate": 5.551819701447832e-06, + "loss": 0.1719, + "step": 24124 + }, + { + "epoch": 65.73569482288828, + "grad_norm": 3.5386910438537598, + "learning_rate": 5.5510293380691494e-06, + "loss": 0.1005, + "step": 24125 + }, + { + "epoch": 65.73841961852861, + "grad_norm": 3.8201828002929688, + "learning_rate": 5.550239009338905e-06, + "loss": 0.0532, + "step": 24126 + }, + { + "epoch": 65.74114441416894, + "grad_norm": 3.731848955154419, + "learning_rate": 5.549448715263252e-06, + "loss": 0.1585, + "step": 24127 + }, + { + "epoch": 65.74386920980926, + "grad_norm": 4.082111358642578, + "learning_rate": 5.548658455848355e-06, + "loss": 0.1388, + "step": 24128 + }, + { + "epoch": 65.7465940054496, + "grad_norm": 2.539555072784424, + "learning_rate": 5.547868231100362e-06, + "loss": 0.1853, + "step": 24129 + }, + { + "epoch": 65.74931880108991, + "grad_norm": 2.4366369247436523, + "learning_rate": 5.547078041025429e-06, + "loss": 0.0285, + "step": 24130 + }, + { + "epoch": 65.75204359673025, + "grad_norm": 8.254321098327637, + "learning_rate": 5.546287885629702e-06, + "loss": 0.0883, + "step": 24131 + }, + { + "epoch": 65.75476839237058, + "grad_norm": 3.6452460289001465, + "learning_rate": 5.545497764919345e-06, + "loss": 0.0628, + "step": 24132 + }, + { + "epoch": 65.7574931880109, + "grad_norm": 4.926702976226807, + "learning_rate": 5.544707678900509e-06, + "loss": 0.0799, + "step": 24133 + }, + { + "epoch": 65.76021798365123, + "grad_norm": 5.784377098083496, + "learning_rate": 5.543917627579347e-06, + "loss": 0.2102, + "step": 24134 + }, + { + "epoch": 65.76294277929155, + "grad_norm": 3.480914831161499, + "learning_rate": 5.543127610962012e-06, + "loss": 0.0499, + "step": 24135 + }, + { + "epoch": 65.76566757493188, + "grad_norm": 3.3300530910491943, + "learning_rate": 5.5423376290546526e-06, + "loss": 0.0835, + "step": 24136 + }, + { + "epoch": 65.7683923705722, + "grad_norm": 2.075978994369507, + "learning_rate": 5.541547681863426e-06, + "loss": 0.0348, + "step": 24137 + }, + { + "epoch": 65.77111716621253, + "grad_norm": 3.2094852924346924, + "learning_rate": 5.5407577693944835e-06, + "loss": 0.1015, + "step": 24138 + }, + { + "epoch": 65.77384196185287, + "grad_norm": 2.8756561279296875, + "learning_rate": 5.539967891653976e-06, + "loss": 0.0686, + "step": 24139 + }, + { + "epoch": 65.77656675749319, + "grad_norm": 2.7848398685455322, + "learning_rate": 5.539178048648051e-06, + "loss": 0.086, + "step": 24140 + }, + { + "epoch": 65.77929155313352, + "grad_norm": 4.2184014320373535, + "learning_rate": 5.538388240382868e-06, + "loss": 0.0904, + "step": 24141 + }, + { + "epoch": 65.78201634877384, + "grad_norm": 3.6957924365997314, + "learning_rate": 5.537598466864574e-06, + "loss": 0.1328, + "step": 24142 + }, + { + "epoch": 65.78474114441417, + "grad_norm": 3.270751714706421, + "learning_rate": 5.536808728099318e-06, + "loss": 0.0708, + "step": 24143 + }, + { + "epoch": 65.7874659400545, + "grad_norm": 3.877631425857544, + "learning_rate": 5.536019024093251e-06, + "loss": 0.0816, + "step": 24144 + }, + { + "epoch": 65.79019073569482, + "grad_norm": 2.9125187397003174, + "learning_rate": 5.535229354852525e-06, + "loss": 0.0552, + "step": 24145 + }, + { + "epoch": 65.79291553133515, + "grad_norm": 3.9231040477752686, + "learning_rate": 5.534439720383291e-06, + "loss": 0.1446, + "step": 24146 + }, + { + "epoch": 65.79564032697547, + "grad_norm": 5.722751617431641, + "learning_rate": 5.533650120691696e-06, + "loss": 0.0868, + "step": 24147 + }, + { + "epoch": 65.7983651226158, + "grad_norm": 4.944255352020264, + "learning_rate": 5.532860555783885e-06, + "loss": 0.0679, + "step": 24148 + }, + { + "epoch": 65.80108991825612, + "grad_norm": 2.7896859645843506, + "learning_rate": 5.5320710256660146e-06, + "loss": 0.0466, + "step": 24149 + }, + { + "epoch": 65.80381471389646, + "grad_norm": 4.166999816894531, + "learning_rate": 5.531281530344235e-06, + "loss": 0.0665, + "step": 24150 + }, + { + "epoch": 65.80653950953679, + "grad_norm": 3.6034128665924072, + "learning_rate": 5.530492069824689e-06, + "loss": 0.1082, + "step": 24151 + }, + { + "epoch": 65.80926430517711, + "grad_norm": 3.5304007530212402, + "learning_rate": 5.529702644113524e-06, + "loss": 0.1821, + "step": 24152 + }, + { + "epoch": 65.81198910081744, + "grad_norm": 3.4963839054107666, + "learning_rate": 5.528913253216896e-06, + "loss": 0.0515, + "step": 24153 + }, + { + "epoch": 65.81471389645776, + "grad_norm": 3.477022409439087, + "learning_rate": 5.528123897140946e-06, + "loss": 0.1316, + "step": 24154 + }, + { + "epoch": 65.8174386920981, + "grad_norm": 5.340469837188721, + "learning_rate": 5.5273345758918225e-06, + "loss": 0.214, + "step": 24155 + }, + { + "epoch": 65.82016348773843, + "grad_norm": 3.8314285278320312, + "learning_rate": 5.526545289475671e-06, + "loss": 0.1361, + "step": 24156 + }, + { + "epoch": 65.82288828337875, + "grad_norm": 4.120553970336914, + "learning_rate": 5.525756037898645e-06, + "loss": 0.1485, + "step": 24157 + }, + { + "epoch": 65.82561307901908, + "grad_norm": 3.0257270336151123, + "learning_rate": 5.524966821166886e-06, + "loss": 0.1318, + "step": 24158 + }, + { + "epoch": 65.8283378746594, + "grad_norm": 4.530957221984863, + "learning_rate": 5.524177639286543e-06, + "loss": 0.1526, + "step": 24159 + }, + { + "epoch": 65.83106267029973, + "grad_norm": 3.710131883621216, + "learning_rate": 5.523388492263755e-06, + "loss": 0.0539, + "step": 24160 + }, + { + "epoch": 65.83378746594005, + "grad_norm": 5.359655857086182, + "learning_rate": 5.522599380104677e-06, + "loss": 0.0565, + "step": 24161 + }, + { + "epoch": 65.83651226158038, + "grad_norm": 4.823092937469482, + "learning_rate": 5.521810302815453e-06, + "loss": 0.0942, + "step": 24162 + }, + { + "epoch": 65.83923705722071, + "grad_norm": 4.227487564086914, + "learning_rate": 5.521021260402224e-06, + "loss": 0.0418, + "step": 24163 + }, + { + "epoch": 65.84196185286103, + "grad_norm": 2.779810905456543, + "learning_rate": 5.520232252871134e-06, + "loss": 0.0756, + "step": 24164 + }, + { + "epoch": 65.84468664850137, + "grad_norm": 3.6005938053131104, + "learning_rate": 5.519443280228335e-06, + "loss": 0.0895, + "step": 24165 + }, + { + "epoch": 65.84741144414168, + "grad_norm": 2.7258284091949463, + "learning_rate": 5.5186543424799636e-06, + "loss": 0.152, + "step": 24166 + }, + { + "epoch": 65.85013623978202, + "grad_norm": 4.038546562194824, + "learning_rate": 5.517865439632173e-06, + "loss": 0.1054, + "step": 24167 + }, + { + "epoch": 65.85286103542235, + "grad_norm": 2.302922248840332, + "learning_rate": 5.517076571691096e-06, + "loss": 0.08, + "step": 24168 + }, + { + "epoch": 65.85558583106267, + "grad_norm": 3.5228846073150635, + "learning_rate": 5.516287738662887e-06, + "loss": 0.0398, + "step": 24169 + }, + { + "epoch": 65.858310626703, + "grad_norm": 2.2264459133148193, + "learning_rate": 5.515498940553685e-06, + "loss": 0.0675, + "step": 24170 + }, + { + "epoch": 65.86103542234332, + "grad_norm": 3.608992576599121, + "learning_rate": 5.514710177369634e-06, + "loss": 0.0973, + "step": 24171 + }, + { + "epoch": 65.86376021798365, + "grad_norm": 2.6364173889160156, + "learning_rate": 5.513921449116871e-06, + "loss": 0.0377, + "step": 24172 + }, + { + "epoch": 65.86648501362397, + "grad_norm": 3.437800645828247, + "learning_rate": 5.5131327558015466e-06, + "loss": 0.0947, + "step": 24173 + }, + { + "epoch": 65.8692098092643, + "grad_norm": 3.5913867950439453, + "learning_rate": 5.512344097429801e-06, + "loss": 0.1357, + "step": 24174 + }, + { + "epoch": 65.87193460490464, + "grad_norm": 6.768052577972412, + "learning_rate": 5.511555474007775e-06, + "loss": 0.1138, + "step": 24175 + }, + { + "epoch": 65.87465940054496, + "grad_norm": 3.4739911556243896, + "learning_rate": 5.510766885541606e-06, + "loss": 0.0492, + "step": 24176 + }, + { + "epoch": 65.87738419618529, + "grad_norm": 4.011838912963867, + "learning_rate": 5.509978332037444e-06, + "loss": 0.1477, + "step": 24177 + }, + { + "epoch": 65.88010899182561, + "grad_norm": 4.0436692237854, + "learning_rate": 5.509189813501427e-06, + "loss": 0.0764, + "step": 24178 + }, + { + "epoch": 65.88283378746594, + "grad_norm": 3.490626335144043, + "learning_rate": 5.508401329939695e-06, + "loss": 0.0556, + "step": 24179 + }, + { + "epoch": 65.88555858310627, + "grad_norm": 4.4941487312316895, + "learning_rate": 5.507612881358384e-06, + "loss": 0.2727, + "step": 24180 + }, + { + "epoch": 65.88828337874659, + "grad_norm": 7.636957168579102, + "learning_rate": 5.506824467763645e-06, + "loss": 0.0851, + "step": 24181 + }, + { + "epoch": 65.89100817438693, + "grad_norm": 3.2159922122955322, + "learning_rate": 5.506036089161611e-06, + "loss": 0.0683, + "step": 24182 + }, + { + "epoch": 65.89373297002724, + "grad_norm": 3.8589589595794678, + "learning_rate": 5.505247745558419e-06, + "loss": 0.0811, + "step": 24183 + }, + { + "epoch": 65.89645776566758, + "grad_norm": 3.433084726333618, + "learning_rate": 5.504459436960218e-06, + "loss": 0.0632, + "step": 24184 + }, + { + "epoch": 65.8991825613079, + "grad_norm": 3.2560300827026367, + "learning_rate": 5.5036711633731375e-06, + "loss": 0.06, + "step": 24185 + }, + { + "epoch": 65.90190735694823, + "grad_norm": 3.7079596519470215, + "learning_rate": 5.502882924803326e-06, + "loss": 0.0864, + "step": 24186 + }, + { + "epoch": 65.90463215258856, + "grad_norm": 3.2791967391967773, + "learning_rate": 5.502094721256916e-06, + "loss": 0.0716, + "step": 24187 + }, + { + "epoch": 65.90735694822888, + "grad_norm": 3.8873748779296875, + "learning_rate": 5.501306552740049e-06, + "loss": 0.0429, + "step": 24188 + }, + { + "epoch": 65.91008174386921, + "grad_norm": 3.6260781288146973, + "learning_rate": 5.500518419258858e-06, + "loss": 0.1358, + "step": 24189 + }, + { + "epoch": 65.91280653950953, + "grad_norm": 3.118328332901001, + "learning_rate": 5.499730320819487e-06, + "loss": 0.0476, + "step": 24190 + }, + { + "epoch": 65.91553133514986, + "grad_norm": 2.7150537967681885, + "learning_rate": 5.498942257428073e-06, + "loss": 0.0793, + "step": 24191 + }, + { + "epoch": 65.9182561307902, + "grad_norm": 3.9062442779541016, + "learning_rate": 5.498154229090748e-06, + "loss": 0.0791, + "step": 24192 + }, + { + "epoch": 65.92098092643052, + "grad_norm": 3.698467493057251, + "learning_rate": 5.497366235813656e-06, + "loss": 0.1608, + "step": 24193 + }, + { + "epoch": 65.92370572207085, + "grad_norm": 4.635098457336426, + "learning_rate": 5.496578277602931e-06, + "loss": 0.0595, + "step": 24194 + }, + { + "epoch": 65.92643051771117, + "grad_norm": 3.7649402618408203, + "learning_rate": 5.49579035446471e-06, + "loss": 0.1043, + "step": 24195 + }, + { + "epoch": 65.9291553133515, + "grad_norm": 2.6555700302124023, + "learning_rate": 5.495002466405124e-06, + "loss": 0.0343, + "step": 24196 + }, + { + "epoch": 65.93188010899182, + "grad_norm": 4.743636131286621, + "learning_rate": 5.4942146134303175e-06, + "loss": 0.0989, + "step": 24197 + }, + { + "epoch": 65.93460490463215, + "grad_norm": 2.9609110355377197, + "learning_rate": 5.493426795546424e-06, + "loss": 0.1368, + "step": 24198 + }, + { + "epoch": 65.93732970027249, + "grad_norm": 2.9740395545959473, + "learning_rate": 5.492639012759576e-06, + "loss": 0.1373, + "step": 24199 + }, + { + "epoch": 65.9400544959128, + "grad_norm": 4.133841514587402, + "learning_rate": 5.491851265075907e-06, + "loss": 0.0728, + "step": 24200 + }, + { + "epoch": 65.94277929155314, + "grad_norm": 3.930466651916504, + "learning_rate": 5.491063552501557e-06, + "loss": 0.1177, + "step": 24201 + }, + { + "epoch": 65.94550408719346, + "grad_norm": 3.093852996826172, + "learning_rate": 5.4902758750426596e-06, + "loss": 0.1674, + "step": 24202 + }, + { + "epoch": 65.94822888283379, + "grad_norm": 9.726191520690918, + "learning_rate": 5.489488232705351e-06, + "loss": 0.0435, + "step": 24203 + }, + { + "epoch": 65.95095367847412, + "grad_norm": 3.5312047004699707, + "learning_rate": 5.488700625495762e-06, + "loss": 0.1013, + "step": 24204 + }, + { + "epoch": 65.95367847411444, + "grad_norm": 3.8236422538757324, + "learning_rate": 5.487913053420023e-06, + "loss": 0.0735, + "step": 24205 + }, + { + "epoch": 65.95640326975477, + "grad_norm": 4.338160037994385, + "learning_rate": 5.487125516484276e-06, + "loss": 0.1414, + "step": 24206 + }, + { + "epoch": 65.95912806539509, + "grad_norm": 2.083596706390381, + "learning_rate": 5.486338014694651e-06, + "loss": 0.0296, + "step": 24207 + }, + { + "epoch": 65.96185286103542, + "grad_norm": 2.7186203002929688, + "learning_rate": 5.485550548057279e-06, + "loss": 0.0425, + "step": 24208 + }, + { + "epoch": 65.96457765667574, + "grad_norm": 4.528669834136963, + "learning_rate": 5.4847631165782914e-06, + "loss": 0.0521, + "step": 24209 + }, + { + "epoch": 65.96730245231608, + "grad_norm": 2.236259698867798, + "learning_rate": 5.483975720263827e-06, + "loss": 0.0689, + "step": 24210 + }, + { + "epoch": 65.97002724795641, + "grad_norm": 5.090316295623779, + "learning_rate": 5.4831883591200145e-06, + "loss": 0.1475, + "step": 24211 + }, + { + "epoch": 65.97275204359673, + "grad_norm": 3.0475664138793945, + "learning_rate": 5.482401033152984e-06, + "loss": 0.1759, + "step": 24212 + }, + { + "epoch": 65.97547683923706, + "grad_norm": 5.212029457092285, + "learning_rate": 5.481613742368868e-06, + "loss": 0.2215, + "step": 24213 + }, + { + "epoch": 65.97820163487738, + "grad_norm": 3.1095752716064453, + "learning_rate": 5.4808264867738e-06, + "loss": 0.0509, + "step": 24214 + }, + { + "epoch": 65.98092643051771, + "grad_norm": 3.6840479373931885, + "learning_rate": 5.480039266373911e-06, + "loss": 0.0353, + "step": 24215 + }, + { + "epoch": 65.98365122615803, + "grad_norm": 2.972705841064453, + "learning_rate": 5.479252081175326e-06, + "loss": 0.1874, + "step": 24216 + }, + { + "epoch": 65.98637602179836, + "grad_norm": 3.9125068187713623, + "learning_rate": 5.478464931184186e-06, + "loss": 0.0907, + "step": 24217 + }, + { + "epoch": 65.9891008174387, + "grad_norm": 3.8430469036102295, + "learning_rate": 5.477677816406611e-06, + "loss": 0.1185, + "step": 24218 + }, + { + "epoch": 65.99182561307902, + "grad_norm": 13.997435569763184, + "learning_rate": 5.4768907368487375e-06, + "loss": 0.0862, + "step": 24219 + }, + { + "epoch": 65.99455040871935, + "grad_norm": 5.113949775695801, + "learning_rate": 5.4761036925166946e-06, + "loss": 0.1009, + "step": 24220 + }, + { + "epoch": 65.99727520435967, + "grad_norm": 2.952927589416504, + "learning_rate": 5.475316683416607e-06, + "loss": 0.0448, + "step": 24221 + }, + { + "epoch": 66.0, + "grad_norm": 2.908334493637085, + "learning_rate": 5.4745297095546125e-06, + "loss": 0.1382, + "step": 24222 + }, + { + "epoch": 66.00272479564033, + "grad_norm": 4.744135856628418, + "learning_rate": 5.4737427709368326e-06, + "loss": 0.067, + "step": 24223 + }, + { + "epoch": 66.00544959128065, + "grad_norm": 3.928037166595459, + "learning_rate": 5.472955867569399e-06, + "loss": 0.0739, + "step": 24224 + }, + { + "epoch": 66.00817438692098, + "grad_norm": 4.2218427658081055, + "learning_rate": 5.472168999458436e-06, + "loss": 0.1286, + "step": 24225 + }, + { + "epoch": 66.0108991825613, + "grad_norm": 3.494382381439209, + "learning_rate": 5.4713821666100794e-06, + "loss": 0.0475, + "step": 24226 + }, + { + "epoch": 66.01362397820164, + "grad_norm": 3.000708818435669, + "learning_rate": 5.470595369030453e-06, + "loss": 0.0377, + "step": 24227 + }, + { + "epoch": 66.01634877384195, + "grad_norm": 3.6476948261260986, + "learning_rate": 5.4698086067256826e-06, + "loss": 0.0524, + "step": 24228 + }, + { + "epoch": 66.01907356948229, + "grad_norm": 3.2138516902923584, + "learning_rate": 5.469021879701895e-06, + "loss": 0.1095, + "step": 24229 + }, + { + "epoch": 66.02179836512262, + "grad_norm": 2.9181294441223145, + "learning_rate": 5.468235187965221e-06, + "loss": 0.0985, + "step": 24230 + }, + { + "epoch": 66.02452316076294, + "grad_norm": 2.7947864532470703, + "learning_rate": 5.467448531521786e-06, + "loss": 0.1065, + "step": 24231 + }, + { + "epoch": 66.02724795640327, + "grad_norm": 3.4363908767700195, + "learning_rate": 5.466661910377717e-06, + "loss": 0.0713, + "step": 24232 + }, + { + "epoch": 66.02997275204359, + "grad_norm": 5.255629539489746, + "learning_rate": 5.465875324539134e-06, + "loss": 0.2178, + "step": 24233 + }, + { + "epoch": 66.03269754768392, + "grad_norm": 2.9164540767669678, + "learning_rate": 5.465088774012172e-06, + "loss": 0.0578, + "step": 24234 + }, + { + "epoch": 66.03542234332426, + "grad_norm": 2.8132989406585693, + "learning_rate": 5.464302258802949e-06, + "loss": 0.0379, + "step": 24235 + }, + { + "epoch": 66.03814713896458, + "grad_norm": 3.0949575901031494, + "learning_rate": 5.463515778917598e-06, + "loss": 0.0759, + "step": 24236 + }, + { + "epoch": 66.04087193460491, + "grad_norm": 4.194434642791748, + "learning_rate": 5.462729334362238e-06, + "loss": 0.1513, + "step": 24237 + }, + { + "epoch": 66.04359673024523, + "grad_norm": 7.156740188598633, + "learning_rate": 5.461942925142998e-06, + "loss": 0.1032, + "step": 24238 + }, + { + "epoch": 66.04632152588556, + "grad_norm": 3.326951742172241, + "learning_rate": 5.4611565512660005e-06, + "loss": 0.0777, + "step": 24239 + }, + { + "epoch": 66.04904632152588, + "grad_norm": 4.344686508178711, + "learning_rate": 5.46037021273737e-06, + "loss": 0.0969, + "step": 24240 + }, + { + "epoch": 66.05177111716621, + "grad_norm": 3.5357677936553955, + "learning_rate": 5.459583909563226e-06, + "loss": 0.0591, + "step": 24241 + }, + { + "epoch": 66.05449591280654, + "grad_norm": 5.435465335845947, + "learning_rate": 5.4587976417497e-06, + "loss": 0.182, + "step": 24242 + }, + { + "epoch": 66.05722070844686, + "grad_norm": 2.5353848934173584, + "learning_rate": 5.458011409302913e-06, + "loss": 0.0453, + "step": 24243 + }, + { + "epoch": 66.0599455040872, + "grad_norm": 4.735696315765381, + "learning_rate": 5.457225212228987e-06, + "loss": 0.0537, + "step": 24244 + }, + { + "epoch": 66.06267029972751, + "grad_norm": 3.0745997428894043, + "learning_rate": 5.456439050534039e-06, + "loss": 0.0733, + "step": 24245 + }, + { + "epoch": 66.06539509536785, + "grad_norm": 3.17090106010437, + "learning_rate": 5.455652924224203e-06, + "loss": 0.1197, + "step": 24246 + }, + { + "epoch": 66.06811989100818, + "grad_norm": 3.086277961730957, + "learning_rate": 5.4548668333055954e-06, + "loss": 0.0427, + "step": 24247 + }, + { + "epoch": 66.0708446866485, + "grad_norm": 3.164388418197632, + "learning_rate": 5.454080777784338e-06, + "loss": 0.1118, + "step": 24248 + }, + { + "epoch": 66.07356948228883, + "grad_norm": 3.5116429328918457, + "learning_rate": 5.453294757666549e-06, + "loss": 0.0553, + "step": 24249 + }, + { + "epoch": 66.07629427792915, + "grad_norm": 2.788637638092041, + "learning_rate": 5.45250877295836e-06, + "loss": 0.0515, + "step": 24250 + }, + { + "epoch": 66.07901907356948, + "grad_norm": 2.9801645278930664, + "learning_rate": 5.451722823665885e-06, + "loss": 0.1824, + "step": 24251 + }, + { + "epoch": 66.0817438692098, + "grad_norm": 2.963919162750244, + "learning_rate": 5.4509369097952425e-06, + "loss": 0.111, + "step": 24252 + }, + { + "epoch": 66.08446866485014, + "grad_norm": 3.0374701023101807, + "learning_rate": 5.45015103135256e-06, + "loss": 0.0937, + "step": 24253 + }, + { + "epoch": 66.08719346049047, + "grad_norm": 3.2187795639038086, + "learning_rate": 5.449365188343952e-06, + "loss": 0.1229, + "step": 24254 + }, + { + "epoch": 66.08991825613079, + "grad_norm": 2.594090461730957, + "learning_rate": 5.448579380775545e-06, + "loss": 0.0431, + "step": 24255 + }, + { + "epoch": 66.09264305177112, + "grad_norm": 4.707623481750488, + "learning_rate": 5.447793608653456e-06, + "loss": 0.049, + "step": 24256 + }, + { + "epoch": 66.09536784741144, + "grad_norm": 3.289013385772705, + "learning_rate": 5.447007871983799e-06, + "loss": 0.0673, + "step": 24257 + }, + { + "epoch": 66.09809264305177, + "grad_norm": 3.820110321044922, + "learning_rate": 5.446222170772703e-06, + "loss": 0.053, + "step": 24258 + }, + { + "epoch": 66.1008174386921, + "grad_norm": 2.688070774078369, + "learning_rate": 5.44543650502628e-06, + "loss": 0.0321, + "step": 24259 + }, + { + "epoch": 66.10354223433242, + "grad_norm": 3.359084129333496, + "learning_rate": 5.444650874750654e-06, + "loss": 0.1136, + "step": 24260 + }, + { + "epoch": 66.10626702997276, + "grad_norm": 2.812195062637329, + "learning_rate": 5.443865279951934e-06, + "loss": 0.0778, + "step": 24261 + }, + { + "epoch": 66.10899182561307, + "grad_norm": 2.4813084602355957, + "learning_rate": 5.443079720636251e-06, + "loss": 0.1395, + "step": 24262 + }, + { + "epoch": 66.11171662125341, + "grad_norm": 4.899084568023682, + "learning_rate": 5.4422941968097145e-06, + "loss": 0.0998, + "step": 24263 + }, + { + "epoch": 66.11444141689373, + "grad_norm": 2.6284587383270264, + "learning_rate": 5.441508708478444e-06, + "loss": 0.1984, + "step": 24264 + }, + { + "epoch": 66.11716621253406, + "grad_norm": 3.3272786140441895, + "learning_rate": 5.440723255648553e-06, + "loss": 0.0589, + "step": 24265 + }, + { + "epoch": 66.11989100817439, + "grad_norm": 2.6776010990142822, + "learning_rate": 5.439937838326168e-06, + "loss": 0.0539, + "step": 24266 + }, + { + "epoch": 66.12261580381471, + "grad_norm": 2.8808488845825195, + "learning_rate": 5.439152456517398e-06, + "loss": 0.083, + "step": 24267 + }, + { + "epoch": 66.12534059945504, + "grad_norm": 2.9243571758270264, + "learning_rate": 5.438367110228364e-06, + "loss": 0.0718, + "step": 24268 + }, + { + "epoch": 66.12806539509536, + "grad_norm": 2.8457818031311035, + "learning_rate": 5.437581799465174e-06, + "loss": 0.1266, + "step": 24269 + }, + { + "epoch": 66.1307901907357, + "grad_norm": 3.4168143272399902, + "learning_rate": 5.436796524233953e-06, + "loss": 0.1344, + "step": 24270 + }, + { + "epoch": 66.13351498637603, + "grad_norm": 4.4502482414245605, + "learning_rate": 5.436011284540816e-06, + "loss": 0.0456, + "step": 24271 + }, + { + "epoch": 66.13623978201635, + "grad_norm": 3.203949451446533, + "learning_rate": 5.435226080391876e-06, + "loss": 0.1046, + "step": 24272 + }, + { + "epoch": 66.13896457765668, + "grad_norm": 5.92611026763916, + "learning_rate": 5.43444091179325e-06, + "loss": 0.0545, + "step": 24273 + }, + { + "epoch": 66.141689373297, + "grad_norm": 2.4659831523895264, + "learning_rate": 5.433655778751046e-06, + "loss": 0.1484, + "step": 24274 + }, + { + "epoch": 66.14441416893733, + "grad_norm": 2.714594841003418, + "learning_rate": 5.432870681271387e-06, + "loss": 0.1633, + "step": 24275 + }, + { + "epoch": 66.14713896457765, + "grad_norm": 5.0077056884765625, + "learning_rate": 5.432085619360385e-06, + "loss": 0.1349, + "step": 24276 + }, + { + "epoch": 66.14986376021798, + "grad_norm": 3.6828205585479736, + "learning_rate": 5.431300593024154e-06, + "loss": 0.0866, + "step": 24277 + }, + { + "epoch": 66.15258855585832, + "grad_norm": 3.1793949604034424, + "learning_rate": 5.430515602268802e-06, + "loss": 0.104, + "step": 24278 + }, + { + "epoch": 66.15531335149863, + "grad_norm": 3.393775701522827, + "learning_rate": 5.429730647100452e-06, + "loss": 0.185, + "step": 24279 + }, + { + "epoch": 66.15803814713897, + "grad_norm": 2.9456627368927, + "learning_rate": 5.428945727525212e-06, + "loss": 0.0303, + "step": 24280 + }, + { + "epoch": 66.16076294277929, + "grad_norm": 7.299849510192871, + "learning_rate": 5.428160843549192e-06, + "loss": 0.1888, + "step": 24281 + }, + { + "epoch": 66.16348773841962, + "grad_norm": 3.188413143157959, + "learning_rate": 5.427375995178512e-06, + "loss": 0.0408, + "step": 24282 + }, + { + "epoch": 66.16621253405995, + "grad_norm": 3.6501407623291016, + "learning_rate": 5.426591182419281e-06, + "loss": 0.2349, + "step": 24283 + }, + { + "epoch": 66.16893732970027, + "grad_norm": 4.452661514282227, + "learning_rate": 5.425806405277609e-06, + "loss": 0.2183, + "step": 24284 + }, + { + "epoch": 66.1716621253406, + "grad_norm": 3.6181628704071045, + "learning_rate": 5.425021663759607e-06, + "loss": 0.0525, + "step": 24285 + }, + { + "epoch": 66.17438692098092, + "grad_norm": 3.887105703353882, + "learning_rate": 5.424236957871389e-06, + "loss": 0.1238, + "step": 24286 + }, + { + "epoch": 66.17711171662125, + "grad_norm": 2.744150161743164, + "learning_rate": 5.423452287619071e-06, + "loss": 0.0421, + "step": 24287 + }, + { + "epoch": 66.17983651226157, + "grad_norm": 5.4936981201171875, + "learning_rate": 5.4226676530087575e-06, + "loss": 0.0257, + "step": 24288 + }, + { + "epoch": 66.1825613079019, + "grad_norm": 2.7765650749206543, + "learning_rate": 5.421883054046562e-06, + "loss": 0.0715, + "step": 24289 + }, + { + "epoch": 66.18528610354224, + "grad_norm": 3.0034921169281006, + "learning_rate": 5.42109849073859e-06, + "loss": 0.0443, + "step": 24290 + }, + { + "epoch": 66.18801089918256, + "grad_norm": 2.518137216567993, + "learning_rate": 5.42031396309096e-06, + "loss": 0.116, + "step": 24291 + }, + { + "epoch": 66.19073569482289, + "grad_norm": 2.664363145828247, + "learning_rate": 5.4195294711097766e-06, + "loss": 0.0469, + "step": 24292 + }, + { + "epoch": 66.19346049046321, + "grad_norm": 2.527747631072998, + "learning_rate": 5.41874501480115e-06, + "loss": 0.0589, + "step": 24293 + }, + { + "epoch": 66.19618528610354, + "grad_norm": 4.242908954620361, + "learning_rate": 5.417960594171187e-06, + "loss": 0.0872, + "step": 24294 + }, + { + "epoch": 66.19891008174388, + "grad_norm": 2.8034889698028564, + "learning_rate": 5.417176209226003e-06, + "loss": 0.0412, + "step": 24295 + }, + { + "epoch": 66.2016348773842, + "grad_norm": 2.995678663253784, + "learning_rate": 5.4163918599717015e-06, + "loss": 0.0459, + "step": 24296 + }, + { + "epoch": 66.20435967302453, + "grad_norm": 2.9752919673919678, + "learning_rate": 5.415607546414394e-06, + "loss": 0.1032, + "step": 24297 + }, + { + "epoch": 66.20708446866485, + "grad_norm": 3.64369535446167, + "learning_rate": 5.414823268560184e-06, + "loss": 0.1894, + "step": 24298 + }, + { + "epoch": 66.20980926430518, + "grad_norm": 6.802177906036377, + "learning_rate": 5.414039026415187e-06, + "loss": 0.0524, + "step": 24299 + }, + { + "epoch": 66.2125340599455, + "grad_norm": 3.8642148971557617, + "learning_rate": 5.413254819985505e-06, + "loss": 0.0839, + "step": 24300 + }, + { + "epoch": 66.21525885558583, + "grad_norm": 3.5432136058807373, + "learning_rate": 5.412470649277244e-06, + "loss": 0.0668, + "step": 24301 + }, + { + "epoch": 66.21798365122616, + "grad_norm": 2.77707839012146, + "learning_rate": 5.411686514296517e-06, + "loss": 0.0738, + "step": 24302 + }, + { + "epoch": 66.22070844686648, + "grad_norm": 2.6112751960754395, + "learning_rate": 5.410902415049428e-06, + "loss": 0.0455, + "step": 24303 + }, + { + "epoch": 66.22343324250681, + "grad_norm": 2.9880340099334717, + "learning_rate": 5.410118351542079e-06, + "loss": 0.089, + "step": 24304 + }, + { + "epoch": 66.22615803814713, + "grad_norm": 4.272844314575195, + "learning_rate": 5.409334323780586e-06, + "loss": 0.0798, + "step": 24305 + }, + { + "epoch": 66.22888283378747, + "grad_norm": 3.6603877544403076, + "learning_rate": 5.408550331771045e-06, + "loss": 0.2148, + "step": 24306 + }, + { + "epoch": 66.2316076294278, + "grad_norm": 2.74448561668396, + "learning_rate": 5.40776637551957e-06, + "loss": 0.0391, + "step": 24307 + }, + { + "epoch": 66.23433242506812, + "grad_norm": 13.26368522644043, + "learning_rate": 5.4069824550322614e-06, + "loss": 0.1095, + "step": 24308 + }, + { + "epoch": 66.23705722070845, + "grad_norm": 3.366335391998291, + "learning_rate": 5.406198570315227e-06, + "loss": 0.073, + "step": 24309 + }, + { + "epoch": 66.23978201634877, + "grad_norm": 3.413801431655884, + "learning_rate": 5.405414721374567e-06, + "loss": 0.0339, + "step": 24310 + }, + { + "epoch": 66.2425068119891, + "grad_norm": 3.139404535293579, + "learning_rate": 5.404630908216391e-06, + "loss": 0.109, + "step": 24311 + }, + { + "epoch": 66.24523160762942, + "grad_norm": 3.3953793048858643, + "learning_rate": 5.4038471308468046e-06, + "loss": 0.0455, + "step": 24312 + }, + { + "epoch": 66.24795640326975, + "grad_norm": 4.085725784301758, + "learning_rate": 5.403063389271906e-06, + "loss": 0.1498, + "step": 24313 + }, + { + "epoch": 66.25068119891009, + "grad_norm": 3.603846311569214, + "learning_rate": 5.4022796834978e-06, + "loss": 0.1901, + "step": 24314 + }, + { + "epoch": 66.2534059945504, + "grad_norm": 3.5509657859802246, + "learning_rate": 5.401496013530594e-06, + "loss": 0.138, + "step": 24315 + }, + { + "epoch": 66.25613079019074, + "grad_norm": 3.6874115467071533, + "learning_rate": 5.400712379376389e-06, + "loss": 0.1103, + "step": 24316 + }, + { + "epoch": 66.25885558583106, + "grad_norm": 3.6496448516845703, + "learning_rate": 5.399928781041289e-06, + "loss": 0.1321, + "step": 24317 + }, + { + "epoch": 66.26158038147139, + "grad_norm": 3.424882650375366, + "learning_rate": 5.399145218531392e-06, + "loss": 0.0404, + "step": 24318 + }, + { + "epoch": 66.26430517711172, + "grad_norm": 2.8604648113250732, + "learning_rate": 5.398361691852807e-06, + "loss": 0.0482, + "step": 24319 + }, + { + "epoch": 66.26702997275204, + "grad_norm": 3.9597084522247314, + "learning_rate": 5.397578201011633e-06, + "loss": 0.2066, + "step": 24320 + }, + { + "epoch": 66.26975476839237, + "grad_norm": 3.7965893745422363, + "learning_rate": 5.396794746013969e-06, + "loss": 0.1034, + "step": 24321 + }, + { + "epoch": 66.2724795640327, + "grad_norm": 2.308955192565918, + "learning_rate": 5.396011326865918e-06, + "loss": 0.0803, + "step": 24322 + }, + { + "epoch": 66.27520435967303, + "grad_norm": 3.434704303741455, + "learning_rate": 5.395227943573588e-06, + "loss": 0.0408, + "step": 24323 + }, + { + "epoch": 66.27792915531334, + "grad_norm": 12.772610664367676, + "learning_rate": 5.394444596143074e-06, + "loss": 0.0785, + "step": 24324 + }, + { + "epoch": 66.28065395095368, + "grad_norm": 4.06698751449585, + "learning_rate": 5.393661284580476e-06, + "loss": 0.2114, + "step": 24325 + }, + { + "epoch": 66.28337874659401, + "grad_norm": 4.142553806304932, + "learning_rate": 5.392878008891893e-06, + "loss": 0.0809, + "step": 24326 + }, + { + "epoch": 66.28610354223433, + "grad_norm": 4.444906711578369, + "learning_rate": 5.3920947690834315e-06, + "loss": 0.2025, + "step": 24327 + }, + { + "epoch": 66.28882833787466, + "grad_norm": 4.779823303222656, + "learning_rate": 5.391311565161188e-06, + "loss": 0.0845, + "step": 24328 + }, + { + "epoch": 66.29155313351498, + "grad_norm": 3.2991936206817627, + "learning_rate": 5.39052839713126e-06, + "loss": 0.2644, + "step": 24329 + }, + { + "epoch": 66.29427792915531, + "grad_norm": 6.251668453216553, + "learning_rate": 5.389745264999746e-06, + "loss": 0.0719, + "step": 24330 + }, + { + "epoch": 66.29700272479565, + "grad_norm": 2.9856066703796387, + "learning_rate": 5.388962168772751e-06, + "loss": 0.0553, + "step": 24331 + }, + { + "epoch": 66.29972752043597, + "grad_norm": 6.136131286621094, + "learning_rate": 5.388179108456371e-06, + "loss": 0.1126, + "step": 24332 + }, + { + "epoch": 66.3024523160763, + "grad_norm": 3.4155325889587402, + "learning_rate": 5.387396084056704e-06, + "loss": 0.1678, + "step": 24333 + }, + { + "epoch": 66.30517711171662, + "grad_norm": 2.889922618865967, + "learning_rate": 5.386613095579842e-06, + "loss": 0.0481, + "step": 24334 + }, + { + "epoch": 66.30790190735695, + "grad_norm": 2.9885833263397217, + "learning_rate": 5.385830143031894e-06, + "loss": 0.0802, + "step": 24335 + }, + { + "epoch": 66.31062670299727, + "grad_norm": 3.7668232917785645, + "learning_rate": 5.385047226418953e-06, + "loss": 0.0485, + "step": 24336 + }, + { + "epoch": 66.3133514986376, + "grad_norm": 2.5551421642303467, + "learning_rate": 5.384264345747114e-06, + "loss": 0.0465, + "step": 24337 + }, + { + "epoch": 66.31607629427793, + "grad_norm": 2.507850408554077, + "learning_rate": 5.383481501022472e-06, + "loss": 0.034, + "step": 24338 + }, + { + "epoch": 66.31880108991825, + "grad_norm": 4.48660945892334, + "learning_rate": 5.382698692251128e-06, + "loss": 0.052, + "step": 24339 + }, + { + "epoch": 66.32152588555859, + "grad_norm": 3.4189884662628174, + "learning_rate": 5.381915919439182e-06, + "loss": 0.2075, + "step": 24340 + }, + { + "epoch": 66.3242506811989, + "grad_norm": 3.596912384033203, + "learning_rate": 5.381133182592726e-06, + "loss": 0.0506, + "step": 24341 + }, + { + "epoch": 66.32697547683924, + "grad_norm": 2.990658760070801, + "learning_rate": 5.380350481717853e-06, + "loss": 0.1349, + "step": 24342 + }, + { + "epoch": 66.32970027247957, + "grad_norm": 3.235776901245117, + "learning_rate": 5.379567816820664e-06, + "loss": 0.0529, + "step": 24343 + }, + { + "epoch": 66.33242506811989, + "grad_norm": 5.018767356872559, + "learning_rate": 5.378785187907254e-06, + "loss": 0.1797, + "step": 24344 + }, + { + "epoch": 66.33514986376022, + "grad_norm": 2.745403528213501, + "learning_rate": 5.378002594983715e-06, + "loss": 0.034, + "step": 24345 + }, + { + "epoch": 66.33787465940054, + "grad_norm": 3.718411684036255, + "learning_rate": 5.377220038056139e-06, + "loss": 0.0623, + "step": 24346 + }, + { + "epoch": 66.34059945504087, + "grad_norm": 2.6147892475128174, + "learning_rate": 5.376437517130629e-06, + "loss": 0.0675, + "step": 24347 + }, + { + "epoch": 66.34332425068119, + "grad_norm": 3.535597324371338, + "learning_rate": 5.375655032213275e-06, + "loss": 0.1465, + "step": 24348 + }, + { + "epoch": 66.34604904632153, + "grad_norm": 3.055279493331909, + "learning_rate": 5.374872583310171e-06, + "loss": 0.127, + "step": 24349 + }, + { + "epoch": 66.34877384196186, + "grad_norm": 3.0705902576446533, + "learning_rate": 5.3740901704274065e-06, + "loss": 0.1877, + "step": 24350 + }, + { + "epoch": 66.35149863760218, + "grad_norm": 3.3683879375457764, + "learning_rate": 5.373307793571081e-06, + "loss": 0.1183, + "step": 24351 + }, + { + "epoch": 66.35422343324251, + "grad_norm": 3.221919059753418, + "learning_rate": 5.372525452747288e-06, + "loss": 0.0942, + "step": 24352 + }, + { + "epoch": 66.35694822888283, + "grad_norm": 3.9317526817321777, + "learning_rate": 5.3717431479621164e-06, + "loss": 0.1732, + "step": 24353 + }, + { + "epoch": 66.35967302452316, + "grad_norm": 4.337979793548584, + "learning_rate": 5.370960879221656e-06, + "loss": 0.038, + "step": 24354 + }, + { + "epoch": 66.3623978201635, + "grad_norm": 3.9914824962615967, + "learning_rate": 5.370178646532004e-06, + "loss": 0.0724, + "step": 24355 + }, + { + "epoch": 66.36512261580381, + "grad_norm": 3.8431718349456787, + "learning_rate": 5.369396449899256e-06, + "loss": 0.1155, + "step": 24356 + }, + { + "epoch": 66.36784741144415, + "grad_norm": 4.0201239585876465, + "learning_rate": 5.368614289329499e-06, + "loss": 0.0864, + "step": 24357 + }, + { + "epoch": 66.37057220708446, + "grad_norm": 8.328060150146484, + "learning_rate": 5.367832164828823e-06, + "loss": 0.1455, + "step": 24358 + }, + { + "epoch": 66.3732970027248, + "grad_norm": 3.160085678100586, + "learning_rate": 5.367050076403319e-06, + "loss": 0.0564, + "step": 24359 + }, + { + "epoch": 66.37602179836512, + "grad_norm": 2.751584529876709, + "learning_rate": 5.366268024059085e-06, + "loss": 0.0621, + "step": 24360 + }, + { + "epoch": 66.37874659400545, + "grad_norm": 3.876132011413574, + "learning_rate": 5.365486007802206e-06, + "loss": 0.0941, + "step": 24361 + }, + { + "epoch": 66.38147138964578, + "grad_norm": 2.637402057647705, + "learning_rate": 5.3647040276387695e-06, + "loss": 0.133, + "step": 24362 + }, + { + "epoch": 66.3841961852861, + "grad_norm": 3.3070435523986816, + "learning_rate": 5.363922083574869e-06, + "loss": 0.0534, + "step": 24363 + }, + { + "epoch": 66.38692098092643, + "grad_norm": 6.5956830978393555, + "learning_rate": 5.363140175616596e-06, + "loss": 0.1527, + "step": 24364 + }, + { + "epoch": 66.38964577656675, + "grad_norm": 3.4426121711730957, + "learning_rate": 5.362358303770039e-06, + "loss": 0.1852, + "step": 24365 + }, + { + "epoch": 66.39237057220708, + "grad_norm": 4.032536029815674, + "learning_rate": 5.36157646804128e-06, + "loss": 0.0495, + "step": 24366 + }, + { + "epoch": 66.39509536784742, + "grad_norm": 3.3472368717193604, + "learning_rate": 5.360794668436421e-06, + "loss": 0.1474, + "step": 24367 + }, + { + "epoch": 66.39782016348774, + "grad_norm": 6.354490756988525, + "learning_rate": 5.360012904961542e-06, + "loss": 0.0648, + "step": 24368 + }, + { + "epoch": 66.40054495912807, + "grad_norm": 3.3422086238861084, + "learning_rate": 5.359231177622735e-06, + "loss": 0.1479, + "step": 24369 + }, + { + "epoch": 66.40326975476839, + "grad_norm": 4.014708042144775, + "learning_rate": 5.358449486426081e-06, + "loss": 0.0974, + "step": 24370 + }, + { + "epoch": 66.40599455040872, + "grad_norm": 2.181469678878784, + "learning_rate": 5.357667831377676e-06, + "loss": 0.0366, + "step": 24371 + }, + { + "epoch": 66.40871934604904, + "grad_norm": 6.039536952972412, + "learning_rate": 5.356886212483603e-06, + "loss": 0.3392, + "step": 24372 + }, + { + "epoch": 66.41144414168937, + "grad_norm": 3.6809701919555664, + "learning_rate": 5.356104629749952e-06, + "loss": 0.1699, + "step": 24373 + }, + { + "epoch": 66.4141689373297, + "grad_norm": 4.135191440582275, + "learning_rate": 5.355323083182811e-06, + "loss": 0.1575, + "step": 24374 + }, + { + "epoch": 66.41689373297002, + "grad_norm": 2.894618272781372, + "learning_rate": 5.354541572788259e-06, + "loss": 0.0403, + "step": 24375 + }, + { + "epoch": 66.41961852861036, + "grad_norm": 3.449108123779297, + "learning_rate": 5.353760098572393e-06, + "loss": 0.0643, + "step": 24376 + }, + { + "epoch": 66.42234332425068, + "grad_norm": 5.413773059844971, + "learning_rate": 5.3529786605412925e-06, + "loss": 0.133, + "step": 24377 + }, + { + "epoch": 66.42506811989101, + "grad_norm": 2.243168592453003, + "learning_rate": 5.352197258701044e-06, + "loss": 0.0437, + "step": 24378 + }, + { + "epoch": 66.42779291553134, + "grad_norm": 4.364460468292236, + "learning_rate": 5.351415893057732e-06, + "loss": 0.1098, + "step": 24379 + }, + { + "epoch": 66.43051771117166, + "grad_norm": 2.627695083618164, + "learning_rate": 5.350634563617445e-06, + "loss": 0.041, + "step": 24380 + }, + { + "epoch": 66.433242506812, + "grad_norm": 7.7000627517700195, + "learning_rate": 5.3498532703862685e-06, + "loss": 0.1024, + "step": 24381 + }, + { + "epoch": 66.43596730245231, + "grad_norm": 3.704960823059082, + "learning_rate": 5.349072013370285e-06, + "loss": 0.1359, + "step": 24382 + }, + { + "epoch": 66.43869209809264, + "grad_norm": 3.626906156539917, + "learning_rate": 5.348290792575572e-06, + "loss": 0.1797, + "step": 24383 + }, + { + "epoch": 66.44141689373296, + "grad_norm": 4.711760997772217, + "learning_rate": 5.347509608008228e-06, + "loss": 0.0528, + "step": 24384 + }, + { + "epoch": 66.4441416893733, + "grad_norm": 3.4660227298736572, + "learning_rate": 5.346728459674327e-06, + "loss": 0.1244, + "step": 24385 + }, + { + "epoch": 66.44686648501363, + "grad_norm": 3.4487414360046387, + "learning_rate": 5.3459473475799565e-06, + "loss": 0.0642, + "step": 24386 + }, + { + "epoch": 66.44959128065395, + "grad_norm": 16.17318344116211, + "learning_rate": 5.345166271731195e-06, + "loss": 0.0778, + "step": 24387 + }, + { + "epoch": 66.45231607629428, + "grad_norm": 5.871947288513184, + "learning_rate": 5.344385232134131e-06, + "loss": 0.0867, + "step": 24388 + }, + { + "epoch": 66.4550408719346, + "grad_norm": 2.7655997276306152, + "learning_rate": 5.343604228794845e-06, + "loss": 0.0538, + "step": 24389 + }, + { + "epoch": 66.45776566757493, + "grad_norm": 2.9549553394317627, + "learning_rate": 5.342823261719417e-06, + "loss": 0.0427, + "step": 24390 + }, + { + "epoch": 66.46049046321527, + "grad_norm": 2.7028307914733887, + "learning_rate": 5.34204233091393e-06, + "loss": 0.0329, + "step": 24391 + }, + { + "epoch": 66.46321525885558, + "grad_norm": 2.3739640712738037, + "learning_rate": 5.341261436384472e-06, + "loss": 0.0387, + "step": 24392 + }, + { + "epoch": 66.46594005449592, + "grad_norm": 4.051398754119873, + "learning_rate": 5.34048057813712e-06, + "loss": 0.1547, + "step": 24393 + }, + { + "epoch": 66.46866485013624, + "grad_norm": 3.3245432376861572, + "learning_rate": 5.339699756177954e-06, + "loss": 0.0516, + "step": 24394 + }, + { + "epoch": 66.47138964577657, + "grad_norm": 2.757563352584839, + "learning_rate": 5.338918970513054e-06, + "loss": 0.1485, + "step": 24395 + }, + { + "epoch": 66.47411444141689, + "grad_norm": 2.9744319915771484, + "learning_rate": 5.338138221148506e-06, + "loss": 0.0963, + "step": 24396 + }, + { + "epoch": 66.47683923705722, + "grad_norm": 4.11489200592041, + "learning_rate": 5.337357508090388e-06, + "loss": 0.0836, + "step": 24397 + }, + { + "epoch": 66.47956403269755, + "grad_norm": 3.1040594577789307, + "learning_rate": 5.336576831344781e-06, + "loss": 0.0741, + "step": 24398 + }, + { + "epoch": 66.48228882833787, + "grad_norm": 5.489741325378418, + "learning_rate": 5.335796190917758e-06, + "loss": 0.0545, + "step": 24399 + }, + { + "epoch": 66.4850136239782, + "grad_norm": 3.4695920944213867, + "learning_rate": 5.335015586815408e-06, + "loss": 0.0577, + "step": 24400 + }, + { + "epoch": 66.48773841961852, + "grad_norm": 3.547744035720825, + "learning_rate": 5.3342350190438075e-06, + "loss": 0.0754, + "step": 24401 + }, + { + "epoch": 66.49046321525886, + "grad_norm": 3.535972833633423, + "learning_rate": 5.333454487609033e-06, + "loss": 0.0663, + "step": 24402 + }, + { + "epoch": 66.49318801089919, + "grad_norm": 4.044013977050781, + "learning_rate": 5.332673992517162e-06, + "loss": 0.2245, + "step": 24403 + }, + { + "epoch": 66.49591280653951, + "grad_norm": 3.093130111694336, + "learning_rate": 5.3318935337742795e-06, + "loss": 0.0305, + "step": 24404 + }, + { + "epoch": 66.49863760217984, + "grad_norm": 3.9721336364746094, + "learning_rate": 5.331113111386459e-06, + "loss": 0.0535, + "step": 24405 + }, + { + "epoch": 66.50136239782016, + "grad_norm": 4.23530387878418, + "learning_rate": 5.330332725359781e-06, + "loss": 0.0688, + "step": 24406 + }, + { + "epoch": 66.50408719346049, + "grad_norm": 4.098939418792725, + "learning_rate": 5.329552375700313e-06, + "loss": 0.0821, + "step": 24407 + }, + { + "epoch": 66.50681198910081, + "grad_norm": 7.238304615020752, + "learning_rate": 5.328772062414147e-06, + "loss": 0.1316, + "step": 24408 + }, + { + "epoch": 66.50953678474114, + "grad_norm": 2.327904224395752, + "learning_rate": 5.327991785507356e-06, + "loss": 0.0501, + "step": 24409 + }, + { + "epoch": 66.51226158038148, + "grad_norm": 3.332578659057617, + "learning_rate": 5.327211544986013e-06, + "loss": 0.1043, + "step": 24410 + }, + { + "epoch": 66.5149863760218, + "grad_norm": 3.3954625129699707, + "learning_rate": 5.326431340856193e-06, + "loss": 0.0434, + "step": 24411 + }, + { + "epoch": 66.51771117166213, + "grad_norm": 5.331161975860596, + "learning_rate": 5.3256511731239805e-06, + "loss": 0.1002, + "step": 24412 + }, + { + "epoch": 66.52043596730245, + "grad_norm": 3.658219337463379, + "learning_rate": 5.324871041795444e-06, + "loss": 0.2241, + "step": 24413 + }, + { + "epoch": 66.52316076294278, + "grad_norm": 4.608555793762207, + "learning_rate": 5.3240909468766625e-06, + "loss": 0.1769, + "step": 24414 + }, + { + "epoch": 66.52588555858311, + "grad_norm": 4.825925827026367, + "learning_rate": 5.323310888373705e-06, + "loss": 0.1014, + "step": 24415 + }, + { + "epoch": 66.52861035422343, + "grad_norm": 2.0899970531463623, + "learning_rate": 5.322530866292658e-06, + "loss": 0.0331, + "step": 24416 + }, + { + "epoch": 66.53133514986376, + "grad_norm": 3.315011501312256, + "learning_rate": 5.321750880639589e-06, + "loss": 0.0739, + "step": 24417 + }, + { + "epoch": 66.53405994550408, + "grad_norm": 3.0963010787963867, + "learning_rate": 5.320970931420572e-06, + "loss": 0.0825, + "step": 24418 + }, + { + "epoch": 66.53678474114442, + "grad_norm": 14.82800579071045, + "learning_rate": 5.3201910186416805e-06, + "loss": 0.138, + "step": 24419 + }, + { + "epoch": 66.53950953678473, + "grad_norm": 3.478710174560547, + "learning_rate": 5.3194111423089945e-06, + "loss": 0.0681, + "step": 24420 + }, + { + "epoch": 66.54223433242507, + "grad_norm": 3.069889783859253, + "learning_rate": 5.318631302428584e-06, + "loss": 0.1064, + "step": 24421 + }, + { + "epoch": 66.5449591280654, + "grad_norm": 4.537165641784668, + "learning_rate": 5.317851499006522e-06, + "loss": 0.2001, + "step": 24422 + }, + { + "epoch": 66.54768392370572, + "grad_norm": 3.5059680938720703, + "learning_rate": 5.317071732048877e-06, + "loss": 0.1032, + "step": 24423 + }, + { + "epoch": 66.55040871934605, + "grad_norm": 2.677603244781494, + "learning_rate": 5.316292001561729e-06, + "loss": 0.0401, + "step": 24424 + }, + { + "epoch": 66.55313351498637, + "grad_norm": 2.9905624389648438, + "learning_rate": 5.315512307551149e-06, + "loss": 0.0424, + "step": 24425 + }, + { + "epoch": 66.5558583106267, + "grad_norm": 3.9608407020568848, + "learning_rate": 5.314732650023211e-06, + "loss": 0.1701, + "step": 24426 + }, + { + "epoch": 66.55858310626704, + "grad_norm": 2.984921455383301, + "learning_rate": 5.3139530289839835e-06, + "loss": 0.0934, + "step": 24427 + }, + { + "epoch": 66.56130790190736, + "grad_norm": 3.228469133377075, + "learning_rate": 5.313173444439535e-06, + "loss": 0.1571, + "step": 24428 + }, + { + "epoch": 66.56403269754769, + "grad_norm": 2.8808178901672363, + "learning_rate": 5.312393896395944e-06, + "loss": 0.1158, + "step": 24429 + }, + { + "epoch": 66.566757493188, + "grad_norm": 2.9934260845184326, + "learning_rate": 5.311614384859281e-06, + "loss": 0.0521, + "step": 24430 + }, + { + "epoch": 66.56948228882834, + "grad_norm": 2.9923391342163086, + "learning_rate": 5.310834909835607e-06, + "loss": 0.0424, + "step": 24431 + }, + { + "epoch": 66.57220708446866, + "grad_norm": 3.9207231998443604, + "learning_rate": 5.310055471331006e-06, + "loss": 0.1289, + "step": 24432 + }, + { + "epoch": 66.57493188010899, + "grad_norm": 3.5021450519561768, + "learning_rate": 5.309276069351541e-06, + "loss": 0.1068, + "step": 24433 + }, + { + "epoch": 66.57765667574932, + "grad_norm": 5.448784828186035, + "learning_rate": 5.308496703903283e-06, + "loss": 0.197, + "step": 24434 + }, + { + "epoch": 66.58038147138964, + "grad_norm": 3.25518798828125, + "learning_rate": 5.307717374992298e-06, + "loss": 0.0947, + "step": 24435 + }, + { + "epoch": 66.58310626702998, + "grad_norm": 4.407520294189453, + "learning_rate": 5.306938082624663e-06, + "loss": 0.0852, + "step": 24436 + }, + { + "epoch": 66.5858310626703, + "grad_norm": 3.608776092529297, + "learning_rate": 5.306158826806443e-06, + "loss": 0.1135, + "step": 24437 + }, + { + "epoch": 66.58855585831063, + "grad_norm": 3.587841749191284, + "learning_rate": 5.305379607543708e-06, + "loss": 0.1764, + "step": 24438 + }, + { + "epoch": 66.59128065395096, + "grad_norm": 3.5023584365844727, + "learning_rate": 5.30460042484252e-06, + "loss": 0.0544, + "step": 24439 + }, + { + "epoch": 66.59400544959128, + "grad_norm": 3.0952892303466797, + "learning_rate": 5.303821278708958e-06, + "loss": 0.047, + "step": 24440 + }, + { + "epoch": 66.59673024523161, + "grad_norm": 3.8683419227600098, + "learning_rate": 5.303042169149079e-06, + "loss": 0.1697, + "step": 24441 + }, + { + "epoch": 66.59945504087193, + "grad_norm": 3.4120495319366455, + "learning_rate": 5.302263096168963e-06, + "loss": 0.0438, + "step": 24442 + }, + { + "epoch": 66.60217983651226, + "grad_norm": 3.191737651824951, + "learning_rate": 5.301484059774668e-06, + "loss": 0.054, + "step": 24443 + }, + { + "epoch": 66.60490463215258, + "grad_norm": 4.179776191711426, + "learning_rate": 5.300705059972262e-06, + "loss": 0.1406, + "step": 24444 + }, + { + "epoch": 66.60762942779292, + "grad_norm": 4.180954933166504, + "learning_rate": 5.299926096767818e-06, + "loss": 0.0562, + "step": 24445 + }, + { + "epoch": 66.61035422343325, + "grad_norm": 2.867324113845825, + "learning_rate": 5.299147170167397e-06, + "loss": 0.0586, + "step": 24446 + }, + { + "epoch": 66.61307901907357, + "grad_norm": 3.289529323577881, + "learning_rate": 5.298368280177066e-06, + "loss": 0.0632, + "step": 24447 + }, + { + "epoch": 66.6158038147139, + "grad_norm": 2.871412992477417, + "learning_rate": 5.297589426802889e-06, + "loss": 0.1184, + "step": 24448 + }, + { + "epoch": 66.61852861035422, + "grad_norm": 3.8014256954193115, + "learning_rate": 5.296810610050937e-06, + "loss": 0.1684, + "step": 24449 + }, + { + "epoch": 66.62125340599455, + "grad_norm": 2.6733717918395996, + "learning_rate": 5.296031829927274e-06, + "loss": 0.0539, + "step": 24450 + }, + { + "epoch": 66.62397820163488, + "grad_norm": 3.6280720233917236, + "learning_rate": 5.2952530864379595e-06, + "loss": 0.0939, + "step": 24451 + }, + { + "epoch": 66.6267029972752, + "grad_norm": 3.6763455867767334, + "learning_rate": 5.294474379589065e-06, + "loss": 0.1457, + "step": 24452 + }, + { + "epoch": 66.62942779291554, + "grad_norm": 3.1730730533599854, + "learning_rate": 5.293695709386655e-06, + "loss": 0.1938, + "step": 24453 + }, + { + "epoch": 66.63215258855585, + "grad_norm": 3.2582757472991943, + "learning_rate": 5.292917075836789e-06, + "loss": 0.1068, + "step": 24454 + }, + { + "epoch": 66.63487738419619, + "grad_norm": 3.7654495239257812, + "learning_rate": 5.29213847894553e-06, + "loss": 0.0986, + "step": 24455 + }, + { + "epoch": 66.6376021798365, + "grad_norm": 3.281188488006592, + "learning_rate": 5.29135991871895e-06, + "loss": 0.1427, + "step": 24456 + }, + { + "epoch": 66.64032697547684, + "grad_norm": 2.386540651321411, + "learning_rate": 5.290581395163106e-06, + "loss": 0.0582, + "step": 24457 + }, + { + "epoch": 66.64305177111717, + "grad_norm": 2.81923246383667, + "learning_rate": 5.289802908284063e-06, + "loss": 0.0411, + "step": 24458 + }, + { + "epoch": 66.64577656675749, + "grad_norm": 4.507114410400391, + "learning_rate": 5.289024458087879e-06, + "loss": 0.2048, + "step": 24459 + }, + { + "epoch": 66.64850136239782, + "grad_norm": 2.605423927307129, + "learning_rate": 5.288246044580623e-06, + "loss": 0.1153, + "step": 24460 + }, + { + "epoch": 66.65122615803814, + "grad_norm": 3.0955703258514404, + "learning_rate": 5.287467667768357e-06, + "loss": 0.0473, + "step": 24461 + }, + { + "epoch": 66.65395095367847, + "grad_norm": 3.8462536334991455, + "learning_rate": 5.286689327657142e-06, + "loss": 0.0389, + "step": 24462 + }, + { + "epoch": 66.65667574931881, + "grad_norm": 2.484198808670044, + "learning_rate": 5.285911024253039e-06, + "loss": 0.0515, + "step": 24463 + }, + { + "epoch": 66.65940054495913, + "grad_norm": 3.103261709213257, + "learning_rate": 5.2851327575621035e-06, + "loss": 0.079, + "step": 24464 + }, + { + "epoch": 66.66212534059946, + "grad_norm": 2.198317766189575, + "learning_rate": 5.284354527590407e-06, + "loss": 0.0314, + "step": 24465 + }, + { + "epoch": 66.66485013623978, + "grad_norm": 3.7459402084350586, + "learning_rate": 5.283576334344007e-06, + "loss": 0.0921, + "step": 24466 + }, + { + "epoch": 66.66757493188011, + "grad_norm": 1.9179775714874268, + "learning_rate": 5.2827981778289625e-06, + "loss": 0.0278, + "step": 24467 + }, + { + "epoch": 66.67029972752043, + "grad_norm": 4.033474445343018, + "learning_rate": 5.2820200580513295e-06, + "loss": 0.0628, + "step": 24468 + }, + { + "epoch": 66.67302452316076, + "grad_norm": 5.211009979248047, + "learning_rate": 5.281241975017176e-06, + "loss": 0.0908, + "step": 24469 + }, + { + "epoch": 66.6757493188011, + "grad_norm": 4.247863292694092, + "learning_rate": 5.280463928732557e-06, + "loss": 0.1162, + "step": 24470 + }, + { + "epoch": 66.67847411444141, + "grad_norm": 4.005177974700928, + "learning_rate": 5.279685919203537e-06, + "loss": 0.1159, + "step": 24471 + }, + { + "epoch": 66.68119891008175, + "grad_norm": 2.956925630569458, + "learning_rate": 5.278907946436164e-06, + "loss": 0.043, + "step": 24472 + }, + { + "epoch": 66.68392370572207, + "grad_norm": 3.3972792625427246, + "learning_rate": 5.278130010436509e-06, + "loss": 0.0568, + "step": 24473 + }, + { + "epoch": 66.6866485013624, + "grad_norm": 3.1583309173583984, + "learning_rate": 5.277352111210625e-06, + "loss": 0.123, + "step": 24474 + }, + { + "epoch": 66.68937329700273, + "grad_norm": 3.8960046768188477, + "learning_rate": 5.276574248764567e-06, + "loss": 0.0637, + "step": 24475 + }, + { + "epoch": 66.69209809264305, + "grad_norm": 3.651273250579834, + "learning_rate": 5.275796423104396e-06, + "loss": 0.0694, + "step": 24476 + }, + { + "epoch": 66.69482288828338, + "grad_norm": 4.14750862121582, + "learning_rate": 5.275018634236176e-06, + "loss": 0.0897, + "step": 24477 + }, + { + "epoch": 66.6975476839237, + "grad_norm": 3.3199069499969482, + "learning_rate": 5.274240882165958e-06, + "loss": 0.1153, + "step": 24478 + }, + { + "epoch": 66.70027247956403, + "grad_norm": 6.15848970413208, + "learning_rate": 5.2734631668998e-06, + "loss": 0.1701, + "step": 24479 + }, + { + "epoch": 66.70299727520435, + "grad_norm": 4.8711771965026855, + "learning_rate": 5.272685488443754e-06, + "loss": 0.1102, + "step": 24480 + }, + { + "epoch": 66.70572207084469, + "grad_norm": 3.2478652000427246, + "learning_rate": 5.271907846803885e-06, + "loss": 0.0948, + "step": 24481 + }, + { + "epoch": 66.70844686648502, + "grad_norm": 3.449075222015381, + "learning_rate": 5.271130241986246e-06, + "loss": 0.1392, + "step": 24482 + }, + { + "epoch": 66.71117166212534, + "grad_norm": 9.120984077453613, + "learning_rate": 5.270352673996893e-06, + "loss": 0.1362, + "step": 24483 + }, + { + "epoch": 66.71389645776567, + "grad_norm": 3.307509422302246, + "learning_rate": 5.269575142841876e-06, + "loss": 0.0432, + "step": 24484 + }, + { + "epoch": 66.71662125340599, + "grad_norm": 4.888644218444824, + "learning_rate": 5.268797648527262e-06, + "loss": 0.1129, + "step": 24485 + }, + { + "epoch": 66.71934604904632, + "grad_norm": 3.402113676071167, + "learning_rate": 5.268020191059098e-06, + "loss": 0.0675, + "step": 24486 + }, + { + "epoch": 66.72207084468666, + "grad_norm": 3.7245945930480957, + "learning_rate": 5.26724277044344e-06, + "loss": 0.1126, + "step": 24487 + }, + { + "epoch": 66.72479564032697, + "grad_norm": 3.6874537467956543, + "learning_rate": 5.266465386686339e-06, + "loss": 0.1886, + "step": 24488 + }, + { + "epoch": 66.7275204359673, + "grad_norm": 2.0126962661743164, + "learning_rate": 5.2656880397938585e-06, + "loss": 0.0286, + "step": 24489 + }, + { + "epoch": 66.73024523160763, + "grad_norm": 2.6054625511169434, + "learning_rate": 5.264910729772046e-06, + "loss": 0.0982, + "step": 24490 + }, + { + "epoch": 66.73297002724796, + "grad_norm": 3.2242088317871094, + "learning_rate": 5.264133456626956e-06, + "loss": 0.0863, + "step": 24491 + }, + { + "epoch": 66.73569482288828, + "grad_norm": 4.689243316650391, + "learning_rate": 5.2633562203646395e-06, + "loss": 0.0804, + "step": 24492 + }, + { + "epoch": 66.73841961852861, + "grad_norm": 3.8238258361816406, + "learning_rate": 5.262579020991152e-06, + "loss": 0.0925, + "step": 24493 + }, + { + "epoch": 66.74114441416894, + "grad_norm": 3.351555347442627, + "learning_rate": 5.26180185851255e-06, + "loss": 0.0536, + "step": 24494 + }, + { + "epoch": 66.74386920980926, + "grad_norm": 2.875150442123413, + "learning_rate": 5.261024732934883e-06, + "loss": 0.0337, + "step": 24495 + }, + { + "epoch": 66.7465940054496, + "grad_norm": 3.38814377784729, + "learning_rate": 5.260247644264199e-06, + "loss": 0.0902, + "step": 24496 + }, + { + "epoch": 66.74931880108991, + "grad_norm": 3.024885892868042, + "learning_rate": 5.259470592506558e-06, + "loss": 0.0865, + "step": 24497 + }, + { + "epoch": 66.75204359673025, + "grad_norm": 3.5949912071228027, + "learning_rate": 5.258693577668007e-06, + "loss": 0.0386, + "step": 24498 + }, + { + "epoch": 66.75476839237058, + "grad_norm": 3.1890130043029785, + "learning_rate": 5.257916599754598e-06, + "loss": 0.067, + "step": 24499 + }, + { + "epoch": 66.7574931880109, + "grad_norm": 2.889885663986206, + "learning_rate": 5.257139658772378e-06, + "loss": 0.0655, + "step": 24500 + }, + { + "epoch": 66.76021798365123, + "grad_norm": 3.1376566886901855, + "learning_rate": 5.256362754727405e-06, + "loss": 0.0897, + "step": 24501 + }, + { + "epoch": 66.76294277929155, + "grad_norm": 3.6445372104644775, + "learning_rate": 5.255585887625727e-06, + "loss": 0.1373, + "step": 24502 + }, + { + "epoch": 66.76566757493188, + "grad_norm": 4.082334041595459, + "learning_rate": 5.254809057473393e-06, + "loss": 0.1015, + "step": 24503 + }, + { + "epoch": 66.7683923705722, + "grad_norm": 3.480103015899658, + "learning_rate": 5.25403226427645e-06, + "loss": 0.0553, + "step": 24504 + }, + { + "epoch": 66.77111716621253, + "grad_norm": 3.3684353828430176, + "learning_rate": 5.253255508040954e-06, + "loss": 0.1454, + "step": 24505 + }, + { + "epoch": 66.77384196185287, + "grad_norm": 4.273370742797852, + "learning_rate": 5.252478788772952e-06, + "loss": 0.1254, + "step": 24506 + }, + { + "epoch": 66.77656675749319, + "grad_norm": 3.679145336151123, + "learning_rate": 5.251702106478491e-06, + "loss": 0.0507, + "step": 24507 + }, + { + "epoch": 66.77929155313352, + "grad_norm": 3.5244994163513184, + "learning_rate": 5.2509254611636196e-06, + "loss": 0.0618, + "step": 24508 + }, + { + "epoch": 66.78201634877384, + "grad_norm": 3.312422037124634, + "learning_rate": 5.25014885283439e-06, + "loss": 0.0723, + "step": 24509 + }, + { + "epoch": 66.78474114441417, + "grad_norm": 3.9562501907348633, + "learning_rate": 5.249372281496845e-06, + "loss": 0.0454, + "step": 24510 + }, + { + "epoch": 66.7874659400545, + "grad_norm": 3.1592650413513184, + "learning_rate": 5.248595747157039e-06, + "loss": 0.1629, + "step": 24511 + }, + { + "epoch": 66.79019073569482, + "grad_norm": 3.199082851409912, + "learning_rate": 5.247819249821018e-06, + "loss": 0.1506, + "step": 24512 + }, + { + "epoch": 66.79291553133515, + "grad_norm": 4.939488887786865, + "learning_rate": 5.247042789494823e-06, + "loss": 0.0471, + "step": 24513 + }, + { + "epoch": 66.79564032697547, + "grad_norm": 2.8808956146240234, + "learning_rate": 5.2462663661845094e-06, + "loss": 0.165, + "step": 24514 + }, + { + "epoch": 66.7983651226158, + "grad_norm": 4.536468982696533, + "learning_rate": 5.24548997989612e-06, + "loss": 0.0878, + "step": 24515 + }, + { + "epoch": 66.80108991825612, + "grad_norm": 4.296672821044922, + "learning_rate": 5.244713630635698e-06, + "loss": 0.0772, + "step": 24516 + }, + { + "epoch": 66.80381471389646, + "grad_norm": 4.1772918701171875, + "learning_rate": 5.243937318409298e-06, + "loss": 0.0558, + "step": 24517 + }, + { + "epoch": 66.80653950953679, + "grad_norm": 4.366561412811279, + "learning_rate": 5.24316104322296e-06, + "loss": 0.137, + "step": 24518 + }, + { + "epoch": 66.80926430517711, + "grad_norm": 4.326655387878418, + "learning_rate": 5.242384805082731e-06, + "loss": 0.0469, + "step": 24519 + }, + { + "epoch": 66.81198910081744, + "grad_norm": 3.3069229125976562, + "learning_rate": 5.241608603994652e-06, + "loss": 0.1111, + "step": 24520 + }, + { + "epoch": 66.81471389645776, + "grad_norm": 2.7045812606811523, + "learning_rate": 5.240832439964776e-06, + "loss": 0.0447, + "step": 24521 + }, + { + "epoch": 66.8174386920981, + "grad_norm": 3.258586883544922, + "learning_rate": 5.240056312999145e-06, + "loss": 0.0619, + "step": 24522 + }, + { + "epoch": 66.82016348773843, + "grad_norm": 7.099562168121338, + "learning_rate": 5.2392802231037996e-06, + "loss": 0.0847, + "step": 24523 + }, + { + "epoch": 66.82288828337875, + "grad_norm": 3.2443881034851074, + "learning_rate": 5.238504170284785e-06, + "loss": 0.0578, + "step": 24524 + }, + { + "epoch": 66.82561307901908, + "grad_norm": 3.9697070121765137, + "learning_rate": 5.23772815454815e-06, + "loss": 0.0736, + "step": 24525 + }, + { + "epoch": 66.8283378746594, + "grad_norm": 3.475645065307617, + "learning_rate": 5.236952175899934e-06, + "loss": 0.1062, + "step": 24526 + }, + { + "epoch": 66.83106267029973, + "grad_norm": 2.467761993408203, + "learning_rate": 5.236176234346179e-06, + "loss": 0.0557, + "step": 24527 + }, + { + "epoch": 66.83378746594005, + "grad_norm": 3.229022264480591, + "learning_rate": 5.2354003298929325e-06, + "loss": 0.0567, + "step": 24528 + }, + { + "epoch": 66.83651226158038, + "grad_norm": 3.237917900085449, + "learning_rate": 5.234624462546232e-06, + "loss": 0.0458, + "step": 24529 + }, + { + "epoch": 66.83923705722071, + "grad_norm": 6.592916965484619, + "learning_rate": 5.2338486323121266e-06, + "loss": 0.0707, + "step": 24530 + }, + { + "epoch": 66.84196185286103, + "grad_norm": 4.381230354309082, + "learning_rate": 5.233072839196653e-06, + "loss": 0.1391, + "step": 24531 + }, + { + "epoch": 66.84468664850137, + "grad_norm": 3.1076245307922363, + "learning_rate": 5.2322970832058565e-06, + "loss": 0.1147, + "step": 24532 + }, + { + "epoch": 66.84741144414168, + "grad_norm": 4.884410858154297, + "learning_rate": 5.231521364345772e-06, + "loss": 0.0573, + "step": 24533 + }, + { + "epoch": 66.85013623978202, + "grad_norm": 2.974672317504883, + "learning_rate": 5.23074568262245e-06, + "loss": 0.0595, + "step": 24534 + }, + { + "epoch": 66.85286103542235, + "grad_norm": 4.428715705871582, + "learning_rate": 5.229970038041927e-06, + "loss": 0.0556, + "step": 24535 + }, + { + "epoch": 66.85558583106267, + "grad_norm": 3.121584892272949, + "learning_rate": 5.229194430610243e-06, + "loss": 0.0516, + "step": 24536 + }, + { + "epoch": 66.858310626703, + "grad_norm": 3.397125005722046, + "learning_rate": 5.228418860333437e-06, + "loss": 0.1241, + "step": 24537 + }, + { + "epoch": 66.86103542234332, + "grad_norm": 1.7952107191085815, + "learning_rate": 5.227643327217555e-06, + "loss": 0.028, + "step": 24538 + }, + { + "epoch": 66.86376021798365, + "grad_norm": 3.0323386192321777, + "learning_rate": 5.226867831268632e-06, + "loss": 0.0469, + "step": 24539 + }, + { + "epoch": 66.86648501362397, + "grad_norm": 2.748408317565918, + "learning_rate": 5.226092372492706e-06, + "loss": 0.195, + "step": 24540 + }, + { + "epoch": 66.8692098092643, + "grad_norm": 2.3647797107696533, + "learning_rate": 5.2253169508958225e-06, + "loss": 0.0453, + "step": 24541 + }, + { + "epoch": 66.87193460490464, + "grad_norm": 2.489013671875, + "learning_rate": 5.224541566484016e-06, + "loss": 0.1354, + "step": 24542 + }, + { + "epoch": 66.87465940054496, + "grad_norm": 3.8515937328338623, + "learning_rate": 5.223766219263327e-06, + "loss": 0.0982, + "step": 24543 + }, + { + "epoch": 66.87738419618529, + "grad_norm": 3.0182557106018066, + "learning_rate": 5.222990909239789e-06, + "loss": 0.0692, + "step": 24544 + }, + { + "epoch": 66.88010899182561, + "grad_norm": 6.353591442108154, + "learning_rate": 5.222215636419443e-06, + "loss": 0.1967, + "step": 24545 + }, + { + "epoch": 66.88283378746594, + "grad_norm": 3.788677215576172, + "learning_rate": 5.221440400808333e-06, + "loss": 0.1314, + "step": 24546 + }, + { + "epoch": 66.88555858310627, + "grad_norm": 3.978733539581299, + "learning_rate": 5.220665202412492e-06, + "loss": 0.0494, + "step": 24547 + }, + { + "epoch": 66.88828337874659, + "grad_norm": 3.4406204223632812, + "learning_rate": 5.219890041237955e-06, + "loss": 0.1857, + "step": 24548 + }, + { + "epoch": 66.89100817438693, + "grad_norm": 2.2609307765960693, + "learning_rate": 5.219114917290757e-06, + "loss": 0.0295, + "step": 24549 + }, + { + "epoch": 66.89373297002724, + "grad_norm": 3.813671112060547, + "learning_rate": 5.2183398305769424e-06, + "loss": 0.0544, + "step": 24550 + }, + { + "epoch": 66.89645776566758, + "grad_norm": 4.5922651290893555, + "learning_rate": 5.217564781102543e-06, + "loss": 0.1875, + "step": 24551 + }, + { + "epoch": 66.8991825613079, + "grad_norm": 2.906663179397583, + "learning_rate": 5.216789768873596e-06, + "loss": 0.2047, + "step": 24552 + }, + { + "epoch": 66.90190735694823, + "grad_norm": 2.953495979309082, + "learning_rate": 5.2160147938961315e-06, + "loss": 0.194, + "step": 24553 + }, + { + "epoch": 66.90463215258856, + "grad_norm": 3.020416021347046, + "learning_rate": 5.215239856176194e-06, + "loss": 0.1086, + "step": 24554 + }, + { + "epoch": 66.90735694822888, + "grad_norm": 3.5891289710998535, + "learning_rate": 5.214464955719814e-06, + "loss": 0.0599, + "step": 24555 + }, + { + "epoch": 66.91008174386921, + "grad_norm": 3.024014472961426, + "learning_rate": 5.213690092533028e-06, + "loss": 0.0953, + "step": 24556 + }, + { + "epoch": 66.91280653950953, + "grad_norm": 3.2397093772888184, + "learning_rate": 5.212915266621865e-06, + "loss": 0.0469, + "step": 24557 + }, + { + "epoch": 66.91553133514986, + "grad_norm": 3.362849712371826, + "learning_rate": 5.212140477992367e-06, + "loss": 0.0468, + "step": 24558 + }, + { + "epoch": 66.9182561307902, + "grad_norm": 3.0881080627441406, + "learning_rate": 5.2113657266505655e-06, + "loss": 0.0532, + "step": 24559 + }, + { + "epoch": 66.92098092643052, + "grad_norm": 4.1464924812316895, + "learning_rate": 5.210591012602495e-06, + "loss": 0.1187, + "step": 24560 + }, + { + "epoch": 66.92370572207085, + "grad_norm": 2.5345964431762695, + "learning_rate": 5.209816335854181e-06, + "loss": 0.0411, + "step": 24561 + }, + { + "epoch": 66.92643051771117, + "grad_norm": 3.098723888397217, + "learning_rate": 5.209041696411665e-06, + "loss": 0.0441, + "step": 24562 + }, + { + "epoch": 66.9291553133515, + "grad_norm": 2.8344247341156006, + "learning_rate": 5.208267094280981e-06, + "loss": 0.0478, + "step": 24563 + }, + { + "epoch": 66.93188010899182, + "grad_norm": 4.4746198654174805, + "learning_rate": 5.20749252946816e-06, + "loss": 0.0524, + "step": 24564 + }, + { + "epoch": 66.93460490463215, + "grad_norm": 3.8244478702545166, + "learning_rate": 5.206718001979228e-06, + "loss": 0.1104, + "step": 24565 + }, + { + "epoch": 66.93732970027249, + "grad_norm": 3.324032783508301, + "learning_rate": 5.2059435118202264e-06, + "loss": 0.0759, + "step": 24566 + }, + { + "epoch": 66.9400544959128, + "grad_norm": 3.023571729660034, + "learning_rate": 5.205169058997181e-06, + "loss": 0.0383, + "step": 24567 + }, + { + "epoch": 66.94277929155314, + "grad_norm": 4.425686359405518, + "learning_rate": 5.204394643516127e-06, + "loss": 0.2514, + "step": 24568 + }, + { + "epoch": 66.94550408719346, + "grad_norm": 3.483464479446411, + "learning_rate": 5.203620265383087e-06, + "loss": 0.0343, + "step": 24569 + }, + { + "epoch": 66.94822888283379, + "grad_norm": 2.8341145515441895, + "learning_rate": 5.202845924604103e-06, + "loss": 0.1197, + "step": 24570 + }, + { + "epoch": 66.95095367847412, + "grad_norm": 4.877206325531006, + "learning_rate": 5.2020716211852e-06, + "loss": 0.0781, + "step": 24571 + }, + { + "epoch": 66.95367847411444, + "grad_norm": 3.90977144241333, + "learning_rate": 5.201297355132411e-06, + "loss": 0.1366, + "step": 24572 + }, + { + "epoch": 66.95640326975477, + "grad_norm": 2.614654779434204, + "learning_rate": 5.200523126451757e-06, + "loss": 0.1078, + "step": 24573 + }, + { + "epoch": 66.95912806539509, + "grad_norm": 3.2511801719665527, + "learning_rate": 5.19974893514928e-06, + "loss": 0.0475, + "step": 24574 + }, + { + "epoch": 66.96185286103542, + "grad_norm": 2.8034374713897705, + "learning_rate": 5.198974781231003e-06, + "loss": 0.0693, + "step": 24575 + }, + { + "epoch": 66.96457765667574, + "grad_norm": 3.829230308532715, + "learning_rate": 5.1982006647029555e-06, + "loss": 0.1439, + "step": 24576 + }, + { + "epoch": 66.96730245231608, + "grad_norm": 4.487547397613525, + "learning_rate": 5.197426585571163e-06, + "loss": 0.0636, + "step": 24577 + }, + { + "epoch": 66.97002724795641, + "grad_norm": 2.5402772426605225, + "learning_rate": 5.196652543841663e-06, + "loss": 0.1121, + "step": 24578 + }, + { + "epoch": 66.97275204359673, + "grad_norm": 3.519968271255493, + "learning_rate": 5.195878539520474e-06, + "loss": 0.0806, + "step": 24579 + }, + { + "epoch": 66.97547683923706, + "grad_norm": 3.5499627590179443, + "learning_rate": 5.195104572613631e-06, + "loss": 0.0921, + "step": 24580 + }, + { + "epoch": 66.97820163487738, + "grad_norm": 2.5481748580932617, + "learning_rate": 5.194330643127155e-06, + "loss": 0.0316, + "step": 24581 + }, + { + "epoch": 66.98092643051771, + "grad_norm": 3.4201138019561768, + "learning_rate": 5.193556751067082e-06, + "loss": 0.0729, + "step": 24582 + }, + { + "epoch": 66.98365122615803, + "grad_norm": 3.4435765743255615, + "learning_rate": 5.192782896439434e-06, + "loss": 0.0584, + "step": 24583 + }, + { + "epoch": 66.98637602179836, + "grad_norm": 3.1900954246520996, + "learning_rate": 5.192009079250239e-06, + "loss": 0.0371, + "step": 24584 + }, + { + "epoch": 66.9891008174387, + "grad_norm": 3.2524049282073975, + "learning_rate": 5.191235299505517e-06, + "loss": 0.0588, + "step": 24585 + }, + { + "epoch": 66.99182561307902, + "grad_norm": 3.2355782985687256, + "learning_rate": 5.190461557211306e-06, + "loss": 0.0612, + "step": 24586 + }, + { + "epoch": 66.99455040871935, + "grad_norm": 2.7511208057403564, + "learning_rate": 5.189687852373624e-06, + "loss": 0.0517, + "step": 24587 + }, + { + "epoch": 66.99727520435967, + "grad_norm": 4.004414081573486, + "learning_rate": 5.188914184998497e-06, + "loss": 0.0823, + "step": 24588 + }, + { + "epoch": 67.0, + "grad_norm": 2.313328504562378, + "learning_rate": 5.18814055509195e-06, + "loss": 0.0428, + "step": 24589 + }, + { + "epoch": 67.00272479564033, + "grad_norm": 3.8177289962768555, + "learning_rate": 5.187366962660012e-06, + "loss": 0.1239, + "step": 24590 + }, + { + "epoch": 67.00544959128065, + "grad_norm": 2.535372018814087, + "learning_rate": 5.186593407708706e-06, + "loss": 0.0375, + "step": 24591 + }, + { + "epoch": 67.00817438692098, + "grad_norm": 4.38206148147583, + "learning_rate": 5.185819890244055e-06, + "loss": 0.1362, + "step": 24592 + }, + { + "epoch": 67.0108991825613, + "grad_norm": 4.015827178955078, + "learning_rate": 5.185046410272079e-06, + "loss": 0.1009, + "step": 24593 + }, + { + "epoch": 67.01362397820164, + "grad_norm": 2.929131031036377, + "learning_rate": 5.184272967798811e-06, + "loss": 0.0477, + "step": 24594 + }, + { + "epoch": 67.01634877384195, + "grad_norm": 2.9919931888580322, + "learning_rate": 5.183499562830272e-06, + "loss": 0.0428, + "step": 24595 + }, + { + "epoch": 67.01907356948229, + "grad_norm": 3.2489945888519287, + "learning_rate": 5.182726195372478e-06, + "loss": 0.1985, + "step": 24596 + }, + { + "epoch": 67.02179836512262, + "grad_norm": 4.685133934020996, + "learning_rate": 5.181952865431461e-06, + "loss": 0.1397, + "step": 24597 + }, + { + "epoch": 67.02452316076294, + "grad_norm": 4.398831367492676, + "learning_rate": 5.1811795730132365e-06, + "loss": 0.0388, + "step": 24598 + }, + { + "epoch": 67.02724795640327, + "grad_norm": 5.002074241638184, + "learning_rate": 5.180406318123834e-06, + "loss": 0.1359, + "step": 24599 + }, + { + "epoch": 67.02997275204359, + "grad_norm": 3.0800745487213135, + "learning_rate": 5.1796331007692725e-06, + "loss": 0.1064, + "step": 24600 + }, + { + "epoch": 67.03269754768392, + "grad_norm": 3.5149998664855957, + "learning_rate": 5.1788599209555726e-06, + "loss": 0.0646, + "step": 24601 + }, + { + "epoch": 67.03542234332426, + "grad_norm": 2.087890863418579, + "learning_rate": 5.1780867786887535e-06, + "loss": 0.0303, + "step": 24602 + }, + { + "epoch": 67.03814713896458, + "grad_norm": 5.657195568084717, + "learning_rate": 5.177313673974842e-06, + "loss": 0.2395, + "step": 24603 + }, + { + "epoch": 67.04087193460491, + "grad_norm": 3.764268159866333, + "learning_rate": 5.176540606819857e-06, + "loss": 0.082, + "step": 24604 + }, + { + "epoch": 67.04359673024523, + "grad_norm": 3.439305543899536, + "learning_rate": 5.175767577229815e-06, + "loss": 0.1406, + "step": 24605 + }, + { + "epoch": 67.04632152588556, + "grad_norm": 2.306802988052368, + "learning_rate": 5.174994585210744e-06, + "loss": 0.0339, + "step": 24606 + }, + { + "epoch": 67.04904632152588, + "grad_norm": 6.121353626251221, + "learning_rate": 5.174221630768659e-06, + "loss": 0.1512, + "step": 24607 + }, + { + "epoch": 67.05177111716621, + "grad_norm": 2.480057716369629, + "learning_rate": 5.1734487139095815e-06, + "loss": 0.0481, + "step": 24608 + }, + { + "epoch": 67.05449591280654, + "grad_norm": 3.2592272758483887, + "learning_rate": 5.172675834639524e-06, + "loss": 0.2128, + "step": 24609 + }, + { + "epoch": 67.05722070844686, + "grad_norm": 2.563528299331665, + "learning_rate": 5.171902992964518e-06, + "loss": 0.0392, + "step": 24610 + }, + { + "epoch": 67.0599455040872, + "grad_norm": 4.097001552581787, + "learning_rate": 5.1711301888905765e-06, + "loss": 0.1128, + "step": 24611 + }, + { + "epoch": 67.06267029972751, + "grad_norm": 6.103743553161621, + "learning_rate": 5.170357422423715e-06, + "loss": 0.1939, + "step": 24612 + }, + { + "epoch": 67.06539509536785, + "grad_norm": 3.189117908477783, + "learning_rate": 5.169584693569953e-06, + "loss": 0.2665, + "step": 24613 + }, + { + "epoch": 67.06811989100818, + "grad_norm": 5.12296724319458, + "learning_rate": 5.168812002335309e-06, + "loss": 0.1065, + "step": 24614 + }, + { + "epoch": 67.0708446866485, + "grad_norm": 2.6996898651123047, + "learning_rate": 5.168039348725806e-06, + "loss": 0.0581, + "step": 24615 + }, + { + "epoch": 67.07356948228883, + "grad_norm": 2.8209614753723145, + "learning_rate": 5.167266732747455e-06, + "loss": 0.0461, + "step": 24616 + }, + { + "epoch": 67.07629427792915, + "grad_norm": 6.042128562927246, + "learning_rate": 5.166494154406279e-06, + "loss": 0.091, + "step": 24617 + }, + { + "epoch": 67.07901907356948, + "grad_norm": 3.844276189804077, + "learning_rate": 5.165721613708283e-06, + "loss": 0.0579, + "step": 24618 + }, + { + "epoch": 67.0817438692098, + "grad_norm": 3.6185991764068604, + "learning_rate": 5.164949110659498e-06, + "loss": 0.0936, + "step": 24619 + }, + { + "epoch": 67.08446866485014, + "grad_norm": 3.4355180263519287, + "learning_rate": 5.164176645265932e-06, + "loss": 0.1002, + "step": 24620 + }, + { + "epoch": 67.08719346049047, + "grad_norm": 4.071255683898926, + "learning_rate": 5.163404217533604e-06, + "loss": 0.0682, + "step": 24621 + }, + { + "epoch": 67.08991825613079, + "grad_norm": 2.856973171234131, + "learning_rate": 5.162631827468525e-06, + "loss": 0.1088, + "step": 24622 + }, + { + "epoch": 67.09264305177112, + "grad_norm": 3.257694721221924, + "learning_rate": 5.161859475076716e-06, + "loss": 0.1017, + "step": 24623 + }, + { + "epoch": 67.09536784741144, + "grad_norm": 3.8397223949432373, + "learning_rate": 5.16108716036419e-06, + "loss": 0.0921, + "step": 24624 + }, + { + "epoch": 67.09809264305177, + "grad_norm": 3.522420644760132, + "learning_rate": 5.160314883336958e-06, + "loss": 0.1487, + "step": 24625 + }, + { + "epoch": 67.1008174386921, + "grad_norm": 3.160970687866211, + "learning_rate": 5.159542644001041e-06, + "loss": 0.1618, + "step": 24626 + }, + { + "epoch": 67.10354223433242, + "grad_norm": 2.8199210166931152, + "learning_rate": 5.158770442362451e-06, + "loss": 0.0673, + "step": 24627 + }, + { + "epoch": 67.10626702997276, + "grad_norm": 3.246110439300537, + "learning_rate": 5.1579982784272005e-06, + "loss": 0.047, + "step": 24628 + }, + { + "epoch": 67.10899182561307, + "grad_norm": 7.186903953552246, + "learning_rate": 5.1572261522013e-06, + "loss": 0.1531, + "step": 24629 + }, + { + "epoch": 67.11171662125341, + "grad_norm": 3.513388156890869, + "learning_rate": 5.15645406369077e-06, + "loss": 0.1825, + "step": 24630 + }, + { + "epoch": 67.11444141689373, + "grad_norm": 2.9456865787506104, + "learning_rate": 5.155682012901616e-06, + "loss": 0.065, + "step": 24631 + }, + { + "epoch": 67.11716621253406, + "grad_norm": 4.3389892578125, + "learning_rate": 5.1549099998398585e-06, + "loss": 0.0904, + "step": 24632 + }, + { + "epoch": 67.11989100817439, + "grad_norm": 4.458559036254883, + "learning_rate": 5.154138024511506e-06, + "loss": 0.0767, + "step": 24633 + }, + { + "epoch": 67.12261580381471, + "grad_norm": 2.301032781600952, + "learning_rate": 5.153366086922567e-06, + "loss": 0.0394, + "step": 24634 + }, + { + "epoch": 67.12534059945504, + "grad_norm": 3.2916994094848633, + "learning_rate": 5.152594187079061e-06, + "loss": 0.0484, + "step": 24635 + }, + { + "epoch": 67.12806539509536, + "grad_norm": 2.459163188934326, + "learning_rate": 5.151822324986995e-06, + "loss": 0.0345, + "step": 24636 + }, + { + "epoch": 67.1307901907357, + "grad_norm": 2.8928542137145996, + "learning_rate": 5.151050500652379e-06, + "loss": 0.0373, + "step": 24637 + }, + { + "epoch": 67.13351498637603, + "grad_norm": 3.3529112339019775, + "learning_rate": 5.150278714081224e-06, + "loss": 0.0641, + "step": 24638 + }, + { + "epoch": 67.13623978201635, + "grad_norm": 3.647813558578491, + "learning_rate": 5.149506965279545e-06, + "loss": 0.0754, + "step": 24639 + }, + { + "epoch": 67.13896457765668, + "grad_norm": 2.7385573387145996, + "learning_rate": 5.148735254253351e-06, + "loss": 0.109, + "step": 24640 + }, + { + "epoch": 67.141689373297, + "grad_norm": 7.747296333312988, + "learning_rate": 5.14796358100865e-06, + "loss": 0.0454, + "step": 24641 + }, + { + "epoch": 67.14441416893733, + "grad_norm": 2.8267595767974854, + "learning_rate": 5.1471919455514484e-06, + "loss": 0.0412, + "step": 24642 + }, + { + "epoch": 67.14713896457765, + "grad_norm": 2.8402023315429688, + "learning_rate": 5.146420347887764e-06, + "loss": 0.0709, + "step": 24643 + }, + { + "epoch": 67.14986376021798, + "grad_norm": 3.3954174518585205, + "learning_rate": 5.145648788023601e-06, + "loss": 0.1491, + "step": 24644 + }, + { + "epoch": 67.15258855585832, + "grad_norm": 3.405459403991699, + "learning_rate": 5.144877265964969e-06, + "loss": 0.0631, + "step": 24645 + }, + { + "epoch": 67.15531335149863, + "grad_norm": 4.721367835998535, + "learning_rate": 5.144105781717874e-06, + "loss": 0.1033, + "step": 24646 + }, + { + "epoch": 67.15803814713897, + "grad_norm": 3.2868051528930664, + "learning_rate": 5.14333433528833e-06, + "loss": 0.1403, + "step": 24647 + }, + { + "epoch": 67.16076294277929, + "grad_norm": 3.087031364440918, + "learning_rate": 5.142562926682338e-06, + "loss": 0.1066, + "step": 24648 + }, + { + "epoch": 67.16348773841962, + "grad_norm": 2.8686745166778564, + "learning_rate": 5.141791555905913e-06, + "loss": 0.0997, + "step": 24649 + }, + { + "epoch": 67.16621253405995, + "grad_norm": 3.295128583908081, + "learning_rate": 5.141020222965056e-06, + "loss": 0.1319, + "step": 24650 + }, + { + "epoch": 67.16893732970027, + "grad_norm": 2.890428304672241, + "learning_rate": 5.140248927865781e-06, + "loss": 0.045, + "step": 24651 + }, + { + "epoch": 67.1716621253406, + "grad_norm": 4.1570963859558105, + "learning_rate": 5.139477670614091e-06, + "loss": 0.0606, + "step": 24652 + }, + { + "epoch": 67.17438692098092, + "grad_norm": 3.9590163230895996, + "learning_rate": 5.138706451215991e-06, + "loss": 0.1766, + "step": 24653 + }, + { + "epoch": 67.17711171662125, + "grad_norm": 3.9261727333068848, + "learning_rate": 5.137935269677485e-06, + "loss": 0.0771, + "step": 24654 + }, + { + "epoch": 67.17983651226157, + "grad_norm": 2.083590030670166, + "learning_rate": 5.137164126004588e-06, + "loss": 0.0306, + "step": 24655 + }, + { + "epoch": 67.1825613079019, + "grad_norm": 3.423569440841675, + "learning_rate": 5.136393020203298e-06, + "loss": 0.1249, + "step": 24656 + }, + { + "epoch": 67.18528610354224, + "grad_norm": 2.2648110389709473, + "learning_rate": 5.1356219522796255e-06, + "loss": 0.0422, + "step": 24657 + }, + { + "epoch": 67.18801089918256, + "grad_norm": 4.222996711730957, + "learning_rate": 5.134850922239567e-06, + "loss": 0.0985, + "step": 24658 + }, + { + "epoch": 67.19073569482289, + "grad_norm": 4.955621242523193, + "learning_rate": 5.134079930089138e-06, + "loss": 0.0536, + "step": 24659 + }, + { + "epoch": 67.19346049046321, + "grad_norm": 3.551360607147217, + "learning_rate": 5.1333089758343364e-06, + "loss": 0.0671, + "step": 24660 + }, + { + "epoch": 67.19618528610354, + "grad_norm": 3.71524977684021, + "learning_rate": 5.1325380594811694e-06, + "loss": 0.1959, + "step": 24661 + }, + { + "epoch": 67.19891008174388, + "grad_norm": 3.1517035961151123, + "learning_rate": 5.131767181035634e-06, + "loss": 0.1292, + "step": 24662 + }, + { + "epoch": 67.2016348773842, + "grad_norm": 3.6539742946624756, + "learning_rate": 5.130996340503744e-06, + "loss": 0.039, + "step": 24663 + }, + { + "epoch": 67.20435967302453, + "grad_norm": 3.0689525604248047, + "learning_rate": 5.130225537891498e-06, + "loss": 0.0363, + "step": 24664 + }, + { + "epoch": 67.20708446866485, + "grad_norm": 2.8991730213165283, + "learning_rate": 5.129454773204894e-06, + "loss": 0.1223, + "step": 24665 + }, + { + "epoch": 67.20980926430518, + "grad_norm": 3.562687635421753, + "learning_rate": 5.1286840464499435e-06, + "loss": 0.1406, + "step": 24666 + }, + { + "epoch": 67.2125340599455, + "grad_norm": 3.347503423690796, + "learning_rate": 5.127913357632641e-06, + "loss": 0.0408, + "step": 24667 + }, + { + "epoch": 67.21525885558583, + "grad_norm": 3.359271287918091, + "learning_rate": 5.127142706758996e-06, + "loss": 0.0752, + "step": 24668 + }, + { + "epoch": 67.21798365122616, + "grad_norm": 6.227237224578857, + "learning_rate": 5.1263720938350085e-06, + "loss": 0.0484, + "step": 24669 + }, + { + "epoch": 67.22070844686648, + "grad_norm": 2.8463234901428223, + "learning_rate": 5.125601518866672e-06, + "loss": 0.0459, + "step": 24670 + }, + { + "epoch": 67.22343324250681, + "grad_norm": 5.320071220397949, + "learning_rate": 5.12483098186e-06, + "loss": 0.1143, + "step": 24671 + }, + { + "epoch": 67.22615803814713, + "grad_norm": 3.1932263374328613, + "learning_rate": 5.124060482820986e-06, + "loss": 0.199, + "step": 24672 + }, + { + "epoch": 67.22888283378747, + "grad_norm": 15.600347518920898, + "learning_rate": 5.123290021755634e-06, + "loss": 0.1381, + "step": 24673 + }, + { + "epoch": 67.2316076294278, + "grad_norm": 3.40120267868042, + "learning_rate": 5.122519598669935e-06, + "loss": 0.1106, + "step": 24674 + }, + { + "epoch": 67.23433242506812, + "grad_norm": 3.6226260662078857, + "learning_rate": 5.121749213569903e-06, + "loss": 0.1756, + "step": 24675 + }, + { + "epoch": 67.23705722070845, + "grad_norm": 2.6622533798217773, + "learning_rate": 5.1209788664615304e-06, + "loss": 0.043, + "step": 24676 + }, + { + "epoch": 67.23978201634877, + "grad_norm": 2.5700666904449463, + "learning_rate": 5.1202085573508175e-06, + "loss": 0.0453, + "step": 24677 + }, + { + "epoch": 67.2425068119891, + "grad_norm": 2.4242546558380127, + "learning_rate": 5.119438286243759e-06, + "loss": 0.0648, + "step": 24678 + }, + { + "epoch": 67.24523160762942, + "grad_norm": 3.5825319290161133, + "learning_rate": 5.118668053146363e-06, + "loss": 0.0793, + "step": 24679 + }, + { + "epoch": 67.24795640326975, + "grad_norm": 3.02204966545105, + "learning_rate": 5.117897858064622e-06, + "loss": 0.0814, + "step": 24680 + }, + { + "epoch": 67.25068119891009, + "grad_norm": 4.157834529876709, + "learning_rate": 5.117127701004535e-06, + "loss": 0.187, + "step": 24681 + }, + { + "epoch": 67.2534059945504, + "grad_norm": 5.315064907073975, + "learning_rate": 5.116357581972098e-06, + "loss": 0.1216, + "step": 24682 + }, + { + "epoch": 67.25613079019074, + "grad_norm": 5.192597389221191, + "learning_rate": 5.115587500973309e-06, + "loss": 0.116, + "step": 24683 + }, + { + "epoch": 67.25885558583106, + "grad_norm": 3.724283456802368, + "learning_rate": 5.114817458014172e-06, + "loss": 0.0807, + "step": 24684 + }, + { + "epoch": 67.26158038147139, + "grad_norm": 3.5205814838409424, + "learning_rate": 5.11404745310068e-06, + "loss": 0.0721, + "step": 24685 + }, + { + "epoch": 67.26430517711172, + "grad_norm": 5.1249680519104, + "learning_rate": 5.113277486238829e-06, + "loss": 0.1646, + "step": 24686 + }, + { + "epoch": 67.26702997275204, + "grad_norm": 3.207024335861206, + "learning_rate": 5.112507557434612e-06, + "loss": 0.1413, + "step": 24687 + }, + { + "epoch": 67.26975476839237, + "grad_norm": 4.9466376304626465, + "learning_rate": 5.111737666694032e-06, + "loss": 0.1088, + "step": 24688 + }, + { + "epoch": 67.2724795640327, + "grad_norm": 2.8702213764190674, + "learning_rate": 5.110967814023083e-06, + "loss": 0.0437, + "step": 24689 + }, + { + "epoch": 67.27520435967303, + "grad_norm": 3.057664394378662, + "learning_rate": 5.110197999427753e-06, + "loss": 0.0659, + "step": 24690 + }, + { + "epoch": 67.27792915531334, + "grad_norm": 2.8249452114105225, + "learning_rate": 5.10942822291405e-06, + "loss": 0.061, + "step": 24691 + }, + { + "epoch": 67.28065395095368, + "grad_norm": 3.631533622741699, + "learning_rate": 5.108658484487961e-06, + "loss": 0.1307, + "step": 24692 + }, + { + "epoch": 67.28337874659401, + "grad_norm": 3.4069125652313232, + "learning_rate": 5.107888784155484e-06, + "loss": 0.0955, + "step": 24693 + }, + { + "epoch": 67.28610354223433, + "grad_norm": 2.5948667526245117, + "learning_rate": 5.107119121922606e-06, + "loss": 0.1235, + "step": 24694 + }, + { + "epoch": 67.28882833787466, + "grad_norm": 3.14793062210083, + "learning_rate": 5.106349497795331e-06, + "loss": 0.0542, + "step": 24695 + }, + { + "epoch": 67.29155313351498, + "grad_norm": 4.083686828613281, + "learning_rate": 5.105579911779649e-06, + "loss": 0.0805, + "step": 24696 + }, + { + "epoch": 67.29427792915531, + "grad_norm": 3.630496025085449, + "learning_rate": 5.104810363881554e-06, + "loss": 0.1727, + "step": 24697 + }, + { + "epoch": 67.29700272479565, + "grad_norm": 3.330587387084961, + "learning_rate": 5.104040854107033e-06, + "loss": 0.0753, + "step": 24698 + }, + { + "epoch": 67.29972752043597, + "grad_norm": 3.055983543395996, + "learning_rate": 5.103271382462085e-06, + "loss": 0.1081, + "step": 24699 + }, + { + "epoch": 67.3024523160763, + "grad_norm": 3.5617239475250244, + "learning_rate": 5.102501948952705e-06, + "loss": 0.062, + "step": 24700 + }, + { + "epoch": 67.30517711171662, + "grad_norm": 2.897954225540161, + "learning_rate": 5.101732553584883e-06, + "loss": 0.0431, + "step": 24701 + }, + { + "epoch": 67.30790190735695, + "grad_norm": 4.210009574890137, + "learning_rate": 5.10096319636461e-06, + "loss": 0.1356, + "step": 24702 + }, + { + "epoch": 67.31062670299727, + "grad_norm": 2.9569778442382812, + "learning_rate": 5.100193877297874e-06, + "loss": 0.0798, + "step": 24703 + }, + { + "epoch": 67.3133514986376, + "grad_norm": 2.7195286750793457, + "learning_rate": 5.099424596390674e-06, + "loss": 0.0687, + "step": 24704 + }, + { + "epoch": 67.31607629427793, + "grad_norm": 3.508420944213867, + "learning_rate": 5.098655353648998e-06, + "loss": 0.1061, + "step": 24705 + }, + { + "epoch": 67.31880108991825, + "grad_norm": 4.016233444213867, + "learning_rate": 5.097886149078836e-06, + "loss": 0.1569, + "step": 24706 + }, + { + "epoch": 67.32152588555859, + "grad_norm": 3.3125321865081787, + "learning_rate": 5.097116982686175e-06, + "loss": 0.071, + "step": 24707 + }, + { + "epoch": 67.3242506811989, + "grad_norm": 2.6926913261413574, + "learning_rate": 5.0963478544770125e-06, + "loss": 0.0903, + "step": 24708 + }, + { + "epoch": 67.32697547683924, + "grad_norm": 3.0416789054870605, + "learning_rate": 5.095578764457336e-06, + "loss": 0.074, + "step": 24709 + }, + { + "epoch": 67.32970027247957, + "grad_norm": 3.1462037563323975, + "learning_rate": 5.0948097126331355e-06, + "loss": 0.0857, + "step": 24710 + }, + { + "epoch": 67.33242506811989, + "grad_norm": 2.979736804962158, + "learning_rate": 5.094040699010393e-06, + "loss": 0.0531, + "step": 24711 + }, + { + "epoch": 67.33514986376022, + "grad_norm": 4.241286277770996, + "learning_rate": 5.093271723595108e-06, + "loss": 0.1427, + "step": 24712 + }, + { + "epoch": 67.33787465940054, + "grad_norm": 3.185534715652466, + "learning_rate": 5.092502786393265e-06, + "loss": 0.1253, + "step": 24713 + }, + { + "epoch": 67.34059945504087, + "grad_norm": 3.9344115257263184, + "learning_rate": 5.091733887410849e-06, + "loss": 0.0438, + "step": 24714 + }, + { + "epoch": 67.34332425068119, + "grad_norm": 2.4539952278137207, + "learning_rate": 5.090965026653856e-06, + "loss": 0.0662, + "step": 24715 + }, + { + "epoch": 67.34604904632153, + "grad_norm": 4.353048801422119, + "learning_rate": 5.090196204128268e-06, + "loss": 0.1334, + "step": 24716 + }, + { + "epoch": 67.34877384196186, + "grad_norm": 2.635066509246826, + "learning_rate": 5.08942741984007e-06, + "loss": 0.0972, + "step": 24717 + }, + { + "epoch": 67.35149863760218, + "grad_norm": 3.0731635093688965, + "learning_rate": 5.088658673795257e-06, + "loss": 0.0495, + "step": 24718 + }, + { + "epoch": 67.35422343324251, + "grad_norm": 3.688865900039673, + "learning_rate": 5.08788996599981e-06, + "loss": 0.0424, + "step": 24719 + }, + { + "epoch": 67.35694822888283, + "grad_norm": 4.1209917068481445, + "learning_rate": 5.0871212964597205e-06, + "loss": 0.1023, + "step": 24720 + }, + { + "epoch": 67.35967302452316, + "grad_norm": 2.7736964225769043, + "learning_rate": 5.086352665180971e-06, + "loss": 0.0804, + "step": 24721 + }, + { + "epoch": 67.3623978201635, + "grad_norm": 3.80026912689209, + "learning_rate": 5.085584072169551e-06, + "loss": 0.066, + "step": 24722 + }, + { + "epoch": 67.36512261580381, + "grad_norm": 2.247812032699585, + "learning_rate": 5.08481551743144e-06, + "loss": 0.0544, + "step": 24723 + }, + { + "epoch": 67.36784741144415, + "grad_norm": 6.78448486328125, + "learning_rate": 5.0840470009726295e-06, + "loss": 0.0496, + "step": 24724 + }, + { + "epoch": 67.37057220708446, + "grad_norm": 4.081532955169678, + "learning_rate": 5.083278522799104e-06, + "loss": 0.0775, + "step": 24725 + }, + { + "epoch": 67.3732970027248, + "grad_norm": 3.0944600105285645, + "learning_rate": 5.082510082916847e-06, + "loss": 0.1056, + "step": 24726 + }, + { + "epoch": 67.37602179836512, + "grad_norm": 3.0897984504699707, + "learning_rate": 5.08174168133184e-06, + "loss": 0.0694, + "step": 24727 + }, + { + "epoch": 67.37874659400545, + "grad_norm": 2.751068115234375, + "learning_rate": 5.080973318050073e-06, + "loss": 0.051, + "step": 24728 + }, + { + "epoch": 67.38147138964578, + "grad_norm": 2.8970413208007812, + "learning_rate": 5.080204993077529e-06, + "loss": 0.0439, + "step": 24729 + }, + { + "epoch": 67.3841961852861, + "grad_norm": 3.559302806854248, + "learning_rate": 5.0794367064201885e-06, + "loss": 0.1568, + "step": 24730 + }, + { + "epoch": 67.38692098092643, + "grad_norm": 15.17588996887207, + "learning_rate": 5.078668458084035e-06, + "loss": 0.2251, + "step": 24731 + }, + { + "epoch": 67.38964577656675, + "grad_norm": 2.577274799346924, + "learning_rate": 5.077900248075055e-06, + "loss": 0.121, + "step": 24732 + }, + { + "epoch": 67.39237057220708, + "grad_norm": 5.998250961303711, + "learning_rate": 5.07713207639923e-06, + "loss": 0.1262, + "step": 24733 + }, + { + "epoch": 67.39509536784742, + "grad_norm": 3.9774091243743896, + "learning_rate": 5.0763639430625385e-06, + "loss": 0.0612, + "step": 24734 + }, + { + "epoch": 67.39782016348774, + "grad_norm": 3.52544903755188, + "learning_rate": 5.0755958480709665e-06, + "loss": 0.0651, + "step": 24735 + }, + { + "epoch": 67.40054495912807, + "grad_norm": 3.4941420555114746, + "learning_rate": 5.074827791430499e-06, + "loss": 0.0568, + "step": 24736 + }, + { + "epoch": 67.40326975476839, + "grad_norm": 2.9969611167907715, + "learning_rate": 5.0740597731471134e-06, + "loss": 0.1178, + "step": 24737 + }, + { + "epoch": 67.40599455040872, + "grad_norm": 2.392972946166992, + "learning_rate": 5.073291793226791e-06, + "loss": 0.0384, + "step": 24738 + }, + { + "epoch": 67.40871934604904, + "grad_norm": 3.2726314067840576, + "learning_rate": 5.072523851675512e-06, + "loss": 0.0531, + "step": 24739 + }, + { + "epoch": 67.41144414168937, + "grad_norm": 4.787219047546387, + "learning_rate": 5.071755948499262e-06, + "loss": 0.0365, + "step": 24740 + }, + { + "epoch": 67.4141689373297, + "grad_norm": 7.6623663902282715, + "learning_rate": 5.070988083704016e-06, + "loss": 0.167, + "step": 24741 + }, + { + "epoch": 67.41689373297002, + "grad_norm": 3.5750341415405273, + "learning_rate": 5.070220257295758e-06, + "loss": 0.1, + "step": 24742 + }, + { + "epoch": 67.41961852861036, + "grad_norm": 3.042717933654785, + "learning_rate": 5.0694524692804625e-06, + "loss": 0.0564, + "step": 24743 + }, + { + "epoch": 67.42234332425068, + "grad_norm": 3.4299728870391846, + "learning_rate": 5.068684719664116e-06, + "loss": 0.1737, + "step": 24744 + }, + { + "epoch": 67.42506811989101, + "grad_norm": 3.153731107711792, + "learning_rate": 5.067917008452693e-06, + "loss": 0.0827, + "step": 24745 + }, + { + "epoch": 67.42779291553134, + "grad_norm": 3.2509191036224365, + "learning_rate": 5.067149335652175e-06, + "loss": 0.1035, + "step": 24746 + }, + { + "epoch": 67.43051771117166, + "grad_norm": 3.6034340858459473, + "learning_rate": 5.066381701268535e-06, + "loss": 0.114, + "step": 24747 + }, + { + "epoch": 67.433242506812, + "grad_norm": 10.852611541748047, + "learning_rate": 5.065614105307759e-06, + "loss": 0.0402, + "step": 24748 + }, + { + "epoch": 67.43596730245231, + "grad_norm": 4.52252197265625, + "learning_rate": 5.064846547775821e-06, + "loss": 0.1277, + "step": 24749 + }, + { + "epoch": 67.43869209809264, + "grad_norm": 4.758501052856445, + "learning_rate": 5.0640790286787e-06, + "loss": 0.2125, + "step": 24750 + }, + { + "epoch": 67.44141689373296, + "grad_norm": 3.4215078353881836, + "learning_rate": 5.0633115480223695e-06, + "loss": 0.0479, + "step": 24751 + }, + { + "epoch": 67.4441416893733, + "grad_norm": 3.988860845565796, + "learning_rate": 5.062544105812807e-06, + "loss": 0.1015, + "step": 24752 + }, + { + "epoch": 67.44686648501363, + "grad_norm": 3.772794008255005, + "learning_rate": 5.061776702055998e-06, + "loss": 0.0599, + "step": 24753 + }, + { + "epoch": 67.44959128065395, + "grad_norm": 4.0554280281066895, + "learning_rate": 5.0610093367579135e-06, + "loss": 0.1243, + "step": 24754 + }, + { + "epoch": 67.45231607629428, + "grad_norm": 2.8715896606445312, + "learning_rate": 5.060242009924525e-06, + "loss": 0.0636, + "step": 24755 + }, + { + "epoch": 67.4550408719346, + "grad_norm": 3.2675414085388184, + "learning_rate": 5.059474721561817e-06, + "loss": 0.0614, + "step": 24756 + }, + { + "epoch": 67.45776566757493, + "grad_norm": 2.7207672595977783, + "learning_rate": 5.058707471675761e-06, + "loss": 0.0383, + "step": 24757 + }, + { + "epoch": 67.46049046321527, + "grad_norm": 3.1995835304260254, + "learning_rate": 5.0579402602723315e-06, + "loss": 0.0915, + "step": 24758 + }, + { + "epoch": 67.46321525885558, + "grad_norm": 3.2084741592407227, + "learning_rate": 5.057173087357501e-06, + "loss": 0.0684, + "step": 24759 + }, + { + "epoch": 67.46594005449592, + "grad_norm": 3.7472259998321533, + "learning_rate": 5.05640595293725e-06, + "loss": 0.1285, + "step": 24760 + }, + { + "epoch": 67.46866485013624, + "grad_norm": 3.2161805629730225, + "learning_rate": 5.055638857017551e-06, + "loss": 0.0553, + "step": 24761 + }, + { + "epoch": 67.47138964577657, + "grad_norm": 3.6380856037139893, + "learning_rate": 5.054871799604377e-06, + "loss": 0.1469, + "step": 24762 + }, + { + "epoch": 67.47411444141689, + "grad_norm": 3.3077454566955566, + "learning_rate": 5.054104780703699e-06, + "loss": 0.0768, + "step": 24763 + }, + { + "epoch": 67.47683923705722, + "grad_norm": 3.4313948154449463, + "learning_rate": 5.053337800321498e-06, + "loss": 0.1028, + "step": 24764 + }, + { + "epoch": 67.47956403269755, + "grad_norm": 2.646376132965088, + "learning_rate": 5.052570858463743e-06, + "loss": 0.0306, + "step": 24765 + }, + { + "epoch": 67.48228882833787, + "grad_norm": 3.7639083862304688, + "learning_rate": 5.051803955136406e-06, + "loss": 0.0776, + "step": 24766 + }, + { + "epoch": 67.4850136239782, + "grad_norm": 2.773786783218384, + "learning_rate": 5.051037090345457e-06, + "loss": 0.0363, + "step": 24767 + }, + { + "epoch": 67.48773841961852, + "grad_norm": 2.877821683883667, + "learning_rate": 5.050270264096873e-06, + "loss": 0.0494, + "step": 24768 + }, + { + "epoch": 67.49046321525886, + "grad_norm": 3.5250706672668457, + "learning_rate": 5.049503476396627e-06, + "loss": 0.0428, + "step": 24769 + }, + { + "epoch": 67.49318801089919, + "grad_norm": 3.0568342208862305, + "learning_rate": 5.048736727250689e-06, + "loss": 0.1221, + "step": 24770 + }, + { + "epoch": 67.49591280653951, + "grad_norm": 3.014346122741699, + "learning_rate": 5.047970016665031e-06, + "loss": 0.0739, + "step": 24771 + }, + { + "epoch": 67.49863760217984, + "grad_norm": 3.089616537094116, + "learning_rate": 5.0472033446456195e-06, + "loss": 0.1213, + "step": 24772 + }, + { + "epoch": 67.50136239782016, + "grad_norm": 3.176083564758301, + "learning_rate": 5.046436711198431e-06, + "loss": 0.0425, + "step": 24773 + }, + { + "epoch": 67.50408719346049, + "grad_norm": 3.830902576446533, + "learning_rate": 5.045670116329435e-06, + "loss": 0.0919, + "step": 24774 + }, + { + "epoch": 67.50681198910081, + "grad_norm": 3.097994565963745, + "learning_rate": 5.0449035600446005e-06, + "loss": 0.0678, + "step": 24775 + }, + { + "epoch": 67.50953678474114, + "grad_norm": 5.094249725341797, + "learning_rate": 5.044137042349895e-06, + "loss": 0.099, + "step": 24776 + }, + { + "epoch": 67.51226158038148, + "grad_norm": 3.530489921569824, + "learning_rate": 5.043370563251293e-06, + "loss": 0.207, + "step": 24777 + }, + { + "epoch": 67.5149863760218, + "grad_norm": 3.2964890003204346, + "learning_rate": 5.0426041227547616e-06, + "loss": 0.2278, + "step": 24778 + }, + { + "epoch": 67.51771117166213, + "grad_norm": 2.7340049743652344, + "learning_rate": 5.041837720866266e-06, + "loss": 0.0463, + "step": 24779 + }, + { + "epoch": 67.52043596730245, + "grad_norm": 3.1398894786834717, + "learning_rate": 5.041071357591782e-06, + "loss": 0.0496, + "step": 24780 + }, + { + "epoch": 67.52316076294278, + "grad_norm": 2.630547285079956, + "learning_rate": 5.040305032937276e-06, + "loss": 0.1534, + "step": 24781 + }, + { + "epoch": 67.52588555858311, + "grad_norm": 2.391430377960205, + "learning_rate": 5.039538746908714e-06, + "loss": 0.0404, + "step": 24782 + }, + { + "epoch": 67.52861035422343, + "grad_norm": 3.8539505004882812, + "learning_rate": 5.038772499512061e-06, + "loss": 0.2649, + "step": 24783 + }, + { + "epoch": 67.53133514986376, + "grad_norm": 3.411309003829956, + "learning_rate": 5.038006290753292e-06, + "loss": 0.0927, + "step": 24784 + }, + { + "epoch": 67.53405994550408, + "grad_norm": 3.26887845993042, + "learning_rate": 5.037240120638367e-06, + "loss": 0.1387, + "step": 24785 + }, + { + "epoch": 67.53678474114442, + "grad_norm": 3.015413999557495, + "learning_rate": 5.0364739891732584e-06, + "loss": 0.1044, + "step": 24786 + }, + { + "epoch": 67.53950953678473, + "grad_norm": 2.9222254753112793, + "learning_rate": 5.0357078963639325e-06, + "loss": 0.1054, + "step": 24787 + }, + { + "epoch": 67.54223433242507, + "grad_norm": 5.172916412353516, + "learning_rate": 5.034941842216349e-06, + "loss": 0.1323, + "step": 24788 + }, + { + "epoch": 67.5449591280654, + "grad_norm": 4.501311302185059, + "learning_rate": 5.034175826736483e-06, + "loss": 0.139, + "step": 24789 + }, + { + "epoch": 67.54768392370572, + "grad_norm": 4.1948418617248535, + "learning_rate": 5.033409849930295e-06, + "loss": 0.0798, + "step": 24790 + }, + { + "epoch": 67.55040871934605, + "grad_norm": 2.8324954509735107, + "learning_rate": 5.032643911803752e-06, + "loss": 0.1167, + "step": 24791 + }, + { + "epoch": 67.55313351498637, + "grad_norm": 8.362939834594727, + "learning_rate": 5.031878012362813e-06, + "loss": 0.087, + "step": 24792 + }, + { + "epoch": 67.5558583106267, + "grad_norm": 2.408095598220825, + "learning_rate": 5.031112151613453e-06, + "loss": 0.0604, + "step": 24793 + }, + { + "epoch": 67.55858310626704, + "grad_norm": 3.738321304321289, + "learning_rate": 5.030346329561632e-06, + "loss": 0.0899, + "step": 24794 + }, + { + "epoch": 67.56130790190736, + "grad_norm": 2.8952131271362305, + "learning_rate": 5.029580546213313e-06, + "loss": 0.0963, + "step": 24795 + }, + { + "epoch": 67.56403269754769, + "grad_norm": 3.862053632736206, + "learning_rate": 5.0288148015744576e-06, + "loss": 0.0682, + "step": 24796 + }, + { + "epoch": 67.566757493188, + "grad_norm": 3.8780133724212646, + "learning_rate": 5.028049095651036e-06, + "loss": 0.0962, + "step": 24797 + }, + { + "epoch": 67.56948228882834, + "grad_norm": 2.654364824295044, + "learning_rate": 5.027283428449008e-06, + "loss": 0.0397, + "step": 24798 + }, + { + "epoch": 67.57220708446866, + "grad_norm": 2.4831955432891846, + "learning_rate": 5.0265177999743335e-06, + "loss": 0.0322, + "step": 24799 + }, + { + "epoch": 67.57493188010899, + "grad_norm": 3.551032304763794, + "learning_rate": 5.025752210232982e-06, + "loss": 0.1826, + "step": 24800 + }, + { + "epoch": 67.57765667574932, + "grad_norm": 3.573977470397949, + "learning_rate": 5.0249866592309115e-06, + "loss": 0.0409, + "step": 24801 + }, + { + "epoch": 67.58038147138964, + "grad_norm": 2.2330880165100098, + "learning_rate": 5.024221146974084e-06, + "loss": 0.0276, + "step": 24802 + }, + { + "epoch": 67.58310626702998, + "grad_norm": 3.4516408443450928, + "learning_rate": 5.02345567346846e-06, + "loss": 0.0809, + "step": 24803 + }, + { + "epoch": 67.5858310626703, + "grad_norm": 2.8857977390289307, + "learning_rate": 5.022690238720002e-06, + "loss": 0.0433, + "step": 24804 + }, + { + "epoch": 67.58855585831063, + "grad_norm": 2.741292953491211, + "learning_rate": 5.021924842734678e-06, + "loss": 0.0724, + "step": 24805 + }, + { + "epoch": 67.59128065395096, + "grad_norm": 2.7073473930358887, + "learning_rate": 5.021159485518441e-06, + "loss": 0.0375, + "step": 24806 + }, + { + "epoch": 67.59400544959128, + "grad_norm": 5.090786457061768, + "learning_rate": 5.020394167077254e-06, + "loss": 0.1652, + "step": 24807 + }, + { + "epoch": 67.59673024523161, + "grad_norm": 3.7017996311187744, + "learning_rate": 5.019628887417073e-06, + "loss": 0.0454, + "step": 24808 + }, + { + "epoch": 67.59945504087193, + "grad_norm": 2.341773748397827, + "learning_rate": 5.0188636465438654e-06, + "loss": 0.0507, + "step": 24809 + }, + { + "epoch": 67.60217983651226, + "grad_norm": 2.2711684703826904, + "learning_rate": 5.018098444463588e-06, + "loss": 0.0479, + "step": 24810 + }, + { + "epoch": 67.60490463215258, + "grad_norm": 2.489880323410034, + "learning_rate": 5.0173332811822e-06, + "loss": 0.0304, + "step": 24811 + }, + { + "epoch": 67.60762942779292, + "grad_norm": 5.754882335662842, + "learning_rate": 5.016568156705657e-06, + "loss": 0.1992, + "step": 24812 + }, + { + "epoch": 67.61035422343325, + "grad_norm": 3.56738018989563, + "learning_rate": 5.015803071039923e-06, + "loss": 0.079, + "step": 24813 + }, + { + "epoch": 67.61307901907357, + "grad_norm": 6.180990695953369, + "learning_rate": 5.015038024190954e-06, + "loss": 0.0558, + "step": 24814 + }, + { + "epoch": 67.6158038147139, + "grad_norm": 3.8189873695373535, + "learning_rate": 5.014273016164711e-06, + "loss": 0.0851, + "step": 24815 + }, + { + "epoch": 67.61852861035422, + "grad_norm": 4.0965681076049805, + "learning_rate": 5.013508046967142e-06, + "loss": 0.1865, + "step": 24816 + }, + { + "epoch": 67.62125340599455, + "grad_norm": 3.53777813911438, + "learning_rate": 5.012743116604217e-06, + "loss": 0.0459, + "step": 24817 + }, + { + "epoch": 67.62397820163488, + "grad_norm": 3.362224817276001, + "learning_rate": 5.011978225081889e-06, + "loss": 0.069, + "step": 24818 + }, + { + "epoch": 67.6267029972752, + "grad_norm": 3.1568098068237305, + "learning_rate": 5.011213372406114e-06, + "loss": 0.0637, + "step": 24819 + }, + { + "epoch": 67.62942779291554, + "grad_norm": 2.6528587341308594, + "learning_rate": 5.010448558582841e-06, + "loss": 0.0515, + "step": 24820 + }, + { + "epoch": 67.63215258855585, + "grad_norm": 3.075692653656006, + "learning_rate": 5.00968378361804e-06, + "loss": 0.0959, + "step": 24821 + }, + { + "epoch": 67.63487738419619, + "grad_norm": 3.195258617401123, + "learning_rate": 5.008919047517663e-06, + "loss": 0.0471, + "step": 24822 + }, + { + "epoch": 67.6376021798365, + "grad_norm": 3.759169340133667, + "learning_rate": 5.008154350287663e-06, + "loss": 0.0691, + "step": 24823 + }, + { + "epoch": 67.64032697547684, + "grad_norm": 4.912634372711182, + "learning_rate": 5.007389691933992e-06, + "loss": 0.037, + "step": 24824 + }, + { + "epoch": 67.64305177111717, + "grad_norm": 3.0033481121063232, + "learning_rate": 5.006625072462615e-06, + "loss": 0.0449, + "step": 24825 + }, + { + "epoch": 67.64577656675749, + "grad_norm": 2.47558856010437, + "learning_rate": 5.005860491879479e-06, + "loss": 0.0442, + "step": 24826 + }, + { + "epoch": 67.64850136239782, + "grad_norm": 3.771505832672119, + "learning_rate": 5.005095950190541e-06, + "loss": 0.0826, + "step": 24827 + }, + { + "epoch": 67.65122615803814, + "grad_norm": 4.252354621887207, + "learning_rate": 5.004331447401754e-06, + "loss": 0.0824, + "step": 24828 + }, + { + "epoch": 67.65395095367847, + "grad_norm": 3.3859550952911377, + "learning_rate": 5.003566983519073e-06, + "loss": 0.1013, + "step": 24829 + }, + { + "epoch": 67.65667574931881, + "grad_norm": 2.417128562927246, + "learning_rate": 5.002802558548454e-06, + "loss": 0.0727, + "step": 24830 + }, + { + "epoch": 67.65940054495913, + "grad_norm": 3.090529441833496, + "learning_rate": 5.002038172495847e-06, + "loss": 0.0413, + "step": 24831 + }, + { + "epoch": 67.66212534059946, + "grad_norm": 2.4321982860565186, + "learning_rate": 5.001273825367201e-06, + "loss": 0.1191, + "step": 24832 + }, + { + "epoch": 67.66485013623978, + "grad_norm": 4.1490983963012695, + "learning_rate": 5.0005095171684794e-06, + "loss": 0.0716, + "step": 24833 + }, + { + "epoch": 67.66757493188011, + "grad_norm": 5.533572196960449, + "learning_rate": 4.999745247905627e-06, + "loss": 0.2342, + "step": 24834 + }, + { + "epoch": 67.67029972752043, + "grad_norm": 2.7488348484039307, + "learning_rate": 4.998981017584598e-06, + "loss": 0.0645, + "step": 24835 + }, + { + "epoch": 67.67302452316076, + "grad_norm": 4.481891632080078, + "learning_rate": 4.99821682621134e-06, + "loss": 0.1657, + "step": 24836 + }, + { + "epoch": 67.6757493188011, + "grad_norm": 4.825045108795166, + "learning_rate": 4.9974526737918095e-06, + "loss": 0.1055, + "step": 24837 + }, + { + "epoch": 67.67847411444141, + "grad_norm": 3.8038241863250732, + "learning_rate": 4.996688560331961e-06, + "loss": 0.1125, + "step": 24838 + }, + { + "epoch": 67.68119891008175, + "grad_norm": 4.075389862060547, + "learning_rate": 4.995924485837739e-06, + "loss": 0.1495, + "step": 24839 + }, + { + "epoch": 67.68392370572207, + "grad_norm": 2.7468202114105225, + "learning_rate": 4.995160450315093e-06, + "loss": 0.0668, + "step": 24840 + }, + { + "epoch": 67.6866485013624, + "grad_norm": 3.0879342555999756, + "learning_rate": 4.99439645376998e-06, + "loss": 0.0592, + "step": 24841 + }, + { + "epoch": 67.68937329700273, + "grad_norm": 3.7090606689453125, + "learning_rate": 4.993632496208346e-06, + "loss": 0.2208, + "step": 24842 + }, + { + "epoch": 67.69209809264305, + "grad_norm": 2.401188373565674, + "learning_rate": 4.992868577636142e-06, + "loss": 0.0285, + "step": 24843 + }, + { + "epoch": 67.69482288828338, + "grad_norm": 5.189709663391113, + "learning_rate": 4.992104698059312e-06, + "loss": 0.0577, + "step": 24844 + }, + { + "epoch": 67.6975476839237, + "grad_norm": 2.323056221008301, + "learning_rate": 4.991340857483813e-06, + "loss": 0.047, + "step": 24845 + }, + { + "epoch": 67.70027247956403, + "grad_norm": 4.279284477233887, + "learning_rate": 4.9905770559155905e-06, + "loss": 0.0586, + "step": 24846 + }, + { + "epoch": 67.70299727520435, + "grad_norm": 2.025045871734619, + "learning_rate": 4.989813293360593e-06, + "loss": 0.0442, + "step": 24847 + }, + { + "epoch": 67.70572207084469, + "grad_norm": 3.212538480758667, + "learning_rate": 4.989049569824763e-06, + "loss": 0.0544, + "step": 24848 + }, + { + "epoch": 67.70844686648502, + "grad_norm": 3.816307783126831, + "learning_rate": 4.988285885314059e-06, + "loss": 0.044, + "step": 24849 + }, + { + "epoch": 67.71117166212534, + "grad_norm": 3.193031072616577, + "learning_rate": 4.987522239834422e-06, + "loss": 0.27, + "step": 24850 + }, + { + "epoch": 67.71389645776567, + "grad_norm": 3.969139814376831, + "learning_rate": 4.9867586333918015e-06, + "loss": 0.0459, + "step": 24851 + }, + { + "epoch": 67.71662125340599, + "grad_norm": 2.8488636016845703, + "learning_rate": 4.985995065992139e-06, + "loss": 0.0686, + "step": 24852 + }, + { + "epoch": 67.71934604904632, + "grad_norm": 4.406191349029541, + "learning_rate": 4.985231537641391e-06, + "loss": 0.1313, + "step": 24853 + }, + { + "epoch": 67.72207084468666, + "grad_norm": 2.194641590118408, + "learning_rate": 4.984468048345493e-06, + "loss": 0.0321, + "step": 24854 + }, + { + "epoch": 67.72479564032697, + "grad_norm": 3.4836697578430176, + "learning_rate": 4.983704598110401e-06, + "loss": 0.0835, + "step": 24855 + }, + { + "epoch": 67.7275204359673, + "grad_norm": 3.131699562072754, + "learning_rate": 4.982941186942055e-06, + "loss": 0.1429, + "step": 24856 + }, + { + "epoch": 67.73024523160763, + "grad_norm": 4.213091850280762, + "learning_rate": 4.982177814846398e-06, + "loss": 0.0812, + "step": 24857 + }, + { + "epoch": 67.73297002724796, + "grad_norm": 2.6906919479370117, + "learning_rate": 4.981414481829383e-06, + "loss": 0.0538, + "step": 24858 + }, + { + "epoch": 67.73569482288828, + "grad_norm": 4.27742862701416, + "learning_rate": 4.980651187896951e-06, + "loss": 0.2144, + "step": 24859 + }, + { + "epoch": 67.73841961852861, + "grad_norm": 2.63991117477417, + "learning_rate": 4.979887933055045e-06, + "loss": 0.0729, + "step": 24860 + }, + { + "epoch": 67.74114441416894, + "grad_norm": 3.841693878173828, + "learning_rate": 4.979124717309607e-06, + "loss": 0.0735, + "step": 24861 + }, + { + "epoch": 67.74386920980926, + "grad_norm": 2.9286797046661377, + "learning_rate": 4.978361540666587e-06, + "loss": 0.0447, + "step": 24862 + }, + { + "epoch": 67.7465940054496, + "grad_norm": 4.95592737197876, + "learning_rate": 4.977598403131927e-06, + "loss": 0.1634, + "step": 24863 + }, + { + "epoch": 67.74931880108991, + "grad_norm": 4.124266624450684, + "learning_rate": 4.976835304711565e-06, + "loss": 0.1666, + "step": 24864 + }, + { + "epoch": 67.75204359673025, + "grad_norm": 2.6184325218200684, + "learning_rate": 4.976072245411451e-06, + "loss": 0.0387, + "step": 24865 + }, + { + "epoch": 67.75476839237058, + "grad_norm": 3.3357319831848145, + "learning_rate": 4.9753092252375245e-06, + "loss": 0.0702, + "step": 24866 + }, + { + "epoch": 67.7574931880109, + "grad_norm": 3.164846897125244, + "learning_rate": 4.974546244195729e-06, + "loss": 0.0592, + "step": 24867 + }, + { + "epoch": 67.76021798365123, + "grad_norm": 2.907390832901001, + "learning_rate": 4.973783302292001e-06, + "loss": 0.1629, + "step": 24868 + }, + { + "epoch": 67.76294277929155, + "grad_norm": 3.3718841075897217, + "learning_rate": 4.973020399532291e-06, + "loss": 0.0482, + "step": 24869 + }, + { + "epoch": 67.76566757493188, + "grad_norm": 3.1799652576446533, + "learning_rate": 4.972257535922537e-06, + "loss": 0.1327, + "step": 24870 + }, + { + "epoch": 67.7683923705722, + "grad_norm": 3.9311981201171875, + "learning_rate": 4.971494711468675e-06, + "loss": 0.1101, + "step": 24871 + }, + { + "epoch": 67.77111716621253, + "grad_norm": 3.581341028213501, + "learning_rate": 4.970731926176654e-06, + "loss": 0.1398, + "step": 24872 + }, + { + "epoch": 67.77384196185287, + "grad_norm": 2.3169612884521484, + "learning_rate": 4.969969180052407e-06, + "loss": 0.0444, + "step": 24873 + }, + { + "epoch": 67.77656675749319, + "grad_norm": 2.0783934593200684, + "learning_rate": 4.969206473101883e-06, + "loss": 0.0263, + "step": 24874 + }, + { + "epoch": 67.77929155313352, + "grad_norm": 3.9229013919830322, + "learning_rate": 4.9684438053310155e-06, + "loss": 0.0502, + "step": 24875 + }, + { + "epoch": 67.78201634877384, + "grad_norm": 3.068594455718994, + "learning_rate": 4.967681176745747e-06, + "loss": 0.0882, + "step": 24876 + }, + { + "epoch": 67.78474114441417, + "grad_norm": 3.4225618839263916, + "learning_rate": 4.966918587352011e-06, + "loss": 0.0911, + "step": 24877 + }, + { + "epoch": 67.7874659400545, + "grad_norm": 4.238270282745361, + "learning_rate": 4.966156037155755e-06, + "loss": 0.1074, + "step": 24878 + }, + { + "epoch": 67.79019073569482, + "grad_norm": 4.291094779968262, + "learning_rate": 4.965393526162914e-06, + "loss": 0.0818, + "step": 24879 + }, + { + "epoch": 67.79291553133515, + "grad_norm": 3.67020583152771, + "learning_rate": 4.964631054379426e-06, + "loss": 0.1277, + "step": 24880 + }, + { + "epoch": 67.79564032697547, + "grad_norm": 5.443231105804443, + "learning_rate": 4.963868621811227e-06, + "loss": 0.1818, + "step": 24881 + }, + { + "epoch": 67.7983651226158, + "grad_norm": 3.1344242095947266, + "learning_rate": 4.963106228464258e-06, + "loss": 0.0418, + "step": 24882 + }, + { + "epoch": 67.80108991825612, + "grad_norm": 4.302298069000244, + "learning_rate": 4.962343874344457e-06, + "loss": 0.0737, + "step": 24883 + }, + { + "epoch": 67.80381471389646, + "grad_norm": 3.8121414184570312, + "learning_rate": 4.96158155945776e-06, + "loss": 0.0838, + "step": 24884 + }, + { + "epoch": 67.80653950953679, + "grad_norm": 3.3013153076171875, + "learning_rate": 4.9608192838100995e-06, + "loss": 0.0715, + "step": 24885 + }, + { + "epoch": 67.80926430517711, + "grad_norm": 3.171365261077881, + "learning_rate": 4.96005704740742e-06, + "loss": 0.0612, + "step": 24886 + }, + { + "epoch": 67.81198910081744, + "grad_norm": 5.323923587799072, + "learning_rate": 4.959294850255655e-06, + "loss": 0.0807, + "step": 24887 + }, + { + "epoch": 67.81471389645776, + "grad_norm": 3.057110071182251, + "learning_rate": 4.958532692360735e-06, + "loss": 0.0941, + "step": 24888 + }, + { + "epoch": 67.8174386920981, + "grad_norm": 2.6628201007843018, + "learning_rate": 4.9577705737286e-06, + "loss": 0.0561, + "step": 24889 + }, + { + "epoch": 67.82016348773843, + "grad_norm": 2.3849899768829346, + "learning_rate": 4.957008494365189e-06, + "loss": 0.102, + "step": 24890 + }, + { + "epoch": 67.82288828337875, + "grad_norm": 3.0842764377593994, + "learning_rate": 4.956246454276433e-06, + "loss": 0.054, + "step": 24891 + }, + { + "epoch": 67.82561307901908, + "grad_norm": 3.459657907485962, + "learning_rate": 4.955484453468269e-06, + "loss": 0.0528, + "step": 24892 + }, + { + "epoch": 67.8283378746594, + "grad_norm": 2.9648995399475098, + "learning_rate": 4.954722491946624e-06, + "loss": 0.0465, + "step": 24893 + }, + { + "epoch": 67.83106267029973, + "grad_norm": 4.292356491088867, + "learning_rate": 4.953960569717443e-06, + "loss": 0.0527, + "step": 24894 + }, + { + "epoch": 67.83378746594005, + "grad_norm": 2.9318783283233643, + "learning_rate": 4.953198686786655e-06, + "loss": 0.0459, + "step": 24895 + }, + { + "epoch": 67.83651226158038, + "grad_norm": 3.5212247371673584, + "learning_rate": 4.952436843160192e-06, + "loss": 0.0832, + "step": 24896 + }, + { + "epoch": 67.83923705722071, + "grad_norm": 3.3984742164611816, + "learning_rate": 4.951675038843985e-06, + "loss": 0.1136, + "step": 24897 + }, + { + "epoch": 67.84196185286103, + "grad_norm": 3.9382457733154297, + "learning_rate": 4.950913273843975e-06, + "loss": 0.094, + "step": 24898 + }, + { + "epoch": 67.84468664850137, + "grad_norm": 3.3440463542938232, + "learning_rate": 4.950151548166089e-06, + "loss": 0.0428, + "step": 24899 + }, + { + "epoch": 67.84741144414168, + "grad_norm": 3.871778964996338, + "learning_rate": 4.949389861816259e-06, + "loss": 0.0615, + "step": 24900 + }, + { + "epoch": 67.85013623978202, + "grad_norm": 2.4289021492004395, + "learning_rate": 4.948628214800417e-06, + "loss": 0.0303, + "step": 24901 + }, + { + "epoch": 67.85286103542235, + "grad_norm": 3.30828857421875, + "learning_rate": 4.947866607124499e-06, + "loss": 0.0544, + "step": 24902 + }, + { + "epoch": 67.85558583106267, + "grad_norm": 2.7102503776550293, + "learning_rate": 4.947105038794432e-06, + "loss": 0.0484, + "step": 24903 + }, + { + "epoch": 67.858310626703, + "grad_norm": 2.3424482345581055, + "learning_rate": 4.946343509816149e-06, + "loss": 0.0498, + "step": 24904 + }, + { + "epoch": 67.86103542234332, + "grad_norm": 2.4523189067840576, + "learning_rate": 4.945582020195576e-06, + "loss": 0.0594, + "step": 24905 + }, + { + "epoch": 67.86376021798365, + "grad_norm": 3.603227376937866, + "learning_rate": 4.944820569938649e-06, + "loss": 0.044, + "step": 24906 + }, + { + "epoch": 67.86648501362397, + "grad_norm": 2.3260836601257324, + "learning_rate": 4.9440591590512984e-06, + "loss": 0.0662, + "step": 24907 + }, + { + "epoch": 67.8692098092643, + "grad_norm": 3.8470189571380615, + "learning_rate": 4.9432977875394536e-06, + "loss": 0.1546, + "step": 24908 + }, + { + "epoch": 67.87193460490464, + "grad_norm": 3.7191038131713867, + "learning_rate": 4.942536455409039e-06, + "loss": 0.1139, + "step": 24909 + }, + { + "epoch": 67.87465940054496, + "grad_norm": 4.3344221115112305, + "learning_rate": 4.941775162665992e-06, + "loss": 0.0525, + "step": 24910 + }, + { + "epoch": 67.87738419618529, + "grad_norm": 2.6456716060638428, + "learning_rate": 4.941013909316236e-06, + "loss": 0.2204, + "step": 24911 + }, + { + "epoch": 67.88010899182561, + "grad_norm": 2.9865050315856934, + "learning_rate": 4.940252695365701e-06, + "loss": 0.0631, + "step": 24912 + }, + { + "epoch": 67.88283378746594, + "grad_norm": 6.068676948547363, + "learning_rate": 4.939491520820312e-06, + "loss": 0.0772, + "step": 24913 + }, + { + "epoch": 67.88555858310627, + "grad_norm": 3.0810790061950684, + "learning_rate": 4.938730385686004e-06, + "loss": 0.0483, + "step": 24914 + }, + { + "epoch": 67.88828337874659, + "grad_norm": 2.9013748168945312, + "learning_rate": 4.937969289968701e-06, + "loss": 0.0996, + "step": 24915 + }, + { + "epoch": 67.89100817438693, + "grad_norm": 4.394800662994385, + "learning_rate": 4.93720823367433e-06, + "loss": 0.1282, + "step": 24916 + }, + { + "epoch": 67.89373297002724, + "grad_norm": 2.896500587463379, + "learning_rate": 4.936447216808814e-06, + "loss": 0.0702, + "step": 24917 + }, + { + "epoch": 67.89645776566758, + "grad_norm": 2.685396909713745, + "learning_rate": 4.935686239378088e-06, + "loss": 0.0863, + "step": 24918 + }, + { + "epoch": 67.8991825613079, + "grad_norm": 2.7011332511901855, + "learning_rate": 4.934925301388075e-06, + "loss": 0.0324, + "step": 24919 + }, + { + "epoch": 67.90190735694823, + "grad_norm": 3.0609073638916016, + "learning_rate": 4.9341644028447014e-06, + "loss": 0.0397, + "step": 24920 + }, + { + "epoch": 67.90463215258856, + "grad_norm": 2.5676541328430176, + "learning_rate": 4.933403543753887e-06, + "loss": 0.0358, + "step": 24921 + }, + { + "epoch": 67.90735694822888, + "grad_norm": 2.9928839206695557, + "learning_rate": 4.9326427241215666e-06, + "loss": 0.0719, + "step": 24922 + }, + { + "epoch": 67.91008174386921, + "grad_norm": 2.7477798461914062, + "learning_rate": 4.9318819439536596e-06, + "loss": 0.0999, + "step": 24923 + }, + { + "epoch": 67.91280653950953, + "grad_norm": 4.223602294921875, + "learning_rate": 4.931121203256095e-06, + "loss": 0.0801, + "step": 24924 + }, + { + "epoch": 67.91553133514986, + "grad_norm": 2.8641223907470703, + "learning_rate": 4.9303605020347965e-06, + "loss": 0.1024, + "step": 24925 + }, + { + "epoch": 67.9182561307902, + "grad_norm": 3.264960527420044, + "learning_rate": 4.929599840295683e-06, + "loss": 0.0905, + "step": 24926 + }, + { + "epoch": 67.92098092643052, + "grad_norm": 3.5409579277038574, + "learning_rate": 4.928839218044687e-06, + "loss": 0.087, + "step": 24927 + }, + { + "epoch": 67.92370572207085, + "grad_norm": 3.775388717651367, + "learning_rate": 4.928078635287726e-06, + "loss": 0.0643, + "step": 24928 + }, + { + "epoch": 67.92643051771117, + "grad_norm": 3.0450453758239746, + "learning_rate": 4.927318092030723e-06, + "loss": 0.0672, + "step": 24929 + }, + { + "epoch": 67.9291553133515, + "grad_norm": 4.1666669845581055, + "learning_rate": 4.9265575882796076e-06, + "loss": 0.0853, + "step": 24930 + }, + { + "epoch": 67.93188010899182, + "grad_norm": 3.8314664363861084, + "learning_rate": 4.925797124040298e-06, + "loss": 0.232, + "step": 24931 + }, + { + "epoch": 67.93460490463215, + "grad_norm": 4.507056713104248, + "learning_rate": 4.925036699318717e-06, + "loss": 0.0599, + "step": 24932 + }, + { + "epoch": 67.93732970027249, + "grad_norm": 3.821880578994751, + "learning_rate": 4.9242763141207825e-06, + "loss": 0.1515, + "step": 24933 + }, + { + "epoch": 67.9400544959128, + "grad_norm": 2.9991466999053955, + "learning_rate": 4.9235159684524256e-06, + "loss": 0.1734, + "step": 24934 + }, + { + "epoch": 67.94277929155314, + "grad_norm": 2.7332661151885986, + "learning_rate": 4.922755662319563e-06, + "loss": 0.0352, + "step": 24935 + }, + { + "epoch": 67.94550408719346, + "grad_norm": 4.4129252433776855, + "learning_rate": 4.9219953957281154e-06, + "loss": 0.0785, + "step": 24936 + }, + { + "epoch": 67.94822888283379, + "grad_norm": 2.548818588256836, + "learning_rate": 4.9212351686839995e-06, + "loss": 0.0363, + "step": 24937 + }, + { + "epoch": 67.95095367847412, + "grad_norm": 5.2256646156311035, + "learning_rate": 4.920474981193146e-06, + "loss": 0.1432, + "step": 24938 + }, + { + "epoch": 67.95367847411444, + "grad_norm": 3.511392116546631, + "learning_rate": 4.9197148332614685e-06, + "loss": 0.0745, + "step": 24939 + }, + { + "epoch": 67.95640326975477, + "grad_norm": 2.386901378631592, + "learning_rate": 4.9189547248948856e-06, + "loss": 0.0296, + "step": 24940 + }, + { + "epoch": 67.95912806539509, + "grad_norm": 3.104686975479126, + "learning_rate": 4.918194656099323e-06, + "loss": 0.0769, + "step": 24941 + }, + { + "epoch": 67.96185286103542, + "grad_norm": 3.6968278884887695, + "learning_rate": 4.917434626880694e-06, + "loss": 0.1325, + "step": 24942 + }, + { + "epoch": 67.96457765667574, + "grad_norm": 2.0700976848602295, + "learning_rate": 4.916674637244924e-06, + "loss": 0.0848, + "step": 24943 + }, + { + "epoch": 67.96730245231608, + "grad_norm": 2.490745782852173, + "learning_rate": 4.915914687197928e-06, + "loss": 0.0805, + "step": 24944 + }, + { + "epoch": 67.97002724795641, + "grad_norm": 3.9408082962036133, + "learning_rate": 4.915154776745624e-06, + "loss": 0.0811, + "step": 24945 + }, + { + "epoch": 67.97275204359673, + "grad_norm": 3.8298580646514893, + "learning_rate": 4.914394905893928e-06, + "loss": 0.2028, + "step": 24946 + }, + { + "epoch": 67.97547683923706, + "grad_norm": 8.07292652130127, + "learning_rate": 4.913635074648765e-06, + "loss": 0.0823, + "step": 24947 + }, + { + "epoch": 67.97820163487738, + "grad_norm": 2.2788009643554688, + "learning_rate": 4.912875283016047e-06, + "loss": 0.0249, + "step": 24948 + }, + { + "epoch": 67.98092643051771, + "grad_norm": 3.7298474311828613, + "learning_rate": 4.9121155310016946e-06, + "loss": 0.1421, + "step": 24949 + }, + { + "epoch": 67.98365122615803, + "grad_norm": 5.163436412811279, + "learning_rate": 4.911355818611618e-06, + "loss": 0.153, + "step": 24950 + }, + { + "epoch": 67.98637602179836, + "grad_norm": 3.9633572101593018, + "learning_rate": 4.9105961458517415e-06, + "loss": 0.1678, + "step": 24951 + }, + { + "epoch": 67.9891008174387, + "grad_norm": 4.479075908660889, + "learning_rate": 4.909836512727978e-06, + "loss": 0.1247, + "step": 24952 + }, + { + "epoch": 67.99182561307902, + "grad_norm": 3.044597625732422, + "learning_rate": 4.909076919246242e-06, + "loss": 0.1124, + "step": 24953 + }, + { + "epoch": 67.99455040871935, + "grad_norm": 3.070491313934326, + "learning_rate": 4.908317365412454e-06, + "loss": 0.1288, + "step": 24954 + }, + { + "epoch": 67.99727520435967, + "grad_norm": 3.2853972911834717, + "learning_rate": 4.9075578512325266e-06, + "loss": 0.1325, + "step": 24955 + }, + { + "epoch": 68.0, + "grad_norm": 4.042403221130371, + "learning_rate": 4.9067983767123736e-06, + "loss": 0.1736, + "step": 24956 + }, + { + "epoch": 68.00272479564033, + "grad_norm": 2.7494149208068848, + "learning_rate": 4.906038941857908e-06, + "loss": 0.0768, + "step": 24957 + }, + { + "epoch": 68.00544959128065, + "grad_norm": 3.2249743938446045, + "learning_rate": 4.905279546675047e-06, + "loss": 0.0774, + "step": 24958 + }, + { + "epoch": 68.00817438692098, + "grad_norm": 2.04597806930542, + "learning_rate": 4.904520191169709e-06, + "loss": 0.0732, + "step": 24959 + }, + { + "epoch": 68.0108991825613, + "grad_norm": 3.357067584991455, + "learning_rate": 4.903760875347804e-06, + "loss": 0.0507, + "step": 24960 + }, + { + "epoch": 68.01362397820164, + "grad_norm": 3.263263702392578, + "learning_rate": 4.9030015992152445e-06, + "loss": 0.0539, + "step": 24961 + }, + { + "epoch": 68.01634877384195, + "grad_norm": 3.323880672454834, + "learning_rate": 4.902242362777942e-06, + "loss": 0.1754, + "step": 24962 + }, + { + "epoch": 68.01907356948229, + "grad_norm": 3.205150604248047, + "learning_rate": 4.901483166041815e-06, + "loss": 0.1094, + "step": 24963 + }, + { + "epoch": 68.02179836512262, + "grad_norm": 3.1998703479766846, + "learning_rate": 4.900724009012773e-06, + "loss": 0.0441, + "step": 24964 + }, + { + "epoch": 68.02452316076294, + "grad_norm": 9.504284858703613, + "learning_rate": 4.899964891696728e-06, + "loss": 0.1081, + "step": 24965 + }, + { + "epoch": 68.02724795640327, + "grad_norm": 3.5057647228240967, + "learning_rate": 4.899205814099589e-06, + "loss": 0.083, + "step": 24966 + }, + { + "epoch": 68.02997275204359, + "grad_norm": 8.63381290435791, + "learning_rate": 4.898446776227274e-06, + "loss": 0.1381, + "step": 24967 + }, + { + "epoch": 68.03269754768392, + "grad_norm": 3.1937215328216553, + "learning_rate": 4.897687778085693e-06, + "loss": 0.136, + "step": 24968 + }, + { + "epoch": 68.03542234332426, + "grad_norm": 2.3671205043792725, + "learning_rate": 4.896928819680753e-06, + "loss": 0.0353, + "step": 24969 + }, + { + "epoch": 68.03814713896458, + "grad_norm": 6.201351642608643, + "learning_rate": 4.896169901018365e-06, + "loss": 0.0942, + "step": 24970 + }, + { + "epoch": 68.04087193460491, + "grad_norm": 3.7104909420013428, + "learning_rate": 4.8954110221044435e-06, + "loss": 0.0563, + "step": 24971 + }, + { + "epoch": 68.04359673024523, + "grad_norm": 2.5792465209960938, + "learning_rate": 4.894652182944899e-06, + "loss": 0.122, + "step": 24972 + }, + { + "epoch": 68.04632152588556, + "grad_norm": 2.297308921813965, + "learning_rate": 4.893893383545633e-06, + "loss": 0.1426, + "step": 24973 + }, + { + "epoch": 68.04904632152588, + "grad_norm": 3.3279075622558594, + "learning_rate": 4.893134623912567e-06, + "loss": 0.122, + "step": 24974 + }, + { + "epoch": 68.05177111716621, + "grad_norm": 2.6865179538726807, + "learning_rate": 4.892375904051599e-06, + "loss": 0.1871, + "step": 24975 + }, + { + "epoch": 68.05449591280654, + "grad_norm": 3.0044872760772705, + "learning_rate": 4.891617223968648e-06, + "loss": 0.0392, + "step": 24976 + }, + { + "epoch": 68.05722070844686, + "grad_norm": 4.275487422943115, + "learning_rate": 4.890858583669616e-06, + "loss": 0.1134, + "step": 24977 + }, + { + "epoch": 68.0599455040872, + "grad_norm": 3.2748069763183594, + "learning_rate": 4.89009998316041e-06, + "loss": 0.117, + "step": 24978 + }, + { + "epoch": 68.06267029972751, + "grad_norm": 3.3147456645965576, + "learning_rate": 4.889341422446945e-06, + "loss": 0.1342, + "step": 24979 + }, + { + "epoch": 68.06539509536785, + "grad_norm": 3.7245795726776123, + "learning_rate": 4.888582901535124e-06, + "loss": 0.2111, + "step": 24980 + }, + { + "epoch": 68.06811989100818, + "grad_norm": 2.658000946044922, + "learning_rate": 4.887824420430854e-06, + "loss": 0.1104, + "step": 24981 + }, + { + "epoch": 68.0708446866485, + "grad_norm": 2.3336551189422607, + "learning_rate": 4.887065979140041e-06, + "loss": 0.0396, + "step": 24982 + }, + { + "epoch": 68.07356948228883, + "grad_norm": 3.099041700363159, + "learning_rate": 4.886307577668596e-06, + "loss": 0.1679, + "step": 24983 + }, + { + "epoch": 68.07629427792915, + "grad_norm": 3.471858024597168, + "learning_rate": 4.885549216022424e-06, + "loss": 0.0494, + "step": 24984 + }, + { + "epoch": 68.07901907356948, + "grad_norm": 4.856651782989502, + "learning_rate": 4.8847908942074295e-06, + "loss": 0.0645, + "step": 24985 + }, + { + "epoch": 68.0817438692098, + "grad_norm": 2.4537742137908936, + "learning_rate": 4.884032612229515e-06, + "loss": 0.0337, + "step": 24986 + }, + { + "epoch": 68.08446866485014, + "grad_norm": 3.4039788246154785, + "learning_rate": 4.8832743700945936e-06, + "loss": 0.0667, + "step": 24987 + }, + { + "epoch": 68.08719346049047, + "grad_norm": 3.9975268840789795, + "learning_rate": 4.882516167808568e-06, + "loss": 0.0868, + "step": 24988 + }, + { + "epoch": 68.08991825613079, + "grad_norm": 3.4598822593688965, + "learning_rate": 4.881758005377339e-06, + "loss": 0.0667, + "step": 24989 + }, + { + "epoch": 68.09264305177112, + "grad_norm": 3.3750131130218506, + "learning_rate": 4.880999882806813e-06, + "loss": 0.0661, + "step": 24990 + }, + { + "epoch": 68.09536784741144, + "grad_norm": 2.525282382965088, + "learning_rate": 4.880241800102897e-06, + "loss": 0.0454, + "step": 24991 + }, + { + "epoch": 68.09809264305177, + "grad_norm": 3.315260648727417, + "learning_rate": 4.87948375727149e-06, + "loss": 0.3172, + "step": 24992 + }, + { + "epoch": 68.1008174386921, + "grad_norm": 2.868989944458008, + "learning_rate": 4.878725754318503e-06, + "loss": 0.0721, + "step": 24993 + }, + { + "epoch": 68.10354223433242, + "grad_norm": 5.609745025634766, + "learning_rate": 4.877967791249831e-06, + "loss": 0.1983, + "step": 24994 + }, + { + "epoch": 68.10626702997276, + "grad_norm": 2.8073129653930664, + "learning_rate": 4.877209868071384e-06, + "loss": 0.0581, + "step": 24995 + }, + { + "epoch": 68.10899182561307, + "grad_norm": 3.576669692993164, + "learning_rate": 4.876451984789062e-06, + "loss": 0.1892, + "step": 24996 + }, + { + "epoch": 68.11171662125341, + "grad_norm": 3.127253770828247, + "learning_rate": 4.8756941414087675e-06, + "loss": 0.156, + "step": 24997 + }, + { + "epoch": 68.11444141689373, + "grad_norm": 2.397226572036743, + "learning_rate": 4.874936337936399e-06, + "loss": 0.0437, + "step": 24998 + }, + { + "epoch": 68.11716621253406, + "grad_norm": 2.780616283416748, + "learning_rate": 4.874178574377863e-06, + "loss": 0.0316, + "step": 24999 + }, + { + "epoch": 68.11989100817439, + "grad_norm": 3.2752492427825928, + "learning_rate": 4.8734208507390615e-06, + "loss": 0.0516, + "step": 25000 + }, + { + "epoch": 68.12261580381471, + "grad_norm": 3.1068167686462402, + "learning_rate": 4.872663167025893e-06, + "loss": 0.0899, + "step": 25001 + }, + { + "epoch": 68.12534059945504, + "grad_norm": 3.745326280593872, + "learning_rate": 4.8719055232442535e-06, + "loss": 0.0589, + "step": 25002 + }, + { + "epoch": 68.12806539509536, + "grad_norm": 2.551170825958252, + "learning_rate": 4.871147919400053e-06, + "loss": 0.048, + "step": 25003 + }, + { + "epoch": 68.1307901907357, + "grad_norm": 2.6059932708740234, + "learning_rate": 4.8703903554991885e-06, + "loss": 0.0439, + "step": 25004 + }, + { + "epoch": 68.13351498637603, + "grad_norm": 2.7945291996002197, + "learning_rate": 4.869632831547559e-06, + "loss": 0.0345, + "step": 25005 + }, + { + "epoch": 68.13623978201635, + "grad_norm": 4.376722812652588, + "learning_rate": 4.868875347551059e-06, + "loss": 0.0386, + "step": 25006 + }, + { + "epoch": 68.13896457765668, + "grad_norm": 2.1037650108337402, + "learning_rate": 4.868117903515596e-06, + "loss": 0.0377, + "step": 25007 + }, + { + "epoch": 68.141689373297, + "grad_norm": 3.319108009338379, + "learning_rate": 4.867360499447066e-06, + "loss": 0.05, + "step": 25008 + }, + { + "epoch": 68.14441416893733, + "grad_norm": 2.9765584468841553, + "learning_rate": 4.866603135351365e-06, + "loss": 0.1211, + "step": 25009 + }, + { + "epoch": 68.14713896457765, + "grad_norm": 2.914546251296997, + "learning_rate": 4.8658458112343955e-06, + "loss": 0.0883, + "step": 25010 + }, + { + "epoch": 68.14986376021798, + "grad_norm": 2.722857713699341, + "learning_rate": 4.8650885271020495e-06, + "loss": 0.1046, + "step": 25011 + }, + { + "epoch": 68.15258855585832, + "grad_norm": 3.4026708602905273, + "learning_rate": 4.864331282960234e-06, + "loss": 0.0672, + "step": 25012 + }, + { + "epoch": 68.15531335149863, + "grad_norm": 2.9237442016601562, + "learning_rate": 4.86357407881484e-06, + "loss": 0.0826, + "step": 25013 + }, + { + "epoch": 68.15803814713897, + "grad_norm": 3.331533670425415, + "learning_rate": 4.862816914671763e-06, + "loss": 0.1254, + "step": 25014 + }, + { + "epoch": 68.16076294277929, + "grad_norm": 3.147104024887085, + "learning_rate": 4.862059790536906e-06, + "loss": 0.0859, + "step": 25015 + }, + { + "epoch": 68.16348773841962, + "grad_norm": 2.5917232036590576, + "learning_rate": 4.861302706416162e-06, + "loss": 0.0624, + "step": 25016 + }, + { + "epoch": 68.16621253405995, + "grad_norm": 4.823266983032227, + "learning_rate": 4.860545662315427e-06, + "loss": 0.0767, + "step": 25017 + }, + { + "epoch": 68.16893732970027, + "grad_norm": 3.8482394218444824, + "learning_rate": 4.859788658240593e-06, + "loss": 0.1534, + "step": 25018 + }, + { + "epoch": 68.1716621253406, + "grad_norm": 4.588294506072998, + "learning_rate": 4.859031694197563e-06, + "loss": 0.0899, + "step": 25019 + }, + { + "epoch": 68.17438692098092, + "grad_norm": 2.63802170753479, + "learning_rate": 4.858274770192229e-06, + "loss": 0.1056, + "step": 25020 + }, + { + "epoch": 68.17711171662125, + "grad_norm": 2.652108669281006, + "learning_rate": 4.8575178862304865e-06, + "loss": 0.044, + "step": 25021 + }, + { + "epoch": 68.17983651226157, + "grad_norm": 4.528519630432129, + "learning_rate": 4.856761042318224e-06, + "loss": 0.1687, + "step": 25022 + }, + { + "epoch": 68.1825613079019, + "grad_norm": 5.335216999053955, + "learning_rate": 4.856004238461346e-06, + "loss": 0.0651, + "step": 25023 + }, + { + "epoch": 68.18528610354224, + "grad_norm": 3.355959892272949, + "learning_rate": 4.8552474746657405e-06, + "loss": 0.1393, + "step": 25024 + }, + { + "epoch": 68.18801089918256, + "grad_norm": 3.15427303314209, + "learning_rate": 4.854490750937303e-06, + "loss": 0.1628, + "step": 25025 + }, + { + "epoch": 68.19073569482289, + "grad_norm": 3.5091757774353027, + "learning_rate": 4.853734067281922e-06, + "loss": 0.0499, + "step": 25026 + }, + { + "epoch": 68.19346049046321, + "grad_norm": 3.323369264602661, + "learning_rate": 4.852977423705494e-06, + "loss": 0.0527, + "step": 25027 + }, + { + "epoch": 68.19618528610354, + "grad_norm": 4.669510841369629, + "learning_rate": 4.852220820213915e-06, + "loss": 0.0706, + "step": 25028 + }, + { + "epoch": 68.19891008174388, + "grad_norm": 5.563045978546143, + "learning_rate": 4.851464256813076e-06, + "loss": 0.1015, + "step": 25029 + }, + { + "epoch": 68.2016348773842, + "grad_norm": 3.3602840900421143, + "learning_rate": 4.850707733508868e-06, + "loss": 0.0472, + "step": 25030 + }, + { + "epoch": 68.20435967302453, + "grad_norm": 3.2086257934570312, + "learning_rate": 4.8499512503071775e-06, + "loss": 0.073, + "step": 25031 + }, + { + "epoch": 68.20708446866485, + "grad_norm": 4.109739780426025, + "learning_rate": 4.849194807213905e-06, + "loss": 0.1155, + "step": 25032 + }, + { + "epoch": 68.20980926430518, + "grad_norm": 5.412731170654297, + "learning_rate": 4.848438404234937e-06, + "loss": 0.158, + "step": 25033 + }, + { + "epoch": 68.2125340599455, + "grad_norm": 2.9590957164764404, + "learning_rate": 4.847682041376166e-06, + "loss": 0.042, + "step": 25034 + }, + { + "epoch": 68.21525885558583, + "grad_norm": 2.1525983810424805, + "learning_rate": 4.846925718643478e-06, + "loss": 0.067, + "step": 25035 + }, + { + "epoch": 68.21798365122616, + "grad_norm": 3.3515589237213135, + "learning_rate": 4.846169436042769e-06, + "loss": 0.0527, + "step": 25036 + }, + { + "epoch": 68.22070844686648, + "grad_norm": 2.3968660831451416, + "learning_rate": 4.845413193579927e-06, + "loss": 0.04, + "step": 25037 + }, + { + "epoch": 68.22343324250681, + "grad_norm": 2.7044997215270996, + "learning_rate": 4.844656991260838e-06, + "loss": 0.0377, + "step": 25038 + }, + { + "epoch": 68.22615803814713, + "grad_norm": 3.2693943977355957, + "learning_rate": 4.843900829091398e-06, + "loss": 0.1073, + "step": 25039 + }, + { + "epoch": 68.22888283378747, + "grad_norm": 3.2461183071136475, + "learning_rate": 4.8431447070774916e-06, + "loss": 0.1183, + "step": 25040 + }, + { + "epoch": 68.2316076294278, + "grad_norm": 5.564183235168457, + "learning_rate": 4.842388625225009e-06, + "loss": 0.1141, + "step": 25041 + }, + { + "epoch": 68.23433242506812, + "grad_norm": 6.375480651855469, + "learning_rate": 4.841632583539835e-06, + "loss": 0.0521, + "step": 25042 + }, + { + "epoch": 68.23705722070845, + "grad_norm": 2.3081696033477783, + "learning_rate": 4.840876582027863e-06, + "loss": 0.0383, + "step": 25043 + }, + { + "epoch": 68.23978201634877, + "grad_norm": 3.0546491146087646, + "learning_rate": 4.840120620694974e-06, + "loss": 0.112, + "step": 25044 + }, + { + "epoch": 68.2425068119891, + "grad_norm": 2.5620908737182617, + "learning_rate": 4.839364699547064e-06, + "loss": 0.1705, + "step": 25045 + }, + { + "epoch": 68.24523160762942, + "grad_norm": 3.5948729515075684, + "learning_rate": 4.8386088185900145e-06, + "loss": 0.1684, + "step": 25046 + }, + { + "epoch": 68.24795640326975, + "grad_norm": 3.0221545696258545, + "learning_rate": 4.837852977829711e-06, + "loss": 0.1146, + "step": 25047 + }, + { + "epoch": 68.25068119891009, + "grad_norm": 6.115458965301514, + "learning_rate": 4.837097177272045e-06, + "loss": 0.0545, + "step": 25048 + }, + { + "epoch": 68.2534059945504, + "grad_norm": 3.122903823852539, + "learning_rate": 4.836341416922901e-06, + "loss": 0.1152, + "step": 25049 + }, + { + "epoch": 68.25613079019074, + "grad_norm": 3.8173673152923584, + "learning_rate": 4.835585696788163e-06, + "loss": 0.1432, + "step": 25050 + }, + { + "epoch": 68.25885558583106, + "grad_norm": 2.7445411682128906, + "learning_rate": 4.834830016873715e-06, + "loss": 0.0638, + "step": 25051 + }, + { + "epoch": 68.26158038147139, + "grad_norm": 3.772977590560913, + "learning_rate": 4.834074377185447e-06, + "loss": 0.0469, + "step": 25052 + }, + { + "epoch": 68.26430517711172, + "grad_norm": 3.452272891998291, + "learning_rate": 4.833318777729243e-06, + "loss": 0.1427, + "step": 25053 + }, + { + "epoch": 68.26702997275204, + "grad_norm": 2.9316632747650146, + "learning_rate": 4.832563218510984e-06, + "loss": 0.0623, + "step": 25054 + }, + { + "epoch": 68.26975476839237, + "grad_norm": 3.105860948562622, + "learning_rate": 4.831807699536554e-06, + "loss": 0.0934, + "step": 25055 + }, + { + "epoch": 68.2724795640327, + "grad_norm": 3.162024974822998, + "learning_rate": 4.831052220811843e-06, + "loss": 0.0623, + "step": 25056 + }, + { + "epoch": 68.27520435967303, + "grad_norm": 3.763082504272461, + "learning_rate": 4.8302967823427296e-06, + "loss": 0.0968, + "step": 25057 + }, + { + "epoch": 68.27792915531334, + "grad_norm": 4.577455043792725, + "learning_rate": 4.8295413841350995e-06, + "loss": 0.1031, + "step": 25058 + }, + { + "epoch": 68.28065395095368, + "grad_norm": 3.669177532196045, + "learning_rate": 4.8287860261948305e-06, + "loss": 0.1281, + "step": 25059 + }, + { + "epoch": 68.28337874659401, + "grad_norm": 2.364025831222534, + "learning_rate": 4.828030708527814e-06, + "loss": 0.0313, + "step": 25060 + }, + { + "epoch": 68.28610354223433, + "grad_norm": 2.397878885269165, + "learning_rate": 4.827275431139924e-06, + "loss": 0.0421, + "step": 25061 + }, + { + "epoch": 68.28882833787466, + "grad_norm": 2.458519458770752, + "learning_rate": 4.82652019403705e-06, + "loss": 0.0901, + "step": 25062 + }, + { + "epoch": 68.29155313351498, + "grad_norm": 2.9947876930236816, + "learning_rate": 4.825764997225066e-06, + "loss": 0.1044, + "step": 25063 + }, + { + "epoch": 68.29427792915531, + "grad_norm": 2.8236539363861084, + "learning_rate": 4.825009840709862e-06, + "loss": 0.0447, + "step": 25064 + }, + { + "epoch": 68.29700272479565, + "grad_norm": 2.933349847793579, + "learning_rate": 4.8242547244973144e-06, + "loss": 0.0408, + "step": 25065 + }, + { + "epoch": 68.29972752043597, + "grad_norm": 4.040036678314209, + "learning_rate": 4.823499648593305e-06, + "loss": 0.0641, + "step": 25066 + }, + { + "epoch": 68.3024523160763, + "grad_norm": 4.4302239418029785, + "learning_rate": 4.82274461300371e-06, + "loss": 0.0918, + "step": 25067 + }, + { + "epoch": 68.30517711171662, + "grad_norm": 3.477489709854126, + "learning_rate": 4.821989617734416e-06, + "loss": 0.0495, + "step": 25068 + }, + { + "epoch": 68.30790190735695, + "grad_norm": 3.266461133956909, + "learning_rate": 4.821234662791302e-06, + "loss": 0.0541, + "step": 25069 + }, + { + "epoch": 68.31062670299727, + "grad_norm": 2.8733971118927, + "learning_rate": 4.820479748180245e-06, + "loss": 0.0477, + "step": 25070 + }, + { + "epoch": 68.3133514986376, + "grad_norm": 2.9562008380889893, + "learning_rate": 4.81972487390712e-06, + "loss": 0.0463, + "step": 25071 + }, + { + "epoch": 68.31607629427793, + "grad_norm": 2.757918119430542, + "learning_rate": 4.818970039977816e-06, + "loss": 0.1046, + "step": 25072 + }, + { + "epoch": 68.31880108991825, + "grad_norm": 3.5135529041290283, + "learning_rate": 4.818215246398206e-06, + "loss": 0.0466, + "step": 25073 + }, + { + "epoch": 68.32152588555859, + "grad_norm": 15.699817657470703, + "learning_rate": 4.81746049317417e-06, + "loss": 0.0823, + "step": 25074 + }, + { + "epoch": 68.3242506811989, + "grad_norm": 3.147193431854248, + "learning_rate": 4.81670578031158e-06, + "loss": 0.0471, + "step": 25075 + }, + { + "epoch": 68.32697547683924, + "grad_norm": 3.7153866291046143, + "learning_rate": 4.815951107816322e-06, + "loss": 0.0506, + "step": 25076 + }, + { + "epoch": 68.32970027247957, + "grad_norm": 4.23006534576416, + "learning_rate": 4.815196475694271e-06, + "loss": 0.0737, + "step": 25077 + }, + { + "epoch": 68.33242506811989, + "grad_norm": 3.3838913440704346, + "learning_rate": 4.814441883951299e-06, + "loss": 0.0731, + "step": 25078 + }, + { + "epoch": 68.33514986376022, + "grad_norm": 5.721966743469238, + "learning_rate": 4.813687332593287e-06, + "loss": 0.0741, + "step": 25079 + }, + { + "epoch": 68.33787465940054, + "grad_norm": 4.798506736755371, + "learning_rate": 4.812932821626113e-06, + "loss": 0.2038, + "step": 25080 + }, + { + "epoch": 68.34059945504087, + "grad_norm": 7.884695053100586, + "learning_rate": 4.812178351055653e-06, + "loss": 0.0779, + "step": 25081 + }, + { + "epoch": 68.34332425068119, + "grad_norm": 2.769942283630371, + "learning_rate": 4.811423920887781e-06, + "loss": 0.0533, + "step": 25082 + }, + { + "epoch": 68.34604904632153, + "grad_norm": 2.734086751937866, + "learning_rate": 4.810669531128368e-06, + "loss": 0.0589, + "step": 25083 + }, + { + "epoch": 68.34877384196186, + "grad_norm": 2.627162456512451, + "learning_rate": 4.809915181783298e-06, + "loss": 0.064, + "step": 25084 + }, + { + "epoch": 68.35149863760218, + "grad_norm": 3.023695468902588, + "learning_rate": 4.809160872858442e-06, + "loss": 0.0705, + "step": 25085 + }, + { + "epoch": 68.35422343324251, + "grad_norm": 3.268885374069214, + "learning_rate": 4.8084066043596724e-06, + "loss": 0.0597, + "step": 25086 + }, + { + "epoch": 68.35694822888283, + "grad_norm": 3.398163080215454, + "learning_rate": 4.807652376292863e-06, + "loss": 0.0813, + "step": 25087 + }, + { + "epoch": 68.35967302452316, + "grad_norm": 3.454350709915161, + "learning_rate": 4.806898188663892e-06, + "loss": 0.2177, + "step": 25088 + }, + { + "epoch": 68.3623978201635, + "grad_norm": 4.0141143798828125, + "learning_rate": 4.806144041478632e-06, + "loss": 0.1013, + "step": 25089 + }, + { + "epoch": 68.36512261580381, + "grad_norm": 8.191872596740723, + "learning_rate": 4.8053899347429545e-06, + "loss": 0.2007, + "step": 25090 + }, + { + "epoch": 68.36784741144415, + "grad_norm": 2.948700189590454, + "learning_rate": 4.804635868462729e-06, + "loss": 0.0463, + "step": 25091 + }, + { + "epoch": 68.37057220708446, + "grad_norm": 4.066028594970703, + "learning_rate": 4.803881842643837e-06, + "loss": 0.1249, + "step": 25092 + }, + { + "epoch": 68.3732970027248, + "grad_norm": 2.9195990562438965, + "learning_rate": 4.803127857292145e-06, + "loss": 0.0515, + "step": 25093 + }, + { + "epoch": 68.37602179836512, + "grad_norm": 3.255952835083008, + "learning_rate": 4.802373912413526e-06, + "loss": 0.062, + "step": 25094 + }, + { + "epoch": 68.37874659400545, + "grad_norm": 2.8404171466827393, + "learning_rate": 4.801620008013849e-06, + "loss": 0.0496, + "step": 25095 + }, + { + "epoch": 68.38147138964578, + "grad_norm": 3.142814874649048, + "learning_rate": 4.800866144098987e-06, + "loss": 0.1768, + "step": 25096 + }, + { + "epoch": 68.3841961852861, + "grad_norm": 2.899886131286621, + "learning_rate": 4.800112320674816e-06, + "loss": 0.0634, + "step": 25097 + }, + { + "epoch": 68.38692098092643, + "grad_norm": 2.8207359313964844, + "learning_rate": 4.799358537747203e-06, + "loss": 0.0508, + "step": 25098 + }, + { + "epoch": 68.38964577656675, + "grad_norm": 3.2844810485839844, + "learning_rate": 4.798604795322018e-06, + "loss": 0.2419, + "step": 25099 + }, + { + "epoch": 68.39237057220708, + "grad_norm": 3.1961586475372314, + "learning_rate": 4.797851093405128e-06, + "loss": 0.0828, + "step": 25100 + }, + { + "epoch": 68.39509536784742, + "grad_norm": 2.9002537727355957, + "learning_rate": 4.79709743200241e-06, + "loss": 0.033, + "step": 25101 + }, + { + "epoch": 68.39782016348774, + "grad_norm": 2.4350409507751465, + "learning_rate": 4.7963438111197306e-06, + "loss": 0.0447, + "step": 25102 + }, + { + "epoch": 68.40054495912807, + "grad_norm": 3.0927481651306152, + "learning_rate": 4.795590230762953e-06, + "loss": 0.0529, + "step": 25103 + }, + { + "epoch": 68.40326975476839, + "grad_norm": 2.9737613201141357, + "learning_rate": 4.794836690937955e-06, + "loss": 0.0373, + "step": 25104 + }, + { + "epoch": 68.40599455040872, + "grad_norm": 3.585712432861328, + "learning_rate": 4.794083191650603e-06, + "loss": 0.1791, + "step": 25105 + }, + { + "epoch": 68.40871934604904, + "grad_norm": 2.8583109378814697, + "learning_rate": 4.793329732906762e-06, + "loss": 0.0605, + "step": 25106 + }, + { + "epoch": 68.41144414168937, + "grad_norm": 3.3776392936706543, + "learning_rate": 4.792576314712297e-06, + "loss": 0.0766, + "step": 25107 + }, + { + "epoch": 68.4141689373297, + "grad_norm": 3.646101951599121, + "learning_rate": 4.7918229370730855e-06, + "loss": 0.07, + "step": 25108 + }, + { + "epoch": 68.41689373297002, + "grad_norm": 4.175693035125732, + "learning_rate": 4.7910695999949885e-06, + "loss": 0.0617, + "step": 25109 + }, + { + "epoch": 68.41961852861036, + "grad_norm": 3.119385242462158, + "learning_rate": 4.790316303483874e-06, + "loss": 0.0679, + "step": 25110 + }, + { + "epoch": 68.42234332425068, + "grad_norm": 3.341418504714966, + "learning_rate": 4.7895630475456054e-06, + "loss": 0.0559, + "step": 25111 + }, + { + "epoch": 68.42506811989101, + "grad_norm": 2.7829813957214355, + "learning_rate": 4.788809832186051e-06, + "loss": 0.0468, + "step": 25112 + }, + { + "epoch": 68.42779291553134, + "grad_norm": 4.060194969177246, + "learning_rate": 4.788056657411082e-06, + "loss": 0.0869, + "step": 25113 + }, + { + "epoch": 68.43051771117166, + "grad_norm": 2.6804492473602295, + "learning_rate": 4.787303523226561e-06, + "loss": 0.2156, + "step": 25114 + }, + { + "epoch": 68.433242506812, + "grad_norm": 5.664914608001709, + "learning_rate": 4.786550429638352e-06, + "loss": 0.1709, + "step": 25115 + }, + { + "epoch": 68.43596730245231, + "grad_norm": 2.7411012649536133, + "learning_rate": 4.785797376652315e-06, + "loss": 0.0668, + "step": 25116 + }, + { + "epoch": 68.43869209809264, + "grad_norm": 3.996340036392212, + "learning_rate": 4.785044364274325e-06, + "loss": 0.1414, + "step": 25117 + }, + { + "epoch": 68.44141689373296, + "grad_norm": 2.0779170989990234, + "learning_rate": 4.784291392510242e-06, + "loss": 0.0569, + "step": 25118 + }, + { + "epoch": 68.4441416893733, + "grad_norm": 2.0381622314453125, + "learning_rate": 4.78353846136593e-06, + "loss": 0.0256, + "step": 25119 + }, + { + "epoch": 68.44686648501363, + "grad_norm": 6.922408580780029, + "learning_rate": 4.782785570847248e-06, + "loss": 0.0789, + "step": 25120 + }, + { + "epoch": 68.44959128065395, + "grad_norm": 4.676624774932861, + "learning_rate": 4.782032720960068e-06, + "loss": 0.0395, + "step": 25121 + }, + { + "epoch": 68.45231607629428, + "grad_norm": 3.942620277404785, + "learning_rate": 4.781279911710249e-06, + "loss": 0.0855, + "step": 25122 + }, + { + "epoch": 68.4550408719346, + "grad_norm": 2.670901298522949, + "learning_rate": 4.780527143103655e-06, + "loss": 0.1506, + "step": 25123 + }, + { + "epoch": 68.45776566757493, + "grad_norm": 3.5805327892303467, + "learning_rate": 4.779774415146143e-06, + "loss": 0.1134, + "step": 25124 + }, + { + "epoch": 68.46049046321527, + "grad_norm": 3.4640166759490967, + "learning_rate": 4.779021727843585e-06, + "loss": 0.0546, + "step": 25125 + }, + { + "epoch": 68.46321525885558, + "grad_norm": 2.886509895324707, + "learning_rate": 4.7782690812018365e-06, + "loss": 0.1032, + "step": 25126 + }, + { + "epoch": 68.46594005449592, + "grad_norm": 3.5943520069122314, + "learning_rate": 4.777516475226757e-06, + "loss": 0.0892, + "step": 25127 + }, + { + "epoch": 68.46866485013624, + "grad_norm": 7.02865743637085, + "learning_rate": 4.776763909924215e-06, + "loss": 0.0359, + "step": 25128 + }, + { + "epoch": 68.47138964577657, + "grad_norm": 4.470008850097656, + "learning_rate": 4.776011385300066e-06, + "loss": 0.1249, + "step": 25129 + }, + { + "epoch": 68.47411444141689, + "grad_norm": 3.266449213027954, + "learning_rate": 4.77525890136017e-06, + "loss": 0.0592, + "step": 25130 + }, + { + "epoch": 68.47683923705722, + "grad_norm": 2.963853120803833, + "learning_rate": 4.774506458110393e-06, + "loss": 0.1043, + "step": 25131 + }, + { + "epoch": 68.47956403269755, + "grad_norm": 6.4120073318481445, + "learning_rate": 4.773754055556588e-06, + "loss": 0.0614, + "step": 25132 + }, + { + "epoch": 68.48228882833787, + "grad_norm": 4.997405529022217, + "learning_rate": 4.773001693704622e-06, + "loss": 0.0437, + "step": 25133 + }, + { + "epoch": 68.4850136239782, + "grad_norm": 3.729607343673706, + "learning_rate": 4.77224937256035e-06, + "loss": 0.1769, + "step": 25134 + }, + { + "epoch": 68.48773841961852, + "grad_norm": 3.7368216514587402, + "learning_rate": 4.7714970921296325e-06, + "loss": 0.1098, + "step": 25135 + }, + { + "epoch": 68.49046321525886, + "grad_norm": 3.899833917617798, + "learning_rate": 4.770744852418322e-06, + "loss": 0.0862, + "step": 25136 + }, + { + "epoch": 68.49318801089919, + "grad_norm": 3.8085601329803467, + "learning_rate": 4.769992653432287e-06, + "loss": 0.1327, + "step": 25137 + }, + { + "epoch": 68.49591280653951, + "grad_norm": 2.893799304962158, + "learning_rate": 4.7692404951773815e-06, + "loss": 0.0662, + "step": 25138 + }, + { + "epoch": 68.49863760217984, + "grad_norm": 2.687007427215576, + "learning_rate": 4.768488377659462e-06, + "loss": 0.0639, + "step": 25139 + }, + { + "epoch": 68.50136239782016, + "grad_norm": 3.9088146686553955, + "learning_rate": 4.767736300884384e-06, + "loss": 0.1024, + "step": 25140 + }, + { + "epoch": 68.50408719346049, + "grad_norm": 3.08231520652771, + "learning_rate": 4.766984264858009e-06, + "loss": 0.0434, + "step": 25141 + }, + { + "epoch": 68.50681198910081, + "grad_norm": 2.6814839839935303, + "learning_rate": 4.766232269586193e-06, + "loss": 0.1448, + "step": 25142 + }, + { + "epoch": 68.50953678474114, + "grad_norm": 2.983130693435669, + "learning_rate": 4.7654803150747915e-06, + "loss": 0.1021, + "step": 25143 + }, + { + "epoch": 68.51226158038148, + "grad_norm": 3.5604686737060547, + "learning_rate": 4.764728401329658e-06, + "loss": 0.1013, + "step": 25144 + }, + { + "epoch": 68.5149863760218, + "grad_norm": 4.0818281173706055, + "learning_rate": 4.763976528356654e-06, + "loss": 0.0871, + "step": 25145 + }, + { + "epoch": 68.51771117166213, + "grad_norm": 2.9919230937957764, + "learning_rate": 4.763224696161633e-06, + "loss": 0.0374, + "step": 25146 + }, + { + "epoch": 68.52043596730245, + "grad_norm": 3.354459524154663, + "learning_rate": 4.7624729047504455e-06, + "loss": 0.0532, + "step": 25147 + }, + { + "epoch": 68.52316076294278, + "grad_norm": 6.059757709503174, + "learning_rate": 4.76172115412895e-06, + "loss": 0.1336, + "step": 25148 + }, + { + "epoch": 68.52588555858311, + "grad_norm": 3.0966076850891113, + "learning_rate": 4.760969444303006e-06, + "loss": 0.1218, + "step": 25149 + }, + { + "epoch": 68.52861035422343, + "grad_norm": 3.0650575160980225, + "learning_rate": 4.7602177752784625e-06, + "loss": 0.1357, + "step": 25150 + }, + { + "epoch": 68.53133514986376, + "grad_norm": 3.5466384887695312, + "learning_rate": 4.7594661470611745e-06, + "loss": 0.0509, + "step": 25151 + }, + { + "epoch": 68.53405994550408, + "grad_norm": 10.345356941223145, + "learning_rate": 4.7587145596569925e-06, + "loss": 0.0422, + "step": 25152 + }, + { + "epoch": 68.53678474114442, + "grad_norm": 4.462990760803223, + "learning_rate": 4.757963013071777e-06, + "loss": 0.04, + "step": 25153 + }, + { + "epoch": 68.53950953678473, + "grad_norm": 5.018280029296875, + "learning_rate": 4.7572115073113755e-06, + "loss": 0.1542, + "step": 25154 + }, + { + "epoch": 68.54223433242507, + "grad_norm": 3.254812717437744, + "learning_rate": 4.756460042381642e-06, + "loss": 0.0706, + "step": 25155 + }, + { + "epoch": 68.5449591280654, + "grad_norm": 3.239781141281128, + "learning_rate": 4.755708618288426e-06, + "loss": 0.0707, + "step": 25156 + }, + { + "epoch": 68.54768392370572, + "grad_norm": 2.7286837100982666, + "learning_rate": 4.7549572350375864e-06, + "loss": 0.0435, + "step": 25157 + }, + { + "epoch": 68.55040871934605, + "grad_norm": 3.584249258041382, + "learning_rate": 4.75420589263497e-06, + "loss": 0.0806, + "step": 25158 + }, + { + "epoch": 68.55313351498637, + "grad_norm": 4.158878803253174, + "learning_rate": 4.753454591086431e-06, + "loss": 0.1047, + "step": 25159 + }, + { + "epoch": 68.5558583106267, + "grad_norm": 3.319026231765747, + "learning_rate": 4.7527033303978135e-06, + "loss": 0.047, + "step": 25160 + }, + { + "epoch": 68.55858310626704, + "grad_norm": 4.47884464263916, + "learning_rate": 4.751952110574977e-06, + "loss": 0.0943, + "step": 25161 + }, + { + "epoch": 68.56130790190736, + "grad_norm": 3.4570767879486084, + "learning_rate": 4.75120093162377e-06, + "loss": 0.0436, + "step": 25162 + }, + { + "epoch": 68.56403269754769, + "grad_norm": 2.990640878677368, + "learning_rate": 4.75044979355004e-06, + "loss": 0.0877, + "step": 25163 + }, + { + "epoch": 68.566757493188, + "grad_norm": 3.3707058429718018, + "learning_rate": 4.749698696359635e-06, + "loss": 0.0883, + "step": 25164 + }, + { + "epoch": 68.56948228882834, + "grad_norm": 5.598540306091309, + "learning_rate": 4.748947640058407e-06, + "loss": 0.07, + "step": 25165 + }, + { + "epoch": 68.57220708446866, + "grad_norm": 3.6774098873138428, + "learning_rate": 4.74819662465221e-06, + "loss": 0.1686, + "step": 25166 + }, + { + "epoch": 68.57493188010899, + "grad_norm": 2.633655309677124, + "learning_rate": 4.747445650146888e-06, + "loss": 0.0332, + "step": 25167 + }, + { + "epoch": 68.57765667574932, + "grad_norm": 2.769691228866577, + "learning_rate": 4.746694716548288e-06, + "loss": 0.1756, + "step": 25168 + }, + { + "epoch": 68.58038147138964, + "grad_norm": 3.9401910305023193, + "learning_rate": 4.745943823862263e-06, + "loss": 0.1578, + "step": 25169 + }, + { + "epoch": 68.58310626702998, + "grad_norm": 2.708097457885742, + "learning_rate": 4.745192972094659e-06, + "loss": 0.0359, + "step": 25170 + }, + { + "epoch": 68.5858310626703, + "grad_norm": 3.1952457427978516, + "learning_rate": 4.744442161251323e-06, + "loss": 0.1823, + "step": 25171 + }, + { + "epoch": 68.58855585831063, + "grad_norm": 2.921765089035034, + "learning_rate": 4.743691391338096e-06, + "loss": 0.2089, + "step": 25172 + }, + { + "epoch": 68.59128065395096, + "grad_norm": 2.713057279586792, + "learning_rate": 4.742940662360839e-06, + "loss": 0.0447, + "step": 25173 + }, + { + "epoch": 68.59400544959128, + "grad_norm": 2.8322789669036865, + "learning_rate": 4.742189974325389e-06, + "loss": 0.096, + "step": 25174 + }, + { + "epoch": 68.59673024523161, + "grad_norm": 6.807580471038818, + "learning_rate": 4.741439327237594e-06, + "loss": 0.0619, + "step": 25175 + }, + { + "epoch": 68.59945504087193, + "grad_norm": 3.18601393699646, + "learning_rate": 4.740688721103297e-06, + "loss": 0.1193, + "step": 25176 + }, + { + "epoch": 68.60217983651226, + "grad_norm": 3.1044204235076904, + "learning_rate": 4.739938155928351e-06, + "loss": 0.2166, + "step": 25177 + }, + { + "epoch": 68.60490463215258, + "grad_norm": 3.3225605487823486, + "learning_rate": 4.739187631718597e-06, + "loss": 0.0378, + "step": 25178 + }, + { + "epoch": 68.60762942779292, + "grad_norm": 3.8188860416412354, + "learning_rate": 4.73843714847988e-06, + "loss": 0.1016, + "step": 25179 + }, + { + "epoch": 68.61035422343325, + "grad_norm": 3.6552019119262695, + "learning_rate": 4.737686706218042e-06, + "loss": 0.0608, + "step": 25180 + }, + { + "epoch": 68.61307901907357, + "grad_norm": 2.598064661026001, + "learning_rate": 4.736936304938929e-06, + "loss": 0.1276, + "step": 25181 + }, + { + "epoch": 68.6158038147139, + "grad_norm": 6.786052227020264, + "learning_rate": 4.736185944648393e-06, + "loss": 0.0641, + "step": 25182 + }, + { + "epoch": 68.61852861035422, + "grad_norm": 5.362548828125, + "learning_rate": 4.73543562535227e-06, + "loss": 0.0602, + "step": 25183 + }, + { + "epoch": 68.62125340599455, + "grad_norm": 3.872605085372925, + "learning_rate": 4.734685347056405e-06, + "loss": 0.1098, + "step": 25184 + }, + { + "epoch": 68.62397820163488, + "grad_norm": 3.679784059524536, + "learning_rate": 4.7339351097666375e-06, + "loss": 0.0483, + "step": 25185 + }, + { + "epoch": 68.6267029972752, + "grad_norm": 3.1309032440185547, + "learning_rate": 4.733184913488817e-06, + "loss": 0.042, + "step": 25186 + }, + { + "epoch": 68.62942779291554, + "grad_norm": 4.85702657699585, + "learning_rate": 4.732434758228784e-06, + "loss": 0.1734, + "step": 25187 + }, + { + "epoch": 68.63215258855585, + "grad_norm": 4.458306789398193, + "learning_rate": 4.731684643992375e-06, + "loss": 0.059, + "step": 25188 + }, + { + "epoch": 68.63487738419619, + "grad_norm": 2.068485975265503, + "learning_rate": 4.730934570785441e-06, + "loss": 0.0292, + "step": 25189 + }, + { + "epoch": 68.6376021798365, + "grad_norm": 3.625941753387451, + "learning_rate": 4.730184538613818e-06, + "loss": 0.1159, + "step": 25190 + }, + { + "epoch": 68.64032697547684, + "grad_norm": 3.8161723613739014, + "learning_rate": 4.729434547483349e-06, + "loss": 0.1458, + "step": 25191 + }, + { + "epoch": 68.64305177111717, + "grad_norm": 4.030821323394775, + "learning_rate": 4.72868459739987e-06, + "loss": 0.1822, + "step": 25192 + }, + { + "epoch": 68.64577656675749, + "grad_norm": 3.8183062076568604, + "learning_rate": 4.727934688369229e-06, + "loss": 0.0592, + "step": 25193 + }, + { + "epoch": 68.64850136239782, + "grad_norm": 2.4527411460876465, + "learning_rate": 4.727184820397263e-06, + "loss": 0.0386, + "step": 25194 + }, + { + "epoch": 68.65122615803814, + "grad_norm": 2.4861347675323486, + "learning_rate": 4.7264349934898124e-06, + "loss": 0.1229, + "step": 25195 + }, + { + "epoch": 68.65395095367847, + "grad_norm": 3.8023078441619873, + "learning_rate": 4.725685207652712e-06, + "loss": 0.081, + "step": 25196 + }, + { + "epoch": 68.65667574931881, + "grad_norm": 3.4263360500335693, + "learning_rate": 4.724935462891811e-06, + "loss": 0.0855, + "step": 25197 + }, + { + "epoch": 68.65940054495913, + "grad_norm": 3.7822086811065674, + "learning_rate": 4.724185759212937e-06, + "loss": 0.0851, + "step": 25198 + }, + { + "epoch": 68.66212534059946, + "grad_norm": 3.5324831008911133, + "learning_rate": 4.723436096621939e-06, + "loss": 0.0527, + "step": 25199 + }, + { + "epoch": 68.66485013623978, + "grad_norm": 3.150998830795288, + "learning_rate": 4.722686475124652e-06, + "loss": 0.0605, + "step": 25200 + }, + { + "epoch": 68.66757493188011, + "grad_norm": 4.413564682006836, + "learning_rate": 4.7219368947269074e-06, + "loss": 0.0959, + "step": 25201 + }, + { + "epoch": 68.67029972752043, + "grad_norm": 2.7410242557525635, + "learning_rate": 4.721187355434553e-06, + "loss": 0.0351, + "step": 25202 + }, + { + "epoch": 68.67302452316076, + "grad_norm": 5.757294178009033, + "learning_rate": 4.720437857253421e-06, + "loss": 0.232, + "step": 25203 + }, + { + "epoch": 68.6757493188011, + "grad_norm": 4.090802192687988, + "learning_rate": 4.719688400189349e-06, + "loss": 0.0994, + "step": 25204 + }, + { + "epoch": 68.67847411444141, + "grad_norm": 3.794888973236084, + "learning_rate": 4.718938984248171e-06, + "loss": 0.0756, + "step": 25205 + }, + { + "epoch": 68.68119891008175, + "grad_norm": 3.559938907623291, + "learning_rate": 4.71818960943573e-06, + "loss": 0.1147, + "step": 25206 + }, + { + "epoch": 68.68392370572207, + "grad_norm": 5.694897174835205, + "learning_rate": 4.717440275757858e-06, + "loss": 0.083, + "step": 25207 + }, + { + "epoch": 68.6866485013624, + "grad_norm": 3.655093193054199, + "learning_rate": 4.71669098322039e-06, + "loss": 0.0837, + "step": 25208 + }, + { + "epoch": 68.68937329700273, + "grad_norm": 4.3597235679626465, + "learning_rate": 4.7159417318291604e-06, + "loss": 0.0904, + "step": 25209 + }, + { + "epoch": 68.69209809264305, + "grad_norm": 3.2580018043518066, + "learning_rate": 4.715192521590009e-06, + "loss": 0.0925, + "step": 25210 + }, + { + "epoch": 68.69482288828338, + "grad_norm": 2.5528197288513184, + "learning_rate": 4.7144433525087685e-06, + "loss": 0.1412, + "step": 25211 + }, + { + "epoch": 68.6975476839237, + "grad_norm": 2.148444175720215, + "learning_rate": 4.71369422459127e-06, + "loss": 0.0908, + "step": 25212 + }, + { + "epoch": 68.70027247956403, + "grad_norm": 2.996722936630249, + "learning_rate": 4.712945137843353e-06, + "loss": 0.135, + "step": 25213 + }, + { + "epoch": 68.70299727520435, + "grad_norm": 3.0027120113372803, + "learning_rate": 4.712196092270851e-06, + "loss": 0.087, + "step": 25214 + }, + { + "epoch": 68.70572207084469, + "grad_norm": 3.3666679859161377, + "learning_rate": 4.711447087879595e-06, + "loss": 0.0638, + "step": 25215 + }, + { + "epoch": 68.70844686648502, + "grad_norm": 3.1055893898010254, + "learning_rate": 4.710698124675415e-06, + "loss": 0.1127, + "step": 25216 + }, + { + "epoch": 68.71117166212534, + "grad_norm": 2.238966703414917, + "learning_rate": 4.709949202664147e-06, + "loss": 0.0344, + "step": 25217 + }, + { + "epoch": 68.71389645776567, + "grad_norm": 2.6818714141845703, + "learning_rate": 4.709200321851629e-06, + "loss": 0.0261, + "step": 25218 + }, + { + "epoch": 68.71662125340599, + "grad_norm": 3.0138466358184814, + "learning_rate": 4.708451482243688e-06, + "loss": 0.0363, + "step": 25219 + }, + { + "epoch": 68.71934604904632, + "grad_norm": 3.702580451965332, + "learning_rate": 4.707702683846157e-06, + "loss": 0.1585, + "step": 25220 + }, + { + "epoch": 68.72207084468666, + "grad_norm": 3.066445827484131, + "learning_rate": 4.706953926664863e-06, + "loss": 0.0378, + "step": 25221 + }, + { + "epoch": 68.72479564032697, + "grad_norm": 2.9520070552825928, + "learning_rate": 4.706205210705645e-06, + "loss": 0.059, + "step": 25222 + }, + { + "epoch": 68.7275204359673, + "grad_norm": 10.24441146850586, + "learning_rate": 4.705456535974332e-06, + "loss": 0.052, + "step": 25223 + }, + { + "epoch": 68.73024523160763, + "grad_norm": 3.098729372024536, + "learning_rate": 4.704707902476752e-06, + "loss": 0.0672, + "step": 25224 + }, + { + "epoch": 68.73297002724796, + "grad_norm": 2.529139995574951, + "learning_rate": 4.703959310218733e-06, + "loss": 0.0333, + "step": 25225 + }, + { + "epoch": 68.73569482288828, + "grad_norm": 6.588604927062988, + "learning_rate": 4.703210759206112e-06, + "loss": 0.0867, + "step": 25226 + }, + { + "epoch": 68.73841961852861, + "grad_norm": 3.233839511871338, + "learning_rate": 4.702462249444714e-06, + "loss": 0.1194, + "step": 25227 + }, + { + "epoch": 68.74114441416894, + "grad_norm": 4.281998634338379, + "learning_rate": 4.7017137809403716e-06, + "loss": 0.1756, + "step": 25228 + }, + { + "epoch": 68.74386920980926, + "grad_norm": 4.349316596984863, + "learning_rate": 4.700965353698907e-06, + "loss": 0.0985, + "step": 25229 + }, + { + "epoch": 68.7465940054496, + "grad_norm": 3.625556707382202, + "learning_rate": 4.700216967726157e-06, + "loss": 0.1254, + "step": 25230 + }, + { + "epoch": 68.74931880108991, + "grad_norm": 5.871299743652344, + "learning_rate": 4.699468623027948e-06, + "loss": 0.0972, + "step": 25231 + }, + { + "epoch": 68.75204359673025, + "grad_norm": 3.9378881454467773, + "learning_rate": 4.698720319610105e-06, + "loss": 0.1128, + "step": 25232 + }, + { + "epoch": 68.75476839237058, + "grad_norm": 2.4924910068511963, + "learning_rate": 4.69797205747845e-06, + "loss": 0.0284, + "step": 25233 + }, + { + "epoch": 68.7574931880109, + "grad_norm": 5.077095985412598, + "learning_rate": 4.6972238366388265e-06, + "loss": 0.0569, + "step": 25234 + }, + { + "epoch": 68.76021798365123, + "grad_norm": 3.356592893600464, + "learning_rate": 4.696475657097054e-06, + "loss": 0.0822, + "step": 25235 + }, + { + "epoch": 68.76294277929155, + "grad_norm": 4.1355881690979, + "learning_rate": 4.6957275188589565e-06, + "loss": 0.0346, + "step": 25236 + }, + { + "epoch": 68.76566757493188, + "grad_norm": 4.216447353363037, + "learning_rate": 4.69497942193036e-06, + "loss": 0.0641, + "step": 25237 + }, + { + "epoch": 68.7683923705722, + "grad_norm": 4.259905815124512, + "learning_rate": 4.694231366317096e-06, + "loss": 0.0797, + "step": 25238 + }, + { + "epoch": 68.77111716621253, + "grad_norm": 2.423780918121338, + "learning_rate": 4.693483352024988e-06, + "loss": 0.036, + "step": 25239 + }, + { + "epoch": 68.77384196185287, + "grad_norm": 3.8292150497436523, + "learning_rate": 4.6927353790598595e-06, + "loss": 0.0732, + "step": 25240 + }, + { + "epoch": 68.77656675749319, + "grad_norm": 4.539219856262207, + "learning_rate": 4.691987447427535e-06, + "loss": 0.1038, + "step": 25241 + }, + { + "epoch": 68.77929155313352, + "grad_norm": 2.4098050594329834, + "learning_rate": 4.691239557133844e-06, + "loss": 0.031, + "step": 25242 + }, + { + "epoch": 68.78201634877384, + "grad_norm": 3.4923839569091797, + "learning_rate": 4.690491708184609e-06, + "loss": 0.1443, + "step": 25243 + }, + { + "epoch": 68.78474114441417, + "grad_norm": 2.1044909954071045, + "learning_rate": 4.689743900585654e-06, + "loss": 0.0782, + "step": 25244 + }, + { + "epoch": 68.7874659400545, + "grad_norm": 3.4952354431152344, + "learning_rate": 4.688996134342798e-06, + "loss": 0.082, + "step": 25245 + }, + { + "epoch": 68.79019073569482, + "grad_norm": 4.9752912521362305, + "learning_rate": 4.688248409461873e-06, + "loss": 0.1302, + "step": 25246 + }, + { + "epoch": 68.79291553133515, + "grad_norm": 3.041003942489624, + "learning_rate": 4.687500725948699e-06, + "loss": 0.0425, + "step": 25247 + }, + { + "epoch": 68.79564032697547, + "grad_norm": 3.128225564956665, + "learning_rate": 4.686753083809098e-06, + "loss": 0.2146, + "step": 25248 + }, + { + "epoch": 68.7983651226158, + "grad_norm": 3.4257009029388428, + "learning_rate": 4.68600548304889e-06, + "loss": 0.084, + "step": 25249 + }, + { + "epoch": 68.80108991825612, + "grad_norm": 3.7465832233428955, + "learning_rate": 4.685257923673899e-06, + "loss": 0.2516, + "step": 25250 + }, + { + "epoch": 68.80381471389646, + "grad_norm": 2.69468092918396, + "learning_rate": 4.6845104056899525e-06, + "loss": 0.0383, + "step": 25251 + }, + { + "epoch": 68.80653950953679, + "grad_norm": 2.782733917236328, + "learning_rate": 4.683762929102868e-06, + "loss": 0.036, + "step": 25252 + }, + { + "epoch": 68.80926430517711, + "grad_norm": 12.41683578491211, + "learning_rate": 4.683015493918463e-06, + "loss": 0.0443, + "step": 25253 + }, + { + "epoch": 68.81198910081744, + "grad_norm": 3.2941360473632812, + "learning_rate": 4.682268100142567e-06, + "loss": 0.1425, + "step": 25254 + }, + { + "epoch": 68.81471389645776, + "grad_norm": 3.0366806983947754, + "learning_rate": 4.681520747780994e-06, + "loss": 0.0552, + "step": 25255 + }, + { + "epoch": 68.8174386920981, + "grad_norm": 5.389036655426025, + "learning_rate": 4.680773436839566e-06, + "loss": 0.0725, + "step": 25256 + }, + { + "epoch": 68.82016348773843, + "grad_norm": 4.012606620788574, + "learning_rate": 4.680026167324101e-06, + "loss": 0.144, + "step": 25257 + }, + { + "epoch": 68.82288828337875, + "grad_norm": 3.0946478843688965, + "learning_rate": 4.6792789392404246e-06, + "loss": 0.0747, + "step": 25258 + }, + { + "epoch": 68.82561307901908, + "grad_norm": 3.341019630432129, + "learning_rate": 4.678531752594352e-06, + "loss": 0.0629, + "step": 25259 + }, + { + "epoch": 68.8283378746594, + "grad_norm": 2.997502565383911, + "learning_rate": 4.677784607391703e-06, + "loss": 0.0772, + "step": 25260 + }, + { + "epoch": 68.83106267029973, + "grad_norm": 2.483455181121826, + "learning_rate": 4.677037503638293e-06, + "loss": 0.1807, + "step": 25261 + }, + { + "epoch": 68.83378746594005, + "grad_norm": 3.285806179046631, + "learning_rate": 4.6762904413399465e-06, + "loss": 0.1326, + "step": 25262 + }, + { + "epoch": 68.83651226158038, + "grad_norm": 4.679166793823242, + "learning_rate": 4.675543420502479e-06, + "loss": 0.0922, + "step": 25263 + }, + { + "epoch": 68.83923705722071, + "grad_norm": 2.4225618839263916, + "learning_rate": 4.674796441131708e-06, + "loss": 0.0405, + "step": 25264 + }, + { + "epoch": 68.84196185286103, + "grad_norm": 2.8314013481140137, + "learning_rate": 4.6740495032334475e-06, + "loss": 0.0441, + "step": 25265 + }, + { + "epoch": 68.84468664850137, + "grad_norm": 3.1308062076568604, + "learning_rate": 4.673302606813521e-06, + "loss": 0.0679, + "step": 25266 + }, + { + "epoch": 68.84741144414168, + "grad_norm": 2.5626614093780518, + "learning_rate": 4.67255575187774e-06, + "loss": 0.1095, + "step": 25267 + }, + { + "epoch": 68.85013623978202, + "grad_norm": 4.718066215515137, + "learning_rate": 4.671808938431927e-06, + "loss": 0.1733, + "step": 25268 + }, + { + "epoch": 68.85286103542235, + "grad_norm": 2.801140785217285, + "learning_rate": 4.671062166481893e-06, + "loss": 0.115, + "step": 25269 + }, + { + "epoch": 68.85558583106267, + "grad_norm": 3.2998874187469482, + "learning_rate": 4.670315436033452e-06, + "loss": 0.0647, + "step": 25270 + }, + { + "epoch": 68.858310626703, + "grad_norm": 2.5194222927093506, + "learning_rate": 4.669568747092427e-06, + "loss": 0.0493, + "step": 25271 + }, + { + "epoch": 68.86103542234332, + "grad_norm": 2.6707797050476074, + "learning_rate": 4.668822099664629e-06, + "loss": 0.0793, + "step": 25272 + }, + { + "epoch": 68.86376021798365, + "grad_norm": 3.8744704723358154, + "learning_rate": 4.668075493755873e-06, + "loss": 0.029, + "step": 25273 + }, + { + "epoch": 68.86648501362397, + "grad_norm": 3.476962089538574, + "learning_rate": 4.667328929371969e-06, + "loss": 0.1315, + "step": 25274 + }, + { + "epoch": 68.8692098092643, + "grad_norm": 3.791701078414917, + "learning_rate": 4.66658240651874e-06, + "loss": 0.0587, + "step": 25275 + }, + { + "epoch": 68.87193460490464, + "grad_norm": 2.206984758377075, + "learning_rate": 4.665835925201995e-06, + "loss": 0.0261, + "step": 25276 + }, + { + "epoch": 68.87465940054496, + "grad_norm": 7.005254745483398, + "learning_rate": 4.665089485427546e-06, + "loss": 0.0725, + "step": 25277 + }, + { + "epoch": 68.87738419618529, + "grad_norm": 2.7205026149749756, + "learning_rate": 4.664343087201211e-06, + "loss": 0.0532, + "step": 25278 + }, + { + "epoch": 68.88010899182561, + "grad_norm": 4.036895751953125, + "learning_rate": 4.6635967305288e-06, + "loss": 0.048, + "step": 25279 + }, + { + "epoch": 68.88283378746594, + "grad_norm": 2.835393190383911, + "learning_rate": 4.662850415416127e-06, + "loss": 0.1298, + "step": 25280 + }, + { + "epoch": 68.88555858310627, + "grad_norm": 3.6264708042144775, + "learning_rate": 4.6621041418689985e-06, + "loss": 0.0497, + "step": 25281 + }, + { + "epoch": 68.88828337874659, + "grad_norm": 2.5192103385925293, + "learning_rate": 4.661357909893235e-06, + "loss": 0.0923, + "step": 25282 + }, + { + "epoch": 68.89100817438693, + "grad_norm": 5.387713432312012, + "learning_rate": 4.660611719494644e-06, + "loss": 0.1054, + "step": 25283 + }, + { + "epoch": 68.89373297002724, + "grad_norm": 3.527350902557373, + "learning_rate": 4.6598655706790344e-06, + "loss": 0.0993, + "step": 25284 + }, + { + "epoch": 68.89645776566758, + "grad_norm": 4.775354862213135, + "learning_rate": 4.659119463452223e-06, + "loss": 0.055, + "step": 25285 + }, + { + "epoch": 68.8991825613079, + "grad_norm": 5.509058475494385, + "learning_rate": 4.658373397820013e-06, + "loss": 0.059, + "step": 25286 + }, + { + "epoch": 68.90190735694823, + "grad_norm": 3.4188144207000732, + "learning_rate": 4.657627373788224e-06, + "loss": 0.0444, + "step": 25287 + }, + { + "epoch": 68.90463215258856, + "grad_norm": 2.3662898540496826, + "learning_rate": 4.65688139136266e-06, + "loss": 0.0293, + "step": 25288 + }, + { + "epoch": 68.90735694822888, + "grad_norm": 4.150286674499512, + "learning_rate": 4.656135450549132e-06, + "loss": 0.1194, + "step": 25289 + }, + { + "epoch": 68.91008174386921, + "grad_norm": 3.394137144088745, + "learning_rate": 4.655389551353445e-06, + "loss": 0.0794, + "step": 25290 + }, + { + "epoch": 68.91280653950953, + "grad_norm": 3.964113235473633, + "learning_rate": 4.654643693781417e-06, + "loss": 0.22, + "step": 25291 + }, + { + "epoch": 68.91553133514986, + "grad_norm": 2.2684898376464844, + "learning_rate": 4.653897877838851e-06, + "loss": 0.0394, + "step": 25292 + }, + { + "epoch": 68.9182561307902, + "grad_norm": 2.652017593383789, + "learning_rate": 4.6531521035315566e-06, + "loss": 0.0661, + "step": 25293 + }, + { + "epoch": 68.92098092643052, + "grad_norm": 3.710247278213501, + "learning_rate": 4.652406370865338e-06, + "loss": 0.0798, + "step": 25294 + }, + { + "epoch": 68.92370572207085, + "grad_norm": 4.017529487609863, + "learning_rate": 4.65166067984601e-06, + "loss": 0.0678, + "step": 25295 + }, + { + "epoch": 68.92643051771117, + "grad_norm": 3.1239895820617676, + "learning_rate": 4.650915030479376e-06, + "loss": 0.1691, + "step": 25296 + }, + { + "epoch": 68.9291553133515, + "grad_norm": 2.6684730052948, + "learning_rate": 4.65016942277124e-06, + "loss": 0.278, + "step": 25297 + }, + { + "epoch": 68.93188010899182, + "grad_norm": 1.8895353078842163, + "learning_rate": 4.6494238567274175e-06, + "loss": 0.0257, + "step": 25298 + }, + { + "epoch": 68.93460490463215, + "grad_norm": 3.6534266471862793, + "learning_rate": 4.648678332353709e-06, + "loss": 0.0791, + "step": 25299 + }, + { + "epoch": 68.93732970027249, + "grad_norm": 3.0218663215637207, + "learning_rate": 4.64793284965592e-06, + "loss": 0.0404, + "step": 25300 + }, + { + "epoch": 68.9400544959128, + "grad_norm": 2.994173049926758, + "learning_rate": 4.647187408639855e-06, + "loss": 0.0413, + "step": 25301 + }, + { + "epoch": 68.94277929155314, + "grad_norm": 3.136317491531372, + "learning_rate": 4.646442009311323e-06, + "loss": 0.0766, + "step": 25302 + }, + { + "epoch": 68.94550408719346, + "grad_norm": 3.6843063831329346, + "learning_rate": 4.645696651676131e-06, + "loss": 0.1817, + "step": 25303 + }, + { + "epoch": 68.94822888283379, + "grad_norm": 4.230409145355225, + "learning_rate": 4.644951335740081e-06, + "loss": 0.1955, + "step": 25304 + }, + { + "epoch": 68.95095367847412, + "grad_norm": 3.020812749862671, + "learning_rate": 4.644206061508979e-06, + "loss": 0.1499, + "step": 25305 + }, + { + "epoch": 68.95367847411444, + "grad_norm": 3.0145413875579834, + "learning_rate": 4.643460828988623e-06, + "loss": 0.0394, + "step": 25306 + }, + { + "epoch": 68.95640326975477, + "grad_norm": 2.7844457626342773, + "learning_rate": 4.642715638184825e-06, + "loss": 0.0361, + "step": 25307 + }, + { + "epoch": 68.95912806539509, + "grad_norm": 3.670297861099243, + "learning_rate": 4.641970489103386e-06, + "loss": 0.0626, + "step": 25308 + }, + { + "epoch": 68.96185286103542, + "grad_norm": 3.8738906383514404, + "learning_rate": 4.641225381750109e-06, + "loss": 0.0491, + "step": 25309 + }, + { + "epoch": 68.96457765667574, + "grad_norm": 4.277965068817139, + "learning_rate": 4.640480316130791e-06, + "loss": 0.1066, + "step": 25310 + }, + { + "epoch": 68.96730245231608, + "grad_norm": 2.212169647216797, + "learning_rate": 4.639735292251244e-06, + "loss": 0.0364, + "step": 25311 + }, + { + "epoch": 68.97002724795641, + "grad_norm": 2.7719273567199707, + "learning_rate": 4.638990310117266e-06, + "loss": 0.0607, + "step": 25312 + }, + { + "epoch": 68.97275204359673, + "grad_norm": 4.156070232391357, + "learning_rate": 4.638245369734659e-06, + "loss": 0.056, + "step": 25313 + }, + { + "epoch": 68.97547683923706, + "grad_norm": 2.888261079788208, + "learning_rate": 4.637500471109222e-06, + "loss": 0.0426, + "step": 25314 + }, + { + "epoch": 68.97820163487738, + "grad_norm": 2.8456966876983643, + "learning_rate": 4.6367556142467605e-06, + "loss": 0.0748, + "step": 25315 + }, + { + "epoch": 68.98092643051771, + "grad_norm": 3.2775473594665527, + "learning_rate": 4.636010799153074e-06, + "loss": 0.0408, + "step": 25316 + }, + { + "epoch": 68.98365122615803, + "grad_norm": 3.8727123737335205, + "learning_rate": 4.635266025833964e-06, + "loss": 0.0355, + "step": 25317 + }, + { + "epoch": 68.98637602179836, + "grad_norm": 3.1337437629699707, + "learning_rate": 4.6345212942952255e-06, + "loss": 0.0447, + "step": 25318 + }, + { + "epoch": 68.9891008174387, + "grad_norm": 3.4043190479278564, + "learning_rate": 4.6337766045426625e-06, + "loss": 0.0977, + "step": 25319 + }, + { + "epoch": 68.99182561307902, + "grad_norm": 2.9682180881500244, + "learning_rate": 4.633031956582077e-06, + "loss": 0.0658, + "step": 25320 + }, + { + "epoch": 68.99455040871935, + "grad_norm": 2.725248336791992, + "learning_rate": 4.6322873504192675e-06, + "loss": 0.0964, + "step": 25321 + }, + { + "epoch": 68.99727520435967, + "grad_norm": 2.6156909465789795, + "learning_rate": 4.631542786060027e-06, + "loss": 0.069, + "step": 25322 + }, + { + "epoch": 69.0, + "grad_norm": 3.5765891075134277, + "learning_rate": 4.630798263510162e-06, + "loss": 0.1748, + "step": 25323 + }, + { + "epoch": 69.00272479564033, + "grad_norm": 2.973284959793091, + "learning_rate": 4.630053782775467e-06, + "loss": 0.0512, + "step": 25324 + }, + { + "epoch": 69.00544959128065, + "grad_norm": 2.2170028686523438, + "learning_rate": 4.629309343861741e-06, + "loss": 0.0336, + "step": 25325 + }, + { + "epoch": 69.00817438692098, + "grad_norm": 2.648892641067505, + "learning_rate": 4.628564946774777e-06, + "loss": 0.0665, + "step": 25326 + }, + { + "epoch": 69.0108991825613, + "grad_norm": 3.3921704292297363, + "learning_rate": 4.62782059152038e-06, + "loss": 0.1104, + "step": 25327 + }, + { + "epoch": 69.01362397820164, + "grad_norm": 2.8230392932891846, + "learning_rate": 4.627076278104343e-06, + "loss": 0.0478, + "step": 25328 + }, + { + "epoch": 69.01634877384195, + "grad_norm": 2.938129186630249, + "learning_rate": 4.626332006532464e-06, + "loss": 0.0954, + "step": 25329 + }, + { + "epoch": 69.01907356948229, + "grad_norm": 4.370748996734619, + "learning_rate": 4.625587776810534e-06, + "loss": 0.0938, + "step": 25330 + }, + { + "epoch": 69.02179836512262, + "grad_norm": 2.6737706661224365, + "learning_rate": 4.624843588944357e-06, + "loss": 0.0499, + "step": 25331 + }, + { + "epoch": 69.02452316076294, + "grad_norm": 3.3993330001831055, + "learning_rate": 4.624099442939726e-06, + "loss": 0.0714, + "step": 25332 + }, + { + "epoch": 69.02724795640327, + "grad_norm": 2.5821268558502197, + "learning_rate": 4.623355338802434e-06, + "loss": 0.081, + "step": 25333 + }, + { + "epoch": 69.02997275204359, + "grad_norm": 3.2227485179901123, + "learning_rate": 4.622611276538276e-06, + "loss": 0.0677, + "step": 25334 + }, + { + "epoch": 69.03269754768392, + "grad_norm": 2.1117255687713623, + "learning_rate": 4.62186725615305e-06, + "loss": 0.0333, + "step": 25335 + }, + { + "epoch": 69.03542234332426, + "grad_norm": 3.1656744480133057, + "learning_rate": 4.621123277652546e-06, + "loss": 0.037, + "step": 25336 + }, + { + "epoch": 69.03814713896458, + "grad_norm": 4.241729736328125, + "learning_rate": 4.620379341042564e-06, + "loss": 0.1225, + "step": 25337 + }, + { + "epoch": 69.04087193460491, + "grad_norm": 4.0763349533081055, + "learning_rate": 4.619635446328895e-06, + "loss": 0.0599, + "step": 25338 + }, + { + "epoch": 69.04359673024523, + "grad_norm": 4.741207599639893, + "learning_rate": 4.618891593517328e-06, + "loss": 0.1084, + "step": 25339 + }, + { + "epoch": 69.04632152588556, + "grad_norm": 3.7330992221832275, + "learning_rate": 4.618147782613663e-06, + "loss": 0.0644, + "step": 25340 + }, + { + "epoch": 69.04904632152588, + "grad_norm": 2.286592721939087, + "learning_rate": 4.617404013623692e-06, + "loss": 0.0336, + "step": 25341 + }, + { + "epoch": 69.05177111716621, + "grad_norm": 2.8393232822418213, + "learning_rate": 4.616660286553199e-06, + "loss": 0.061, + "step": 25342 + }, + { + "epoch": 69.05449591280654, + "grad_norm": 2.792849540710449, + "learning_rate": 4.615916601407988e-06, + "loss": 0.1103, + "step": 25343 + }, + { + "epoch": 69.05722070844686, + "grad_norm": 3.050400972366333, + "learning_rate": 4.615172958193845e-06, + "loss": 0.0836, + "step": 25344 + }, + { + "epoch": 69.0599455040872, + "grad_norm": 3.8424429893493652, + "learning_rate": 4.614429356916561e-06, + "loss": 0.1374, + "step": 25345 + }, + { + "epoch": 69.06267029972751, + "grad_norm": 3.551499128341675, + "learning_rate": 4.613685797581925e-06, + "loss": 0.0867, + "step": 25346 + }, + { + "epoch": 69.06539509536785, + "grad_norm": 5.33734655380249, + "learning_rate": 4.612942280195734e-06, + "loss": 0.0901, + "step": 25347 + }, + { + "epoch": 69.06811989100818, + "grad_norm": 2.7843034267425537, + "learning_rate": 4.612198804763775e-06, + "loss": 0.077, + "step": 25348 + }, + { + "epoch": 69.0708446866485, + "grad_norm": 3.4353561401367188, + "learning_rate": 4.611455371291837e-06, + "loss": 0.1888, + "step": 25349 + }, + { + "epoch": 69.07356948228883, + "grad_norm": 3.2494888305664062, + "learning_rate": 4.6107119797857096e-06, + "loss": 0.0602, + "step": 25350 + }, + { + "epoch": 69.07629427792915, + "grad_norm": 2.899702548980713, + "learning_rate": 4.609968630251187e-06, + "loss": 0.056, + "step": 25351 + }, + { + "epoch": 69.07901907356948, + "grad_norm": 2.1720457077026367, + "learning_rate": 4.6092253226940546e-06, + "loss": 0.0361, + "step": 25352 + }, + { + "epoch": 69.0817438692098, + "grad_norm": 2.9516775608062744, + "learning_rate": 4.608482057120099e-06, + "loss": 0.116, + "step": 25353 + }, + { + "epoch": 69.08446866485014, + "grad_norm": 2.660510540008545, + "learning_rate": 4.6077388335351144e-06, + "loss": 0.0417, + "step": 25354 + }, + { + "epoch": 69.08719346049047, + "grad_norm": 5.641421318054199, + "learning_rate": 4.6069956519448836e-06, + "loss": 0.0838, + "step": 25355 + }, + { + "epoch": 69.08991825613079, + "grad_norm": 3.240388870239258, + "learning_rate": 4.606252512355199e-06, + "loss": 0.0466, + "step": 25356 + }, + { + "epoch": 69.09264305177112, + "grad_norm": 3.065953254699707, + "learning_rate": 4.605509414771847e-06, + "loss": 0.185, + "step": 25357 + }, + { + "epoch": 69.09536784741144, + "grad_norm": 2.6469898223876953, + "learning_rate": 4.6047663592006155e-06, + "loss": 0.0436, + "step": 25358 + }, + { + "epoch": 69.09809264305177, + "grad_norm": 3.0340006351470947, + "learning_rate": 4.6040233456472845e-06, + "loss": 0.042, + "step": 25359 + }, + { + "epoch": 69.1008174386921, + "grad_norm": 3.9148831367492676, + "learning_rate": 4.60328037411765e-06, + "loss": 0.0393, + "step": 25360 + }, + { + "epoch": 69.10354223433242, + "grad_norm": 3.3091955184936523, + "learning_rate": 4.602537444617495e-06, + "loss": 0.1229, + "step": 25361 + }, + { + "epoch": 69.10626702997276, + "grad_norm": 2.4060099124908447, + "learning_rate": 4.601794557152602e-06, + "loss": 0.1009, + "step": 25362 + }, + { + "epoch": 69.10899182561307, + "grad_norm": 5.231338977813721, + "learning_rate": 4.60105171172876e-06, + "loss": 0.0999, + "step": 25363 + }, + { + "epoch": 69.11171662125341, + "grad_norm": 2.4197018146514893, + "learning_rate": 4.6003089083517545e-06, + "loss": 0.029, + "step": 25364 + }, + { + "epoch": 69.11444141689373, + "grad_norm": 4.155883312225342, + "learning_rate": 4.599566147027371e-06, + "loss": 0.1456, + "step": 25365 + }, + { + "epoch": 69.11716621253406, + "grad_norm": 10.01461124420166, + "learning_rate": 4.598823427761387e-06, + "loss": 0.0622, + "step": 25366 + }, + { + "epoch": 69.11989100817439, + "grad_norm": 3.3596034049987793, + "learning_rate": 4.598080750559597e-06, + "loss": 0.0503, + "step": 25367 + }, + { + "epoch": 69.12261580381471, + "grad_norm": 2.7877581119537354, + "learning_rate": 4.597338115427781e-06, + "loss": 0.0411, + "step": 25368 + }, + { + "epoch": 69.12534059945504, + "grad_norm": 2.8343818187713623, + "learning_rate": 4.596595522371721e-06, + "loss": 0.0636, + "step": 25369 + }, + { + "epoch": 69.12806539509536, + "grad_norm": 4.523220062255859, + "learning_rate": 4.595852971397197e-06, + "loss": 0.0883, + "step": 25370 + }, + { + "epoch": 69.1307901907357, + "grad_norm": 2.302170991897583, + "learning_rate": 4.595110462509996e-06, + "loss": 0.0339, + "step": 25371 + }, + { + "epoch": 69.13351498637603, + "grad_norm": 2.4652061462402344, + "learning_rate": 4.594367995715905e-06, + "loss": 0.1065, + "step": 25372 + }, + { + "epoch": 69.13623978201635, + "grad_norm": 2.82228946685791, + "learning_rate": 4.593625571020702e-06, + "loss": 0.0816, + "step": 25373 + }, + { + "epoch": 69.13896457765668, + "grad_norm": 2.334242105484009, + "learning_rate": 4.592883188430169e-06, + "loss": 0.0354, + "step": 25374 + }, + { + "epoch": 69.141689373297, + "grad_norm": 2.4624836444854736, + "learning_rate": 4.592140847950085e-06, + "loss": 0.0329, + "step": 25375 + }, + { + "epoch": 69.14441416893733, + "grad_norm": 2.9783990383148193, + "learning_rate": 4.591398549586237e-06, + "loss": 0.1948, + "step": 25376 + }, + { + "epoch": 69.14713896457765, + "grad_norm": 3.096959114074707, + "learning_rate": 4.5906562933444024e-06, + "loss": 0.1198, + "step": 25377 + }, + { + "epoch": 69.14986376021798, + "grad_norm": 3.8093245029449463, + "learning_rate": 4.589914079230363e-06, + "loss": 0.0987, + "step": 25378 + }, + { + "epoch": 69.15258855585832, + "grad_norm": 2.3881402015686035, + "learning_rate": 4.589171907249895e-06, + "loss": 0.0416, + "step": 25379 + }, + { + "epoch": 69.15531335149863, + "grad_norm": 4.455782413482666, + "learning_rate": 4.588429777408785e-06, + "loss": 0.1728, + "step": 25380 + }, + { + "epoch": 69.15803814713897, + "grad_norm": 9.765618324279785, + "learning_rate": 4.587687689712811e-06, + "loss": 0.0506, + "step": 25381 + }, + { + "epoch": 69.16076294277929, + "grad_norm": 3.4322943687438965, + "learning_rate": 4.586945644167751e-06, + "loss": 0.0459, + "step": 25382 + }, + { + "epoch": 69.16348773841962, + "grad_norm": 4.60107421875, + "learning_rate": 4.586203640779379e-06, + "loss": 0.188, + "step": 25383 + }, + { + "epoch": 69.16621253405995, + "grad_norm": 1.8150352239608765, + "learning_rate": 4.5854616795534835e-06, + "loss": 0.0265, + "step": 25384 + }, + { + "epoch": 69.16893732970027, + "grad_norm": 3.624239444732666, + "learning_rate": 4.584719760495838e-06, + "loss": 0.0658, + "step": 25385 + }, + { + "epoch": 69.1716621253406, + "grad_norm": 2.3626153469085693, + "learning_rate": 4.583977883612218e-06, + "loss": 0.0668, + "step": 25386 + }, + { + "epoch": 69.17438692098092, + "grad_norm": 2.6876978874206543, + "learning_rate": 4.583236048908406e-06, + "loss": 0.1338, + "step": 25387 + }, + { + "epoch": 69.17711171662125, + "grad_norm": 3.021451711654663, + "learning_rate": 4.582494256390174e-06, + "loss": 0.0364, + "step": 25388 + }, + { + "epoch": 69.17983651226157, + "grad_norm": 3.472978353500366, + "learning_rate": 4.581752506063306e-06, + "loss": 0.0623, + "step": 25389 + }, + { + "epoch": 69.1825613079019, + "grad_norm": 3.0560572147369385, + "learning_rate": 4.581010797933576e-06, + "loss": 0.077, + "step": 25390 + }, + { + "epoch": 69.18528610354224, + "grad_norm": 2.9825806617736816, + "learning_rate": 4.580269132006755e-06, + "loss": 0.0321, + "step": 25391 + }, + { + "epoch": 69.18801089918256, + "grad_norm": 3.3844103813171387, + "learning_rate": 4.579527508288627e-06, + "loss": 0.0364, + "step": 25392 + }, + { + "epoch": 69.19073569482289, + "grad_norm": 2.671772003173828, + "learning_rate": 4.578785926784966e-06, + "loss": 0.0554, + "step": 25393 + }, + { + "epoch": 69.19346049046321, + "grad_norm": 2.484617233276367, + "learning_rate": 4.578044387501544e-06, + "loss": 0.0392, + "step": 25394 + }, + { + "epoch": 69.19618528610354, + "grad_norm": 3.5257954597473145, + "learning_rate": 4.577302890444134e-06, + "loss": 0.0505, + "step": 25395 + }, + { + "epoch": 69.19891008174388, + "grad_norm": 3.391948699951172, + "learning_rate": 4.57656143561852e-06, + "loss": 0.0438, + "step": 25396 + }, + { + "epoch": 69.2016348773842, + "grad_norm": 4.001677513122559, + "learning_rate": 4.575820023030469e-06, + "loss": 0.1583, + "step": 25397 + }, + { + "epoch": 69.20435967302453, + "grad_norm": 2.1667492389678955, + "learning_rate": 4.575078652685758e-06, + "loss": 0.0436, + "step": 25398 + }, + { + "epoch": 69.20708446866485, + "grad_norm": 3.1260199546813965, + "learning_rate": 4.574337324590156e-06, + "loss": 0.1362, + "step": 25399 + }, + { + "epoch": 69.20980926430518, + "grad_norm": 2.11391282081604, + "learning_rate": 4.573596038749444e-06, + "loss": 0.2222, + "step": 25400 + }, + { + "epoch": 69.2125340599455, + "grad_norm": 2.815260648727417, + "learning_rate": 4.572854795169392e-06, + "loss": 0.0791, + "step": 25401 + }, + { + "epoch": 69.21525885558583, + "grad_norm": 3.2800514698028564, + "learning_rate": 4.572113593855771e-06, + "loss": 0.0716, + "step": 25402 + }, + { + "epoch": 69.21798365122616, + "grad_norm": 2.0049800872802734, + "learning_rate": 4.571372434814352e-06, + "loss": 0.0353, + "step": 25403 + }, + { + "epoch": 69.22070844686648, + "grad_norm": 4.266651630401611, + "learning_rate": 4.570631318050913e-06, + "loss": 0.1376, + "step": 25404 + }, + { + "epoch": 69.22343324250681, + "grad_norm": 4.971512794494629, + "learning_rate": 4.569890243571219e-06, + "loss": 0.0445, + "step": 25405 + }, + { + "epoch": 69.22615803814713, + "grad_norm": 3.709139347076416, + "learning_rate": 4.569149211381049e-06, + "loss": 0.0814, + "step": 25406 + }, + { + "epoch": 69.22888283378747, + "grad_norm": 3.2884321212768555, + "learning_rate": 4.568408221486166e-06, + "loss": 0.1194, + "step": 25407 + }, + { + "epoch": 69.2316076294278, + "grad_norm": 2.227508306503296, + "learning_rate": 4.567667273892349e-06, + "loss": 0.0274, + "step": 25408 + }, + { + "epoch": 69.23433242506812, + "grad_norm": 3.514317750930786, + "learning_rate": 4.566926368605364e-06, + "loss": 0.0488, + "step": 25409 + }, + { + "epoch": 69.23705722070845, + "grad_norm": 7.666079521179199, + "learning_rate": 4.566185505630981e-06, + "loss": 0.2268, + "step": 25410 + }, + { + "epoch": 69.23978201634877, + "grad_norm": 3.4058709144592285, + "learning_rate": 4.565444684974968e-06, + "loss": 0.1507, + "step": 25411 + }, + { + "epoch": 69.2425068119891, + "grad_norm": 3.5763678550720215, + "learning_rate": 4.5647039066431e-06, + "loss": 0.0785, + "step": 25412 + }, + { + "epoch": 69.24523160762942, + "grad_norm": 2.9784834384918213, + "learning_rate": 4.563963170641143e-06, + "loss": 0.1684, + "step": 25413 + }, + { + "epoch": 69.24795640326975, + "grad_norm": 2.819248676300049, + "learning_rate": 4.563222476974866e-06, + "loss": 0.1865, + "step": 25414 + }, + { + "epoch": 69.25068119891009, + "grad_norm": 3.5395994186401367, + "learning_rate": 4.562481825650034e-06, + "loss": 0.0434, + "step": 25415 + }, + { + "epoch": 69.2534059945504, + "grad_norm": 4.175273418426514, + "learning_rate": 4.561741216672422e-06, + "loss": 0.0573, + "step": 25416 + }, + { + "epoch": 69.25613079019074, + "grad_norm": 3.1356163024902344, + "learning_rate": 4.5610006500477935e-06, + "loss": 0.0513, + "step": 25417 + }, + { + "epoch": 69.25885558583106, + "grad_norm": 2.5869336128234863, + "learning_rate": 4.560260125781918e-06, + "loss": 0.0385, + "step": 25418 + }, + { + "epoch": 69.26158038147139, + "grad_norm": 2.9099714756011963, + "learning_rate": 4.559519643880556e-06, + "loss": 0.0331, + "step": 25419 + }, + { + "epoch": 69.26430517711172, + "grad_norm": 3.585111141204834, + "learning_rate": 4.5587792043494865e-06, + "loss": 0.095, + "step": 25420 + }, + { + "epoch": 69.26702997275204, + "grad_norm": 3.7343595027923584, + "learning_rate": 4.558038807194468e-06, + "loss": 0.1624, + "step": 25421 + }, + { + "epoch": 69.26975476839237, + "grad_norm": 5.514522552490234, + "learning_rate": 4.557298452421264e-06, + "loss": 0.0472, + "step": 25422 + }, + { + "epoch": 69.2724795640327, + "grad_norm": 4.171028137207031, + "learning_rate": 4.556558140035648e-06, + "loss": 0.1025, + "step": 25423 + }, + { + "epoch": 69.27520435967303, + "grad_norm": 3.00070858001709, + "learning_rate": 4.555817870043379e-06, + "loss": 0.1122, + "step": 25424 + }, + { + "epoch": 69.27792915531334, + "grad_norm": 3.1932849884033203, + "learning_rate": 4.55507764245023e-06, + "loss": 0.0466, + "step": 25425 + }, + { + "epoch": 69.28065395095368, + "grad_norm": 3.068021535873413, + "learning_rate": 4.554337457261959e-06, + "loss": 0.0559, + "step": 25426 + }, + { + "epoch": 69.28337874659401, + "grad_norm": 3.2480483055114746, + "learning_rate": 4.55359731448433e-06, + "loss": 0.0857, + "step": 25427 + }, + { + "epoch": 69.28610354223433, + "grad_norm": 3.1276259422302246, + "learning_rate": 4.552857214123115e-06, + "loss": 0.0659, + "step": 25428 + }, + { + "epoch": 69.28882833787466, + "grad_norm": 4.520638942718506, + "learning_rate": 4.5521171561840696e-06, + "loss": 0.0964, + "step": 25429 + }, + { + "epoch": 69.29155313351498, + "grad_norm": 4.583598613739014, + "learning_rate": 4.551377140672962e-06, + "loss": 0.111, + "step": 25430 + }, + { + "epoch": 69.29427792915531, + "grad_norm": 1.993520975112915, + "learning_rate": 4.55063716759555e-06, + "loss": 0.0574, + "step": 25431 + }, + { + "epoch": 69.29700272479565, + "grad_norm": 4.2229790687561035, + "learning_rate": 4.549897236957605e-06, + "loss": 0.0444, + "step": 25432 + }, + { + "epoch": 69.29972752043597, + "grad_norm": 3.21101450920105, + "learning_rate": 4.549157348764883e-06, + "loss": 0.053, + "step": 25433 + }, + { + "epoch": 69.3024523160763, + "grad_norm": 3.129916191101074, + "learning_rate": 4.548417503023149e-06, + "loss": 0.0939, + "step": 25434 + }, + { + "epoch": 69.30517711171662, + "grad_norm": 3.284067153930664, + "learning_rate": 4.5476776997381615e-06, + "loss": 0.0561, + "step": 25435 + }, + { + "epoch": 69.30790190735695, + "grad_norm": 2.7819948196411133, + "learning_rate": 4.5469379389156865e-06, + "loss": 0.0524, + "step": 25436 + }, + { + "epoch": 69.31062670299727, + "grad_norm": 2.6426141262054443, + "learning_rate": 4.546198220561484e-06, + "loss": 0.061, + "step": 25437 + }, + { + "epoch": 69.3133514986376, + "grad_norm": 3.2954511642456055, + "learning_rate": 4.545458544681315e-06, + "loss": 0.0492, + "step": 25438 + }, + { + "epoch": 69.31607629427793, + "grad_norm": 3.160815954208374, + "learning_rate": 4.544718911280934e-06, + "loss": 0.1001, + "step": 25439 + }, + { + "epoch": 69.31880108991825, + "grad_norm": 3.6648552417755127, + "learning_rate": 4.5439793203661075e-06, + "loss": 0.066, + "step": 25440 + }, + { + "epoch": 69.32152588555859, + "grad_norm": 2.691915273666382, + "learning_rate": 4.543239771942599e-06, + "loss": 0.0614, + "step": 25441 + }, + { + "epoch": 69.3242506811989, + "grad_norm": 4.521756172180176, + "learning_rate": 4.542500266016162e-06, + "loss": 0.1956, + "step": 25442 + }, + { + "epoch": 69.32697547683924, + "grad_norm": 2.222311496734619, + "learning_rate": 4.541760802592558e-06, + "loss": 0.0263, + "step": 25443 + }, + { + "epoch": 69.32970027247957, + "grad_norm": 3.0697567462921143, + "learning_rate": 4.541021381677541e-06, + "loss": 0.1766, + "step": 25444 + }, + { + "epoch": 69.33242506811989, + "grad_norm": 3.325167417526245, + "learning_rate": 4.540282003276879e-06, + "loss": 0.1471, + "step": 25445 + }, + { + "epoch": 69.33514986376022, + "grad_norm": 2.820826292037964, + "learning_rate": 4.5395426673963235e-06, + "loss": 0.1574, + "step": 25446 + }, + { + "epoch": 69.33787465940054, + "grad_norm": 2.6701645851135254, + "learning_rate": 4.5388033740416344e-06, + "loss": 0.059, + "step": 25447 + }, + { + "epoch": 69.34059945504087, + "grad_norm": 3.161954164505005, + "learning_rate": 4.538064123218565e-06, + "loss": 0.0481, + "step": 25448 + }, + { + "epoch": 69.34332425068119, + "grad_norm": 3.1632397174835205, + "learning_rate": 4.53732491493288e-06, + "loss": 0.1351, + "step": 25449 + }, + { + "epoch": 69.34604904632153, + "grad_norm": 2.487396240234375, + "learning_rate": 4.536585749190334e-06, + "loss": 0.0715, + "step": 25450 + }, + { + "epoch": 69.34877384196186, + "grad_norm": 4.762503147125244, + "learning_rate": 4.535846625996677e-06, + "loss": 0.0933, + "step": 25451 + }, + { + "epoch": 69.35149863760218, + "grad_norm": 2.5551226139068604, + "learning_rate": 4.5351075453576755e-06, + "loss": 0.1213, + "step": 25452 + }, + { + "epoch": 69.35422343324251, + "grad_norm": 3.0940890312194824, + "learning_rate": 4.53436850727908e-06, + "loss": 0.0664, + "step": 25453 + }, + { + "epoch": 69.35694822888283, + "grad_norm": 3.4480948448181152, + "learning_rate": 4.533629511766646e-06, + "loss": 0.176, + "step": 25454 + }, + { + "epoch": 69.35967302452316, + "grad_norm": 3.455458164215088, + "learning_rate": 4.5328905588261274e-06, + "loss": 0.0783, + "step": 25455 + }, + { + "epoch": 69.3623978201635, + "grad_norm": 2.989150047302246, + "learning_rate": 4.53215164846328e-06, + "loss": 0.0788, + "step": 25456 + }, + { + "epoch": 69.36512261580381, + "grad_norm": 3.5107991695404053, + "learning_rate": 4.531412780683864e-06, + "loss": 0.128, + "step": 25457 + }, + { + "epoch": 69.36784741144415, + "grad_norm": 2.281085729598999, + "learning_rate": 4.530673955493629e-06, + "loss": 0.0885, + "step": 25458 + }, + { + "epoch": 69.37057220708446, + "grad_norm": 2.156769037246704, + "learning_rate": 4.529935172898327e-06, + "loss": 0.0369, + "step": 25459 + }, + { + "epoch": 69.3732970027248, + "grad_norm": 3.0936028957366943, + "learning_rate": 4.529196432903713e-06, + "loss": 0.0468, + "step": 25460 + }, + { + "epoch": 69.37602179836512, + "grad_norm": 2.3070435523986816, + "learning_rate": 4.528457735515544e-06, + "loss": 0.0441, + "step": 25461 + }, + { + "epoch": 69.37874659400545, + "grad_norm": 5.0418925285339355, + "learning_rate": 4.5277190807395695e-06, + "loss": 0.0459, + "step": 25462 + }, + { + "epoch": 69.38147138964578, + "grad_norm": 4.551960468292236, + "learning_rate": 4.526980468581543e-06, + "loss": 0.0971, + "step": 25463 + }, + { + "epoch": 69.3841961852861, + "grad_norm": 2.7737889289855957, + "learning_rate": 4.526241899047213e-06, + "loss": 0.038, + "step": 25464 + }, + { + "epoch": 69.38692098092643, + "grad_norm": 2.7282233238220215, + "learning_rate": 4.525503372142339e-06, + "loss": 0.0535, + "step": 25465 + }, + { + "epoch": 69.38964577656675, + "grad_norm": 2.7730906009674072, + "learning_rate": 4.524764887872668e-06, + "loss": 0.0842, + "step": 25466 + }, + { + "epoch": 69.39237057220708, + "grad_norm": 2.8168158531188965, + "learning_rate": 4.524026446243952e-06, + "loss": 0.0758, + "step": 25467 + }, + { + "epoch": 69.39509536784742, + "grad_norm": 3.4718661308288574, + "learning_rate": 4.523288047261938e-06, + "loss": 0.1124, + "step": 25468 + }, + { + "epoch": 69.39782016348774, + "grad_norm": 3.580873966217041, + "learning_rate": 4.522549690932384e-06, + "loss": 0.1165, + "step": 25469 + }, + { + "epoch": 69.40054495912807, + "grad_norm": 2.9290521144866943, + "learning_rate": 4.521811377261036e-06, + "loss": 0.0466, + "step": 25470 + }, + { + "epoch": 69.40326975476839, + "grad_norm": 3.4112048149108887, + "learning_rate": 4.521073106253643e-06, + "loss": 0.048, + "step": 25471 + }, + { + "epoch": 69.40599455040872, + "grad_norm": 2.107800006866455, + "learning_rate": 4.5203348779159585e-06, + "loss": 0.0748, + "step": 25472 + }, + { + "epoch": 69.40871934604904, + "grad_norm": 3.148745059967041, + "learning_rate": 4.51959669225373e-06, + "loss": 0.057, + "step": 25473 + }, + { + "epoch": 69.41144414168937, + "grad_norm": 4.197068691253662, + "learning_rate": 4.518858549272702e-06, + "loss": 0.0384, + "step": 25474 + }, + { + "epoch": 69.4141689373297, + "grad_norm": 4.478817462921143, + "learning_rate": 4.518120448978631e-06, + "loss": 0.058, + "step": 25475 + }, + { + "epoch": 69.41689373297002, + "grad_norm": 3.8297202587127686, + "learning_rate": 4.517382391377258e-06, + "loss": 0.0664, + "step": 25476 + }, + { + "epoch": 69.41961852861036, + "grad_norm": 4.742251873016357, + "learning_rate": 4.516644376474339e-06, + "loss": 0.1049, + "step": 25477 + }, + { + "epoch": 69.42234332425068, + "grad_norm": 2.337071180343628, + "learning_rate": 4.515906404275615e-06, + "loss": 0.0331, + "step": 25478 + }, + { + "epoch": 69.42506811989101, + "grad_norm": 3.4373509883880615, + "learning_rate": 4.515168474786837e-06, + "loss": 0.0445, + "step": 25479 + }, + { + "epoch": 69.42779291553134, + "grad_norm": 3.0513668060302734, + "learning_rate": 4.514430588013746e-06, + "loss": 0.1766, + "step": 25480 + }, + { + "epoch": 69.43051771117166, + "grad_norm": 3.0420408248901367, + "learning_rate": 4.513692743962097e-06, + "loss": 0.0719, + "step": 25481 + }, + { + "epoch": 69.433242506812, + "grad_norm": 2.7636256217956543, + "learning_rate": 4.512954942637633e-06, + "loss": 0.0361, + "step": 25482 + }, + { + "epoch": 69.43596730245231, + "grad_norm": 2.655750036239624, + "learning_rate": 4.512217184046098e-06, + "loss": 0.0628, + "step": 25483 + }, + { + "epoch": 69.43869209809264, + "grad_norm": 2.935687780380249, + "learning_rate": 4.511479468193236e-06, + "loss": 0.1653, + "step": 25484 + }, + { + "epoch": 69.44141689373296, + "grad_norm": 2.878584623336792, + "learning_rate": 4.5107417950848e-06, + "loss": 0.0874, + "step": 25485 + }, + { + "epoch": 69.4441416893733, + "grad_norm": 3.644692897796631, + "learning_rate": 4.510004164726529e-06, + "loss": 0.2839, + "step": 25486 + }, + { + "epoch": 69.44686648501363, + "grad_norm": 2.3344852924346924, + "learning_rate": 4.509266577124169e-06, + "loss": 0.0359, + "step": 25487 + }, + { + "epoch": 69.44959128065395, + "grad_norm": 2.944648265838623, + "learning_rate": 4.508529032283461e-06, + "loss": 0.0493, + "step": 25488 + }, + { + "epoch": 69.45231607629428, + "grad_norm": 3.3743457794189453, + "learning_rate": 4.507791530210155e-06, + "loss": 0.074, + "step": 25489 + }, + { + "epoch": 69.4550408719346, + "grad_norm": 2.828557252883911, + "learning_rate": 4.507054070909992e-06, + "loss": 0.0324, + "step": 25490 + }, + { + "epoch": 69.45776566757493, + "grad_norm": 2.988844871520996, + "learning_rate": 4.506316654388712e-06, + "loss": 0.0744, + "step": 25491 + }, + { + "epoch": 69.46049046321527, + "grad_norm": 3.0800795555114746, + "learning_rate": 4.50557928065206e-06, + "loss": 0.0557, + "step": 25492 + }, + { + "epoch": 69.46321525885558, + "grad_norm": 3.5992672443389893, + "learning_rate": 4.5048419497057835e-06, + "loss": 0.0938, + "step": 25493 + }, + { + "epoch": 69.46594005449592, + "grad_norm": 4.743727684020996, + "learning_rate": 4.504104661555623e-06, + "loss": 0.056, + "step": 25494 + }, + { + "epoch": 69.46866485013624, + "grad_norm": 3.1263489723205566, + "learning_rate": 4.503367416207316e-06, + "loss": 0.0294, + "step": 25495 + }, + { + "epoch": 69.47138964577657, + "grad_norm": 4.683835506439209, + "learning_rate": 4.502630213666605e-06, + "loss": 0.0782, + "step": 25496 + }, + { + "epoch": 69.47411444141689, + "grad_norm": 2.891843557357788, + "learning_rate": 4.501893053939236e-06, + "loss": 0.0497, + "step": 25497 + }, + { + "epoch": 69.47683923705722, + "grad_norm": 3.1541855335235596, + "learning_rate": 4.501155937030946e-06, + "loss": 0.0846, + "step": 25498 + }, + { + "epoch": 69.47956403269755, + "grad_norm": 3.3001279830932617, + "learning_rate": 4.500418862947478e-06, + "loss": 0.0539, + "step": 25499 + }, + { + "epoch": 69.48228882833787, + "grad_norm": 2.4647982120513916, + "learning_rate": 4.4996818316945655e-06, + "loss": 0.0347, + "step": 25500 + }, + { + "epoch": 69.4850136239782, + "grad_norm": 6.2668609619140625, + "learning_rate": 4.498944843277959e-06, + "loss": 0.112, + "step": 25501 + }, + { + "epoch": 69.48773841961852, + "grad_norm": 4.0989203453063965, + "learning_rate": 4.498207897703393e-06, + "loss": 0.0499, + "step": 25502 + }, + { + "epoch": 69.49046321525886, + "grad_norm": 3.043545961380005, + "learning_rate": 4.497470994976606e-06, + "loss": 0.1422, + "step": 25503 + }, + { + "epoch": 69.49318801089919, + "grad_norm": 2.963949680328369, + "learning_rate": 4.496734135103334e-06, + "loss": 0.1138, + "step": 25504 + }, + { + "epoch": 69.49591280653951, + "grad_norm": 2.8195641040802, + "learning_rate": 4.4959973180893235e-06, + "loss": 0.0539, + "step": 25505 + }, + { + "epoch": 69.49863760217984, + "grad_norm": 3.33978533744812, + "learning_rate": 4.49526054394031e-06, + "loss": 0.0545, + "step": 25506 + }, + { + "epoch": 69.50136239782016, + "grad_norm": 2.9912805557250977, + "learning_rate": 4.4945238126620286e-06, + "loss": 0.0379, + "step": 25507 + }, + { + "epoch": 69.50408719346049, + "grad_norm": 4.629179000854492, + "learning_rate": 4.493787124260215e-06, + "loss": 0.054, + "step": 25508 + }, + { + "epoch": 69.50681198910081, + "grad_norm": 4.750308036804199, + "learning_rate": 4.49305047874061e-06, + "loss": 0.1869, + "step": 25509 + }, + { + "epoch": 69.50953678474114, + "grad_norm": 3.1100518703460693, + "learning_rate": 4.492313876108955e-06, + "loss": 0.0395, + "step": 25510 + }, + { + "epoch": 69.51226158038148, + "grad_norm": 3.0238888263702393, + "learning_rate": 4.491577316370982e-06, + "loss": 0.0413, + "step": 25511 + }, + { + "epoch": 69.5149863760218, + "grad_norm": 3.627363681793213, + "learning_rate": 4.490840799532428e-06, + "loss": 0.1171, + "step": 25512 + }, + { + "epoch": 69.51771117166213, + "grad_norm": 3.2774410247802734, + "learning_rate": 4.490104325599024e-06, + "loss": 0.0684, + "step": 25513 + }, + { + "epoch": 69.52043596730245, + "grad_norm": 3.144773483276367, + "learning_rate": 4.489367894576514e-06, + "loss": 0.0516, + "step": 25514 + }, + { + "epoch": 69.52316076294278, + "grad_norm": 4.020216464996338, + "learning_rate": 4.4886315064706295e-06, + "loss": 0.1232, + "step": 25515 + }, + { + "epoch": 69.52588555858311, + "grad_norm": 3.6075801849365234, + "learning_rate": 4.487895161287102e-06, + "loss": 0.0765, + "step": 25516 + }, + { + "epoch": 69.52861035422343, + "grad_norm": 3.4577956199645996, + "learning_rate": 4.487158859031674e-06, + "loss": 0.0423, + "step": 25517 + }, + { + "epoch": 69.53133514986376, + "grad_norm": 4.301992893218994, + "learning_rate": 4.486422599710074e-06, + "loss": 0.1098, + "step": 25518 + }, + { + "epoch": 69.53405994550408, + "grad_norm": 2.895936965942383, + "learning_rate": 4.4856863833280384e-06, + "loss": 0.0528, + "step": 25519 + }, + { + "epoch": 69.53678474114442, + "grad_norm": 2.136328935623169, + "learning_rate": 4.484950209891296e-06, + "loss": 0.035, + "step": 25520 + }, + { + "epoch": 69.53950953678473, + "grad_norm": 4.753259658813477, + "learning_rate": 4.484214079405587e-06, + "loss": 0.1188, + "step": 25521 + }, + { + "epoch": 69.54223433242507, + "grad_norm": 3.827326536178589, + "learning_rate": 4.483477991876642e-06, + "loss": 0.1702, + "step": 25522 + }, + { + "epoch": 69.5449591280654, + "grad_norm": 3.497188091278076, + "learning_rate": 4.482741947310192e-06, + "loss": 0.088, + "step": 25523 + }, + { + "epoch": 69.54768392370572, + "grad_norm": 6.807163715362549, + "learning_rate": 4.482005945711965e-06, + "loss": 0.1857, + "step": 25524 + }, + { + "epoch": 69.55040871934605, + "grad_norm": 3.836564540863037, + "learning_rate": 4.4812699870877e-06, + "loss": 0.0589, + "step": 25525 + }, + { + "epoch": 69.55313351498637, + "grad_norm": 48.24660110473633, + "learning_rate": 4.480534071443131e-06, + "loss": 0.1138, + "step": 25526 + }, + { + "epoch": 69.5558583106267, + "grad_norm": 3.2530205249786377, + "learning_rate": 4.479798198783984e-06, + "loss": 0.0359, + "step": 25527 + }, + { + "epoch": 69.55858310626704, + "grad_norm": 3.3195722103118896, + "learning_rate": 4.479062369115992e-06, + "loss": 0.0471, + "step": 25528 + }, + { + "epoch": 69.56130790190736, + "grad_norm": 3.158198356628418, + "learning_rate": 4.4783265824448795e-06, + "loss": 0.0878, + "step": 25529 + }, + { + "epoch": 69.56403269754769, + "grad_norm": 2.6671762466430664, + "learning_rate": 4.477590838776386e-06, + "loss": 0.0351, + "step": 25530 + }, + { + "epoch": 69.566757493188, + "grad_norm": 3.4229178428649902, + "learning_rate": 4.4768551381162375e-06, + "loss": 0.1534, + "step": 25531 + }, + { + "epoch": 69.56948228882834, + "grad_norm": 7.585022926330566, + "learning_rate": 4.476119480470163e-06, + "loss": 0.1878, + "step": 25532 + }, + { + "epoch": 69.57220708446866, + "grad_norm": 3.3582346439361572, + "learning_rate": 4.475383865843889e-06, + "loss": 0.0483, + "step": 25533 + }, + { + "epoch": 69.57493188010899, + "grad_norm": 3.0538430213928223, + "learning_rate": 4.474648294243151e-06, + "loss": 0.2468, + "step": 25534 + }, + { + "epoch": 69.57765667574932, + "grad_norm": 5.0180792808532715, + "learning_rate": 4.473912765673676e-06, + "loss": 0.1554, + "step": 25535 + }, + { + "epoch": 69.58038147138964, + "grad_norm": 2.2239420413970947, + "learning_rate": 4.473177280141185e-06, + "loss": 0.0411, + "step": 25536 + }, + { + "epoch": 69.58310626702998, + "grad_norm": 2.517350435256958, + "learning_rate": 4.4724418376514155e-06, + "loss": 0.132, + "step": 25537 + }, + { + "epoch": 69.5858310626703, + "grad_norm": 3.0453567504882812, + "learning_rate": 4.47170643821009e-06, + "loss": 0.0819, + "step": 25538 + }, + { + "epoch": 69.58855585831063, + "grad_norm": 2.4413506984710693, + "learning_rate": 4.470971081822938e-06, + "loss": 0.0421, + "step": 25539 + }, + { + "epoch": 69.59128065395096, + "grad_norm": 4.459550857543945, + "learning_rate": 4.470235768495682e-06, + "loss": 0.1374, + "step": 25540 + }, + { + "epoch": 69.59400544959128, + "grad_norm": 3.1329100131988525, + "learning_rate": 4.469500498234055e-06, + "loss": 0.0528, + "step": 25541 + }, + { + "epoch": 69.59673024523161, + "grad_norm": 2.6712231636047363, + "learning_rate": 4.468765271043777e-06, + "loss": 0.0397, + "step": 25542 + }, + { + "epoch": 69.59945504087193, + "grad_norm": 3.0572385787963867, + "learning_rate": 4.4680300869305795e-06, + "loss": 0.0921, + "step": 25543 + }, + { + "epoch": 69.60217983651226, + "grad_norm": 2.4251370429992676, + "learning_rate": 4.467294945900186e-06, + "loss": 0.0479, + "step": 25544 + }, + { + "epoch": 69.60490463215258, + "grad_norm": 2.989567279815674, + "learning_rate": 4.466559847958318e-06, + "loss": 0.1138, + "step": 25545 + }, + { + "epoch": 69.60762942779292, + "grad_norm": 3.232569456100464, + "learning_rate": 4.465824793110708e-06, + "loss": 0.1992, + "step": 25546 + }, + { + "epoch": 69.61035422343325, + "grad_norm": 4.112090110778809, + "learning_rate": 4.4650897813630755e-06, + "loss": 0.0689, + "step": 25547 + }, + { + "epoch": 69.61307901907357, + "grad_norm": 2.628995895385742, + "learning_rate": 4.464354812721147e-06, + "loss": 0.0612, + "step": 25548 + }, + { + "epoch": 69.6158038147139, + "grad_norm": 3.160435199737549, + "learning_rate": 4.46361988719064e-06, + "loss": 0.0529, + "step": 25549 + }, + { + "epoch": 69.61852861035422, + "grad_norm": 3.192359685897827, + "learning_rate": 4.462885004777287e-06, + "loss": 0.1992, + "step": 25550 + }, + { + "epoch": 69.62125340599455, + "grad_norm": 4.834630966186523, + "learning_rate": 4.462150165486807e-06, + "loss": 0.0504, + "step": 25551 + }, + { + "epoch": 69.62397820163488, + "grad_norm": 3.1146316528320312, + "learning_rate": 4.461415369324924e-06, + "loss": 0.1613, + "step": 25552 + }, + { + "epoch": 69.6267029972752, + "grad_norm": 3.7600176334381104, + "learning_rate": 4.460680616297356e-06, + "loss": 0.1573, + "step": 25553 + }, + { + "epoch": 69.62942779291554, + "grad_norm": 3.2461941242218018, + "learning_rate": 4.459945906409832e-06, + "loss": 0.1423, + "step": 25554 + }, + { + "epoch": 69.63215258855585, + "grad_norm": 3.6472384929656982, + "learning_rate": 4.459211239668073e-06, + "loss": 0.0822, + "step": 25555 + }, + { + "epoch": 69.63487738419619, + "grad_norm": 2.415484666824341, + "learning_rate": 4.458476616077797e-06, + "loss": 0.1135, + "step": 25556 + }, + { + "epoch": 69.6376021798365, + "grad_norm": 17.882747650146484, + "learning_rate": 4.457742035644723e-06, + "loss": 0.1495, + "step": 25557 + }, + { + "epoch": 69.64032697547684, + "grad_norm": 3.5511679649353027, + "learning_rate": 4.4570074983745806e-06, + "loss": 0.1856, + "step": 25558 + }, + { + "epoch": 69.64305177111717, + "grad_norm": 4.503655433654785, + "learning_rate": 4.456273004273084e-06, + "loss": 0.0797, + "step": 25559 + }, + { + "epoch": 69.64577656675749, + "grad_norm": 2.438267469406128, + "learning_rate": 4.4555385533459515e-06, + "loss": 0.1115, + "step": 25560 + }, + { + "epoch": 69.64850136239782, + "grad_norm": 3.1369853019714355, + "learning_rate": 4.454804145598907e-06, + "loss": 0.1224, + "step": 25561 + }, + { + "epoch": 69.65122615803814, + "grad_norm": 3.708622455596924, + "learning_rate": 4.4540697810376724e-06, + "loss": 0.1498, + "step": 25562 + }, + { + "epoch": 69.65395095367847, + "grad_norm": 3.237105131149292, + "learning_rate": 4.453335459667964e-06, + "loss": 0.0391, + "step": 25563 + }, + { + "epoch": 69.65667574931881, + "grad_norm": 3.6461849212646484, + "learning_rate": 4.4526011814955e-06, + "loss": 0.046, + "step": 25564 + }, + { + "epoch": 69.65940054495913, + "grad_norm": 2.78324031829834, + "learning_rate": 4.451866946525997e-06, + "loss": 0.0709, + "step": 25565 + }, + { + "epoch": 69.66212534059946, + "grad_norm": 3.4655065536499023, + "learning_rate": 4.451132754765179e-06, + "loss": 0.1083, + "step": 25566 + }, + { + "epoch": 69.66485013623978, + "grad_norm": 3.751417875289917, + "learning_rate": 4.450398606218759e-06, + "loss": 0.1404, + "step": 25567 + }, + { + "epoch": 69.66757493188011, + "grad_norm": 2.905965566635132, + "learning_rate": 4.449664500892456e-06, + "loss": 0.154, + "step": 25568 + }, + { + "epoch": 69.67029972752043, + "grad_norm": 3.733325481414795, + "learning_rate": 4.448930438791986e-06, + "loss": 0.1691, + "step": 25569 + }, + { + "epoch": 69.67302452316076, + "grad_norm": 2.9593799114227295, + "learning_rate": 4.448196419923068e-06, + "loss": 0.0616, + "step": 25570 + }, + { + "epoch": 69.6757493188011, + "grad_norm": 3.1292717456817627, + "learning_rate": 4.447462444291421e-06, + "loss": 0.0477, + "step": 25571 + }, + { + "epoch": 69.67847411444141, + "grad_norm": 2.4466569423675537, + "learning_rate": 4.446728511902755e-06, + "loss": 0.0267, + "step": 25572 + }, + { + "epoch": 69.68119891008175, + "grad_norm": 3.170085906982422, + "learning_rate": 4.445994622762786e-06, + "loss": 0.0603, + "step": 25573 + }, + { + "epoch": 69.68392370572207, + "grad_norm": 3.642721652984619, + "learning_rate": 4.445260776877235e-06, + "loss": 0.1093, + "step": 25574 + }, + { + "epoch": 69.6866485013624, + "grad_norm": 2.6193416118621826, + "learning_rate": 4.444526974251815e-06, + "loss": 0.1013, + "step": 25575 + }, + { + "epoch": 69.68937329700273, + "grad_norm": 2.3695764541625977, + "learning_rate": 4.443793214892241e-06, + "loss": 0.1401, + "step": 25576 + }, + { + "epoch": 69.69209809264305, + "grad_norm": 2.5913591384887695, + "learning_rate": 4.443059498804217e-06, + "loss": 0.0389, + "step": 25577 + }, + { + "epoch": 69.69482288828338, + "grad_norm": 2.943362236022949, + "learning_rate": 4.442325825993475e-06, + "loss": 0.1036, + "step": 25578 + }, + { + "epoch": 69.6975476839237, + "grad_norm": 3.2677478790283203, + "learning_rate": 4.441592196465722e-06, + "loss": 0.1509, + "step": 25579 + }, + { + "epoch": 69.70027247956403, + "grad_norm": 4.0697503089904785, + "learning_rate": 4.440858610226668e-06, + "loss": 0.0494, + "step": 25580 + }, + { + "epoch": 69.70299727520435, + "grad_norm": 2.5456671714782715, + "learning_rate": 4.440125067282026e-06, + "loss": 0.1437, + "step": 25581 + }, + { + "epoch": 69.70572207084469, + "grad_norm": 2.466583251953125, + "learning_rate": 4.439391567637514e-06, + "loss": 0.0759, + "step": 25582 + }, + { + "epoch": 69.70844686648502, + "grad_norm": 3.052860736846924, + "learning_rate": 4.438658111298842e-06, + "loss": 0.0524, + "step": 25583 + }, + { + "epoch": 69.71117166212534, + "grad_norm": 5.271154880523682, + "learning_rate": 4.437924698271721e-06, + "loss": 0.0925, + "step": 25584 + }, + { + "epoch": 69.71389645776567, + "grad_norm": 3.734518051147461, + "learning_rate": 4.437191328561861e-06, + "loss": 0.1157, + "step": 25585 + }, + { + "epoch": 69.71662125340599, + "grad_norm": 2.750703811645508, + "learning_rate": 4.436458002174978e-06, + "loss": 0.1127, + "step": 25586 + }, + { + "epoch": 69.71934604904632, + "grad_norm": 2.8358259201049805, + "learning_rate": 4.435724719116781e-06, + "loss": 0.1227, + "step": 25587 + }, + { + "epoch": 69.72207084468666, + "grad_norm": 3.0903167724609375, + "learning_rate": 4.434991479392983e-06, + "loss": 0.0764, + "step": 25588 + }, + { + "epoch": 69.72479564032697, + "grad_norm": 3.4187843799591064, + "learning_rate": 4.434258283009287e-06, + "loss": 0.0634, + "step": 25589 + }, + { + "epoch": 69.7275204359673, + "grad_norm": 3.107501745223999, + "learning_rate": 4.433525129971412e-06, + "loss": 0.028, + "step": 25590 + }, + { + "epoch": 69.73024523160763, + "grad_norm": 8.434030532836914, + "learning_rate": 4.432792020285065e-06, + "loss": 0.0943, + "step": 25591 + }, + { + "epoch": 69.73297002724796, + "grad_norm": 2.6484265327453613, + "learning_rate": 4.432058953955954e-06, + "loss": 0.0498, + "step": 25592 + }, + { + "epoch": 69.73569482288828, + "grad_norm": 4.696080684661865, + "learning_rate": 4.4313259309897835e-06, + "loss": 0.1324, + "step": 25593 + }, + { + "epoch": 69.73841961852861, + "grad_norm": 3.7561469078063965, + "learning_rate": 4.430592951392269e-06, + "loss": 0.1034, + "step": 25594 + }, + { + "epoch": 69.74114441416894, + "grad_norm": 3.9254508018493652, + "learning_rate": 4.42986001516912e-06, + "loss": 0.1331, + "step": 25595 + }, + { + "epoch": 69.74386920980926, + "grad_norm": 3.06659197807312, + "learning_rate": 4.429127122326044e-06, + "loss": 0.042, + "step": 25596 + }, + { + "epoch": 69.7465940054496, + "grad_norm": 3.235938787460327, + "learning_rate": 4.428394272868746e-06, + "loss": 0.06, + "step": 25597 + }, + { + "epoch": 69.74931880108991, + "grad_norm": 4.666807651519775, + "learning_rate": 4.427661466802929e-06, + "loss": 0.0695, + "step": 25598 + }, + { + "epoch": 69.75204359673025, + "grad_norm": 3.2119932174682617, + "learning_rate": 4.4269287041343105e-06, + "loss": 0.0961, + "step": 25599 + }, + { + "epoch": 69.75476839237058, + "grad_norm": 2.497992753982544, + "learning_rate": 4.42619598486859e-06, + "loss": 0.0415, + "step": 25600 + }, + { + "epoch": 69.7574931880109, + "grad_norm": 3.476628303527832, + "learning_rate": 4.425463309011473e-06, + "loss": 0.1269, + "step": 25601 + }, + { + "epoch": 69.76021798365123, + "grad_norm": 2.7838804721832275, + "learning_rate": 4.4247306765686726e-06, + "loss": 0.0975, + "step": 25602 + }, + { + "epoch": 69.76294277929155, + "grad_norm": 3.8740968704223633, + "learning_rate": 4.42399808754589e-06, + "loss": 0.0683, + "step": 25603 + }, + { + "epoch": 69.76566757493188, + "grad_norm": 3.0945353507995605, + "learning_rate": 4.42326554194883e-06, + "loss": 0.1353, + "step": 25604 + }, + { + "epoch": 69.7683923705722, + "grad_norm": 2.226154088973999, + "learning_rate": 4.422533039783196e-06, + "loss": 0.0273, + "step": 25605 + }, + { + "epoch": 69.77111716621253, + "grad_norm": 4.142420768737793, + "learning_rate": 4.421800581054698e-06, + "loss": 0.1002, + "step": 25606 + }, + { + "epoch": 69.77384196185287, + "grad_norm": 3.0412681102752686, + "learning_rate": 4.421068165769038e-06, + "loss": 0.0761, + "step": 25607 + }, + { + "epoch": 69.77656675749319, + "grad_norm": 3.305342435836792, + "learning_rate": 4.420335793931919e-06, + "loss": 0.0297, + "step": 25608 + }, + { + "epoch": 69.77929155313352, + "grad_norm": 3.126786708831787, + "learning_rate": 4.419603465549042e-06, + "loss": 0.0981, + "step": 25609 + }, + { + "epoch": 69.78201634877384, + "grad_norm": 2.439060688018799, + "learning_rate": 4.418871180626118e-06, + "loss": 0.0776, + "step": 25610 + }, + { + "epoch": 69.78474114441417, + "grad_norm": 3.507622003555298, + "learning_rate": 4.41813893916884e-06, + "loss": 0.0572, + "step": 25611 + }, + { + "epoch": 69.7874659400545, + "grad_norm": 1.6027233600616455, + "learning_rate": 4.417406741182921e-06, + "loss": 0.0211, + "step": 25612 + }, + { + "epoch": 69.79019073569482, + "grad_norm": 2.8347413539886475, + "learning_rate": 4.416674586674059e-06, + "loss": 0.0736, + "step": 25613 + }, + { + "epoch": 69.79291553133515, + "grad_norm": 2.759368896484375, + "learning_rate": 4.415942475647952e-06, + "loss": 0.0456, + "step": 25614 + }, + { + "epoch": 69.79564032697547, + "grad_norm": 4.204044818878174, + "learning_rate": 4.415210408110308e-06, + "loss": 0.0493, + "step": 25615 + }, + { + "epoch": 69.7983651226158, + "grad_norm": 3.0013973712921143, + "learning_rate": 4.414478384066827e-06, + "loss": 0.1487, + "step": 25616 + }, + { + "epoch": 69.80108991825612, + "grad_norm": 2.776397943496704, + "learning_rate": 4.413746403523208e-06, + "loss": 0.0492, + "step": 25617 + }, + { + "epoch": 69.80381471389646, + "grad_norm": 3.0675408840179443, + "learning_rate": 4.413014466485148e-06, + "loss": 0.2052, + "step": 25618 + }, + { + "epoch": 69.80653950953679, + "grad_norm": 2.969741106033325, + "learning_rate": 4.412282572958356e-06, + "loss": 0.0487, + "step": 25619 + }, + { + "epoch": 69.80926430517711, + "grad_norm": 2.379892587661743, + "learning_rate": 4.411550722948527e-06, + "loss": 0.1333, + "step": 25620 + }, + { + "epoch": 69.81198910081744, + "grad_norm": 2.675790548324585, + "learning_rate": 4.410818916461362e-06, + "loss": 0.0952, + "step": 25621 + }, + { + "epoch": 69.81471389645776, + "grad_norm": 3.693694591522217, + "learning_rate": 4.410087153502554e-06, + "loss": 0.0805, + "step": 25622 + }, + { + "epoch": 69.8174386920981, + "grad_norm": 2.791461944580078, + "learning_rate": 4.409355434077812e-06, + "loss": 0.1232, + "step": 25623 + }, + { + "epoch": 69.82016348773843, + "grad_norm": 3.2176051139831543, + "learning_rate": 4.408623758192829e-06, + "loss": 0.0851, + "step": 25624 + }, + { + "epoch": 69.82288828337875, + "grad_norm": 3.1415207386016846, + "learning_rate": 4.4078921258533026e-06, + "loss": 0.0891, + "step": 25625 + }, + { + "epoch": 69.82561307901908, + "grad_norm": 3.862701416015625, + "learning_rate": 4.407160537064934e-06, + "loss": 0.0749, + "step": 25626 + }, + { + "epoch": 69.8283378746594, + "grad_norm": 5.554037570953369, + "learning_rate": 4.40642899183342e-06, + "loss": 0.147, + "step": 25627 + }, + { + "epoch": 69.83106267029973, + "grad_norm": 3.3573391437530518, + "learning_rate": 4.4056974901644565e-06, + "loss": 0.0807, + "step": 25628 + }, + { + "epoch": 69.83378746594005, + "grad_norm": 2.9982717037200928, + "learning_rate": 4.404966032063738e-06, + "loss": 0.0752, + "step": 25629 + }, + { + "epoch": 69.83651226158038, + "grad_norm": 10.977214813232422, + "learning_rate": 4.404234617536964e-06, + "loss": 0.1221, + "step": 25630 + }, + { + "epoch": 69.83923705722071, + "grad_norm": 3.395043134689331, + "learning_rate": 4.403503246589834e-06, + "loss": 0.1199, + "step": 25631 + }, + { + "epoch": 69.84196185286103, + "grad_norm": 2.596799612045288, + "learning_rate": 4.402771919228041e-06, + "loss": 0.0495, + "step": 25632 + }, + { + "epoch": 69.84468664850137, + "grad_norm": 3.859687566757202, + "learning_rate": 4.402040635457279e-06, + "loss": 0.0637, + "step": 25633 + }, + { + "epoch": 69.84741144414168, + "grad_norm": 4.322866439819336, + "learning_rate": 4.401309395283241e-06, + "loss": 0.107, + "step": 25634 + }, + { + "epoch": 69.85013623978202, + "grad_norm": 3.5606908798217773, + "learning_rate": 4.400578198711629e-06, + "loss": 0.1245, + "step": 25635 + }, + { + "epoch": 69.85286103542235, + "grad_norm": 2.4128639698028564, + "learning_rate": 4.399847045748134e-06, + "loss": 0.0301, + "step": 25636 + }, + { + "epoch": 69.85558583106267, + "grad_norm": 3.8043482303619385, + "learning_rate": 4.39911593639845e-06, + "loss": 0.0649, + "step": 25637 + }, + { + "epoch": 69.858310626703, + "grad_norm": 2.828317165374756, + "learning_rate": 4.398384870668267e-06, + "loss": 0.2023, + "step": 25638 + }, + { + "epoch": 69.86103542234332, + "grad_norm": 3.3704493045806885, + "learning_rate": 4.397653848563287e-06, + "loss": 0.0682, + "step": 25639 + }, + { + "epoch": 69.86376021798365, + "grad_norm": 3.1510908603668213, + "learning_rate": 4.396922870089197e-06, + "loss": 0.0609, + "step": 25640 + }, + { + "epoch": 69.86648501362397, + "grad_norm": 3.364135265350342, + "learning_rate": 4.396191935251694e-06, + "loss": 0.1387, + "step": 25641 + }, + { + "epoch": 69.8692098092643, + "grad_norm": 3.898624897003174, + "learning_rate": 4.395461044056462e-06, + "loss": 0.0904, + "step": 25642 + }, + { + "epoch": 69.87193460490464, + "grad_norm": 3.5249741077423096, + "learning_rate": 4.394730196509203e-06, + "loss": 0.0581, + "step": 25643 + }, + { + "epoch": 69.87465940054496, + "grad_norm": 5.282028675079346, + "learning_rate": 4.393999392615604e-06, + "loss": 0.0977, + "step": 25644 + }, + { + "epoch": 69.87738419618529, + "grad_norm": 3.129587173461914, + "learning_rate": 4.393268632381354e-06, + "loss": 0.039, + "step": 25645 + }, + { + "epoch": 69.88010899182561, + "grad_norm": 3.003549814224243, + "learning_rate": 4.392537915812148e-06, + "loss": 0.1757, + "step": 25646 + }, + { + "epoch": 69.88283378746594, + "grad_norm": 2.8321433067321777, + "learning_rate": 4.391807242913679e-06, + "loss": 0.0421, + "step": 25647 + }, + { + "epoch": 69.88555858310627, + "grad_norm": 3.6392486095428467, + "learning_rate": 4.391076613691636e-06, + "loss": 0.0545, + "step": 25648 + }, + { + "epoch": 69.88828337874659, + "grad_norm": 3.471306562423706, + "learning_rate": 4.390346028151708e-06, + "loss": 0.0431, + "step": 25649 + }, + { + "epoch": 69.89100817438693, + "grad_norm": 3.0239179134368896, + "learning_rate": 4.38961548629958e-06, + "loss": 0.0341, + "step": 25650 + }, + { + "epoch": 69.89373297002724, + "grad_norm": 7.585079669952393, + "learning_rate": 4.38888498814095e-06, + "loss": 0.1591, + "step": 25651 + }, + { + "epoch": 69.89645776566758, + "grad_norm": 4.792723655700684, + "learning_rate": 4.388154533681502e-06, + "loss": 0.1317, + "step": 25652 + }, + { + "epoch": 69.8991825613079, + "grad_norm": 3.157466173171997, + "learning_rate": 4.387424122926927e-06, + "loss": 0.0898, + "step": 25653 + }, + { + "epoch": 69.90190735694823, + "grad_norm": 2.9385287761688232, + "learning_rate": 4.386693755882909e-06, + "loss": 0.0555, + "step": 25654 + }, + { + "epoch": 69.90463215258856, + "grad_norm": 3.342075824737549, + "learning_rate": 4.385963432555142e-06, + "loss": 0.073, + "step": 25655 + }, + { + "epoch": 69.90735694822888, + "grad_norm": 3.559858798980713, + "learning_rate": 4.385233152949312e-06, + "loss": 0.101, + "step": 25656 + }, + { + "epoch": 69.91008174386921, + "grad_norm": 4.819878578186035, + "learning_rate": 4.3845029170711055e-06, + "loss": 0.0646, + "step": 25657 + }, + { + "epoch": 69.91280653950953, + "grad_norm": 2.4177775382995605, + "learning_rate": 4.383772724926205e-06, + "loss": 0.1697, + "step": 25658 + }, + { + "epoch": 69.91553133514986, + "grad_norm": 3.4610695838928223, + "learning_rate": 4.383042576520306e-06, + "loss": 0.1073, + "step": 25659 + }, + { + "epoch": 69.9182561307902, + "grad_norm": 4.215226173400879, + "learning_rate": 4.38231247185909e-06, + "loss": 0.1097, + "step": 25660 + }, + { + "epoch": 69.92098092643052, + "grad_norm": 2.705392837524414, + "learning_rate": 4.381582410948244e-06, + "loss": 0.1132, + "step": 25661 + }, + { + "epoch": 69.92370572207085, + "grad_norm": 2.679771900177002, + "learning_rate": 4.380852393793451e-06, + "loss": 0.0356, + "step": 25662 + }, + { + "epoch": 69.92643051771117, + "grad_norm": 3.200523614883423, + "learning_rate": 4.380122420400397e-06, + "loss": 0.0553, + "step": 25663 + }, + { + "epoch": 69.9291553133515, + "grad_norm": 2.936349630355835, + "learning_rate": 4.379392490774773e-06, + "loss": 0.1744, + "step": 25664 + }, + { + "epoch": 69.93188010899182, + "grad_norm": 4.008108139038086, + "learning_rate": 4.378662604922259e-06, + "loss": 0.1185, + "step": 25665 + }, + { + "epoch": 69.93460490463215, + "grad_norm": 5.427388668060303, + "learning_rate": 4.3779327628485365e-06, + "loss": 0.112, + "step": 25666 + }, + { + "epoch": 69.93732970027249, + "grad_norm": 2.4391846656799316, + "learning_rate": 4.377202964559296e-06, + "loss": 0.1328, + "step": 25667 + }, + { + "epoch": 69.9400544959128, + "grad_norm": 2.8574271202087402, + "learning_rate": 4.376473210060219e-06, + "loss": 0.042, + "step": 25668 + }, + { + "epoch": 69.94277929155314, + "grad_norm": 2.2506847381591797, + "learning_rate": 4.375743499356987e-06, + "loss": 0.0739, + "step": 25669 + }, + { + "epoch": 69.94550408719346, + "grad_norm": 3.2817273139953613, + "learning_rate": 4.375013832455279e-06, + "loss": 0.1347, + "step": 25670 + }, + { + "epoch": 69.94822888283379, + "grad_norm": 3.0046727657318115, + "learning_rate": 4.374284209360787e-06, + "loss": 0.0601, + "step": 25671 + }, + { + "epoch": 69.95095367847412, + "grad_norm": 4.249406814575195, + "learning_rate": 4.373554630079187e-06, + "loss": 0.095, + "step": 25672 + }, + { + "epoch": 69.95367847411444, + "grad_norm": 3.763875722885132, + "learning_rate": 4.3728250946161644e-06, + "loss": 0.0977, + "step": 25673 + }, + { + "epoch": 69.95640326975477, + "grad_norm": 3.7556955814361572, + "learning_rate": 4.372095602977394e-06, + "loss": 0.067, + "step": 25674 + }, + { + "epoch": 69.95912806539509, + "grad_norm": 3.5178794860839844, + "learning_rate": 4.371366155168566e-06, + "loss": 0.0613, + "step": 25675 + }, + { + "epoch": 69.96185286103542, + "grad_norm": 3.5529630184173584, + "learning_rate": 4.370636751195357e-06, + "loss": 0.0539, + "step": 25676 + }, + { + "epoch": 69.96457765667574, + "grad_norm": 3.3359811305999756, + "learning_rate": 4.369907391063448e-06, + "loss": 0.1426, + "step": 25677 + }, + { + "epoch": 69.96730245231608, + "grad_norm": 2.9579179286956787, + "learning_rate": 4.369178074778516e-06, + "loss": 0.1469, + "step": 25678 + }, + { + "epoch": 69.97002724795641, + "grad_norm": 3.1833534240722656, + "learning_rate": 4.368448802346247e-06, + "loss": 0.0935, + "step": 25679 + }, + { + "epoch": 69.97275204359673, + "grad_norm": 3.3022069931030273, + "learning_rate": 4.367719573772313e-06, + "loss": 0.0816, + "step": 25680 + }, + { + "epoch": 69.97547683923706, + "grad_norm": 3.098957061767578, + "learning_rate": 4.366990389062402e-06, + "loss": 0.0598, + "step": 25681 + }, + { + "epoch": 69.97820163487738, + "grad_norm": 3.772223711013794, + "learning_rate": 4.366261248222189e-06, + "loss": 0.0484, + "step": 25682 + }, + { + "epoch": 69.98092643051771, + "grad_norm": 2.9102935791015625, + "learning_rate": 4.3655321512573475e-06, + "loss": 0.0849, + "step": 25683 + }, + { + "epoch": 69.98365122615803, + "grad_norm": 4.268817901611328, + "learning_rate": 4.364803098173566e-06, + "loss": 0.0833, + "step": 25684 + }, + { + "epoch": 69.98637602179836, + "grad_norm": 2.0717179775238037, + "learning_rate": 4.364074088976514e-06, + "loss": 0.031, + "step": 25685 + }, + { + "epoch": 69.9891008174387, + "grad_norm": 2.721580743789673, + "learning_rate": 4.363345123671873e-06, + "loss": 0.0813, + "step": 25686 + }, + { + "epoch": 69.99182561307902, + "grad_norm": 5.713351726531982, + "learning_rate": 4.362616202265315e-06, + "loss": 0.0604, + "step": 25687 + }, + { + "epoch": 69.99455040871935, + "grad_norm": 5.006141662597656, + "learning_rate": 4.3618873247625235e-06, + "loss": 0.0677, + "step": 25688 + }, + { + "epoch": 69.99727520435967, + "grad_norm": 4.068763732910156, + "learning_rate": 4.361158491169173e-06, + "loss": 0.1026, + "step": 25689 + }, + { + "epoch": 70.0, + "grad_norm": 3.37605881690979, + "learning_rate": 4.360429701490935e-06, + "loss": 0.0605, + "step": 25690 + }, + { + "epoch": 70.00272479564033, + "grad_norm": 2.612733840942383, + "learning_rate": 4.359700955733492e-06, + "loss": 0.0424, + "step": 25691 + }, + { + "epoch": 70.00544959128065, + "grad_norm": 3.462092161178589, + "learning_rate": 4.358972253902517e-06, + "loss": 0.1157, + "step": 25692 + }, + { + "epoch": 70.00817438692098, + "grad_norm": 2.9180169105529785, + "learning_rate": 4.358243596003684e-06, + "loss": 0.0549, + "step": 25693 + }, + { + "epoch": 70.0108991825613, + "grad_norm": 3.7692203521728516, + "learning_rate": 4.357514982042664e-06, + "loss": 0.1095, + "step": 25694 + }, + { + "epoch": 70.01362397820164, + "grad_norm": 3.2022128105163574, + "learning_rate": 4.3567864120251406e-06, + "loss": 0.1199, + "step": 25695 + }, + { + "epoch": 70.01634877384195, + "grad_norm": 5.526648044586182, + "learning_rate": 4.356057885956782e-06, + "loss": 0.1713, + "step": 25696 + }, + { + "epoch": 70.01907356948229, + "grad_norm": 2.456502914428711, + "learning_rate": 4.35532940384326e-06, + "loss": 0.0632, + "step": 25697 + }, + { + "epoch": 70.02179836512262, + "grad_norm": 3.7020177841186523, + "learning_rate": 4.354600965690255e-06, + "loss": 0.1594, + "step": 25698 + }, + { + "epoch": 70.02452316076294, + "grad_norm": 3.0396926403045654, + "learning_rate": 4.353872571503431e-06, + "loss": 0.1524, + "step": 25699 + }, + { + "epoch": 70.02724795640327, + "grad_norm": 3.463225841522217, + "learning_rate": 4.353144221288471e-06, + "loss": 0.0591, + "step": 25700 + }, + { + "epoch": 70.02997275204359, + "grad_norm": 2.843632698059082, + "learning_rate": 4.352415915051042e-06, + "loss": 0.0925, + "step": 25701 + }, + { + "epoch": 70.03269754768392, + "grad_norm": 2.684150457382202, + "learning_rate": 4.351687652796815e-06, + "loss": 0.08, + "step": 25702 + }, + { + "epoch": 70.03542234332426, + "grad_norm": 2.7099454402923584, + "learning_rate": 4.3509594345314585e-06, + "loss": 0.0472, + "step": 25703 + }, + { + "epoch": 70.03814713896458, + "grad_norm": 2.846945285797119, + "learning_rate": 4.350231260260653e-06, + "loss": 0.0433, + "step": 25704 + }, + { + "epoch": 70.04087193460491, + "grad_norm": 2.798208475112915, + "learning_rate": 4.349503129990065e-06, + "loss": 0.0679, + "step": 25705 + }, + { + "epoch": 70.04359673024523, + "grad_norm": 3.0003740787506104, + "learning_rate": 4.348775043725364e-06, + "loss": 0.0504, + "step": 25706 + }, + { + "epoch": 70.04632152588556, + "grad_norm": 3.941540479660034, + "learning_rate": 4.348047001472217e-06, + "loss": 0.0373, + "step": 25707 + }, + { + "epoch": 70.04904632152588, + "grad_norm": 3.7867789268493652, + "learning_rate": 4.347319003236302e-06, + "loss": 0.1158, + "step": 25708 + }, + { + "epoch": 70.05177111716621, + "grad_norm": 3.8642520904541016, + "learning_rate": 4.346591049023286e-06, + "loss": 0.1307, + "step": 25709 + }, + { + "epoch": 70.05449591280654, + "grad_norm": 3.514848470687866, + "learning_rate": 4.34586313883883e-06, + "loss": 0.0669, + "step": 25710 + }, + { + "epoch": 70.05722070844686, + "grad_norm": 2.442347526550293, + "learning_rate": 4.345135272688617e-06, + "loss": 0.0349, + "step": 25711 + }, + { + "epoch": 70.0599455040872, + "grad_norm": 2.755409002304077, + "learning_rate": 4.3444074505783075e-06, + "loss": 0.0613, + "step": 25712 + }, + { + "epoch": 70.06267029972751, + "grad_norm": 3.864417791366577, + "learning_rate": 4.34367967251357e-06, + "loss": 0.0722, + "step": 25713 + }, + { + "epoch": 70.06539509536785, + "grad_norm": 1.9272481203079224, + "learning_rate": 4.342951938500069e-06, + "loss": 0.0521, + "step": 25714 + }, + { + "epoch": 70.06811989100818, + "grad_norm": 4.0011887550354, + "learning_rate": 4.342224248543479e-06, + "loss": 0.0657, + "step": 25715 + }, + { + "epoch": 70.0708446866485, + "grad_norm": 2.9652342796325684, + "learning_rate": 4.341496602649465e-06, + "loss": 0.0505, + "step": 25716 + }, + { + "epoch": 70.07356948228883, + "grad_norm": 2.233431577682495, + "learning_rate": 4.340769000823695e-06, + "loss": 0.0522, + "step": 25717 + }, + { + "epoch": 70.07629427792915, + "grad_norm": 2.004546880722046, + "learning_rate": 4.340041443071833e-06, + "loss": 0.0246, + "step": 25718 + }, + { + "epoch": 70.07901907356948, + "grad_norm": 2.3655498027801514, + "learning_rate": 4.339313929399543e-06, + "loss": 0.0996, + "step": 25719 + }, + { + "epoch": 70.0817438692098, + "grad_norm": 4.205402851104736, + "learning_rate": 4.338586459812498e-06, + "loss": 0.0624, + "step": 25720 + }, + { + "epoch": 70.08446866485014, + "grad_norm": 3.3054966926574707, + "learning_rate": 4.337859034316358e-06, + "loss": 0.1, + "step": 25721 + }, + { + "epoch": 70.08719346049047, + "grad_norm": 2.6024978160858154, + "learning_rate": 4.337131652916792e-06, + "loss": 0.0862, + "step": 25722 + }, + { + "epoch": 70.08991825613079, + "grad_norm": 3.2785117626190186, + "learning_rate": 4.3364043156194566e-06, + "loss": 0.0414, + "step": 25723 + }, + { + "epoch": 70.09264305177112, + "grad_norm": 2.1956186294555664, + "learning_rate": 4.335677022430027e-06, + "loss": 0.0895, + "step": 25724 + }, + { + "epoch": 70.09536784741144, + "grad_norm": 2.7542428970336914, + "learning_rate": 4.334949773354161e-06, + "loss": 0.0884, + "step": 25725 + }, + { + "epoch": 70.09809264305177, + "grad_norm": 8.024162292480469, + "learning_rate": 4.334222568397526e-06, + "loss": 0.0363, + "step": 25726 + }, + { + "epoch": 70.1008174386921, + "grad_norm": 2.9970154762268066, + "learning_rate": 4.333495407565777e-06, + "loss": 0.2539, + "step": 25727 + }, + { + "epoch": 70.10354223433242, + "grad_norm": 2.9449198246002197, + "learning_rate": 4.33276829086459e-06, + "loss": 0.1015, + "step": 25728 + }, + { + "epoch": 70.10626702997276, + "grad_norm": 2.850621461868286, + "learning_rate": 4.332041218299619e-06, + "loss": 0.1877, + "step": 25729 + }, + { + "epoch": 70.10899182561307, + "grad_norm": 3.671219825744629, + "learning_rate": 4.331314189876528e-06, + "loss": 0.0564, + "step": 25730 + }, + { + "epoch": 70.11171662125341, + "grad_norm": 3.8866076469421387, + "learning_rate": 4.330587205600978e-06, + "loss": 0.0603, + "step": 25731 + }, + { + "epoch": 70.11444141689373, + "grad_norm": 3.623387575149536, + "learning_rate": 4.329860265478631e-06, + "loss": 0.1453, + "step": 25732 + }, + { + "epoch": 70.11716621253406, + "grad_norm": 5.383785724639893, + "learning_rate": 4.329133369515155e-06, + "loss": 0.0817, + "step": 25733 + }, + { + "epoch": 70.11989100817439, + "grad_norm": 3.942452907562256, + "learning_rate": 4.328406517716205e-06, + "loss": 0.188, + "step": 25734 + }, + { + "epoch": 70.12261580381471, + "grad_norm": 4.4679951667785645, + "learning_rate": 4.327679710087438e-06, + "loss": 0.1185, + "step": 25735 + }, + { + "epoch": 70.12534059945504, + "grad_norm": 3.4070608615875244, + "learning_rate": 4.326952946634523e-06, + "loss": 0.1402, + "step": 25736 + }, + { + "epoch": 70.12806539509536, + "grad_norm": 4.057241916656494, + "learning_rate": 4.326226227363116e-06, + "loss": 0.1239, + "step": 25737 + }, + { + "epoch": 70.1307901907357, + "grad_norm": 3.2047441005706787, + "learning_rate": 4.325499552278877e-06, + "loss": 0.0428, + "step": 25738 + }, + { + "epoch": 70.13351498637603, + "grad_norm": 3.029756546020508, + "learning_rate": 4.32477292138746e-06, + "loss": 0.1284, + "step": 25739 + }, + { + "epoch": 70.13623978201635, + "grad_norm": 3.8635129928588867, + "learning_rate": 4.324046334694534e-06, + "loss": 0.0568, + "step": 25740 + }, + { + "epoch": 70.13896457765668, + "grad_norm": 4.335892200469971, + "learning_rate": 4.3233197922057515e-06, + "loss": 0.0934, + "step": 25741 + }, + { + "epoch": 70.141689373297, + "grad_norm": 2.3393070697784424, + "learning_rate": 4.322593293926771e-06, + "loss": 0.1254, + "step": 25742 + }, + { + "epoch": 70.14441416893733, + "grad_norm": 4.349730968475342, + "learning_rate": 4.321866839863249e-06, + "loss": 0.0705, + "step": 25743 + }, + { + "epoch": 70.14713896457765, + "grad_norm": 5.032073020935059, + "learning_rate": 4.321140430020848e-06, + "loss": 0.0822, + "step": 25744 + }, + { + "epoch": 70.14986376021798, + "grad_norm": 2.0033092498779297, + "learning_rate": 4.320414064405223e-06, + "loss": 0.0285, + "step": 25745 + }, + { + "epoch": 70.15258855585832, + "grad_norm": 3.244332790374756, + "learning_rate": 4.319687743022031e-06, + "loss": 0.0398, + "step": 25746 + }, + { + "epoch": 70.15531335149863, + "grad_norm": 4.38469123840332, + "learning_rate": 4.318961465876924e-06, + "loss": 0.1832, + "step": 25747 + }, + { + "epoch": 70.15803814713897, + "grad_norm": 2.730025053024292, + "learning_rate": 4.318235232975565e-06, + "loss": 0.0361, + "step": 25748 + }, + { + "epoch": 70.16076294277929, + "grad_norm": 2.532407522201538, + "learning_rate": 4.317509044323605e-06, + "loss": 0.0421, + "step": 25749 + }, + { + "epoch": 70.16348773841962, + "grad_norm": 3.7165937423706055, + "learning_rate": 4.316782899926704e-06, + "loss": 0.045, + "step": 25750 + }, + { + "epoch": 70.16621253405995, + "grad_norm": 2.5522847175598145, + "learning_rate": 4.316056799790512e-06, + "loss": 0.0396, + "step": 25751 + }, + { + "epoch": 70.16893732970027, + "grad_norm": 2.729966163635254, + "learning_rate": 4.31533074392069e-06, + "loss": 0.0488, + "step": 25752 + }, + { + "epoch": 70.1716621253406, + "grad_norm": 2.9957115650177, + "learning_rate": 4.314604732322889e-06, + "loss": 0.049, + "step": 25753 + }, + { + "epoch": 70.17438692098092, + "grad_norm": 3.1514878273010254, + "learning_rate": 4.313878765002763e-06, + "loss": 0.0741, + "step": 25754 + }, + { + "epoch": 70.17711171662125, + "grad_norm": 2.544762134552002, + "learning_rate": 4.313152841965964e-06, + "loss": 0.0594, + "step": 25755 + }, + { + "epoch": 70.17983651226157, + "grad_norm": 2.818070888519287, + "learning_rate": 4.31242696321815e-06, + "loss": 0.0461, + "step": 25756 + }, + { + "epoch": 70.1825613079019, + "grad_norm": 2.1443002223968506, + "learning_rate": 4.311701128764974e-06, + "loss": 0.1193, + "step": 25757 + }, + { + "epoch": 70.18528610354224, + "grad_norm": 5.600152969360352, + "learning_rate": 4.310975338612084e-06, + "loss": 0.1201, + "step": 25758 + }, + { + "epoch": 70.18801089918256, + "grad_norm": 3.2574639320373535, + "learning_rate": 4.310249592765133e-06, + "loss": 0.0676, + "step": 25759 + }, + { + "epoch": 70.19073569482289, + "grad_norm": 2.508854627609253, + "learning_rate": 4.309523891229777e-06, + "loss": 0.0537, + "step": 25760 + }, + { + "epoch": 70.19346049046321, + "grad_norm": 2.628046751022339, + "learning_rate": 4.3087982340116665e-06, + "loss": 0.0623, + "step": 25761 + }, + { + "epoch": 70.19618528610354, + "grad_norm": 3.702197551727295, + "learning_rate": 4.308072621116453e-06, + "loss": 0.1033, + "step": 25762 + }, + { + "epoch": 70.19891008174388, + "grad_norm": 2.7948198318481445, + "learning_rate": 4.307347052549781e-06, + "loss": 0.0927, + "step": 25763 + }, + { + "epoch": 70.2016348773842, + "grad_norm": 4.994749069213867, + "learning_rate": 4.306621528317312e-06, + "loss": 0.041, + "step": 25764 + }, + { + "epoch": 70.20435967302453, + "grad_norm": 2.5164976119995117, + "learning_rate": 4.305896048424691e-06, + "loss": 0.0393, + "step": 25765 + }, + { + "epoch": 70.20708446866485, + "grad_norm": 3.661639451980591, + "learning_rate": 4.305170612877565e-06, + "loss": 0.048, + "step": 25766 + }, + { + "epoch": 70.20980926430518, + "grad_norm": 3.312103033065796, + "learning_rate": 4.304445221681592e-06, + "loss": 0.0444, + "step": 25767 + }, + { + "epoch": 70.2125340599455, + "grad_norm": 2.6454432010650635, + "learning_rate": 4.3037198748424105e-06, + "loss": 0.0386, + "step": 25768 + }, + { + "epoch": 70.21525885558583, + "grad_norm": 2.856839656829834, + "learning_rate": 4.30299457236568e-06, + "loss": 0.0964, + "step": 25769 + }, + { + "epoch": 70.21798365122616, + "grad_norm": 3.4453814029693604, + "learning_rate": 4.302269314257044e-06, + "loss": 0.0806, + "step": 25770 + }, + { + "epoch": 70.22070844686648, + "grad_norm": 3.521606206893921, + "learning_rate": 4.301544100522151e-06, + "loss": 0.0744, + "step": 25771 + }, + { + "epoch": 70.22343324250681, + "grad_norm": 3.4696497917175293, + "learning_rate": 4.300818931166645e-06, + "loss": 0.0745, + "step": 25772 + }, + { + "epoch": 70.22615803814713, + "grad_norm": 4.244225978851318, + "learning_rate": 4.3000938061961825e-06, + "loss": 0.0535, + "step": 25773 + }, + { + "epoch": 70.22888283378747, + "grad_norm": 2.9358582496643066, + "learning_rate": 4.299368725616405e-06, + "loss": 0.0884, + "step": 25774 + }, + { + "epoch": 70.2316076294278, + "grad_norm": 3.3426084518432617, + "learning_rate": 4.298643689432958e-06, + "loss": 0.0664, + "step": 25775 + }, + { + "epoch": 70.23433242506812, + "grad_norm": 3.7609598636627197, + "learning_rate": 4.297918697651493e-06, + "loss": 0.1675, + "step": 25776 + }, + { + "epoch": 70.23705722070845, + "grad_norm": 3.2763009071350098, + "learning_rate": 4.297193750277654e-06, + "loss": 0.1055, + "step": 25777 + }, + { + "epoch": 70.23978201634877, + "grad_norm": 3.5721278190612793, + "learning_rate": 4.296468847317086e-06, + "loss": 0.0665, + "step": 25778 + }, + { + "epoch": 70.2425068119891, + "grad_norm": 3.158398151397705, + "learning_rate": 4.2957439887754325e-06, + "loss": 0.0466, + "step": 25779 + }, + { + "epoch": 70.24523160762942, + "grad_norm": 2.066787004470825, + "learning_rate": 4.295019174658344e-06, + "loss": 0.154, + "step": 25780 + }, + { + "epoch": 70.24795640326975, + "grad_norm": 3.3044679164886475, + "learning_rate": 4.294294404971464e-06, + "loss": 0.1755, + "step": 25781 + }, + { + "epoch": 70.25068119891009, + "grad_norm": 5.466963291168213, + "learning_rate": 4.293569679720434e-06, + "loss": 0.1676, + "step": 25782 + }, + { + "epoch": 70.2534059945504, + "grad_norm": 3.4783709049224854, + "learning_rate": 4.2928449989108964e-06, + "loss": 0.0965, + "step": 25783 + }, + { + "epoch": 70.25613079019074, + "grad_norm": 2.85040283203125, + "learning_rate": 4.292120362548499e-06, + "loss": 0.0299, + "step": 25784 + }, + { + "epoch": 70.25885558583106, + "grad_norm": 2.3949267864227295, + "learning_rate": 4.291395770638888e-06, + "loss": 0.0344, + "step": 25785 + }, + { + "epoch": 70.26158038147139, + "grad_norm": 2.427435874938965, + "learning_rate": 4.290671223187701e-06, + "loss": 0.1092, + "step": 25786 + }, + { + "epoch": 70.26430517711172, + "grad_norm": 2.70589542388916, + "learning_rate": 4.289946720200585e-06, + "loss": 0.1229, + "step": 25787 + }, + { + "epoch": 70.26702997275204, + "grad_norm": 2.6562418937683105, + "learning_rate": 4.289222261683176e-06, + "loss": 0.0531, + "step": 25788 + }, + { + "epoch": 70.26975476839237, + "grad_norm": 2.682788848876953, + "learning_rate": 4.2884978476411235e-06, + "loss": 0.0811, + "step": 25789 + }, + { + "epoch": 70.2724795640327, + "grad_norm": 3.2893130779266357, + "learning_rate": 4.287773478080066e-06, + "loss": 0.0965, + "step": 25790 + }, + { + "epoch": 70.27520435967303, + "grad_norm": 2.856510639190674, + "learning_rate": 4.287049153005644e-06, + "loss": 0.13, + "step": 25791 + }, + { + "epoch": 70.27792915531334, + "grad_norm": 4.285785675048828, + "learning_rate": 4.286324872423497e-06, + "loss": 0.1433, + "step": 25792 + }, + { + "epoch": 70.28065395095368, + "grad_norm": 2.9691834449768066, + "learning_rate": 4.2856006363392726e-06, + "loss": 0.1299, + "step": 25793 + }, + { + "epoch": 70.28337874659401, + "grad_norm": 2.4945054054260254, + "learning_rate": 4.284876444758604e-06, + "loss": 0.0714, + "step": 25794 + }, + { + "epoch": 70.28610354223433, + "grad_norm": 3.0490522384643555, + "learning_rate": 4.284152297687136e-06, + "loss": 0.0664, + "step": 25795 + }, + { + "epoch": 70.28882833787466, + "grad_norm": 4.4501729011535645, + "learning_rate": 4.2834281951305e-06, + "loss": 0.1, + "step": 25796 + }, + { + "epoch": 70.29155313351498, + "grad_norm": 1.6889508962631226, + "learning_rate": 4.2827041370943465e-06, + "loss": 0.0254, + "step": 25797 + }, + { + "epoch": 70.29427792915531, + "grad_norm": 3.197612762451172, + "learning_rate": 4.2819801235843086e-06, + "loss": 0.066, + "step": 25798 + }, + { + "epoch": 70.29700272479565, + "grad_norm": 2.619960308074951, + "learning_rate": 4.2812561546060215e-06, + "loss": 0.0985, + "step": 25799 + }, + { + "epoch": 70.29972752043597, + "grad_norm": 2.725442409515381, + "learning_rate": 4.280532230165132e-06, + "loss": 0.107, + "step": 25800 + }, + { + "epoch": 70.3024523160763, + "grad_norm": 3.8378942012786865, + "learning_rate": 4.2798083502672695e-06, + "loss": 0.062, + "step": 25801 + }, + { + "epoch": 70.30517711171662, + "grad_norm": 2.5743367671966553, + "learning_rate": 4.2790845149180784e-06, + "loss": 0.0678, + "step": 25802 + }, + { + "epoch": 70.30790190735695, + "grad_norm": 2.618525266647339, + "learning_rate": 4.278360724123194e-06, + "loss": 0.0742, + "step": 25803 + }, + { + "epoch": 70.31062670299727, + "grad_norm": 2.9353785514831543, + "learning_rate": 4.277636977888248e-06, + "loss": 0.039, + "step": 25804 + }, + { + "epoch": 70.3133514986376, + "grad_norm": 3.842531204223633, + "learning_rate": 4.276913276218885e-06, + "loss": 0.0964, + "step": 25805 + }, + { + "epoch": 70.31607629427793, + "grad_norm": 4.603367805480957, + "learning_rate": 4.2761896191207365e-06, + "loss": 0.0517, + "step": 25806 + }, + { + "epoch": 70.31880108991825, + "grad_norm": 2.459416151046753, + "learning_rate": 4.275466006599439e-06, + "loss": 0.0362, + "step": 25807 + }, + { + "epoch": 70.32152588555859, + "grad_norm": 3.6822526454925537, + "learning_rate": 4.2747424386606255e-06, + "loss": 0.0474, + "step": 25808 + }, + { + "epoch": 70.3242506811989, + "grad_norm": 3.025571823120117, + "learning_rate": 4.2740189153099355e-06, + "loss": 0.1482, + "step": 25809 + }, + { + "epoch": 70.32697547683924, + "grad_norm": 3.692002296447754, + "learning_rate": 4.2732954365530034e-06, + "loss": 0.1535, + "step": 25810 + }, + { + "epoch": 70.32970027247957, + "grad_norm": 2.6477317810058594, + "learning_rate": 4.2725720023954605e-06, + "loss": 0.0352, + "step": 25811 + }, + { + "epoch": 70.33242506811989, + "grad_norm": 2.575512647628784, + "learning_rate": 4.27184861284294e-06, + "loss": 0.1223, + "step": 25812 + }, + { + "epoch": 70.33514986376022, + "grad_norm": 13.949918746948242, + "learning_rate": 4.271125267901083e-06, + "loss": 0.0697, + "step": 25813 + }, + { + "epoch": 70.33787465940054, + "grad_norm": 2.2304110527038574, + "learning_rate": 4.2704019675755155e-06, + "loss": 0.039, + "step": 25814 + }, + { + "epoch": 70.34059945504087, + "grad_norm": 3.124695062637329, + "learning_rate": 4.269678711871875e-06, + "loss": 0.0675, + "step": 25815 + }, + { + "epoch": 70.34332425068119, + "grad_norm": 6.387601852416992, + "learning_rate": 4.268955500795788e-06, + "loss": 0.0655, + "step": 25816 + }, + { + "epoch": 70.34604904632153, + "grad_norm": 2.7448737621307373, + "learning_rate": 4.268232334352895e-06, + "loss": 0.0449, + "step": 25817 + }, + { + "epoch": 70.34877384196186, + "grad_norm": 2.030609369277954, + "learning_rate": 4.267509212548821e-06, + "loss": 0.0385, + "step": 25818 + }, + { + "epoch": 70.35149863760218, + "grad_norm": 2.8909125328063965, + "learning_rate": 4.266786135389203e-06, + "loss": 0.1641, + "step": 25819 + }, + { + "epoch": 70.35422343324251, + "grad_norm": 6.593447208404541, + "learning_rate": 4.2660631028796665e-06, + "loss": 0.1597, + "step": 25820 + }, + { + "epoch": 70.35694822888283, + "grad_norm": 2.1756784915924072, + "learning_rate": 4.26534011502585e-06, + "loss": 0.0674, + "step": 25821 + }, + { + "epoch": 70.35967302452316, + "grad_norm": 3.2333314418792725, + "learning_rate": 4.264617171833381e-06, + "loss": 0.2454, + "step": 25822 + }, + { + "epoch": 70.3623978201635, + "grad_norm": 2.5491182804107666, + "learning_rate": 4.263894273307888e-06, + "loss": 0.1337, + "step": 25823 + }, + { + "epoch": 70.36512261580381, + "grad_norm": 3.0634193420410156, + "learning_rate": 4.263171419454998e-06, + "loss": 0.0298, + "step": 25824 + }, + { + "epoch": 70.36784741144415, + "grad_norm": 3.094879150390625, + "learning_rate": 4.262448610280348e-06, + "loss": 0.0624, + "step": 25825 + }, + { + "epoch": 70.37057220708446, + "grad_norm": 1.936737060546875, + "learning_rate": 4.261725845789564e-06, + "loss": 0.0263, + "step": 25826 + }, + { + "epoch": 70.3732970027248, + "grad_norm": 5.852288246154785, + "learning_rate": 4.261003125988275e-06, + "loss": 0.0854, + "step": 25827 + }, + { + "epoch": 70.37602179836512, + "grad_norm": 2.6277921199798584, + "learning_rate": 4.260280450882104e-06, + "loss": 0.1037, + "step": 25828 + }, + { + "epoch": 70.37874659400545, + "grad_norm": 4.712032318115234, + "learning_rate": 4.259557820476689e-06, + "loss": 0.0596, + "step": 25829 + }, + { + "epoch": 70.38147138964578, + "grad_norm": 2.8652727603912354, + "learning_rate": 4.258835234777652e-06, + "loss": 0.0579, + "step": 25830 + }, + { + "epoch": 70.3841961852861, + "grad_norm": 2.4967751502990723, + "learning_rate": 4.2581126937906215e-06, + "loss": 0.0493, + "step": 25831 + }, + { + "epoch": 70.38692098092643, + "grad_norm": 3.6561508178710938, + "learning_rate": 4.257390197521221e-06, + "loss": 0.14, + "step": 25832 + }, + { + "epoch": 70.38964577656675, + "grad_norm": 5.42636251449585, + "learning_rate": 4.256667745975084e-06, + "loss": 0.1609, + "step": 25833 + }, + { + "epoch": 70.39237057220708, + "grad_norm": 3.0732507705688477, + "learning_rate": 4.255945339157834e-06, + "loss": 0.0536, + "step": 25834 + }, + { + "epoch": 70.39509536784742, + "grad_norm": 3.269412040710449, + "learning_rate": 4.255222977075094e-06, + "loss": 0.126, + "step": 25835 + }, + { + "epoch": 70.39782016348774, + "grad_norm": 2.7422266006469727, + "learning_rate": 4.254500659732496e-06, + "loss": 0.0561, + "step": 25836 + }, + { + "epoch": 70.40054495912807, + "grad_norm": 3.6423215866088867, + "learning_rate": 4.253778387135658e-06, + "loss": 0.1019, + "step": 25837 + }, + { + "epoch": 70.40326975476839, + "grad_norm": 3.569866418838501, + "learning_rate": 4.253056159290212e-06, + "loss": 0.0896, + "step": 25838 + }, + { + "epoch": 70.40599455040872, + "grad_norm": 3.734497308731079, + "learning_rate": 4.2523339762017805e-06, + "loss": 0.0434, + "step": 25839 + }, + { + "epoch": 70.40871934604904, + "grad_norm": 3.439307689666748, + "learning_rate": 4.2516118378759826e-06, + "loss": 0.1112, + "step": 25840 + }, + { + "epoch": 70.41144414168937, + "grad_norm": 3.146479368209839, + "learning_rate": 4.250889744318452e-06, + "loss": 0.0579, + "step": 25841 + }, + { + "epoch": 70.4141689373297, + "grad_norm": 3.413196086883545, + "learning_rate": 4.2501676955348045e-06, + "loss": 0.0801, + "step": 25842 + }, + { + "epoch": 70.41689373297002, + "grad_norm": 3.2361388206481934, + "learning_rate": 4.249445691530668e-06, + "loss": 0.0838, + "step": 25843 + }, + { + "epoch": 70.41961852861036, + "grad_norm": 3.2097456455230713, + "learning_rate": 4.24872373231166e-06, + "loss": 0.0547, + "step": 25844 + }, + { + "epoch": 70.42234332425068, + "grad_norm": 6.420253276824951, + "learning_rate": 4.248001817883408e-06, + "loss": 0.0391, + "step": 25845 + }, + { + "epoch": 70.42506811989101, + "grad_norm": 3.8383002281188965, + "learning_rate": 4.247279948251534e-06, + "loss": 0.1797, + "step": 25846 + }, + { + "epoch": 70.42779291553134, + "grad_norm": 3.0335421562194824, + "learning_rate": 4.246558123421658e-06, + "loss": 0.1228, + "step": 25847 + }, + { + "epoch": 70.43051771117166, + "grad_norm": 3.270625114440918, + "learning_rate": 4.2458363433994e-06, + "loss": 0.0631, + "step": 25848 + }, + { + "epoch": 70.433242506812, + "grad_norm": 2.877497673034668, + "learning_rate": 4.245114608190385e-06, + "loss": 0.1059, + "step": 25849 + }, + { + "epoch": 70.43596730245231, + "grad_norm": 3.6067934036254883, + "learning_rate": 4.244392917800234e-06, + "loss": 0.1098, + "step": 25850 + }, + { + "epoch": 70.43869209809264, + "grad_norm": 2.9734182357788086, + "learning_rate": 4.243671272234564e-06, + "loss": 0.0341, + "step": 25851 + }, + { + "epoch": 70.44141689373296, + "grad_norm": 2.876863718032837, + "learning_rate": 4.242949671498995e-06, + "loss": 0.0609, + "step": 25852 + }, + { + "epoch": 70.4441416893733, + "grad_norm": 2.675910472869873, + "learning_rate": 4.242228115599147e-06, + "loss": 0.0461, + "step": 25853 + }, + { + "epoch": 70.44686648501363, + "grad_norm": 2.7128145694732666, + "learning_rate": 4.2415066045406465e-06, + "loss": 0.0781, + "step": 25854 + }, + { + "epoch": 70.44959128065395, + "grad_norm": 3.816506862640381, + "learning_rate": 4.2407851383291055e-06, + "loss": 0.1031, + "step": 25855 + }, + { + "epoch": 70.45231607629428, + "grad_norm": 3.5927624702453613, + "learning_rate": 4.240063716970145e-06, + "loss": 0.1814, + "step": 25856 + }, + { + "epoch": 70.4550408719346, + "grad_norm": 2.925413131713867, + "learning_rate": 4.23934234046938e-06, + "loss": 0.1628, + "step": 25857 + }, + { + "epoch": 70.45776566757493, + "grad_norm": 3.3901381492614746, + "learning_rate": 4.2386210088324355e-06, + "loss": 0.0498, + "step": 25858 + }, + { + "epoch": 70.46049046321527, + "grad_norm": 2.0617852210998535, + "learning_rate": 4.2378997220649235e-06, + "loss": 0.0362, + "step": 25859 + }, + { + "epoch": 70.46321525885558, + "grad_norm": 3.5812828540802, + "learning_rate": 4.23717848017246e-06, + "loss": 0.047, + "step": 25860 + }, + { + "epoch": 70.46594005449592, + "grad_norm": 2.932439088821411, + "learning_rate": 4.236457283160669e-06, + "loss": 0.0564, + "step": 25861 + }, + { + "epoch": 70.46866485013624, + "grad_norm": 2.2549376487731934, + "learning_rate": 4.235736131035163e-06, + "loss": 0.0869, + "step": 25862 + }, + { + "epoch": 70.47138964577657, + "grad_norm": 1.828937292098999, + "learning_rate": 4.235015023801558e-06, + "loss": 0.0252, + "step": 25863 + }, + { + "epoch": 70.47411444141689, + "grad_norm": 4.041618347167969, + "learning_rate": 4.234293961465467e-06, + "loss": 0.0933, + "step": 25864 + }, + { + "epoch": 70.47683923705722, + "grad_norm": 2.6297528743743896, + "learning_rate": 4.233572944032514e-06, + "loss": 0.143, + "step": 25865 + }, + { + "epoch": 70.47956403269755, + "grad_norm": 2.1373395919799805, + "learning_rate": 4.232851971508308e-06, + "loss": 0.0629, + "step": 25866 + }, + { + "epoch": 70.48228882833787, + "grad_norm": 3.39882230758667, + "learning_rate": 4.232131043898465e-06, + "loss": 0.1496, + "step": 25867 + }, + { + "epoch": 70.4850136239782, + "grad_norm": 2.437934398651123, + "learning_rate": 4.231410161208598e-06, + "loss": 0.0359, + "step": 25868 + }, + { + "epoch": 70.48773841961852, + "grad_norm": 2.1555838584899902, + "learning_rate": 4.230689323444322e-06, + "loss": 0.1669, + "step": 25869 + }, + { + "epoch": 70.49046321525886, + "grad_norm": 2.7060513496398926, + "learning_rate": 4.229968530611255e-06, + "loss": 0.1156, + "step": 25870 + }, + { + "epoch": 70.49318801089919, + "grad_norm": 2.6989705562591553, + "learning_rate": 4.229247782715007e-06, + "loss": 0.0523, + "step": 25871 + }, + { + "epoch": 70.49591280653951, + "grad_norm": 2.2723169326782227, + "learning_rate": 4.228527079761192e-06, + "loss": 0.0348, + "step": 25872 + }, + { + "epoch": 70.49863760217984, + "grad_norm": 3.039783477783203, + "learning_rate": 4.2278064217554194e-06, + "loss": 0.0844, + "step": 25873 + }, + { + "epoch": 70.50136239782016, + "grad_norm": 2.909681558609009, + "learning_rate": 4.2270858087033075e-06, + "loss": 0.0731, + "step": 25874 + }, + { + "epoch": 70.50408719346049, + "grad_norm": 3.2307498455047607, + "learning_rate": 4.226365240610465e-06, + "loss": 0.0416, + "step": 25875 + }, + { + "epoch": 70.50681198910081, + "grad_norm": 3.36785626411438, + "learning_rate": 4.225644717482506e-06, + "loss": 0.1876, + "step": 25876 + }, + { + "epoch": 70.50953678474114, + "grad_norm": 3.2695765495300293, + "learning_rate": 4.224924239325035e-06, + "loss": 0.0391, + "step": 25877 + }, + { + "epoch": 70.51226158038148, + "grad_norm": 2.80440092086792, + "learning_rate": 4.224203806143672e-06, + "loss": 0.0435, + "step": 25878 + }, + { + "epoch": 70.5149863760218, + "grad_norm": 3.8948888778686523, + "learning_rate": 4.223483417944024e-06, + "loss": 0.149, + "step": 25879 + }, + { + "epoch": 70.51771117166213, + "grad_norm": 1.9615836143493652, + "learning_rate": 4.2227630747317e-06, + "loss": 0.0629, + "step": 25880 + }, + { + "epoch": 70.52043596730245, + "grad_norm": 2.87920880317688, + "learning_rate": 4.22204277651231e-06, + "loss": 0.0539, + "step": 25881 + }, + { + "epoch": 70.52316076294278, + "grad_norm": 2.286112070083618, + "learning_rate": 4.221322523291467e-06, + "loss": 0.0665, + "step": 25882 + }, + { + "epoch": 70.52588555858311, + "grad_norm": 2.731645107269287, + "learning_rate": 4.2206023150747785e-06, + "loss": 0.1524, + "step": 25883 + }, + { + "epoch": 70.52861035422343, + "grad_norm": 3.801405906677246, + "learning_rate": 4.21988215186785e-06, + "loss": 0.1102, + "step": 25884 + }, + { + "epoch": 70.53133514986376, + "grad_norm": 3.687263250350952, + "learning_rate": 4.2191620336762965e-06, + "loss": 0.1469, + "step": 25885 + }, + { + "epoch": 70.53405994550408, + "grad_norm": 2.582698106765747, + "learning_rate": 4.218441960505723e-06, + "loss": 0.1292, + "step": 25886 + }, + { + "epoch": 70.53678474114442, + "grad_norm": 5.0590410232543945, + "learning_rate": 4.217721932361734e-06, + "loss": 0.0522, + "step": 25887 + }, + { + "epoch": 70.53950953678473, + "grad_norm": 2.432004451751709, + "learning_rate": 4.217001949249944e-06, + "loss": 0.0542, + "step": 25888 + }, + { + "epoch": 70.54223433242507, + "grad_norm": 2.6614952087402344, + "learning_rate": 4.216282011175953e-06, + "loss": 0.1065, + "step": 25889 + }, + { + "epoch": 70.5449591280654, + "grad_norm": 3.007277011871338, + "learning_rate": 4.2155621181453745e-06, + "loss": 0.0856, + "step": 25890 + }, + { + "epoch": 70.54768392370572, + "grad_norm": 3.1674139499664307, + "learning_rate": 4.214842270163813e-06, + "loss": 0.1291, + "step": 25891 + }, + { + "epoch": 70.55040871934605, + "grad_norm": 3.7338919639587402, + "learning_rate": 4.214122467236873e-06, + "loss": 0.151, + "step": 25892 + }, + { + "epoch": 70.55313351498637, + "grad_norm": 3.014159679412842, + "learning_rate": 4.213402709370158e-06, + "loss": 0.1756, + "step": 25893 + }, + { + "epoch": 70.5558583106267, + "grad_norm": 2.431577444076538, + "learning_rate": 4.21268299656928e-06, + "loss": 0.1085, + "step": 25894 + }, + { + "epoch": 70.55858310626704, + "grad_norm": 2.7618846893310547, + "learning_rate": 4.211963328839841e-06, + "loss": 0.0823, + "step": 25895 + }, + { + "epoch": 70.56130790190736, + "grad_norm": 4.54824686050415, + "learning_rate": 4.2112437061874445e-06, + "loss": 0.0673, + "step": 25896 + }, + { + "epoch": 70.56403269754769, + "grad_norm": 3.0391998291015625, + "learning_rate": 4.210524128617692e-06, + "loss": 0.0446, + "step": 25897 + }, + { + "epoch": 70.566757493188, + "grad_norm": 2.9395833015441895, + "learning_rate": 4.209804596136195e-06, + "loss": 0.091, + "step": 25898 + }, + { + "epoch": 70.56948228882834, + "grad_norm": 3.116922616958618, + "learning_rate": 4.209085108748554e-06, + "loss": 0.0931, + "step": 25899 + }, + { + "epoch": 70.57220708446866, + "grad_norm": 5.059455394744873, + "learning_rate": 4.208365666460371e-06, + "loss": 0.0735, + "step": 25900 + }, + { + "epoch": 70.57493188010899, + "grad_norm": 2.790809392929077, + "learning_rate": 4.207646269277247e-06, + "loss": 0.0394, + "step": 25901 + }, + { + "epoch": 70.57765667574932, + "grad_norm": 3.0464560985565186, + "learning_rate": 4.206926917204791e-06, + "loss": 0.0437, + "step": 25902 + }, + { + "epoch": 70.58038147138964, + "grad_norm": 2.7532222270965576, + "learning_rate": 4.2062076102486016e-06, + "loss": 0.1169, + "step": 25903 + }, + { + "epoch": 70.58310626702998, + "grad_norm": 2.997598886489868, + "learning_rate": 4.2054883484142765e-06, + "loss": 0.0469, + "step": 25904 + }, + { + "epoch": 70.5858310626703, + "grad_norm": 2.8382644653320312, + "learning_rate": 4.204769131707422e-06, + "loss": 0.0505, + "step": 25905 + }, + { + "epoch": 70.58855585831063, + "grad_norm": 4.03818416595459, + "learning_rate": 4.204049960133643e-06, + "loss": 0.1391, + "step": 25906 + }, + { + "epoch": 70.59128065395096, + "grad_norm": 3.1195859909057617, + "learning_rate": 4.203330833698536e-06, + "loss": 0.0954, + "step": 25907 + }, + { + "epoch": 70.59400544959128, + "grad_norm": 2.6667582988739014, + "learning_rate": 4.202611752407703e-06, + "loss": 0.0805, + "step": 25908 + }, + { + "epoch": 70.59673024523161, + "grad_norm": 3.4228203296661377, + "learning_rate": 4.201892716266738e-06, + "loss": 0.0639, + "step": 25909 + }, + { + "epoch": 70.59945504087193, + "grad_norm": 2.626016855239868, + "learning_rate": 4.2011737252812505e-06, + "loss": 0.1139, + "step": 25910 + }, + { + "epoch": 70.60217983651226, + "grad_norm": 3.4347877502441406, + "learning_rate": 4.200454779456834e-06, + "loss": 0.0523, + "step": 25911 + }, + { + "epoch": 70.60490463215258, + "grad_norm": 3.0663342475891113, + "learning_rate": 4.199735878799091e-06, + "loss": 0.2209, + "step": 25912 + }, + { + "epoch": 70.60762942779292, + "grad_norm": 3.306182384490967, + "learning_rate": 4.199017023313613e-06, + "loss": 0.0766, + "step": 25913 + }, + { + "epoch": 70.61035422343325, + "grad_norm": 4.746140956878662, + "learning_rate": 4.198298213006008e-06, + "loss": 0.0685, + "step": 25914 + }, + { + "epoch": 70.61307901907357, + "grad_norm": 3.576681613922119, + "learning_rate": 4.19757944788187e-06, + "loss": 0.0785, + "step": 25915 + }, + { + "epoch": 70.6158038147139, + "grad_norm": 2.961754083633423, + "learning_rate": 4.196860727946796e-06, + "loss": 0.0369, + "step": 25916 + }, + { + "epoch": 70.61852861035422, + "grad_norm": 2.2688803672790527, + "learning_rate": 4.19614205320638e-06, + "loss": 0.0481, + "step": 25917 + }, + { + "epoch": 70.62125340599455, + "grad_norm": 2.811814785003662, + "learning_rate": 4.1954234236662275e-06, + "loss": 0.0391, + "step": 25918 + }, + { + "epoch": 70.62397820163488, + "grad_norm": 4.069333553314209, + "learning_rate": 4.19470483933193e-06, + "loss": 0.1037, + "step": 25919 + }, + { + "epoch": 70.6267029972752, + "grad_norm": 2.943814992904663, + "learning_rate": 4.193986300209084e-06, + "loss": 0.0365, + "step": 25920 + }, + { + "epoch": 70.62942779291554, + "grad_norm": 6.791131496429443, + "learning_rate": 4.193267806303283e-06, + "loss": 0.0644, + "step": 25921 + }, + { + "epoch": 70.63215258855585, + "grad_norm": 4.604465007781982, + "learning_rate": 4.192549357620125e-06, + "loss": 0.0799, + "step": 25922 + }, + { + "epoch": 70.63487738419619, + "grad_norm": 2.72743821144104, + "learning_rate": 4.19183095416521e-06, + "loss": 0.0838, + "step": 25923 + }, + { + "epoch": 70.6376021798365, + "grad_norm": 2.7363224029541016, + "learning_rate": 4.191112595944128e-06, + "loss": 0.043, + "step": 25924 + }, + { + "epoch": 70.64032697547684, + "grad_norm": 2.6797404289245605, + "learning_rate": 4.19039428296247e-06, + "loss": 0.0378, + "step": 25925 + }, + { + "epoch": 70.64305177111717, + "grad_norm": 2.8015358448028564, + "learning_rate": 4.189676015225838e-06, + "loss": 0.0956, + "step": 25926 + }, + { + "epoch": 70.64577656675749, + "grad_norm": 2.488412380218506, + "learning_rate": 4.188957792739824e-06, + "loss": 0.074, + "step": 25927 + }, + { + "epoch": 70.64850136239782, + "grad_norm": 2.5805211067199707, + "learning_rate": 4.188239615510018e-06, + "loss": 0.0305, + "step": 25928 + }, + { + "epoch": 70.65122615803814, + "grad_norm": 2.696093797683716, + "learning_rate": 4.1875214835420116e-06, + "loss": 0.0352, + "step": 25929 + }, + { + "epoch": 70.65395095367847, + "grad_norm": 3.0278303623199463, + "learning_rate": 4.186803396841405e-06, + "loss": 0.1216, + "step": 25930 + }, + { + "epoch": 70.65667574931881, + "grad_norm": 3.1114132404327393, + "learning_rate": 4.186085355413785e-06, + "loss": 0.0631, + "step": 25931 + }, + { + "epoch": 70.65940054495913, + "grad_norm": 3.6098079681396484, + "learning_rate": 4.185367359264746e-06, + "loss": 0.0503, + "step": 25932 + }, + { + "epoch": 70.66212534059946, + "grad_norm": 3.1527180671691895, + "learning_rate": 4.184649408399876e-06, + "loss": 0.069, + "step": 25933 + }, + { + "epoch": 70.66485013623978, + "grad_norm": 4.23618745803833, + "learning_rate": 4.183931502824772e-06, + "loss": 0.053, + "step": 25934 + }, + { + "epoch": 70.66757493188011, + "grad_norm": 3.9020419120788574, + "learning_rate": 4.183213642545022e-06, + "loss": 0.0759, + "step": 25935 + }, + { + "epoch": 70.67029972752043, + "grad_norm": 2.308504819869995, + "learning_rate": 4.182495827566217e-06, + "loss": 0.046, + "step": 25936 + }, + { + "epoch": 70.67302452316076, + "grad_norm": 1.9191436767578125, + "learning_rate": 4.181778057893944e-06, + "loss": 0.0359, + "step": 25937 + }, + { + "epoch": 70.6757493188011, + "grad_norm": 3.608513832092285, + "learning_rate": 4.1810603335337964e-06, + "loss": 0.0914, + "step": 25938 + }, + { + "epoch": 70.67847411444141, + "grad_norm": 3.003201961517334, + "learning_rate": 4.180342654491368e-06, + "loss": 0.0913, + "step": 25939 + }, + { + "epoch": 70.68119891008175, + "grad_norm": 3.0630545616149902, + "learning_rate": 4.179625020772242e-06, + "loss": 0.0898, + "step": 25940 + }, + { + "epoch": 70.68392370572207, + "grad_norm": 2.7549078464508057, + "learning_rate": 4.17890743238201e-06, + "loss": 0.1082, + "step": 25941 + }, + { + "epoch": 70.6866485013624, + "grad_norm": 3.135922431945801, + "learning_rate": 4.178189889326255e-06, + "loss": 0.1457, + "step": 25942 + }, + { + "epoch": 70.68937329700273, + "grad_norm": 3.149646043777466, + "learning_rate": 4.177472391610574e-06, + "loss": 0.1164, + "step": 25943 + }, + { + "epoch": 70.69209809264305, + "grad_norm": 2.631542444229126, + "learning_rate": 4.176754939240552e-06, + "loss": 0.0353, + "step": 25944 + }, + { + "epoch": 70.69482288828338, + "grad_norm": 3.2081425189971924, + "learning_rate": 4.176037532221772e-06, + "loss": 0.097, + "step": 25945 + }, + { + "epoch": 70.6975476839237, + "grad_norm": 3.6365292072296143, + "learning_rate": 4.175320170559823e-06, + "loss": 0.041, + "step": 25946 + }, + { + "epoch": 70.70027247956403, + "grad_norm": 2.3372373580932617, + "learning_rate": 4.174602854260297e-06, + "loss": 0.0653, + "step": 25947 + }, + { + "epoch": 70.70299727520435, + "grad_norm": 2.405831813812256, + "learning_rate": 4.173885583328775e-06, + "loss": 0.0461, + "step": 25948 + }, + { + "epoch": 70.70572207084469, + "grad_norm": 2.79573392868042, + "learning_rate": 4.173168357770842e-06, + "loss": 0.0835, + "step": 25949 + }, + { + "epoch": 70.70844686648502, + "grad_norm": 2.502190351486206, + "learning_rate": 4.172451177592089e-06, + "loss": 0.0775, + "step": 25950 + }, + { + "epoch": 70.71117166212534, + "grad_norm": 3.4877779483795166, + "learning_rate": 4.171734042798099e-06, + "loss": 0.075, + "step": 25951 + }, + { + "epoch": 70.71389645776567, + "grad_norm": 2.578361749649048, + "learning_rate": 4.171016953394457e-06, + "loss": 0.0379, + "step": 25952 + }, + { + "epoch": 70.71662125340599, + "grad_norm": 2.6028637886047363, + "learning_rate": 4.1702999093867435e-06, + "loss": 0.0482, + "step": 25953 + }, + { + "epoch": 70.71934604904632, + "grad_norm": 3.591414451599121, + "learning_rate": 4.169582910780551e-06, + "loss": 0.0986, + "step": 25954 + }, + { + "epoch": 70.72207084468666, + "grad_norm": 3.5944488048553467, + "learning_rate": 4.1688659575814535e-06, + "loss": 0.0641, + "step": 25955 + }, + { + "epoch": 70.72479564032697, + "grad_norm": 2.303833484649658, + "learning_rate": 4.168149049795046e-06, + "loss": 0.0593, + "step": 25956 + }, + { + "epoch": 70.7275204359673, + "grad_norm": 2.972484827041626, + "learning_rate": 4.1674321874269055e-06, + "loss": 0.0712, + "step": 25957 + }, + { + "epoch": 70.73024523160763, + "grad_norm": 3.417473793029785, + "learning_rate": 4.166715370482611e-06, + "loss": 0.0587, + "step": 25958 + }, + { + "epoch": 70.73297002724796, + "grad_norm": 3.3364315032958984, + "learning_rate": 4.165998598967754e-06, + "loss": 0.0787, + "step": 25959 + }, + { + "epoch": 70.73569482288828, + "grad_norm": 3.5824971199035645, + "learning_rate": 4.165281872887912e-06, + "loss": 0.0763, + "step": 25960 + }, + { + "epoch": 70.73841961852861, + "grad_norm": 2.5481116771698, + "learning_rate": 4.164565192248667e-06, + "loss": 0.0489, + "step": 25961 + }, + { + "epoch": 70.74114441416894, + "grad_norm": 3.1502392292022705, + "learning_rate": 4.163848557055596e-06, + "loss": 0.1133, + "step": 25962 + }, + { + "epoch": 70.74386920980926, + "grad_norm": 2.2232277393341064, + "learning_rate": 4.163131967314289e-06, + "loss": 0.0336, + "step": 25963 + }, + { + "epoch": 70.7465940054496, + "grad_norm": 2.860795259475708, + "learning_rate": 4.162415423030321e-06, + "loss": 0.0461, + "step": 25964 + }, + { + "epoch": 70.74931880108991, + "grad_norm": 2.332071542739868, + "learning_rate": 4.161698924209275e-06, + "loss": 0.0678, + "step": 25965 + }, + { + "epoch": 70.75204359673025, + "grad_norm": 3.48745059967041, + "learning_rate": 4.160982470856727e-06, + "loss": 0.1695, + "step": 25966 + }, + { + "epoch": 70.75476839237058, + "grad_norm": 3.1752967834472656, + "learning_rate": 4.160266062978262e-06, + "loss": 0.1834, + "step": 25967 + }, + { + "epoch": 70.7574931880109, + "grad_norm": 3.0846974849700928, + "learning_rate": 4.159549700579459e-06, + "loss": 0.0219, + "step": 25968 + }, + { + "epoch": 70.76021798365123, + "grad_norm": 3.33652925491333, + "learning_rate": 4.158833383665892e-06, + "loss": 0.0914, + "step": 25969 + }, + { + "epoch": 70.76294277929155, + "grad_norm": 2.3236277103424072, + "learning_rate": 4.158117112243141e-06, + "loss": 0.0824, + "step": 25970 + }, + { + "epoch": 70.76566757493188, + "grad_norm": 4.714158058166504, + "learning_rate": 4.157400886316788e-06, + "loss": 0.1673, + "step": 25971 + }, + { + "epoch": 70.7683923705722, + "grad_norm": 2.822706460952759, + "learning_rate": 4.15668470589241e-06, + "loss": 0.0381, + "step": 25972 + }, + { + "epoch": 70.77111716621253, + "grad_norm": 3.422696113586426, + "learning_rate": 4.15596857097558e-06, + "loss": 0.0576, + "step": 25973 + }, + { + "epoch": 70.77384196185287, + "grad_norm": 2.4212465286254883, + "learning_rate": 4.155252481571878e-06, + "loss": 0.0307, + "step": 25974 + }, + { + "epoch": 70.77656675749319, + "grad_norm": 2.283277988433838, + "learning_rate": 4.154536437686886e-06, + "loss": 0.0396, + "step": 25975 + }, + { + "epoch": 70.77929155313352, + "grad_norm": 2.959416151046753, + "learning_rate": 4.153820439326175e-06, + "loss": 0.0521, + "step": 25976 + }, + { + "epoch": 70.78201634877384, + "grad_norm": 2.2339015007019043, + "learning_rate": 4.153104486495323e-06, + "loss": 0.0343, + "step": 25977 + }, + { + "epoch": 70.78474114441417, + "grad_norm": 2.94073748588562, + "learning_rate": 4.152388579199901e-06, + "loss": 0.0439, + "step": 25978 + }, + { + "epoch": 70.7874659400545, + "grad_norm": 3.225032329559326, + "learning_rate": 4.151672717445493e-06, + "loss": 0.1102, + "step": 25979 + }, + { + "epoch": 70.79019073569482, + "grad_norm": 3.0006580352783203, + "learning_rate": 4.150956901237668e-06, + "loss": 0.1253, + "step": 25980 + }, + { + "epoch": 70.79291553133515, + "grad_norm": 3.542045831680298, + "learning_rate": 4.1502411305820035e-06, + "loss": 0.0784, + "step": 25981 + }, + { + "epoch": 70.79564032697547, + "grad_norm": 3.6604087352752686, + "learning_rate": 4.1495254054840696e-06, + "loss": 0.2117, + "step": 25982 + }, + { + "epoch": 70.7983651226158, + "grad_norm": 2.596848249435425, + "learning_rate": 4.1488097259494464e-06, + "loss": 0.0434, + "step": 25983 + }, + { + "epoch": 70.80108991825612, + "grad_norm": 2.6084728240966797, + "learning_rate": 4.148094091983705e-06, + "loss": 0.1646, + "step": 25984 + }, + { + "epoch": 70.80381471389646, + "grad_norm": 3.3621985912323, + "learning_rate": 4.147378503592418e-06, + "loss": 0.1964, + "step": 25985 + }, + { + "epoch": 70.80653950953679, + "grad_norm": 3.769082546234131, + "learning_rate": 4.146662960781156e-06, + "loss": 0.0913, + "step": 25986 + }, + { + "epoch": 70.80926430517711, + "grad_norm": 2.646458864212036, + "learning_rate": 4.145947463555499e-06, + "loss": 0.0423, + "step": 25987 + }, + { + "epoch": 70.81198910081744, + "grad_norm": 4.7483391761779785, + "learning_rate": 4.1452320119210136e-06, + "loss": 0.0302, + "step": 25988 + }, + { + "epoch": 70.81471389645776, + "grad_norm": 3.348487138748169, + "learning_rate": 4.144516605883272e-06, + "loss": 0.0766, + "step": 25989 + }, + { + "epoch": 70.8174386920981, + "grad_norm": 3.6103594303131104, + "learning_rate": 4.14380124544784e-06, + "loss": 0.1516, + "step": 25990 + }, + { + "epoch": 70.82016348773843, + "grad_norm": 3.0230557918548584, + "learning_rate": 4.143085930620303e-06, + "loss": 0.1126, + "step": 25991 + }, + { + "epoch": 70.82288828337875, + "grad_norm": 5.467724800109863, + "learning_rate": 4.142370661406224e-06, + "loss": 0.0657, + "step": 25992 + }, + { + "epoch": 70.82561307901908, + "grad_norm": 3.4226467609405518, + "learning_rate": 4.141655437811174e-06, + "loss": 0.1201, + "step": 25993 + }, + { + "epoch": 70.8283378746594, + "grad_norm": 3.245389223098755, + "learning_rate": 4.140940259840719e-06, + "loss": 0.1575, + "step": 25994 + }, + { + "epoch": 70.83106267029973, + "grad_norm": 2.476825475692749, + "learning_rate": 4.140225127500437e-06, + "loss": 0.0518, + "step": 25995 + }, + { + "epoch": 70.83378746594005, + "grad_norm": 3.047578811645508, + "learning_rate": 4.139510040795892e-06, + "loss": 0.0637, + "step": 25996 + }, + { + "epoch": 70.83651226158038, + "grad_norm": 2.880866765975952, + "learning_rate": 4.138794999732655e-06, + "loss": 0.0289, + "step": 25997 + }, + { + "epoch": 70.83923705722071, + "grad_norm": 3.4764673709869385, + "learning_rate": 4.138080004316289e-06, + "loss": 0.079, + "step": 25998 + }, + { + "epoch": 70.84196185286103, + "grad_norm": 3.865513324737549, + "learning_rate": 4.137365054552372e-06, + "loss": 0.1019, + "step": 25999 + }, + { + "epoch": 70.84468664850137, + "grad_norm": 2.4694693088531494, + "learning_rate": 4.136650150446468e-06, + "loss": 0.0377, + "step": 26000 + }, + { + "epoch": 70.84741144414168, + "grad_norm": 3.7884268760681152, + "learning_rate": 4.135935292004143e-06, + "loss": 0.1641, + "step": 26001 + }, + { + "epoch": 70.85013623978202, + "grad_norm": 2.340000629425049, + "learning_rate": 4.135220479230961e-06, + "loss": 0.076, + "step": 26002 + }, + { + "epoch": 70.85286103542235, + "grad_norm": 2.3376033306121826, + "learning_rate": 4.134505712132498e-06, + "loss": 0.0408, + "step": 26003 + }, + { + "epoch": 70.85558583106267, + "grad_norm": 2.3368735313415527, + "learning_rate": 4.133790990714316e-06, + "loss": 0.0497, + "step": 26004 + }, + { + "epoch": 70.858310626703, + "grad_norm": 3.3468737602233887, + "learning_rate": 4.133076314981979e-06, + "loss": 0.1053, + "step": 26005 + }, + { + "epoch": 70.86103542234332, + "grad_norm": 2.214991569519043, + "learning_rate": 4.132361684941053e-06, + "loss": 0.0491, + "step": 26006 + }, + { + "epoch": 70.86376021798365, + "grad_norm": 2.790736675262451, + "learning_rate": 4.131647100597105e-06, + "loss": 0.0403, + "step": 26007 + }, + { + "epoch": 70.86648501362397, + "grad_norm": 3.3679144382476807, + "learning_rate": 4.130932561955704e-06, + "loss": 0.158, + "step": 26008 + }, + { + "epoch": 70.8692098092643, + "grad_norm": 2.829746723175049, + "learning_rate": 4.13021806902241e-06, + "loss": 0.0355, + "step": 26009 + }, + { + "epoch": 70.87193460490464, + "grad_norm": 3.5523321628570557, + "learning_rate": 4.12950362180279e-06, + "loss": 0.0962, + "step": 26010 + }, + { + "epoch": 70.87465940054496, + "grad_norm": 2.690026044845581, + "learning_rate": 4.128789220302404e-06, + "loss": 0.0773, + "step": 26011 + }, + { + "epoch": 70.87738419618529, + "grad_norm": 2.1563637256622314, + "learning_rate": 4.128074864526821e-06, + "loss": 0.0261, + "step": 26012 + }, + { + "epoch": 70.88010899182561, + "grad_norm": 3.8262779712677, + "learning_rate": 4.127360554481602e-06, + "loss": 0.1447, + "step": 26013 + }, + { + "epoch": 70.88283378746594, + "grad_norm": 2.838820695877075, + "learning_rate": 4.126646290172307e-06, + "loss": 0.0839, + "step": 26014 + }, + { + "epoch": 70.88555858310627, + "grad_norm": 2.9895541667938232, + "learning_rate": 4.125932071604505e-06, + "loss": 0.0793, + "step": 26015 + }, + { + "epoch": 70.88828337874659, + "grad_norm": 5.860555171966553, + "learning_rate": 4.125217898783756e-06, + "loss": 0.0819, + "step": 26016 + }, + { + "epoch": 70.89100817438693, + "grad_norm": 3.254020929336548, + "learning_rate": 4.124503771715619e-06, + "loss": 0.0414, + "step": 26017 + }, + { + "epoch": 70.89373297002724, + "grad_norm": 3.3897457122802734, + "learning_rate": 4.123789690405655e-06, + "loss": 0.0878, + "step": 26018 + }, + { + "epoch": 70.89645776566758, + "grad_norm": 4.130880832672119, + "learning_rate": 4.1230756548594305e-06, + "loss": 0.0962, + "step": 26019 + }, + { + "epoch": 70.8991825613079, + "grad_norm": 2.7152228355407715, + "learning_rate": 4.122361665082505e-06, + "loss": 0.0319, + "step": 26020 + }, + { + "epoch": 70.90190735694823, + "grad_norm": 2.5247933864593506, + "learning_rate": 4.121647721080436e-06, + "loss": 0.0282, + "step": 26021 + }, + { + "epoch": 70.90463215258856, + "grad_norm": 3.517009973526001, + "learning_rate": 4.120933822858784e-06, + "loss": 0.127, + "step": 26022 + }, + { + "epoch": 70.90735694822888, + "grad_norm": 2.396376132965088, + "learning_rate": 4.120219970423112e-06, + "loss": 0.205, + "step": 26023 + }, + { + "epoch": 70.91008174386921, + "grad_norm": 3.3002827167510986, + "learning_rate": 4.119506163778974e-06, + "loss": 0.0691, + "step": 26024 + }, + { + "epoch": 70.91280653950953, + "grad_norm": 3.1291379928588867, + "learning_rate": 4.1187924029319374e-06, + "loss": 0.0411, + "step": 26025 + }, + { + "epoch": 70.91553133514986, + "grad_norm": 5.469636917114258, + "learning_rate": 4.118078687887556e-06, + "loss": 0.055, + "step": 26026 + }, + { + "epoch": 70.9182561307902, + "grad_norm": 2.640181064605713, + "learning_rate": 4.117365018651385e-06, + "loss": 0.0946, + "step": 26027 + }, + { + "epoch": 70.92098092643052, + "grad_norm": 3.6619114875793457, + "learning_rate": 4.1166513952289885e-06, + "loss": 0.0475, + "step": 26028 + }, + { + "epoch": 70.92370572207085, + "grad_norm": 3.9255616664886475, + "learning_rate": 4.115937817625923e-06, + "loss": 0.1015, + "step": 26029 + }, + { + "epoch": 70.92643051771117, + "grad_norm": 2.6056079864501953, + "learning_rate": 4.1152242858477435e-06, + "loss": 0.2065, + "step": 26030 + }, + { + "epoch": 70.9291553133515, + "grad_norm": 3.3639891147613525, + "learning_rate": 4.114510799900003e-06, + "loss": 0.0343, + "step": 26031 + }, + { + "epoch": 70.93188010899182, + "grad_norm": 3.2747297286987305, + "learning_rate": 4.113797359788269e-06, + "loss": 0.055, + "step": 26032 + }, + { + "epoch": 70.93460490463215, + "grad_norm": 2.6767966747283936, + "learning_rate": 4.11308396551809e-06, + "loss": 0.0361, + "step": 26033 + }, + { + "epoch": 70.93732970027249, + "grad_norm": 3.1328749656677246, + "learning_rate": 4.11237061709502e-06, + "loss": 0.0398, + "step": 26034 + }, + { + "epoch": 70.9400544959128, + "grad_norm": 3.5282037258148193, + "learning_rate": 4.111657314524623e-06, + "loss": 0.069, + "step": 26035 + }, + { + "epoch": 70.94277929155314, + "grad_norm": 2.897711992263794, + "learning_rate": 4.110944057812449e-06, + "loss": 0.0635, + "step": 26036 + }, + { + "epoch": 70.94550408719346, + "grad_norm": 2.598701238632202, + "learning_rate": 4.110230846964053e-06, + "loss": 0.082, + "step": 26037 + }, + { + "epoch": 70.94822888283379, + "grad_norm": 3.073129653930664, + "learning_rate": 4.109517681984986e-06, + "loss": 0.0628, + "step": 26038 + }, + { + "epoch": 70.95095367847412, + "grad_norm": 2.4614381790161133, + "learning_rate": 4.108804562880809e-06, + "loss": 0.0339, + "step": 26039 + }, + { + "epoch": 70.95367847411444, + "grad_norm": 4.100926876068115, + "learning_rate": 4.108091489657072e-06, + "loss": 0.1, + "step": 26040 + }, + { + "epoch": 70.95640326975477, + "grad_norm": 5.091050624847412, + "learning_rate": 4.107378462319327e-06, + "loss": 0.1347, + "step": 26041 + }, + { + "epoch": 70.95912806539509, + "grad_norm": 12.523394584655762, + "learning_rate": 4.106665480873131e-06, + "loss": 0.0619, + "step": 26042 + }, + { + "epoch": 70.96185286103542, + "grad_norm": 4.1175103187561035, + "learning_rate": 4.105952545324031e-06, + "loss": 0.1031, + "step": 26043 + }, + { + "epoch": 70.96457765667574, + "grad_norm": 3.6107232570648193, + "learning_rate": 4.105239655677586e-06, + "loss": 0.1041, + "step": 26044 + }, + { + "epoch": 70.96730245231608, + "grad_norm": 3.0365426540374756, + "learning_rate": 4.104526811939347e-06, + "loss": 0.0681, + "step": 26045 + }, + { + "epoch": 70.97002724795641, + "grad_norm": 2.794994592666626, + "learning_rate": 4.103814014114862e-06, + "loss": 0.0465, + "step": 26046 + }, + { + "epoch": 70.97275204359673, + "grad_norm": 5.480357646942139, + "learning_rate": 4.10310126220968e-06, + "loss": 0.1777, + "step": 26047 + }, + { + "epoch": 70.97547683923706, + "grad_norm": 4.1183061599731445, + "learning_rate": 4.102388556229358e-06, + "loss": 0.1387, + "step": 26048 + }, + { + "epoch": 70.97820163487738, + "grad_norm": 2.9127626419067383, + "learning_rate": 4.101675896179446e-06, + "loss": 0.0362, + "step": 26049 + }, + { + "epoch": 70.98092643051771, + "grad_norm": 3.8233654499053955, + "learning_rate": 4.100963282065492e-06, + "loss": 0.25, + "step": 26050 + }, + { + "epoch": 70.98365122615803, + "grad_norm": 2.501060724258423, + "learning_rate": 4.100250713893043e-06, + "loss": 0.0319, + "step": 26051 + }, + { + "epoch": 70.98637602179836, + "grad_norm": 4.0335516929626465, + "learning_rate": 4.099538191667654e-06, + "loss": 0.0705, + "step": 26052 + }, + { + "epoch": 70.9891008174387, + "grad_norm": 2.2477872371673584, + "learning_rate": 4.098825715394872e-06, + "loss": 0.0394, + "step": 26053 + }, + { + "epoch": 70.99182561307902, + "grad_norm": 2.850425958633423, + "learning_rate": 4.098113285080245e-06, + "loss": 0.0631, + "step": 26054 + }, + { + "epoch": 70.99455040871935, + "grad_norm": 3.4741532802581787, + "learning_rate": 4.097400900729319e-06, + "loss": 0.2365, + "step": 26055 + }, + { + "epoch": 70.99727520435967, + "grad_norm": 3.390138864517212, + "learning_rate": 4.0966885623476485e-06, + "loss": 0.0896, + "step": 26056 + }, + { + "epoch": 71.0, + "grad_norm": 7.1555657386779785, + "learning_rate": 4.095976269940777e-06, + "loss": 0.1655, + "step": 26057 + }, + { + "epoch": 71.00272479564033, + "grad_norm": 2.8527214527130127, + "learning_rate": 4.095264023514248e-06, + "loss": 0.0885, + "step": 26058 + }, + { + "epoch": 71.00544959128065, + "grad_norm": 3.099708318710327, + "learning_rate": 4.094551823073614e-06, + "loss": 0.1058, + "step": 26059 + }, + { + "epoch": 71.00817438692098, + "grad_norm": 1.9717785120010376, + "learning_rate": 4.093839668624423e-06, + "loss": 0.0329, + "step": 26060 + }, + { + "epoch": 71.0108991825613, + "grad_norm": 2.0244579315185547, + "learning_rate": 4.0931275601722194e-06, + "loss": 0.0348, + "step": 26061 + }, + { + "epoch": 71.01362397820164, + "grad_norm": 2.797454595565796, + "learning_rate": 4.092415497722547e-06, + "loss": 0.0442, + "step": 26062 + }, + { + "epoch": 71.01634877384195, + "grad_norm": 3.133096694946289, + "learning_rate": 4.091703481280951e-06, + "loss": 0.0616, + "step": 26063 + }, + { + "epoch": 71.01907356948229, + "grad_norm": 3.9310803413391113, + "learning_rate": 4.090991510852979e-06, + "loss": 0.1391, + "step": 26064 + }, + { + "epoch": 71.02179836512262, + "grad_norm": 4.202494144439697, + "learning_rate": 4.090279586444177e-06, + "loss": 0.0672, + "step": 26065 + }, + { + "epoch": 71.02452316076294, + "grad_norm": 4.340561389923096, + "learning_rate": 4.089567708060087e-06, + "loss": 0.0555, + "step": 26066 + }, + { + "epoch": 71.02724795640327, + "grad_norm": 3.2145681381225586, + "learning_rate": 4.08885587570625e-06, + "loss": 0.0755, + "step": 26067 + }, + { + "epoch": 71.02997275204359, + "grad_norm": 2.5824227333068848, + "learning_rate": 4.088144089388216e-06, + "loss": 0.1028, + "step": 26068 + }, + { + "epoch": 71.03269754768392, + "grad_norm": 3.8116767406463623, + "learning_rate": 4.087432349111527e-06, + "loss": 0.0409, + "step": 26069 + }, + { + "epoch": 71.03542234332426, + "grad_norm": 2.5581002235412598, + "learning_rate": 4.086720654881723e-06, + "loss": 0.0396, + "step": 26070 + }, + { + "epoch": 71.03814713896458, + "grad_norm": 2.855933427810669, + "learning_rate": 4.086009006704345e-06, + "loss": 0.0517, + "step": 26071 + }, + { + "epoch": 71.04087193460491, + "grad_norm": 2.431560516357422, + "learning_rate": 4.085297404584942e-06, + "loss": 0.0293, + "step": 26072 + }, + { + "epoch": 71.04359673024523, + "grad_norm": 2.369784355163574, + "learning_rate": 4.0845858485290535e-06, + "loss": 0.0846, + "step": 26073 + }, + { + "epoch": 71.04632152588556, + "grad_norm": 2.523799419403076, + "learning_rate": 4.0838743385422195e-06, + "loss": 0.039, + "step": 26074 + }, + { + "epoch": 71.04904632152588, + "grad_norm": 2.0205631256103516, + "learning_rate": 4.083162874629978e-06, + "loss": 0.0347, + "step": 26075 + }, + { + "epoch": 71.05177111716621, + "grad_norm": 2.60185170173645, + "learning_rate": 4.082451456797873e-06, + "loss": 0.0305, + "step": 26076 + }, + { + "epoch": 71.05449591280654, + "grad_norm": 3.9647903442382812, + "learning_rate": 4.08174008505145e-06, + "loss": 0.1401, + "step": 26077 + }, + { + "epoch": 71.05722070844686, + "grad_norm": 4.09466028213501, + "learning_rate": 4.081028759396245e-06, + "loss": 0.0725, + "step": 26078 + }, + { + "epoch": 71.0599455040872, + "grad_norm": 3.022454261779785, + "learning_rate": 4.080317479837793e-06, + "loss": 0.0576, + "step": 26079 + }, + { + "epoch": 71.06267029972751, + "grad_norm": 4.466739654541016, + "learning_rate": 4.079606246381642e-06, + "loss": 0.0723, + "step": 26080 + }, + { + "epoch": 71.06539509536785, + "grad_norm": 3.1590499877929688, + "learning_rate": 4.0788950590333265e-06, + "loss": 0.0515, + "step": 26081 + }, + { + "epoch": 71.06811989100818, + "grad_norm": 2.5963423252105713, + "learning_rate": 4.078183917798386e-06, + "loss": 0.0456, + "step": 26082 + }, + { + "epoch": 71.0708446866485, + "grad_norm": 3.6453804969787598, + "learning_rate": 4.0774728226823556e-06, + "loss": 0.0561, + "step": 26083 + }, + { + "epoch": 71.07356948228883, + "grad_norm": 3.618593215942383, + "learning_rate": 4.07676177369078e-06, + "loss": 0.083, + "step": 26084 + }, + { + "epoch": 71.07629427792915, + "grad_norm": 2.215276002883911, + "learning_rate": 4.076050770829192e-06, + "loss": 0.0389, + "step": 26085 + }, + { + "epoch": 71.07901907356948, + "grad_norm": 3.5353288650512695, + "learning_rate": 4.075339814103131e-06, + "loss": 0.0706, + "step": 26086 + }, + { + "epoch": 71.0817438692098, + "grad_norm": 2.7013566493988037, + "learning_rate": 4.074628903518129e-06, + "loss": 0.0413, + "step": 26087 + }, + { + "epoch": 71.08446866485014, + "grad_norm": 2.762425422668457, + "learning_rate": 4.073918039079729e-06, + "loss": 0.0934, + "step": 26088 + }, + { + "epoch": 71.08719346049047, + "grad_norm": 3.5204782485961914, + "learning_rate": 4.073207220793465e-06, + "loss": 0.0751, + "step": 26089 + }, + { + "epoch": 71.08991825613079, + "grad_norm": 3.8314247131347656, + "learning_rate": 4.072496448664872e-06, + "loss": 0.1176, + "step": 26090 + }, + { + "epoch": 71.09264305177112, + "grad_norm": 1.8714334964752197, + "learning_rate": 4.071785722699484e-06, + "loss": 0.0521, + "step": 26091 + }, + { + "epoch": 71.09536784741144, + "grad_norm": 3.3808674812316895, + "learning_rate": 4.07107504290284e-06, + "loss": 0.0588, + "step": 26092 + }, + { + "epoch": 71.09809264305177, + "grad_norm": 2.3348703384399414, + "learning_rate": 4.0703644092804695e-06, + "loss": 0.1567, + "step": 26093 + }, + { + "epoch": 71.1008174386921, + "grad_norm": 2.7863707542419434, + "learning_rate": 4.069653821837913e-06, + "loss": 0.0605, + "step": 26094 + }, + { + "epoch": 71.10354223433242, + "grad_norm": 3.885864019393921, + "learning_rate": 4.068943280580704e-06, + "loss": 0.1171, + "step": 26095 + }, + { + "epoch": 71.10626702997276, + "grad_norm": 3.8391263484954834, + "learning_rate": 4.068232785514368e-06, + "loss": 0.0768, + "step": 26096 + }, + { + "epoch": 71.10899182561307, + "grad_norm": 6.129915237426758, + "learning_rate": 4.067522336644448e-06, + "loss": 0.0483, + "step": 26097 + }, + { + "epoch": 71.11171662125341, + "grad_norm": 4.418376445770264, + "learning_rate": 4.0668119339764746e-06, + "loss": 0.0855, + "step": 26098 + }, + { + "epoch": 71.11444141689373, + "grad_norm": 2.6548573970794678, + "learning_rate": 4.066101577515974e-06, + "loss": 0.0302, + "step": 26099 + }, + { + "epoch": 71.11716621253406, + "grad_norm": 3.826864004135132, + "learning_rate": 4.065391267268487e-06, + "loss": 0.087, + "step": 26100 + }, + { + "epoch": 71.11989100817439, + "grad_norm": 2.5251123905181885, + "learning_rate": 4.064681003239543e-06, + "loss": 0.1032, + "step": 26101 + }, + { + "epoch": 71.12261580381471, + "grad_norm": 2.869708776473999, + "learning_rate": 4.063970785434671e-06, + "loss": 0.1286, + "step": 26102 + }, + { + "epoch": 71.12534059945504, + "grad_norm": 3.617197275161743, + "learning_rate": 4.0632606138594e-06, + "loss": 0.0651, + "step": 26103 + }, + { + "epoch": 71.12806539509536, + "grad_norm": 1.9999364614486694, + "learning_rate": 4.062550488519268e-06, + "loss": 0.0355, + "step": 26104 + }, + { + "epoch": 71.1307901907357, + "grad_norm": 3.306886672973633, + "learning_rate": 4.0618404094198016e-06, + "loss": 0.0713, + "step": 26105 + }, + { + "epoch": 71.13351498637603, + "grad_norm": 3.030975103378296, + "learning_rate": 4.061130376566531e-06, + "loss": 0.0258, + "step": 26106 + }, + { + "epoch": 71.13623978201635, + "grad_norm": 2.435028076171875, + "learning_rate": 4.060420389964983e-06, + "loss": 0.04, + "step": 26107 + }, + { + "epoch": 71.13896457765668, + "grad_norm": 2.20660400390625, + "learning_rate": 4.059710449620693e-06, + "loss": 0.1839, + "step": 26108 + }, + { + "epoch": 71.141689373297, + "grad_norm": 4.439379692077637, + "learning_rate": 4.0590005555391865e-06, + "loss": 0.1027, + "step": 26109 + }, + { + "epoch": 71.14441416893733, + "grad_norm": 3.1821601390838623, + "learning_rate": 4.0582907077259894e-06, + "loss": 0.1882, + "step": 26110 + }, + { + "epoch": 71.14713896457765, + "grad_norm": 3.6115283966064453, + "learning_rate": 4.057580906186637e-06, + "loss": 0.0664, + "step": 26111 + }, + { + "epoch": 71.14986376021798, + "grad_norm": 3.003767728805542, + "learning_rate": 4.056871150926649e-06, + "loss": 0.0875, + "step": 26112 + }, + { + "epoch": 71.15258855585832, + "grad_norm": 3.3359696865081787, + "learning_rate": 4.056161441951561e-06, + "loss": 0.0916, + "step": 26113 + }, + { + "epoch": 71.15531335149863, + "grad_norm": 2.4242122173309326, + "learning_rate": 4.055451779266896e-06, + "loss": 0.105, + "step": 26114 + }, + { + "epoch": 71.15803814713897, + "grad_norm": 2.911146402359009, + "learning_rate": 4.0547421628781815e-06, + "loss": 0.0528, + "step": 26115 + }, + { + "epoch": 71.16076294277929, + "grad_norm": 3.8165996074676514, + "learning_rate": 4.05403259279094e-06, + "loss": 0.1203, + "step": 26116 + }, + { + "epoch": 71.16348773841962, + "grad_norm": 2.963271379470825, + "learning_rate": 4.053323069010704e-06, + "loss": 0.0522, + "step": 26117 + }, + { + "epoch": 71.16621253405995, + "grad_norm": 2.903336763381958, + "learning_rate": 4.052613591542998e-06, + "loss": 0.0382, + "step": 26118 + }, + { + "epoch": 71.16893732970027, + "grad_norm": 2.796835422515869, + "learning_rate": 4.051904160393345e-06, + "loss": 0.128, + "step": 26119 + }, + { + "epoch": 71.1716621253406, + "grad_norm": 2.7993125915527344, + "learning_rate": 4.051194775567268e-06, + "loss": 0.0348, + "step": 26120 + }, + { + "epoch": 71.17438692098092, + "grad_norm": 3.7094621658325195, + "learning_rate": 4.050485437070297e-06, + "loss": 0.0987, + "step": 26121 + }, + { + "epoch": 71.17711171662125, + "grad_norm": 2.9672060012817383, + "learning_rate": 4.049776144907955e-06, + "loss": 0.0529, + "step": 26122 + }, + { + "epoch": 71.17983651226157, + "grad_norm": 2.5991804599761963, + "learning_rate": 4.0490668990857615e-06, + "loss": 0.0952, + "step": 26123 + }, + { + "epoch": 71.1825613079019, + "grad_norm": 3.1416094303131104, + "learning_rate": 4.048357699609246e-06, + "loss": 0.1398, + "step": 26124 + }, + { + "epoch": 71.18528610354224, + "grad_norm": 2.1139564514160156, + "learning_rate": 4.047648546483931e-06, + "loss": 0.0409, + "step": 26125 + }, + { + "epoch": 71.18801089918256, + "grad_norm": 2.8843088150024414, + "learning_rate": 4.046939439715336e-06, + "loss": 0.0394, + "step": 26126 + }, + { + "epoch": 71.19073569482289, + "grad_norm": 3.3568787574768066, + "learning_rate": 4.046230379308982e-06, + "loss": 0.1828, + "step": 26127 + }, + { + "epoch": 71.19346049046321, + "grad_norm": 2.49369215965271, + "learning_rate": 4.045521365270394e-06, + "loss": 0.1426, + "step": 26128 + }, + { + "epoch": 71.19618528610354, + "grad_norm": 2.4332704544067383, + "learning_rate": 4.044812397605098e-06, + "loss": 0.0322, + "step": 26129 + }, + { + "epoch": 71.19891008174388, + "grad_norm": 4.03870153427124, + "learning_rate": 4.044103476318612e-06, + "loss": 0.0394, + "step": 26130 + }, + { + "epoch": 71.2016348773842, + "grad_norm": 2.979018211364746, + "learning_rate": 4.043394601416455e-06, + "loss": 0.0368, + "step": 26131 + }, + { + "epoch": 71.20435967302453, + "grad_norm": 2.245609760284424, + "learning_rate": 4.042685772904146e-06, + "loss": 0.0373, + "step": 26132 + }, + { + "epoch": 71.20708446866485, + "grad_norm": 3.806074857711792, + "learning_rate": 4.041976990787212e-06, + "loss": 0.0623, + "step": 26133 + }, + { + "epoch": 71.20980926430518, + "grad_norm": 2.555792808532715, + "learning_rate": 4.041268255071169e-06, + "loss": 0.1072, + "step": 26134 + }, + { + "epoch": 71.2125340599455, + "grad_norm": 3.141249179840088, + "learning_rate": 4.040559565761537e-06, + "loss": 0.0808, + "step": 26135 + }, + { + "epoch": 71.21525885558583, + "grad_norm": 3.3116321563720703, + "learning_rate": 4.039850922863833e-06, + "loss": 0.1353, + "step": 26136 + }, + { + "epoch": 71.21798365122616, + "grad_norm": 3.131275177001953, + "learning_rate": 4.03914232638358e-06, + "loss": 0.0482, + "step": 26137 + }, + { + "epoch": 71.22070844686648, + "grad_norm": 2.9546279907226562, + "learning_rate": 4.038433776326297e-06, + "loss": 0.0392, + "step": 26138 + }, + { + "epoch": 71.22343324250681, + "grad_norm": 2.3739166259765625, + "learning_rate": 4.037725272697498e-06, + "loss": 0.1232, + "step": 26139 + }, + { + "epoch": 71.22615803814713, + "grad_norm": 2.883281707763672, + "learning_rate": 4.0370168155027e-06, + "loss": 0.0467, + "step": 26140 + }, + { + "epoch": 71.22888283378747, + "grad_norm": 3.404445171356201, + "learning_rate": 4.036308404747426e-06, + "loss": 0.1129, + "step": 26141 + }, + { + "epoch": 71.2316076294278, + "grad_norm": 3.4998667240142822, + "learning_rate": 4.035600040437191e-06, + "loss": 0.0872, + "step": 26142 + }, + { + "epoch": 71.23433242506812, + "grad_norm": 18.2752742767334, + "learning_rate": 4.034891722577511e-06, + "loss": 0.0834, + "step": 26143 + }, + { + "epoch": 71.23705722070845, + "grad_norm": 3.492717981338501, + "learning_rate": 4.034183451173897e-06, + "loss": 0.0403, + "step": 26144 + }, + { + "epoch": 71.23978201634877, + "grad_norm": 2.7523624897003174, + "learning_rate": 4.033475226231872e-06, + "loss": 0.0685, + "step": 26145 + }, + { + "epoch": 71.2425068119891, + "grad_norm": 3.1481869220733643, + "learning_rate": 4.032767047756954e-06, + "loss": 0.0726, + "step": 26146 + }, + { + "epoch": 71.24523160762942, + "grad_norm": 2.7452948093414307, + "learning_rate": 4.032058915754653e-06, + "loss": 0.1341, + "step": 26147 + }, + { + "epoch": 71.24795640326975, + "grad_norm": 3.3518741130828857, + "learning_rate": 4.031350830230482e-06, + "loss": 0.0424, + "step": 26148 + }, + { + "epoch": 71.25068119891009, + "grad_norm": 3.4906837940216064, + "learning_rate": 4.0306427911899614e-06, + "loss": 0.1093, + "step": 26149 + }, + { + "epoch": 71.2534059945504, + "grad_norm": 2.8083479404449463, + "learning_rate": 4.029934798638603e-06, + "loss": 0.1589, + "step": 26150 + }, + { + "epoch": 71.25613079019074, + "grad_norm": 4.763759136199951, + "learning_rate": 4.02922685258192e-06, + "loss": 0.0315, + "step": 26151 + }, + { + "epoch": 71.25885558583106, + "grad_norm": 2.4466710090637207, + "learning_rate": 4.028518953025423e-06, + "loss": 0.0445, + "step": 26152 + }, + { + "epoch": 71.26158038147139, + "grad_norm": 3.23868465423584, + "learning_rate": 4.027811099974632e-06, + "loss": 0.0849, + "step": 26153 + }, + { + "epoch": 71.26430517711172, + "grad_norm": 2.836198329925537, + "learning_rate": 4.0271032934350555e-06, + "loss": 0.0887, + "step": 26154 + }, + { + "epoch": 71.26702997275204, + "grad_norm": 2.9903182983398438, + "learning_rate": 4.026395533412206e-06, + "loss": 0.0384, + "step": 26155 + }, + { + "epoch": 71.26975476839237, + "grad_norm": 2.2511773109436035, + "learning_rate": 4.025687819911593e-06, + "loss": 0.0327, + "step": 26156 + }, + { + "epoch": 71.2724795640327, + "grad_norm": 2.0673069953918457, + "learning_rate": 4.024980152938735e-06, + "loss": 0.0277, + "step": 26157 + }, + { + "epoch": 71.27520435967303, + "grad_norm": 2.301643133163452, + "learning_rate": 4.0242725324991375e-06, + "loss": 0.0329, + "step": 26158 + }, + { + "epoch": 71.27792915531334, + "grad_norm": 3.1151835918426514, + "learning_rate": 4.023564958598314e-06, + "loss": 0.0521, + "step": 26159 + }, + { + "epoch": 71.28065395095368, + "grad_norm": 2.144178628921509, + "learning_rate": 4.0228574312417715e-06, + "loss": 0.0312, + "step": 26160 + }, + { + "epoch": 71.28337874659401, + "grad_norm": 3.044750452041626, + "learning_rate": 4.022149950435026e-06, + "loss": 0.0292, + "step": 26161 + }, + { + "epoch": 71.28610354223433, + "grad_norm": 3.113910436630249, + "learning_rate": 4.02144251618358e-06, + "loss": 0.1339, + "step": 26162 + }, + { + "epoch": 71.28882833787466, + "grad_norm": 3.3358335494995117, + "learning_rate": 4.020735128492952e-06, + "loss": 0.1451, + "step": 26163 + }, + { + "epoch": 71.29155313351498, + "grad_norm": 3.408358097076416, + "learning_rate": 4.020027787368642e-06, + "loss": 0.1037, + "step": 26164 + }, + { + "epoch": 71.29427792915531, + "grad_norm": 3.093109130859375, + "learning_rate": 4.019320492816167e-06, + "loss": 0.0286, + "step": 26165 + }, + { + "epoch": 71.29700272479565, + "grad_norm": 3.21688175201416, + "learning_rate": 4.018613244841031e-06, + "loss": 0.1308, + "step": 26166 + }, + { + "epoch": 71.29972752043597, + "grad_norm": 2.772951364517212, + "learning_rate": 4.017906043448744e-06, + "loss": 0.0465, + "step": 26167 + }, + { + "epoch": 71.3024523160763, + "grad_norm": 2.1212408542633057, + "learning_rate": 4.017198888644807e-06, + "loss": 0.0362, + "step": 26168 + }, + { + "epoch": 71.30517711171662, + "grad_norm": 2.960747480392456, + "learning_rate": 4.016491780434737e-06, + "loss": 0.1397, + "step": 26169 + }, + { + "epoch": 71.30790190735695, + "grad_norm": 2.8554725646972656, + "learning_rate": 4.015784718824036e-06, + "loss": 0.0732, + "step": 26170 + }, + { + "epoch": 71.31062670299727, + "grad_norm": 3.2245540618896484, + "learning_rate": 4.015077703818211e-06, + "loss": 0.0425, + "step": 26171 + }, + { + "epoch": 71.3133514986376, + "grad_norm": 7.894142150878906, + "learning_rate": 4.014370735422765e-06, + "loss": 0.2433, + "step": 26172 + }, + { + "epoch": 71.31607629427793, + "grad_norm": 2.4632678031921387, + "learning_rate": 4.013663813643211e-06, + "loss": 0.05, + "step": 26173 + }, + { + "epoch": 71.31880108991825, + "grad_norm": 2.931635856628418, + "learning_rate": 4.012956938485049e-06, + "loss": 0.0764, + "step": 26174 + }, + { + "epoch": 71.32152588555859, + "grad_norm": 2.721539258956909, + "learning_rate": 4.012250109953787e-06, + "loss": 0.0351, + "step": 26175 + }, + { + "epoch": 71.3242506811989, + "grad_norm": 4.405660152435303, + "learning_rate": 4.011543328054924e-06, + "loss": 0.1693, + "step": 26176 + }, + { + "epoch": 71.32697547683924, + "grad_norm": 3.629136562347412, + "learning_rate": 4.010836592793973e-06, + "loss": 0.1972, + "step": 26177 + }, + { + "epoch": 71.32970027247957, + "grad_norm": 2.7203550338745117, + "learning_rate": 4.010129904176434e-06, + "loss": 0.0352, + "step": 26178 + }, + { + "epoch": 71.33242506811989, + "grad_norm": 2.688110113143921, + "learning_rate": 4.009423262207807e-06, + "loss": 0.048, + "step": 26179 + }, + { + "epoch": 71.33514986376022, + "grad_norm": 4.946422576904297, + "learning_rate": 4.0087166668936015e-06, + "loss": 0.119, + "step": 26180 + }, + { + "epoch": 71.33787465940054, + "grad_norm": 2.342850923538208, + "learning_rate": 4.008010118239315e-06, + "loss": 0.0248, + "step": 26181 + }, + { + "epoch": 71.34059945504087, + "grad_norm": 3.7198307514190674, + "learning_rate": 4.007303616250457e-06, + "loss": 0.1265, + "step": 26182 + }, + { + "epoch": 71.34332425068119, + "grad_norm": 2.975597381591797, + "learning_rate": 4.006597160932524e-06, + "loss": 0.2323, + "step": 26183 + }, + { + "epoch": 71.34604904632153, + "grad_norm": 4.063631534576416, + "learning_rate": 4.005890752291021e-06, + "loss": 0.1785, + "step": 26184 + }, + { + "epoch": 71.34877384196186, + "grad_norm": 2.9268012046813965, + "learning_rate": 4.005184390331443e-06, + "loss": 0.0501, + "step": 26185 + }, + { + "epoch": 71.35149863760218, + "grad_norm": 4.783208847045898, + "learning_rate": 4.0044780750593005e-06, + "loss": 0.0939, + "step": 26186 + }, + { + "epoch": 71.35422343324251, + "grad_norm": 2.9689512252807617, + "learning_rate": 4.003771806480089e-06, + "loss": 0.0388, + "step": 26187 + }, + { + "epoch": 71.35694822888283, + "grad_norm": 3.088300943374634, + "learning_rate": 4.003065584599306e-06, + "loss": 0.0851, + "step": 26188 + }, + { + "epoch": 71.35967302452316, + "grad_norm": 3.1855874061584473, + "learning_rate": 4.002359409422459e-06, + "loss": 0.0867, + "step": 26189 + }, + { + "epoch": 71.3623978201635, + "grad_norm": 2.78861665725708, + "learning_rate": 4.001653280955045e-06, + "loss": 0.0306, + "step": 26190 + }, + { + "epoch": 71.36512261580381, + "grad_norm": 1.984560489654541, + "learning_rate": 4.000947199202562e-06, + "loss": 0.0306, + "step": 26191 + }, + { + "epoch": 71.36784741144415, + "grad_norm": 3.627943515777588, + "learning_rate": 4.000241164170504e-06, + "loss": 0.0842, + "step": 26192 + }, + { + "epoch": 71.37057220708446, + "grad_norm": 4.622325897216797, + "learning_rate": 3.99953517586438e-06, + "loss": 0.1576, + "step": 26193 + }, + { + "epoch": 71.3732970027248, + "grad_norm": 3.2991983890533447, + "learning_rate": 3.9988292342896816e-06, + "loss": 0.0565, + "step": 26194 + }, + { + "epoch": 71.37602179836512, + "grad_norm": 2.1634292602539062, + "learning_rate": 3.998123339451908e-06, + "loss": 0.1563, + "step": 26195 + }, + { + "epoch": 71.37874659400545, + "grad_norm": 2.7750957012176514, + "learning_rate": 3.997417491356554e-06, + "loss": 0.123, + "step": 26196 + }, + { + "epoch": 71.38147138964578, + "grad_norm": 2.795283794403076, + "learning_rate": 3.996711690009119e-06, + "loss": 0.0364, + "step": 26197 + }, + { + "epoch": 71.3841961852861, + "grad_norm": 4.920372486114502, + "learning_rate": 3.996005935415104e-06, + "loss": 0.0764, + "step": 26198 + }, + { + "epoch": 71.38692098092643, + "grad_norm": 2.1958577632904053, + "learning_rate": 3.995300227580001e-06, + "loss": 0.0689, + "step": 26199 + }, + { + "epoch": 71.38964577656675, + "grad_norm": 3.190755844116211, + "learning_rate": 3.994594566509306e-06, + "loss": 0.2097, + "step": 26200 + }, + { + "epoch": 71.39237057220708, + "grad_norm": 3.133312463760376, + "learning_rate": 3.993888952208513e-06, + "loss": 0.0411, + "step": 26201 + }, + { + "epoch": 71.39509536784742, + "grad_norm": 2.8266334533691406, + "learning_rate": 3.993183384683124e-06, + "loss": 0.0562, + "step": 26202 + }, + { + "epoch": 71.39782016348774, + "grad_norm": 2.8147099018096924, + "learning_rate": 3.992477863938628e-06, + "loss": 0.1085, + "step": 26203 + }, + { + "epoch": 71.40054495912807, + "grad_norm": 3.9899539947509766, + "learning_rate": 3.99177238998052e-06, + "loss": 0.176, + "step": 26204 + }, + { + "epoch": 71.40326975476839, + "grad_norm": 3.109407424926758, + "learning_rate": 3.991066962814293e-06, + "loss": 0.2846, + "step": 26205 + }, + { + "epoch": 71.40599455040872, + "grad_norm": 2.2918648719787598, + "learning_rate": 3.990361582445447e-06, + "loss": 0.0436, + "step": 26206 + }, + { + "epoch": 71.40871934604904, + "grad_norm": 2.409806966781616, + "learning_rate": 3.989656248879471e-06, + "loss": 0.0365, + "step": 26207 + }, + { + "epoch": 71.41144414168937, + "grad_norm": 2.9081597328186035, + "learning_rate": 3.988950962121855e-06, + "loss": 0.0596, + "step": 26208 + }, + { + "epoch": 71.4141689373297, + "grad_norm": 4.1911725997924805, + "learning_rate": 3.988245722178099e-06, + "loss": 0.0565, + "step": 26209 + }, + { + "epoch": 71.41689373297002, + "grad_norm": 3.6818454265594482, + "learning_rate": 3.987540529053692e-06, + "loss": 0.1558, + "step": 26210 + }, + { + "epoch": 71.41961852861036, + "grad_norm": 2.782841920852661, + "learning_rate": 3.9868353827541265e-06, + "loss": 0.0653, + "step": 26211 + }, + { + "epoch": 71.42234332425068, + "grad_norm": 2.2606873512268066, + "learning_rate": 3.986130283284889e-06, + "loss": 0.0553, + "step": 26212 + }, + { + "epoch": 71.42506811989101, + "grad_norm": 3.6367404460906982, + "learning_rate": 3.985425230651479e-06, + "loss": 0.068, + "step": 26213 + }, + { + "epoch": 71.42779291553134, + "grad_norm": 1.963287353515625, + "learning_rate": 3.98472022485938e-06, + "loss": 0.0345, + "step": 26214 + }, + { + "epoch": 71.43051771117166, + "grad_norm": 3.1251213550567627, + "learning_rate": 3.984015265914091e-06, + "loss": 0.0858, + "step": 26215 + }, + { + "epoch": 71.433242506812, + "grad_norm": 3.200543165206909, + "learning_rate": 3.983310353821096e-06, + "loss": 0.0414, + "step": 26216 + }, + { + "epoch": 71.43596730245231, + "grad_norm": 3.0238993167877197, + "learning_rate": 3.982605488585884e-06, + "loss": 0.0729, + "step": 26217 + }, + { + "epoch": 71.43869209809264, + "grad_norm": 2.651211738586426, + "learning_rate": 3.9819006702139496e-06, + "loss": 0.1423, + "step": 26218 + }, + { + "epoch": 71.44141689373296, + "grad_norm": 2.6668174266815186, + "learning_rate": 3.981195898710779e-06, + "loss": 0.0756, + "step": 26219 + }, + { + "epoch": 71.4441416893733, + "grad_norm": 2.347923755645752, + "learning_rate": 3.9804911740818604e-06, + "loss": 0.1214, + "step": 26220 + }, + { + "epoch": 71.44686648501363, + "grad_norm": 3.0171802043914795, + "learning_rate": 3.97978649633268e-06, + "loss": 0.0752, + "step": 26221 + }, + { + "epoch": 71.44959128065395, + "grad_norm": 4.0918402671813965, + "learning_rate": 3.979081865468733e-06, + "loss": 0.1401, + "step": 26222 + }, + { + "epoch": 71.45231607629428, + "grad_norm": 2.6300928592681885, + "learning_rate": 3.978377281495502e-06, + "loss": 0.0601, + "step": 26223 + }, + { + "epoch": 71.4550408719346, + "grad_norm": 7.589695453643799, + "learning_rate": 3.977672744418475e-06, + "loss": 0.0908, + "step": 26224 + }, + { + "epoch": 71.45776566757493, + "grad_norm": 3.170612096786499, + "learning_rate": 3.976968254243135e-06, + "loss": 0.0498, + "step": 26225 + }, + { + "epoch": 71.46049046321527, + "grad_norm": 3.535686731338501, + "learning_rate": 3.976263810974977e-06, + "loss": 0.0463, + "step": 26226 + }, + { + "epoch": 71.46321525885558, + "grad_norm": 2.5216078758239746, + "learning_rate": 3.975559414619481e-06, + "loss": 0.0892, + "step": 26227 + }, + { + "epoch": 71.46594005449592, + "grad_norm": 3.490795612335205, + "learning_rate": 3.974855065182135e-06, + "loss": 0.0565, + "step": 26228 + }, + { + "epoch": 71.46866485013624, + "grad_norm": 3.58577823638916, + "learning_rate": 3.974150762668421e-06, + "loss": 0.0384, + "step": 26229 + }, + { + "epoch": 71.47138964577657, + "grad_norm": 3.07975435256958, + "learning_rate": 3.973446507083829e-06, + "loss": 0.0493, + "step": 26230 + }, + { + "epoch": 71.47411444141689, + "grad_norm": 4.166622638702393, + "learning_rate": 3.9727422984338384e-06, + "loss": 0.0915, + "step": 26231 + }, + { + "epoch": 71.47683923705722, + "grad_norm": 2.069585084915161, + "learning_rate": 3.972038136723941e-06, + "loss": 0.0372, + "step": 26232 + }, + { + "epoch": 71.47956403269755, + "grad_norm": 2.160964250564575, + "learning_rate": 3.971334021959613e-06, + "loss": 0.0457, + "step": 26233 + }, + { + "epoch": 71.48228882833787, + "grad_norm": 2.3658523559570312, + "learning_rate": 3.970629954146346e-06, + "loss": 0.0383, + "step": 26234 + }, + { + "epoch": 71.4850136239782, + "grad_norm": 3.285229444503784, + "learning_rate": 3.9699259332896165e-06, + "loss": 0.0618, + "step": 26235 + }, + { + "epoch": 71.48773841961852, + "grad_norm": 3.133434772491455, + "learning_rate": 3.969221959394911e-06, + "loss": 0.1925, + "step": 26236 + }, + { + "epoch": 71.49046321525886, + "grad_norm": 3.400329828262329, + "learning_rate": 3.9685180324677074e-06, + "loss": 0.1674, + "step": 26237 + }, + { + "epoch": 71.49318801089919, + "grad_norm": 2.832056760787964, + "learning_rate": 3.967814152513495e-06, + "loss": 0.0374, + "step": 26238 + }, + { + "epoch": 71.49591280653951, + "grad_norm": 3.7763254642486572, + "learning_rate": 3.967110319537751e-06, + "loss": 0.0504, + "step": 26239 + }, + { + "epoch": 71.49863760217984, + "grad_norm": 4.347590446472168, + "learning_rate": 3.966406533545959e-06, + "loss": 0.1006, + "step": 26240 + }, + { + "epoch": 71.50136239782016, + "grad_norm": 4.205351829528809, + "learning_rate": 3.965702794543594e-06, + "loss": 0.1328, + "step": 26241 + }, + { + "epoch": 71.50408719346049, + "grad_norm": 2.371041774749756, + "learning_rate": 3.964999102536145e-06, + "loss": 0.0659, + "step": 26242 + }, + { + "epoch": 71.50681198910081, + "grad_norm": 3.883790969848633, + "learning_rate": 3.96429545752909e-06, + "loss": 0.0662, + "step": 26243 + }, + { + "epoch": 71.50953678474114, + "grad_norm": 3.13887882232666, + "learning_rate": 3.963591859527906e-06, + "loss": 0.0958, + "step": 26244 + }, + { + "epoch": 71.51226158038148, + "grad_norm": 6.1765336990356445, + "learning_rate": 3.962888308538072e-06, + "loss": 0.1708, + "step": 26245 + }, + { + "epoch": 71.5149863760218, + "grad_norm": 2.49947190284729, + "learning_rate": 3.962184804565074e-06, + "loss": 0.0383, + "step": 26246 + }, + { + "epoch": 71.51771117166213, + "grad_norm": 2.4722323417663574, + "learning_rate": 3.961481347614385e-06, + "loss": 0.0578, + "step": 26247 + }, + { + "epoch": 71.52043596730245, + "grad_norm": 3.1850924491882324, + "learning_rate": 3.9607779376914814e-06, + "loss": 0.1161, + "step": 26248 + }, + { + "epoch": 71.52316076294278, + "grad_norm": 2.3899035453796387, + "learning_rate": 3.9600745748018445e-06, + "loss": 0.0372, + "step": 26249 + }, + { + "epoch": 71.52588555858311, + "grad_norm": 3.3634681701660156, + "learning_rate": 3.959371258950956e-06, + "loss": 0.1709, + "step": 26250 + }, + { + "epoch": 71.52861035422343, + "grad_norm": 3.508753538131714, + "learning_rate": 3.95866799014429e-06, + "loss": 0.0387, + "step": 26251 + }, + { + "epoch": 71.53133514986376, + "grad_norm": 3.0704305171966553, + "learning_rate": 3.957964768387324e-06, + "loss": 0.0405, + "step": 26252 + }, + { + "epoch": 71.53405994550408, + "grad_norm": 4.232667446136475, + "learning_rate": 3.957261593685529e-06, + "loss": 0.0623, + "step": 26253 + }, + { + "epoch": 71.53678474114442, + "grad_norm": 2.996190309524536, + "learning_rate": 3.9565584660443916e-06, + "loss": 0.0457, + "step": 26254 + }, + { + "epoch": 71.53950953678473, + "grad_norm": 3.1058871746063232, + "learning_rate": 3.955855385469381e-06, + "loss": 0.0413, + "step": 26255 + }, + { + "epoch": 71.54223433242507, + "grad_norm": 3.577069044113159, + "learning_rate": 3.955152351965974e-06, + "loss": 0.1313, + "step": 26256 + }, + { + "epoch": 71.5449591280654, + "grad_norm": 2.307096242904663, + "learning_rate": 3.954449365539643e-06, + "loss": 0.0737, + "step": 26257 + }, + { + "epoch": 71.54768392370572, + "grad_norm": 5.829807281494141, + "learning_rate": 3.953746426195869e-06, + "loss": 0.1635, + "step": 26258 + }, + { + "epoch": 71.55040871934605, + "grad_norm": 2.726738691329956, + "learning_rate": 3.953043533940124e-06, + "loss": 0.084, + "step": 26259 + }, + { + "epoch": 71.55313351498637, + "grad_norm": 2.659027099609375, + "learning_rate": 3.95234068877788e-06, + "loss": 0.0737, + "step": 26260 + }, + { + "epoch": 71.5558583106267, + "grad_norm": 3.3079888820648193, + "learning_rate": 3.951637890714609e-06, + "loss": 0.1624, + "step": 26261 + }, + { + "epoch": 71.55858310626704, + "grad_norm": 3.218881607055664, + "learning_rate": 3.950935139755792e-06, + "loss": 0.0938, + "step": 26262 + }, + { + "epoch": 71.56130790190736, + "grad_norm": 5.3799333572387695, + "learning_rate": 3.950232435906897e-06, + "loss": 0.0394, + "step": 26263 + }, + { + "epoch": 71.56403269754769, + "grad_norm": 3.419832944869995, + "learning_rate": 3.949529779173397e-06, + "loss": 0.0458, + "step": 26264 + }, + { + "epoch": 71.566757493188, + "grad_norm": 2.9798130989074707, + "learning_rate": 3.9488271695607595e-06, + "loss": 0.0911, + "step": 26265 + }, + { + "epoch": 71.56948228882834, + "grad_norm": 2.677361249923706, + "learning_rate": 3.948124607074463e-06, + "loss": 0.0869, + "step": 26266 + }, + { + "epoch": 71.57220708446866, + "grad_norm": 3.440507650375366, + "learning_rate": 3.94742209171998e-06, + "loss": 0.0583, + "step": 26267 + }, + { + "epoch": 71.57493188010899, + "grad_norm": 2.4000511169433594, + "learning_rate": 3.946719623502778e-06, + "loss": 0.0308, + "step": 26268 + }, + { + "epoch": 71.57765667574932, + "grad_norm": 3.487424850463867, + "learning_rate": 3.9460172024283305e-06, + "loss": 0.0305, + "step": 26269 + }, + { + "epoch": 71.58038147138964, + "grad_norm": 3.9430429935455322, + "learning_rate": 3.945314828502102e-06, + "loss": 0.0402, + "step": 26270 + }, + { + "epoch": 71.58310626702998, + "grad_norm": 2.019660234451294, + "learning_rate": 3.94461250172957e-06, + "loss": 0.0251, + "step": 26271 + }, + { + "epoch": 71.5858310626703, + "grad_norm": 2.686077117919922, + "learning_rate": 3.9439102221162016e-06, + "loss": 0.0975, + "step": 26272 + }, + { + "epoch": 71.58855585831063, + "grad_norm": 3.871405601501465, + "learning_rate": 3.943207989667461e-06, + "loss": 0.0735, + "step": 26273 + }, + { + "epoch": 71.59128065395096, + "grad_norm": 3.2200605869293213, + "learning_rate": 3.9425058043888265e-06, + "loss": 0.1172, + "step": 26274 + }, + { + "epoch": 71.59400544959128, + "grad_norm": 3.149120807647705, + "learning_rate": 3.941803666285761e-06, + "loss": 0.0427, + "step": 26275 + }, + { + "epoch": 71.59673024523161, + "grad_norm": 4.132558822631836, + "learning_rate": 3.941101575363733e-06, + "loss": 0.1327, + "step": 26276 + }, + { + "epoch": 71.59945504087193, + "grad_norm": 3.762106418609619, + "learning_rate": 3.9403995316282084e-06, + "loss": 0.0541, + "step": 26277 + }, + { + "epoch": 71.60217983651226, + "grad_norm": 4.901472568511963, + "learning_rate": 3.93969753508466e-06, + "loss": 0.0663, + "step": 26278 + }, + { + "epoch": 71.60490463215258, + "grad_norm": 6.244317531585693, + "learning_rate": 3.938995585738552e-06, + "loss": 0.1002, + "step": 26279 + }, + { + "epoch": 71.60762942779292, + "grad_norm": 3.195518732070923, + "learning_rate": 3.9382936835953525e-06, + "loss": 0.0531, + "step": 26280 + }, + { + "epoch": 71.61035422343325, + "grad_norm": 2.8734614849090576, + "learning_rate": 3.937591828660522e-06, + "loss": 0.0616, + "step": 26281 + }, + { + "epoch": 71.61307901907357, + "grad_norm": 2.5066661834716797, + "learning_rate": 3.9368900209395325e-06, + "loss": 0.097, + "step": 26282 + }, + { + "epoch": 71.6158038147139, + "grad_norm": 3.8755085468292236, + "learning_rate": 3.936188260437851e-06, + "loss": 0.0554, + "step": 26283 + }, + { + "epoch": 71.61852861035422, + "grad_norm": 30.757774353027344, + "learning_rate": 3.935486547160939e-06, + "loss": 0.1705, + "step": 26284 + }, + { + "epoch": 71.62125340599455, + "grad_norm": 2.776183843612671, + "learning_rate": 3.9347848811142644e-06, + "loss": 0.1033, + "step": 26285 + }, + { + "epoch": 71.62397820163488, + "grad_norm": 3.173003911972046, + "learning_rate": 3.934083262303287e-06, + "loss": 0.0992, + "step": 26286 + }, + { + "epoch": 71.6267029972752, + "grad_norm": 5.0574822425842285, + "learning_rate": 3.933381690733475e-06, + "loss": 0.0563, + "step": 26287 + }, + { + "epoch": 71.62942779291554, + "grad_norm": 2.7327327728271484, + "learning_rate": 3.932680166410293e-06, + "loss": 0.1241, + "step": 26288 + }, + { + "epoch": 71.63215258855585, + "grad_norm": 3.556267023086548, + "learning_rate": 3.931978689339202e-06, + "loss": 0.0832, + "step": 26289 + }, + { + "epoch": 71.63487738419619, + "grad_norm": 4.194163799285889, + "learning_rate": 3.9312772595256624e-06, + "loss": 0.0529, + "step": 26290 + }, + { + "epoch": 71.6376021798365, + "grad_norm": 2.6678009033203125, + "learning_rate": 3.9305758769751436e-06, + "loss": 0.0417, + "step": 26291 + }, + { + "epoch": 71.64032697547684, + "grad_norm": 3.616098403930664, + "learning_rate": 3.9298745416931035e-06, + "loss": 0.1153, + "step": 26292 + }, + { + "epoch": 71.64305177111717, + "grad_norm": 3.521211862564087, + "learning_rate": 3.9291732536850056e-06, + "loss": 0.0982, + "step": 26293 + }, + { + "epoch": 71.64577656675749, + "grad_norm": 3.013974905014038, + "learning_rate": 3.928472012956308e-06, + "loss": 0.0566, + "step": 26294 + }, + { + "epoch": 71.64850136239782, + "grad_norm": 3.37339448928833, + "learning_rate": 3.927770819512479e-06, + "loss": 0.1105, + "step": 26295 + }, + { + "epoch": 71.65122615803814, + "grad_norm": 3.3436920642852783, + "learning_rate": 3.927069673358976e-06, + "loss": 0.0822, + "step": 26296 + }, + { + "epoch": 71.65395095367847, + "grad_norm": 2.712724447250366, + "learning_rate": 3.926368574501253e-06, + "loss": 0.1009, + "step": 26297 + }, + { + "epoch": 71.65667574931881, + "grad_norm": 3.7425286769866943, + "learning_rate": 3.925667522944781e-06, + "loss": 0.0403, + "step": 26298 + }, + { + "epoch": 71.65940054495913, + "grad_norm": 2.209707498550415, + "learning_rate": 3.924966518695015e-06, + "loss": 0.0651, + "step": 26299 + }, + { + "epoch": 71.66212534059946, + "grad_norm": 2.2464306354522705, + "learning_rate": 3.92426556175741e-06, + "loss": 0.0383, + "step": 26300 + }, + { + "epoch": 71.66485013623978, + "grad_norm": 4.439968585968018, + "learning_rate": 3.923564652137433e-06, + "loss": 0.0688, + "step": 26301 + }, + { + "epoch": 71.66757493188011, + "grad_norm": 3.5255579948425293, + "learning_rate": 3.922863789840535e-06, + "loss": 0.1391, + "step": 26302 + }, + { + "epoch": 71.67029972752043, + "grad_norm": 3.0047080516815186, + "learning_rate": 3.922162974872182e-06, + "loss": 0.1164, + "step": 26303 + }, + { + "epoch": 71.67302452316076, + "grad_norm": 2.442917585372925, + "learning_rate": 3.9214622072378285e-06, + "loss": 0.0364, + "step": 26304 + }, + { + "epoch": 71.6757493188011, + "grad_norm": 3.430983543395996, + "learning_rate": 3.920761486942932e-06, + "loss": 0.1244, + "step": 26305 + }, + { + "epoch": 71.67847411444141, + "grad_norm": 2.698504686355591, + "learning_rate": 3.920060813992945e-06, + "loss": 0.055, + "step": 26306 + }, + { + "epoch": 71.68119891008175, + "grad_norm": 3.5199246406555176, + "learning_rate": 3.9193601883933326e-06, + "loss": 0.0574, + "step": 26307 + }, + { + "epoch": 71.68392370572207, + "grad_norm": 3.5285394191741943, + "learning_rate": 3.918659610149548e-06, + "loss": 0.0875, + "step": 26308 + }, + { + "epoch": 71.6866485013624, + "grad_norm": 3.1933979988098145, + "learning_rate": 3.917959079267045e-06, + "loss": 0.041, + "step": 26309 + }, + { + "epoch": 71.68937329700273, + "grad_norm": 2.9126813411712646, + "learning_rate": 3.917258595751279e-06, + "loss": 0.0882, + "step": 26310 + }, + { + "epoch": 71.69209809264305, + "grad_norm": 2.869687080383301, + "learning_rate": 3.916558159607711e-06, + "loss": 0.1528, + "step": 26311 + }, + { + "epoch": 71.69482288828338, + "grad_norm": 2.973262071609497, + "learning_rate": 3.9158577708417915e-06, + "loss": 0.1139, + "step": 26312 + }, + { + "epoch": 71.6975476839237, + "grad_norm": 3.114274740219116, + "learning_rate": 3.915157429458976e-06, + "loss": 0.1605, + "step": 26313 + }, + { + "epoch": 71.70027247956403, + "grad_norm": 2.112484931945801, + "learning_rate": 3.914457135464714e-06, + "loss": 0.0661, + "step": 26314 + }, + { + "epoch": 71.70299727520435, + "grad_norm": 2.825071334838867, + "learning_rate": 3.913756888864468e-06, + "loss": 0.1418, + "step": 26315 + }, + { + "epoch": 71.70572207084469, + "grad_norm": 3.551366090774536, + "learning_rate": 3.913056689663689e-06, + "loss": 0.0697, + "step": 26316 + }, + { + "epoch": 71.70844686648502, + "grad_norm": 3.1092236042022705, + "learning_rate": 3.912356537867823e-06, + "loss": 0.0747, + "step": 26317 + }, + { + "epoch": 71.71117166212534, + "grad_norm": 3.4141645431518555, + "learning_rate": 3.91165643348233e-06, + "loss": 0.046, + "step": 26318 + }, + { + "epoch": 71.71389645776567, + "grad_norm": 2.809612512588501, + "learning_rate": 3.910956376512664e-06, + "loss": 0.0571, + "step": 26319 + }, + { + "epoch": 71.71662125340599, + "grad_norm": 3.1274161338806152, + "learning_rate": 3.9102563669642724e-06, + "loss": 0.0474, + "step": 26320 + }, + { + "epoch": 71.71934604904632, + "grad_norm": 4.481291770935059, + "learning_rate": 3.909556404842609e-06, + "loss": 0.0911, + "step": 26321 + }, + { + "epoch": 71.72207084468666, + "grad_norm": 2.82544207572937, + "learning_rate": 3.908856490153121e-06, + "loss": 0.188, + "step": 26322 + }, + { + "epoch": 71.72479564032697, + "grad_norm": 2.664330005645752, + "learning_rate": 3.9081566229012665e-06, + "loss": 0.1044, + "step": 26323 + }, + { + "epoch": 71.7275204359673, + "grad_norm": 5.151984691619873, + "learning_rate": 3.907456803092492e-06, + "loss": 0.1964, + "step": 26324 + }, + { + "epoch": 71.73024523160763, + "grad_norm": 3.0860400199890137, + "learning_rate": 3.906757030732248e-06, + "loss": 0.0324, + "step": 26325 + }, + { + "epoch": 71.73297002724796, + "grad_norm": 2.922128677368164, + "learning_rate": 3.90605730582598e-06, + "loss": 0.0481, + "step": 26326 + }, + { + "epoch": 71.73569482288828, + "grad_norm": 2.772878885269165, + "learning_rate": 3.905357628379145e-06, + "loss": 0.0254, + "step": 26327 + }, + { + "epoch": 71.73841961852861, + "grad_norm": 2.7073915004730225, + "learning_rate": 3.9046579983971885e-06, + "loss": 0.0363, + "step": 26328 + }, + { + "epoch": 71.74114441416894, + "grad_norm": 2.901749849319458, + "learning_rate": 3.90395841588556e-06, + "loss": 0.0688, + "step": 26329 + }, + { + "epoch": 71.74386920980926, + "grad_norm": 2.3532776832580566, + "learning_rate": 3.903258880849703e-06, + "loss": 0.1116, + "step": 26330 + }, + { + "epoch": 71.7465940054496, + "grad_norm": 3.113292932510376, + "learning_rate": 3.902559393295073e-06, + "loss": 0.1108, + "step": 26331 + }, + { + "epoch": 71.74931880108991, + "grad_norm": 2.981163740158081, + "learning_rate": 3.901859953227115e-06, + "loss": 0.1457, + "step": 26332 + }, + { + "epoch": 71.75204359673025, + "grad_norm": 2.9588096141815186, + "learning_rate": 3.901160560651276e-06, + "loss": 0.0501, + "step": 26333 + }, + { + "epoch": 71.75476839237058, + "grad_norm": 3.4545843601226807, + "learning_rate": 3.900461215572997e-06, + "loss": 0.2941, + "step": 26334 + }, + { + "epoch": 71.7574931880109, + "grad_norm": 2.8437490463256836, + "learning_rate": 3.899761917997731e-06, + "loss": 0.0642, + "step": 26335 + }, + { + "epoch": 71.76021798365123, + "grad_norm": 2.816551685333252, + "learning_rate": 3.899062667930926e-06, + "loss": 0.1101, + "step": 26336 + }, + { + "epoch": 71.76294277929155, + "grad_norm": 3.1201517581939697, + "learning_rate": 3.898363465378025e-06, + "loss": 0.1431, + "step": 26337 + }, + { + "epoch": 71.76566757493188, + "grad_norm": 2.708270788192749, + "learning_rate": 3.897664310344469e-06, + "loss": 0.0624, + "step": 26338 + }, + { + "epoch": 71.7683923705722, + "grad_norm": 2.9582321643829346, + "learning_rate": 3.89696520283571e-06, + "loss": 0.0549, + "step": 26339 + }, + { + "epoch": 71.77111716621253, + "grad_norm": 2.193305492401123, + "learning_rate": 3.89626614285719e-06, + "loss": 0.0343, + "step": 26340 + }, + { + "epoch": 71.77384196185287, + "grad_norm": 2.9289002418518066, + "learning_rate": 3.895567130414353e-06, + "loss": 0.0742, + "step": 26341 + }, + { + "epoch": 71.77656675749319, + "grad_norm": 3.2769899368286133, + "learning_rate": 3.894868165512639e-06, + "loss": 0.053, + "step": 26342 + }, + { + "epoch": 71.77929155313352, + "grad_norm": 2.773853302001953, + "learning_rate": 3.894169248157499e-06, + "loss": 0.1123, + "step": 26343 + }, + { + "epoch": 71.78201634877384, + "grad_norm": 2.5914247035980225, + "learning_rate": 3.8934703783543715e-06, + "loss": 0.035, + "step": 26344 + }, + { + "epoch": 71.78474114441417, + "grad_norm": 2.399165391921997, + "learning_rate": 3.8927715561087006e-06, + "loss": 0.076, + "step": 26345 + }, + { + "epoch": 71.7874659400545, + "grad_norm": 2.775571823120117, + "learning_rate": 3.892072781425926e-06, + "loss": 0.0432, + "step": 26346 + }, + { + "epoch": 71.79019073569482, + "grad_norm": 2.0114197731018066, + "learning_rate": 3.8913740543114945e-06, + "loss": 0.024, + "step": 26347 + }, + { + "epoch": 71.79291553133515, + "grad_norm": 2.244875192642212, + "learning_rate": 3.8906753747708446e-06, + "loss": 0.0509, + "step": 26348 + }, + { + "epoch": 71.79564032697547, + "grad_norm": 4.468997955322266, + "learning_rate": 3.889976742809419e-06, + "loss": 0.2228, + "step": 26349 + }, + { + "epoch": 71.7983651226158, + "grad_norm": 2.7303740978240967, + "learning_rate": 3.889278158432654e-06, + "loss": 0.0358, + "step": 26350 + }, + { + "epoch": 71.80108991825612, + "grad_norm": 2.245702028274536, + "learning_rate": 3.888579621645995e-06, + "loss": 0.0303, + "step": 26351 + }, + { + "epoch": 71.80381471389646, + "grad_norm": 3.6175475120544434, + "learning_rate": 3.887881132454884e-06, + "loss": 0.1734, + "step": 26352 + }, + { + "epoch": 71.80653950953679, + "grad_norm": 3.4484775066375732, + "learning_rate": 3.887182690864758e-06, + "loss": 0.1582, + "step": 26353 + }, + { + "epoch": 71.80926430517711, + "grad_norm": 2.438727855682373, + "learning_rate": 3.886484296881057e-06, + "loss": 0.0757, + "step": 26354 + }, + { + "epoch": 71.81198910081744, + "grad_norm": 3.8565361499786377, + "learning_rate": 3.885785950509215e-06, + "loss": 0.0535, + "step": 26355 + }, + { + "epoch": 71.81471389645776, + "grad_norm": 3.1182069778442383, + "learning_rate": 3.88508765175468e-06, + "loss": 0.1748, + "step": 26356 + }, + { + "epoch": 71.8174386920981, + "grad_norm": 2.419715642929077, + "learning_rate": 3.8843894006228844e-06, + "loss": 0.0406, + "step": 26357 + }, + { + "epoch": 71.82016348773843, + "grad_norm": 2.741055965423584, + "learning_rate": 3.883691197119267e-06, + "loss": 0.0665, + "step": 26358 + }, + { + "epoch": 71.82288828337875, + "grad_norm": 4.048133850097656, + "learning_rate": 3.8829930412492636e-06, + "loss": 0.0986, + "step": 26359 + }, + { + "epoch": 71.82561307901908, + "grad_norm": 3.7205846309661865, + "learning_rate": 3.882294933018316e-06, + "loss": 0.1283, + "step": 26360 + }, + { + "epoch": 71.8283378746594, + "grad_norm": 4.266384601593018, + "learning_rate": 3.881596872431859e-06, + "loss": 0.0458, + "step": 26361 + }, + { + "epoch": 71.83106267029973, + "grad_norm": 2.6132822036743164, + "learning_rate": 3.880898859495326e-06, + "loss": 0.0901, + "step": 26362 + }, + { + "epoch": 71.83378746594005, + "grad_norm": 3.58284592628479, + "learning_rate": 3.880200894214158e-06, + "loss": 0.1006, + "step": 26363 + }, + { + "epoch": 71.83651226158038, + "grad_norm": 3.521472692489624, + "learning_rate": 3.879502976593788e-06, + "loss": 0.1067, + "step": 26364 + }, + { + "epoch": 71.83923705722071, + "grad_norm": 3.137671709060669, + "learning_rate": 3.878805106639653e-06, + "loss": 0.0787, + "step": 26365 + }, + { + "epoch": 71.84196185286103, + "grad_norm": 2.116220474243164, + "learning_rate": 3.8781072843571836e-06, + "loss": 0.0921, + "step": 26366 + }, + { + "epoch": 71.84468664850137, + "grad_norm": 2.7314095497131348, + "learning_rate": 3.87740950975182e-06, + "loss": 0.1198, + "step": 26367 + }, + { + "epoch": 71.84741144414168, + "grad_norm": 5.4813714027404785, + "learning_rate": 3.876711782828991e-06, + "loss": 0.0661, + "step": 26368 + }, + { + "epoch": 71.85013623978202, + "grad_norm": 2.426462411880493, + "learning_rate": 3.876014103594137e-06, + "loss": 0.0348, + "step": 26369 + }, + { + "epoch": 71.85286103542235, + "grad_norm": 3.680140256881714, + "learning_rate": 3.8753164720526884e-06, + "loss": 0.0466, + "step": 26370 + }, + { + "epoch": 71.85558583106267, + "grad_norm": 2.6533203125, + "learning_rate": 3.874618888210074e-06, + "loss": 0.1256, + "step": 26371 + }, + { + "epoch": 71.858310626703, + "grad_norm": 2.9805591106414795, + "learning_rate": 3.873921352071734e-06, + "loss": 0.158, + "step": 26372 + }, + { + "epoch": 71.86103542234332, + "grad_norm": 4.2799835205078125, + "learning_rate": 3.873223863643098e-06, + "loss": 0.2181, + "step": 26373 + }, + { + "epoch": 71.86376021798365, + "grad_norm": 3.869594097137451, + "learning_rate": 3.872526422929597e-06, + "loss": 0.0439, + "step": 26374 + }, + { + "epoch": 71.86648501362397, + "grad_norm": 3.964195728302002, + "learning_rate": 3.87182902993666e-06, + "loss": 0.1073, + "step": 26375 + }, + { + "epoch": 71.8692098092643, + "grad_norm": 2.9525675773620605, + "learning_rate": 3.871131684669725e-06, + "loss": 0.1821, + "step": 26376 + }, + { + "epoch": 71.87193460490464, + "grad_norm": 1.5886871814727783, + "learning_rate": 3.870434387134217e-06, + "loss": 0.0285, + "step": 26377 + }, + { + "epoch": 71.87465940054496, + "grad_norm": 3.222775459289551, + "learning_rate": 3.869737137335571e-06, + "loss": 0.0326, + "step": 26378 + }, + { + "epoch": 71.87738419618529, + "grad_norm": 2.483813524246216, + "learning_rate": 3.869039935279211e-06, + "loss": 0.0505, + "step": 26379 + }, + { + "epoch": 71.88010899182561, + "grad_norm": 3.57271146774292, + "learning_rate": 3.868342780970573e-06, + "loss": 0.0895, + "step": 26380 + }, + { + "epoch": 71.88283378746594, + "grad_norm": 1.9605324268341064, + "learning_rate": 3.867645674415085e-06, + "loss": 0.0333, + "step": 26381 + }, + { + "epoch": 71.88555858310627, + "grad_norm": 2.846683979034424, + "learning_rate": 3.8669486156181715e-06, + "loss": 0.05, + "step": 26382 + }, + { + "epoch": 71.88828337874659, + "grad_norm": 3.698002338409424, + "learning_rate": 3.866251604585268e-06, + "loss": 0.1028, + "step": 26383 + }, + { + "epoch": 71.89100817438693, + "grad_norm": 3.3943450450897217, + "learning_rate": 3.8655546413218005e-06, + "loss": 0.0591, + "step": 26384 + }, + { + "epoch": 71.89373297002724, + "grad_norm": 3.743924140930176, + "learning_rate": 3.864857725833194e-06, + "loss": 0.0486, + "step": 26385 + }, + { + "epoch": 71.89645776566758, + "grad_norm": 2.5327439308166504, + "learning_rate": 3.864160858124877e-06, + "loss": 0.0634, + "step": 26386 + }, + { + "epoch": 71.8991825613079, + "grad_norm": 2.6696815490722656, + "learning_rate": 3.863464038202276e-06, + "loss": 0.1281, + "step": 26387 + }, + { + "epoch": 71.90190735694823, + "grad_norm": 3.199040412902832, + "learning_rate": 3.862767266070824e-06, + "loss": 0.1714, + "step": 26388 + }, + { + "epoch": 71.90463215258856, + "grad_norm": 4.53518009185791, + "learning_rate": 3.8620705417359425e-06, + "loss": 0.0669, + "step": 26389 + }, + { + "epoch": 71.90735694822888, + "grad_norm": 4.8748884201049805, + "learning_rate": 3.861373865203059e-06, + "loss": 0.2236, + "step": 26390 + }, + { + "epoch": 71.91008174386921, + "grad_norm": 1.7121739387512207, + "learning_rate": 3.860677236477594e-06, + "loss": 0.0233, + "step": 26391 + }, + { + "epoch": 71.91280653950953, + "grad_norm": 4.375126361846924, + "learning_rate": 3.859980655564981e-06, + "loss": 0.0794, + "step": 26392 + }, + { + "epoch": 71.91553133514986, + "grad_norm": 2.77117657661438, + "learning_rate": 3.85928412247064e-06, + "loss": 0.0369, + "step": 26393 + }, + { + "epoch": 71.9182561307902, + "grad_norm": 2.893740653991699, + "learning_rate": 3.858587637199998e-06, + "loss": 0.0628, + "step": 26394 + }, + { + "epoch": 71.92098092643052, + "grad_norm": 3.6848340034484863, + "learning_rate": 3.857891199758473e-06, + "loss": 0.0715, + "step": 26395 + }, + { + "epoch": 71.92370572207085, + "grad_norm": 6.501197814941406, + "learning_rate": 3.8571948101514975e-06, + "loss": 0.0872, + "step": 26396 + }, + { + "epoch": 71.92643051771117, + "grad_norm": 3.519993543624878, + "learning_rate": 3.856498468384492e-06, + "loss": 0.0452, + "step": 26397 + }, + { + "epoch": 71.9291553133515, + "grad_norm": 3.886000871658325, + "learning_rate": 3.855802174462878e-06, + "loss": 0.0637, + "step": 26398 + }, + { + "epoch": 71.93188010899182, + "grad_norm": 2.6100046634674072, + "learning_rate": 3.8551059283920755e-06, + "loss": 0.0962, + "step": 26399 + }, + { + "epoch": 71.93460490463215, + "grad_norm": 3.729602813720703, + "learning_rate": 3.854409730177514e-06, + "loss": 0.0734, + "step": 26400 + }, + { + "epoch": 71.93732970027249, + "grad_norm": 3.0738816261291504, + "learning_rate": 3.8537135798246114e-06, + "loss": 0.0362, + "step": 26401 + }, + { + "epoch": 71.9400544959128, + "grad_norm": 2.7986834049224854, + "learning_rate": 3.8530174773387894e-06, + "loss": 0.0629, + "step": 26402 + }, + { + "epoch": 71.94277929155314, + "grad_norm": 3.095090627670288, + "learning_rate": 3.852321422725464e-06, + "loss": 0.0345, + "step": 26403 + }, + { + "epoch": 71.94550408719346, + "grad_norm": 5.287209987640381, + "learning_rate": 3.851625415990066e-06, + "loss": 0.0429, + "step": 26404 + }, + { + "epoch": 71.94822888283379, + "grad_norm": 2.890679121017456, + "learning_rate": 3.850929457138013e-06, + "loss": 0.139, + "step": 26405 + }, + { + "epoch": 71.95095367847412, + "grad_norm": 1.8992841243743896, + "learning_rate": 3.850233546174723e-06, + "loss": 0.0239, + "step": 26406 + }, + { + "epoch": 71.95367847411444, + "grad_norm": 2.375065326690674, + "learning_rate": 3.849537683105613e-06, + "loss": 0.0324, + "step": 26407 + }, + { + "epoch": 71.95640326975477, + "grad_norm": 4.101001262664795, + "learning_rate": 3.848841867936109e-06, + "loss": 0.1392, + "step": 26408 + }, + { + "epoch": 71.95912806539509, + "grad_norm": 2.77616810798645, + "learning_rate": 3.848146100671627e-06, + "loss": 0.0633, + "step": 26409 + }, + { + "epoch": 71.96185286103542, + "grad_norm": 3.357628583908081, + "learning_rate": 3.847450381317584e-06, + "loss": 0.044, + "step": 26410 + }, + { + "epoch": 71.96457765667574, + "grad_norm": 3.925208330154419, + "learning_rate": 3.8467547098793965e-06, + "loss": 0.0698, + "step": 26411 + }, + { + "epoch": 71.96730245231608, + "grad_norm": 3.3535728454589844, + "learning_rate": 3.846059086362489e-06, + "loss": 0.1013, + "step": 26412 + }, + { + "epoch": 71.97002724795641, + "grad_norm": 3.7744178771972656, + "learning_rate": 3.845363510772275e-06, + "loss": 0.1563, + "step": 26413 + }, + { + "epoch": 71.97275204359673, + "grad_norm": 3.1011741161346436, + "learning_rate": 3.844667983114172e-06, + "loss": 0.0599, + "step": 26414 + }, + { + "epoch": 71.97547683923706, + "grad_norm": 3.228482484817505, + "learning_rate": 3.843972503393594e-06, + "loss": 0.0707, + "step": 26415 + }, + { + "epoch": 71.97820163487738, + "grad_norm": 3.153712034225464, + "learning_rate": 3.843277071615962e-06, + "loss": 0.05, + "step": 26416 + }, + { + "epoch": 71.98092643051771, + "grad_norm": 6.8295769691467285, + "learning_rate": 3.842581687786691e-06, + "loss": 0.0461, + "step": 26417 + }, + { + "epoch": 71.98365122615803, + "grad_norm": 2.7410759925842285, + "learning_rate": 3.841886351911195e-06, + "loss": 0.0578, + "step": 26418 + }, + { + "epoch": 71.98637602179836, + "grad_norm": 3.6840834617614746, + "learning_rate": 3.841191063994887e-06, + "loss": 0.0611, + "step": 26419 + }, + { + "epoch": 71.9891008174387, + "grad_norm": 3.9045000076293945, + "learning_rate": 3.840495824043184e-06, + "loss": 0.0844, + "step": 26420 + }, + { + "epoch": 71.99182561307902, + "grad_norm": 1.457475185394287, + "learning_rate": 3.839800632061505e-06, + "loss": 0.0176, + "step": 26421 + }, + { + "epoch": 71.99455040871935, + "grad_norm": 4.588175296783447, + "learning_rate": 3.839105488055261e-06, + "loss": 0.0848, + "step": 26422 + }, + { + "epoch": 71.99727520435967, + "grad_norm": 4.111020565032959, + "learning_rate": 3.838410392029861e-06, + "loss": 0.0451, + "step": 26423 + }, + { + "epoch": 72.0, + "grad_norm": 3.852811813354492, + "learning_rate": 3.837715343990727e-06, + "loss": 0.1726, + "step": 26424 + }, + { + "epoch": 72.00272479564033, + "grad_norm": 3.460327625274658, + "learning_rate": 3.837020343943267e-06, + "loss": 0.0799, + "step": 26425 + }, + { + "epoch": 72.00544959128065, + "grad_norm": 4.512401103973389, + "learning_rate": 3.836325391892894e-06, + "loss": 0.1293, + "step": 26426 + }, + { + "epoch": 72.00817438692098, + "grad_norm": 4.811865329742432, + "learning_rate": 3.8356304878450165e-06, + "loss": 0.0375, + "step": 26427 + }, + { + "epoch": 72.0108991825613, + "grad_norm": 3.8618597984313965, + "learning_rate": 3.834935631805055e-06, + "loss": 0.1019, + "step": 26428 + }, + { + "epoch": 72.01362397820164, + "grad_norm": 3.3924152851104736, + "learning_rate": 3.834240823778416e-06, + "loss": 0.0459, + "step": 26429 + }, + { + "epoch": 72.01634877384195, + "grad_norm": 2.285546064376831, + "learning_rate": 3.833546063770512e-06, + "loss": 0.0358, + "step": 26430 + }, + { + "epoch": 72.01907356948229, + "grad_norm": 3.3915133476257324, + "learning_rate": 3.8328513517867475e-06, + "loss": 0.0485, + "step": 26431 + }, + { + "epoch": 72.02179836512262, + "grad_norm": 2.707864761352539, + "learning_rate": 3.832156687832542e-06, + "loss": 0.1161, + "step": 26432 + }, + { + "epoch": 72.02452316076294, + "grad_norm": 3.833160638809204, + "learning_rate": 3.831462071913302e-06, + "loss": 0.1003, + "step": 26433 + }, + { + "epoch": 72.02724795640327, + "grad_norm": 3.3467867374420166, + "learning_rate": 3.8307675040344375e-06, + "loss": 0.0579, + "step": 26434 + }, + { + "epoch": 72.02997275204359, + "grad_norm": 1.303076148033142, + "learning_rate": 3.830072984201353e-06, + "loss": 0.0191, + "step": 26435 + }, + { + "epoch": 72.03269754768392, + "grad_norm": 4.522215366363525, + "learning_rate": 3.829378512419465e-06, + "loss": 0.1038, + "step": 26436 + }, + { + "epoch": 72.03542234332426, + "grad_norm": 3.8533568382263184, + "learning_rate": 3.828684088694174e-06, + "loss": 0.1413, + "step": 26437 + }, + { + "epoch": 72.03814713896458, + "grad_norm": 3.332747459411621, + "learning_rate": 3.827989713030899e-06, + "loss": 0.0996, + "step": 26438 + }, + { + "epoch": 72.04087193460491, + "grad_norm": 2.6036112308502197, + "learning_rate": 3.827295385435039e-06, + "loss": 0.1129, + "step": 26439 + }, + { + "epoch": 72.04359673024523, + "grad_norm": 2.8100404739379883, + "learning_rate": 3.826601105912001e-06, + "loss": 0.0762, + "step": 26440 + }, + { + "epoch": 72.04632152588556, + "grad_norm": 2.9402518272399902, + "learning_rate": 3.825906874467199e-06, + "loss": 0.0324, + "step": 26441 + }, + { + "epoch": 72.04904632152588, + "grad_norm": 3.8927853107452393, + "learning_rate": 3.825212691106035e-06, + "loss": 0.0726, + "step": 26442 + }, + { + "epoch": 72.05177111716621, + "grad_norm": 3.7210917472839355, + "learning_rate": 3.824518555833916e-06, + "loss": 0.1208, + "step": 26443 + }, + { + "epoch": 72.05449591280654, + "grad_norm": 2.8822295665740967, + "learning_rate": 3.823824468656245e-06, + "loss": 0.0375, + "step": 26444 + }, + { + "epoch": 72.05722070844686, + "grad_norm": 9.227213859558105, + "learning_rate": 3.823130429578432e-06, + "loss": 0.0432, + "step": 26445 + }, + { + "epoch": 72.0599455040872, + "grad_norm": 2.4599592685699463, + "learning_rate": 3.822436438605881e-06, + "loss": 0.0275, + "step": 26446 + }, + { + "epoch": 72.06267029972751, + "grad_norm": 4.226046085357666, + "learning_rate": 3.821742495743993e-06, + "loss": 0.067, + "step": 26447 + }, + { + "epoch": 72.06539509536785, + "grad_norm": 3.2443578243255615, + "learning_rate": 3.82104860099818e-06, + "loss": 0.0379, + "step": 26448 + }, + { + "epoch": 72.06811989100818, + "grad_norm": 3.0962071418762207, + "learning_rate": 3.8203547543738395e-06, + "loss": 0.047, + "step": 26449 + }, + { + "epoch": 72.0708446866485, + "grad_norm": 2.8933916091918945, + "learning_rate": 3.819660955876378e-06, + "loss": 0.032, + "step": 26450 + }, + { + "epoch": 72.07356948228883, + "grad_norm": 4.149245738983154, + "learning_rate": 3.818967205511196e-06, + "loss": 0.1032, + "step": 26451 + }, + { + "epoch": 72.07629427792915, + "grad_norm": 5.366902828216553, + "learning_rate": 3.8182735032837015e-06, + "loss": 0.1421, + "step": 26452 + }, + { + "epoch": 72.07901907356948, + "grad_norm": 2.3826136589050293, + "learning_rate": 3.817579849199293e-06, + "loss": 0.0374, + "step": 26453 + }, + { + "epoch": 72.0817438692098, + "grad_norm": 2.4784250259399414, + "learning_rate": 3.816886243263371e-06, + "loss": 0.0509, + "step": 26454 + }, + { + "epoch": 72.08446866485014, + "grad_norm": 3.469705581665039, + "learning_rate": 3.816192685481344e-06, + "loss": 0.0487, + "step": 26455 + }, + { + "epoch": 72.08719346049047, + "grad_norm": 2.6644678115844727, + "learning_rate": 3.8154991758586045e-06, + "loss": 0.0463, + "step": 26456 + }, + { + "epoch": 72.08991825613079, + "grad_norm": 2.715855836868286, + "learning_rate": 3.814805714400562e-06, + "loss": 0.0289, + "step": 26457 + }, + { + "epoch": 72.09264305177112, + "grad_norm": 2.837583065032959, + "learning_rate": 3.8141123011126135e-06, + "loss": 0.1801, + "step": 26458 + }, + { + "epoch": 72.09536784741144, + "grad_norm": 4.77943754196167, + "learning_rate": 3.8134189360001604e-06, + "loss": 0.1445, + "step": 26459 + }, + { + "epoch": 72.09809264305177, + "grad_norm": 2.1811513900756836, + "learning_rate": 3.8127256190685968e-06, + "loss": 0.2314, + "step": 26460 + }, + { + "epoch": 72.1008174386921, + "grad_norm": 3.9631247520446777, + "learning_rate": 3.8120323503233315e-06, + "loss": 0.0357, + "step": 26461 + }, + { + "epoch": 72.10354223433242, + "grad_norm": 2.710859537124634, + "learning_rate": 3.811339129769758e-06, + "loss": 0.0996, + "step": 26462 + }, + { + "epoch": 72.10626702997276, + "grad_norm": 3.615741014480591, + "learning_rate": 3.810645957413277e-06, + "loss": 0.0389, + "step": 26463 + }, + { + "epoch": 72.10899182561307, + "grad_norm": 3.7355191707611084, + "learning_rate": 3.8099528332592817e-06, + "loss": 0.0818, + "step": 26464 + }, + { + "epoch": 72.11171662125341, + "grad_norm": 2.5932669639587402, + "learning_rate": 3.8092597573131796e-06, + "loss": 0.0276, + "step": 26465 + }, + { + "epoch": 72.11444141689373, + "grad_norm": 4.68644380569458, + "learning_rate": 3.8085667295803617e-06, + "loss": 0.1885, + "step": 26466 + }, + { + "epoch": 72.11716621253406, + "grad_norm": 4.039291858673096, + "learning_rate": 3.8078737500662277e-06, + "loss": 0.1143, + "step": 26467 + }, + { + "epoch": 72.11989100817439, + "grad_norm": 2.1027610301971436, + "learning_rate": 3.8071808187761696e-06, + "loss": 0.0307, + "step": 26468 + }, + { + "epoch": 72.12261580381471, + "grad_norm": 2.5047619342803955, + "learning_rate": 3.8064879357155915e-06, + "loss": 0.1368, + "step": 26469 + }, + { + "epoch": 72.12534059945504, + "grad_norm": 3.0962514877319336, + "learning_rate": 3.8057951008898865e-06, + "loss": 0.1067, + "step": 26470 + }, + { + "epoch": 72.12806539509536, + "grad_norm": 2.2265589237213135, + "learning_rate": 3.8051023143044464e-06, + "loss": 0.0193, + "step": 26471 + }, + { + "epoch": 72.1307901907357, + "grad_norm": 2.836852788925171, + "learning_rate": 3.8044095759646694e-06, + "loss": 0.0558, + "step": 26472 + }, + { + "epoch": 72.13351498637603, + "grad_norm": 5.074002742767334, + "learning_rate": 3.8037168858759556e-06, + "loss": 0.2786, + "step": 26473 + }, + { + "epoch": 72.13623978201635, + "grad_norm": 2.991013765335083, + "learning_rate": 3.8030242440436947e-06, + "loss": 0.0744, + "step": 26474 + }, + { + "epoch": 72.13896457765668, + "grad_norm": 3.196929931640625, + "learning_rate": 3.802331650473281e-06, + "loss": 0.0702, + "step": 26475 + }, + { + "epoch": 72.141689373297, + "grad_norm": 5.008358478546143, + "learning_rate": 3.8016391051701063e-06, + "loss": 0.0489, + "step": 26476 + }, + { + "epoch": 72.14441416893733, + "grad_norm": 2.833855152130127, + "learning_rate": 3.8009466081395707e-06, + "loss": 0.0647, + "step": 26477 + }, + { + "epoch": 72.14713896457765, + "grad_norm": 2.50533390045166, + "learning_rate": 3.8002541593870624e-06, + "loss": 0.0335, + "step": 26478 + }, + { + "epoch": 72.14986376021798, + "grad_norm": 2.8171579837799072, + "learning_rate": 3.7995617589179758e-06, + "loss": 0.0969, + "step": 26479 + }, + { + "epoch": 72.15258855585832, + "grad_norm": 2.2267115116119385, + "learning_rate": 3.7988694067376987e-06, + "loss": 0.0515, + "step": 26480 + }, + { + "epoch": 72.15531335149863, + "grad_norm": 3.8708081245422363, + "learning_rate": 3.7981771028516303e-06, + "loss": 0.0396, + "step": 26481 + }, + { + "epoch": 72.15803814713897, + "grad_norm": 2.921945571899414, + "learning_rate": 3.7974848472651593e-06, + "loss": 0.1003, + "step": 26482 + }, + { + "epoch": 72.16076294277929, + "grad_norm": 2.610873222351074, + "learning_rate": 3.7967926399836775e-06, + "loss": 0.0532, + "step": 26483 + }, + { + "epoch": 72.16348773841962, + "grad_norm": 2.5172135829925537, + "learning_rate": 3.796100481012571e-06, + "loss": 0.0315, + "step": 26484 + }, + { + "epoch": 72.16621253405995, + "grad_norm": 2.580249071121216, + "learning_rate": 3.7954083703572376e-06, + "loss": 0.0455, + "step": 26485 + }, + { + "epoch": 72.16893732970027, + "grad_norm": 3.4453303813934326, + "learning_rate": 3.7947163080230644e-06, + "loss": 0.1394, + "step": 26486 + }, + { + "epoch": 72.1716621253406, + "grad_norm": 2.4160969257354736, + "learning_rate": 3.7940242940154404e-06, + "loss": 0.0503, + "step": 26487 + }, + { + "epoch": 72.17438692098092, + "grad_norm": 5.730032920837402, + "learning_rate": 3.793332328339752e-06, + "loss": 0.0362, + "step": 26488 + }, + { + "epoch": 72.17711171662125, + "grad_norm": 3.2699761390686035, + "learning_rate": 3.7926404110013913e-06, + "loss": 0.1083, + "step": 26489 + }, + { + "epoch": 72.17983651226157, + "grad_norm": 3.17868971824646, + "learning_rate": 3.791948542005751e-06, + "loss": 0.0805, + "step": 26490 + }, + { + "epoch": 72.1825613079019, + "grad_norm": 2.672743797302246, + "learning_rate": 3.791256721358216e-06, + "loss": 0.096, + "step": 26491 + }, + { + "epoch": 72.18528610354224, + "grad_norm": 9.494412422180176, + "learning_rate": 3.7905649490641704e-06, + "loss": 0.1418, + "step": 26492 + }, + { + "epoch": 72.18801089918256, + "grad_norm": 2.820760726928711, + "learning_rate": 3.789873225129009e-06, + "loss": 0.0324, + "step": 26493 + }, + { + "epoch": 72.19073569482289, + "grad_norm": 6.814089298248291, + "learning_rate": 3.789181549558114e-06, + "loss": 0.1112, + "step": 26494 + }, + { + "epoch": 72.19346049046321, + "grad_norm": 3.728151559829712, + "learning_rate": 3.788489922356874e-06, + "loss": 0.0513, + "step": 26495 + }, + { + "epoch": 72.19618528610354, + "grad_norm": 3.132028579711914, + "learning_rate": 3.787798343530671e-06, + "loss": 0.035, + "step": 26496 + }, + { + "epoch": 72.19891008174388, + "grad_norm": 3.118652820587158, + "learning_rate": 3.7871068130848974e-06, + "loss": 0.0731, + "step": 26497 + }, + { + "epoch": 72.2016348773842, + "grad_norm": 3.4296882152557373, + "learning_rate": 3.7864153310249376e-06, + "loss": 0.0977, + "step": 26498 + }, + { + "epoch": 72.20435967302453, + "grad_norm": 2.929823637008667, + "learning_rate": 3.7857238973561737e-06, + "loss": 0.048, + "step": 26499 + }, + { + "epoch": 72.20708446866485, + "grad_norm": 4.002386569976807, + "learning_rate": 3.785032512083989e-06, + "loss": 0.0714, + "step": 26500 + }, + { + "epoch": 72.20980926430518, + "grad_norm": 2.456514835357666, + "learning_rate": 3.784341175213775e-06, + "loss": 0.0449, + "step": 26501 + }, + { + "epoch": 72.2125340599455, + "grad_norm": 2.193502187728882, + "learning_rate": 3.7836498867509108e-06, + "loss": 0.098, + "step": 26502 + }, + { + "epoch": 72.21525885558583, + "grad_norm": 3.205998420715332, + "learning_rate": 3.782958646700782e-06, + "loss": 0.1279, + "step": 26503 + }, + { + "epoch": 72.21798365122616, + "grad_norm": 3.640317916870117, + "learning_rate": 3.7822674550687676e-06, + "loss": 0.1048, + "step": 26504 + }, + { + "epoch": 72.22070844686648, + "grad_norm": 2.3547284603118896, + "learning_rate": 3.7815763118602577e-06, + "loss": 0.0247, + "step": 26505 + }, + { + "epoch": 72.22343324250681, + "grad_norm": 2.100797176361084, + "learning_rate": 3.7808852170806275e-06, + "loss": 0.0365, + "step": 26506 + }, + { + "epoch": 72.22615803814713, + "grad_norm": 1.5812318325042725, + "learning_rate": 3.780194170735266e-06, + "loss": 0.0248, + "step": 26507 + }, + { + "epoch": 72.22888283378747, + "grad_norm": 4.499730110168457, + "learning_rate": 3.779503172829554e-06, + "loss": 0.0948, + "step": 26508 + }, + { + "epoch": 72.2316076294278, + "grad_norm": 2.98199725151062, + "learning_rate": 3.778812223368866e-06, + "loss": 0.124, + "step": 26509 + }, + { + "epoch": 72.23433242506812, + "grad_norm": 3.3595364093780518, + "learning_rate": 3.778121322358592e-06, + "loss": 0.0216, + "step": 26510 + }, + { + "epoch": 72.23705722070845, + "grad_norm": 2.3541762828826904, + "learning_rate": 3.77743046980411e-06, + "loss": 0.0295, + "step": 26511 + }, + { + "epoch": 72.23978201634877, + "grad_norm": 3.811251401901245, + "learning_rate": 3.7767396657107936e-06, + "loss": 0.0624, + "step": 26512 + }, + { + "epoch": 72.2425068119891, + "grad_norm": 2.8131866455078125, + "learning_rate": 3.776048910084034e-06, + "loss": 0.0616, + "step": 26513 + }, + { + "epoch": 72.24523160762942, + "grad_norm": 2.430534601211548, + "learning_rate": 3.7753582029292037e-06, + "loss": 0.1069, + "step": 26514 + }, + { + "epoch": 72.24795640326975, + "grad_norm": 2.720771074295044, + "learning_rate": 3.774667544251683e-06, + "loss": 0.0496, + "step": 26515 + }, + { + "epoch": 72.25068119891009, + "grad_norm": 3.8845908641815186, + "learning_rate": 3.773976934056849e-06, + "loss": 0.0476, + "step": 26516 + }, + { + "epoch": 72.2534059945504, + "grad_norm": 3.750916004180908, + "learning_rate": 3.7732863723500855e-06, + "loss": 0.0674, + "step": 26517 + }, + { + "epoch": 72.25613079019074, + "grad_norm": 2.2411701679229736, + "learning_rate": 3.7725958591367675e-06, + "loss": 0.0319, + "step": 26518 + }, + { + "epoch": 72.25885558583106, + "grad_norm": 3.2152843475341797, + "learning_rate": 3.7719053944222715e-06, + "loss": 0.1024, + "step": 26519 + }, + { + "epoch": 72.26158038147139, + "grad_norm": 2.3171660900115967, + "learning_rate": 3.7712149782119733e-06, + "loss": 0.0278, + "step": 26520 + }, + { + "epoch": 72.26430517711172, + "grad_norm": 3.022448778152466, + "learning_rate": 3.770524610511256e-06, + "loss": 0.0471, + "step": 26521 + }, + { + "epoch": 72.26702997275204, + "grad_norm": 2.9819817543029785, + "learning_rate": 3.7698342913254913e-06, + "loss": 0.1696, + "step": 26522 + }, + { + "epoch": 72.26975476839237, + "grad_norm": 3.3681530952453613, + "learning_rate": 3.769144020660054e-06, + "loss": 0.0702, + "step": 26523 + }, + { + "epoch": 72.2724795640327, + "grad_norm": 3.5201833248138428, + "learning_rate": 3.7684537985203263e-06, + "loss": 0.128, + "step": 26524 + }, + { + "epoch": 72.27520435967303, + "grad_norm": 3.9061806201934814, + "learning_rate": 3.7677636249116755e-06, + "loss": 0.0609, + "step": 26525 + }, + { + "epoch": 72.27792915531334, + "grad_norm": 2.433267831802368, + "learning_rate": 3.7670734998394855e-06, + "loss": 0.1045, + "step": 26526 + }, + { + "epoch": 72.28065395095368, + "grad_norm": 3.156240224838257, + "learning_rate": 3.7663834233091257e-06, + "loss": 0.0474, + "step": 26527 + }, + { + "epoch": 72.28337874659401, + "grad_norm": 2.4976119995117188, + "learning_rate": 3.765693395325971e-06, + "loss": 0.0323, + "step": 26528 + }, + { + "epoch": 72.28610354223433, + "grad_norm": 4.028443813323975, + "learning_rate": 3.765003415895393e-06, + "loss": 0.1099, + "step": 26529 + }, + { + "epoch": 72.28882833787466, + "grad_norm": 2.569737672805786, + "learning_rate": 3.76431348502277e-06, + "loss": 0.0506, + "step": 26530 + }, + { + "epoch": 72.29155313351498, + "grad_norm": 3.3727774620056152, + "learning_rate": 3.7636236027134733e-06, + "loss": 0.0491, + "step": 26531 + }, + { + "epoch": 72.29427792915531, + "grad_norm": 10.414998054504395, + "learning_rate": 3.7629337689728763e-06, + "loss": 0.051, + "step": 26532 + }, + { + "epoch": 72.29700272479565, + "grad_norm": 2.196016788482666, + "learning_rate": 3.762243983806345e-06, + "loss": 0.0331, + "step": 26533 + }, + { + "epoch": 72.29972752043597, + "grad_norm": 4.307570457458496, + "learning_rate": 3.7615542472192624e-06, + "loss": 0.0653, + "step": 26534 + }, + { + "epoch": 72.3024523160763, + "grad_norm": 3.4602112770080566, + "learning_rate": 3.7608645592169935e-06, + "loss": 0.0495, + "step": 26535 + }, + { + "epoch": 72.30517711171662, + "grad_norm": 2.949125289916992, + "learning_rate": 3.7601749198049064e-06, + "loss": 0.0538, + "step": 26536 + }, + { + "epoch": 72.30790190735695, + "grad_norm": 3.042327880859375, + "learning_rate": 3.75948532898838e-06, + "loss": 0.1376, + "step": 26537 + }, + { + "epoch": 72.31062670299727, + "grad_norm": 3.713318109512329, + "learning_rate": 3.758795786772782e-06, + "loss": 0.0448, + "step": 26538 + }, + { + "epoch": 72.3133514986376, + "grad_norm": 3.653341770172119, + "learning_rate": 3.7581062931634802e-06, + "loss": 0.088, + "step": 26539 + }, + { + "epoch": 72.31607629427793, + "grad_norm": 2.4039220809936523, + "learning_rate": 3.7574168481658435e-06, + "loss": 0.0694, + "step": 26540 + }, + { + "epoch": 72.31880108991825, + "grad_norm": 2.4391045570373535, + "learning_rate": 3.7567274517852424e-06, + "loss": 0.0649, + "step": 26541 + }, + { + "epoch": 72.32152588555859, + "grad_norm": 2.974087715148926, + "learning_rate": 3.756038104027051e-06, + "loss": 0.167, + "step": 26542 + }, + { + "epoch": 72.3242506811989, + "grad_norm": 2.3259406089782715, + "learning_rate": 3.7553488048966346e-06, + "loss": 0.04, + "step": 26543 + }, + { + "epoch": 72.32697547683924, + "grad_norm": 3.064772844314575, + "learning_rate": 3.75465955439936e-06, + "loss": 0.0509, + "step": 26544 + }, + { + "epoch": 72.32970027247957, + "grad_norm": 2.7310149669647217, + "learning_rate": 3.7539703525405925e-06, + "loss": 0.048, + "step": 26545 + }, + { + "epoch": 72.33242506811989, + "grad_norm": 2.478053569793701, + "learning_rate": 3.7532811993257056e-06, + "loss": 0.0353, + "step": 26546 + }, + { + "epoch": 72.33514986376022, + "grad_norm": 2.859170436859131, + "learning_rate": 3.752592094760065e-06, + "loss": 0.0429, + "step": 26547 + }, + { + "epoch": 72.33787465940054, + "grad_norm": 3.3203647136688232, + "learning_rate": 3.751903038849034e-06, + "loss": 0.0537, + "step": 26548 + }, + { + "epoch": 72.34059945504087, + "grad_norm": 3.221702814102173, + "learning_rate": 3.7512140315979794e-06, + "loss": 0.1904, + "step": 26549 + }, + { + "epoch": 72.34332425068119, + "grad_norm": 2.855668783187866, + "learning_rate": 3.750525073012271e-06, + "loss": 0.1714, + "step": 26550 + }, + { + "epoch": 72.34604904632153, + "grad_norm": 3.7057361602783203, + "learning_rate": 3.7498361630972733e-06, + "loss": 0.0936, + "step": 26551 + }, + { + "epoch": 72.34877384196186, + "grad_norm": 2.206052303314209, + "learning_rate": 3.7491473018583503e-06, + "loss": 0.0285, + "step": 26552 + }, + { + "epoch": 72.35149863760218, + "grad_norm": 2.6182804107666016, + "learning_rate": 3.7484584893008634e-06, + "loss": 0.0312, + "step": 26553 + }, + { + "epoch": 72.35422343324251, + "grad_norm": 2.748892307281494, + "learning_rate": 3.7477697254301836e-06, + "loss": 0.0283, + "step": 26554 + }, + { + "epoch": 72.35694822888283, + "grad_norm": 3.3066937923431396, + "learning_rate": 3.7470810102516717e-06, + "loss": 0.0997, + "step": 26555 + }, + { + "epoch": 72.35967302452316, + "grad_norm": 2.5142152309417725, + "learning_rate": 3.7463923437706896e-06, + "loss": 0.0376, + "step": 26556 + }, + { + "epoch": 72.3623978201635, + "grad_norm": 2.5725595951080322, + "learning_rate": 3.7457037259926043e-06, + "loss": 0.0853, + "step": 26557 + }, + { + "epoch": 72.36512261580381, + "grad_norm": 2.77140212059021, + "learning_rate": 3.7450151569227743e-06, + "loss": 0.0989, + "step": 26558 + }, + { + "epoch": 72.36784741144415, + "grad_norm": 2.4653334617614746, + "learning_rate": 3.744326636566569e-06, + "loss": 0.0472, + "step": 26559 + }, + { + "epoch": 72.37057220708446, + "grad_norm": 3.0174481868743896, + "learning_rate": 3.7436381649293463e-06, + "loss": 0.0407, + "step": 26560 + }, + { + "epoch": 72.3732970027248, + "grad_norm": 3.057506561279297, + "learning_rate": 3.7429497420164638e-06, + "loss": 0.1448, + "step": 26561 + }, + { + "epoch": 72.37602179836512, + "grad_norm": 2.8814988136291504, + "learning_rate": 3.742261367833292e-06, + "loss": 0.0594, + "step": 26562 + }, + { + "epoch": 72.37874659400545, + "grad_norm": 3.040027618408203, + "learning_rate": 3.741573042385187e-06, + "loss": 0.0563, + "step": 26563 + }, + { + "epoch": 72.38147138964578, + "grad_norm": 2.5569448471069336, + "learning_rate": 3.740884765677509e-06, + "loss": 0.0541, + "step": 26564 + }, + { + "epoch": 72.3841961852861, + "grad_norm": 3.7037227153778076, + "learning_rate": 3.740196537715617e-06, + "loss": 0.0613, + "step": 26565 + }, + { + "epoch": 72.38692098092643, + "grad_norm": 2.6009268760681152, + "learning_rate": 3.7395083585048752e-06, + "loss": 0.0523, + "step": 26566 + }, + { + "epoch": 72.38964577656675, + "grad_norm": 4.700798034667969, + "learning_rate": 3.7388202280506413e-06, + "loss": 0.0878, + "step": 26567 + }, + { + "epoch": 72.39237057220708, + "grad_norm": 2.977999210357666, + "learning_rate": 3.738132146358273e-06, + "loss": 0.1726, + "step": 26568 + }, + { + "epoch": 72.39509536784742, + "grad_norm": 2.9839766025543213, + "learning_rate": 3.7374441134331276e-06, + "loss": 0.2143, + "step": 26569 + }, + { + "epoch": 72.39782016348774, + "grad_norm": 3.3047571182250977, + "learning_rate": 3.7367561292805686e-06, + "loss": 0.1686, + "step": 26570 + }, + { + "epoch": 72.40054495912807, + "grad_norm": 3.0683958530426025, + "learning_rate": 3.736068193905952e-06, + "loss": 0.1967, + "step": 26571 + }, + { + "epoch": 72.40326975476839, + "grad_norm": 1.989783525466919, + "learning_rate": 3.7353803073146343e-06, + "loss": 0.0271, + "step": 26572 + }, + { + "epoch": 72.40599455040872, + "grad_norm": 3.054657220840454, + "learning_rate": 3.73469246951197e-06, + "loss": 0.0312, + "step": 26573 + }, + { + "epoch": 72.40871934604904, + "grad_norm": 2.4195311069488525, + "learning_rate": 3.7340046805033224e-06, + "loss": 0.1068, + "step": 26574 + }, + { + "epoch": 72.41144414168937, + "grad_norm": 2.761606454849243, + "learning_rate": 3.7333169402940407e-06, + "loss": 0.234, + "step": 26575 + }, + { + "epoch": 72.4141689373297, + "grad_norm": 3.4567863941192627, + "learning_rate": 3.732629248889489e-06, + "loss": 0.1427, + "step": 26576 + }, + { + "epoch": 72.41689373297002, + "grad_norm": 3.849689245223999, + "learning_rate": 3.7319416062950154e-06, + "loss": 0.1498, + "step": 26577 + }, + { + "epoch": 72.41961852861036, + "grad_norm": 2.1619315147399902, + "learning_rate": 3.731254012515982e-06, + "loss": 0.0286, + "step": 26578 + }, + { + "epoch": 72.42234332425068, + "grad_norm": 3.229844570159912, + "learning_rate": 3.7305664675577415e-06, + "loss": 0.0593, + "step": 26579 + }, + { + "epoch": 72.42506811989101, + "grad_norm": 3.447657585144043, + "learning_rate": 3.729878971425647e-06, + "loss": 0.0839, + "step": 26580 + }, + { + "epoch": 72.42779291553134, + "grad_norm": 2.009647846221924, + "learning_rate": 3.72919152412505e-06, + "loss": 0.0259, + "step": 26581 + }, + { + "epoch": 72.43051771117166, + "grad_norm": 4.244502067565918, + "learning_rate": 3.7285041256613095e-06, + "loss": 0.0511, + "step": 26582 + }, + { + "epoch": 72.433242506812, + "grad_norm": 3.3259167671203613, + "learning_rate": 3.7278167760397788e-06, + "loss": 0.1067, + "step": 26583 + }, + { + "epoch": 72.43596730245231, + "grad_norm": 3.9733872413635254, + "learning_rate": 3.7271294752658093e-06, + "loss": 0.0612, + "step": 26584 + }, + { + "epoch": 72.43869209809264, + "grad_norm": 2.89430832862854, + "learning_rate": 3.7264422233447496e-06, + "loss": 0.046, + "step": 26585 + }, + { + "epoch": 72.44141689373296, + "grad_norm": 3.904181957244873, + "learning_rate": 3.7257550202819593e-06, + "loss": 0.3219, + "step": 26586 + }, + { + "epoch": 72.4441416893733, + "grad_norm": 2.950934886932373, + "learning_rate": 3.7250678660827867e-06, + "loss": 0.0394, + "step": 26587 + }, + { + "epoch": 72.44686648501363, + "grad_norm": 3.6347861289978027, + "learning_rate": 3.724380760752584e-06, + "loss": 0.0587, + "step": 26588 + }, + { + "epoch": 72.44959128065395, + "grad_norm": 3.4159059524536133, + "learning_rate": 3.723693704296698e-06, + "loss": 0.0834, + "step": 26589 + }, + { + "epoch": 72.45231607629428, + "grad_norm": 3.026069164276123, + "learning_rate": 3.723006696720487e-06, + "loss": 0.1139, + "step": 26590 + }, + { + "epoch": 72.4550408719346, + "grad_norm": 4.08567476272583, + "learning_rate": 3.7223197380292986e-06, + "loss": 0.0452, + "step": 26591 + }, + { + "epoch": 72.45776566757493, + "grad_norm": 3.3417935371398926, + "learning_rate": 3.7216328282284776e-06, + "loss": 0.2245, + "step": 26592 + }, + { + "epoch": 72.46049046321527, + "grad_norm": 3.017200231552124, + "learning_rate": 3.7209459673233817e-06, + "loss": 0.0349, + "step": 26593 + }, + { + "epoch": 72.46321525885558, + "grad_norm": 3.1273984909057617, + "learning_rate": 3.7202591553193534e-06, + "loss": 0.0397, + "step": 26594 + }, + { + "epoch": 72.46594005449592, + "grad_norm": 3.3112401962280273, + "learning_rate": 3.7195723922217487e-06, + "loss": 0.0501, + "step": 26595 + }, + { + "epoch": 72.46866485013624, + "grad_norm": 5.199794292449951, + "learning_rate": 3.7188856780359117e-06, + "loss": 0.0353, + "step": 26596 + }, + { + "epoch": 72.47138964577657, + "grad_norm": 4.355407238006592, + "learning_rate": 3.718199012767186e-06, + "loss": 0.3405, + "step": 26597 + }, + { + "epoch": 72.47411444141689, + "grad_norm": 3.16474986076355, + "learning_rate": 3.7175123964209293e-06, + "loss": 0.0604, + "step": 26598 + }, + { + "epoch": 72.47683923705722, + "grad_norm": 3.2281923294067383, + "learning_rate": 3.716825829002484e-06, + "loss": 0.0713, + "step": 26599 + }, + { + "epoch": 72.47956403269755, + "grad_norm": 3.2811269760131836, + "learning_rate": 3.716139310517196e-06, + "loss": 0.1078, + "step": 26600 + }, + { + "epoch": 72.48228882833787, + "grad_norm": 2.6293327808380127, + "learning_rate": 3.7154528409704095e-06, + "loss": 0.1453, + "step": 26601 + }, + { + "epoch": 72.4850136239782, + "grad_norm": 4.739869594573975, + "learning_rate": 3.714766420367478e-06, + "loss": 0.0462, + "step": 26602 + }, + { + "epoch": 72.48773841961852, + "grad_norm": 2.9011590480804443, + "learning_rate": 3.7140800487137428e-06, + "loss": 0.0772, + "step": 26603 + }, + { + "epoch": 72.49046321525886, + "grad_norm": 3.0490882396698, + "learning_rate": 3.71339372601455e-06, + "loss": 0.0356, + "step": 26604 + }, + { + "epoch": 72.49318801089919, + "grad_norm": 2.6441643238067627, + "learning_rate": 3.7127074522752416e-06, + "loss": 0.0935, + "step": 26605 + }, + { + "epoch": 72.49591280653951, + "grad_norm": 3.0331103801727295, + "learning_rate": 3.712021227501168e-06, + "loss": 0.0676, + "step": 26606 + }, + { + "epoch": 72.49863760217984, + "grad_norm": 3.3428590297698975, + "learning_rate": 3.711335051697671e-06, + "loss": 0.1346, + "step": 26607 + }, + { + "epoch": 72.50136239782016, + "grad_norm": 2.761168956756592, + "learning_rate": 3.710648924870094e-06, + "loss": 0.0494, + "step": 26608 + }, + { + "epoch": 72.50408719346049, + "grad_norm": 2.2414186000823975, + "learning_rate": 3.709962847023777e-06, + "loss": 0.1006, + "step": 26609 + }, + { + "epoch": 72.50681198910081, + "grad_norm": 1.9201786518096924, + "learning_rate": 3.709276818164067e-06, + "loss": 0.1983, + "step": 26610 + }, + { + "epoch": 72.50953678474114, + "grad_norm": 2.128126621246338, + "learning_rate": 3.708590838296311e-06, + "loss": 0.0338, + "step": 26611 + }, + { + "epoch": 72.51226158038148, + "grad_norm": 5.717984199523926, + "learning_rate": 3.7079049074258465e-06, + "loss": 0.0615, + "step": 26612 + }, + { + "epoch": 72.5149863760218, + "grad_norm": 2.956634283065796, + "learning_rate": 3.7072190255580153e-06, + "loss": 0.0443, + "step": 26613 + }, + { + "epoch": 72.51771117166213, + "grad_norm": 3.8963871002197266, + "learning_rate": 3.7065331926981573e-06, + "loss": 0.0396, + "step": 26614 + }, + { + "epoch": 72.52043596730245, + "grad_norm": 2.367657423019409, + "learning_rate": 3.7058474088516194e-06, + "loss": 0.0296, + "step": 26615 + }, + { + "epoch": 72.52316076294278, + "grad_norm": 3.041741132736206, + "learning_rate": 3.7051616740237396e-06, + "loss": 0.0977, + "step": 26616 + }, + { + "epoch": 72.52588555858311, + "grad_norm": 2.3505899906158447, + "learning_rate": 3.7044759882198576e-06, + "loss": 0.0529, + "step": 26617 + }, + { + "epoch": 72.52861035422343, + "grad_norm": 2.8662209510803223, + "learning_rate": 3.703790351445311e-06, + "loss": 0.1394, + "step": 26618 + }, + { + "epoch": 72.53133514986376, + "grad_norm": 3.9677467346191406, + "learning_rate": 3.703104763705446e-06, + "loss": 0.0593, + "step": 26619 + }, + { + "epoch": 72.53405994550408, + "grad_norm": 3.4518957138061523, + "learning_rate": 3.702419225005598e-06, + "loss": 0.1954, + "step": 26620 + }, + { + "epoch": 72.53678474114442, + "grad_norm": 2.4246394634246826, + "learning_rate": 3.701733735351103e-06, + "loss": 0.055, + "step": 26621 + }, + { + "epoch": 72.53950953678473, + "grad_norm": 2.5853323936462402, + "learning_rate": 3.701048294747307e-06, + "loss": 0.0369, + "step": 26622 + }, + { + "epoch": 72.54223433242507, + "grad_norm": 3.6149227619171143, + "learning_rate": 3.7003629031995436e-06, + "loss": 0.1518, + "step": 26623 + }, + { + "epoch": 72.5449591280654, + "grad_norm": 3.3796393871307373, + "learning_rate": 3.6996775607131507e-06, + "loss": 0.0401, + "step": 26624 + }, + { + "epoch": 72.54768392370572, + "grad_norm": 3.288841724395752, + "learning_rate": 3.698992267293464e-06, + "loss": 0.0923, + "step": 26625 + }, + { + "epoch": 72.55040871934605, + "grad_norm": 3.312417984008789, + "learning_rate": 3.6983070229458216e-06, + "loss": 0.0473, + "step": 26626 + }, + { + "epoch": 72.55313351498637, + "grad_norm": 2.734294891357422, + "learning_rate": 3.6976218276755647e-06, + "loss": 0.0445, + "step": 26627 + }, + { + "epoch": 72.5558583106267, + "grad_norm": 2.6206490993499756, + "learning_rate": 3.696936681488027e-06, + "loss": 0.0338, + "step": 26628 + }, + { + "epoch": 72.55858310626704, + "grad_norm": 2.402534246444702, + "learning_rate": 3.696251584388544e-06, + "loss": 0.0339, + "step": 26629 + }, + { + "epoch": 72.56130790190736, + "grad_norm": 3.5467193126678467, + "learning_rate": 3.6955665363824455e-06, + "loss": 0.1125, + "step": 26630 + }, + { + "epoch": 72.56403269754769, + "grad_norm": 3.2578461170196533, + "learning_rate": 3.694881537475077e-06, + "loss": 0.048, + "step": 26631 + }, + { + "epoch": 72.566757493188, + "grad_norm": 3.4806723594665527, + "learning_rate": 3.6941965876717667e-06, + "loss": 0.065, + "step": 26632 + }, + { + "epoch": 72.56948228882834, + "grad_norm": 3.2064919471740723, + "learning_rate": 3.693511686977852e-06, + "loss": 0.0941, + "step": 26633 + }, + { + "epoch": 72.57220708446866, + "grad_norm": 2.320227861404419, + "learning_rate": 3.692826835398661e-06, + "loss": 0.0995, + "step": 26634 + }, + { + "epoch": 72.57493188010899, + "grad_norm": 3.9799299240112305, + "learning_rate": 3.692142032939535e-06, + "loss": 0.1618, + "step": 26635 + }, + { + "epoch": 72.57765667574932, + "grad_norm": 2.474313497543335, + "learning_rate": 3.6914572796058033e-06, + "loss": 0.0265, + "step": 26636 + }, + { + "epoch": 72.58038147138964, + "grad_norm": 3.85147762298584, + "learning_rate": 3.6907725754028e-06, + "loss": 0.0505, + "step": 26637 + }, + { + "epoch": 72.58310626702998, + "grad_norm": 2.8720130920410156, + "learning_rate": 3.6900879203358543e-06, + "loss": 0.0906, + "step": 26638 + }, + { + "epoch": 72.5858310626703, + "grad_norm": 4.143994331359863, + "learning_rate": 3.6894033144103025e-06, + "loss": 0.2785, + "step": 26639 + }, + { + "epoch": 72.58855585831063, + "grad_norm": 2.5250139236450195, + "learning_rate": 3.6887187576314755e-06, + "loss": 0.0484, + "step": 26640 + }, + { + "epoch": 72.59128065395096, + "grad_norm": 2.678302526473999, + "learning_rate": 3.688034250004704e-06, + "loss": 0.0388, + "step": 26641 + }, + { + "epoch": 72.59400544959128, + "grad_norm": 3.1381940841674805, + "learning_rate": 3.687349791535314e-06, + "loss": 0.0447, + "step": 26642 + }, + { + "epoch": 72.59673024523161, + "grad_norm": 2.558359146118164, + "learning_rate": 3.6866653822286457e-06, + "loss": 0.0561, + "step": 26643 + }, + { + "epoch": 72.59945504087193, + "grad_norm": 2.7017393112182617, + "learning_rate": 3.685981022090019e-06, + "loss": 0.0344, + "step": 26644 + }, + { + "epoch": 72.60217983651226, + "grad_norm": 3.1276755332946777, + "learning_rate": 3.685296711124774e-06, + "loss": 0.0422, + "step": 26645 + }, + { + "epoch": 72.60490463215258, + "grad_norm": 4.713883876800537, + "learning_rate": 3.684612449338231e-06, + "loss": 0.1321, + "step": 26646 + }, + { + "epoch": 72.60762942779292, + "grad_norm": 2.7960073947906494, + "learning_rate": 3.6839282367357256e-06, + "loss": 0.0768, + "step": 26647 + }, + { + "epoch": 72.61035422343325, + "grad_norm": 2.353724479675293, + "learning_rate": 3.683244073322584e-06, + "loss": 0.0423, + "step": 26648 + }, + { + "epoch": 72.61307901907357, + "grad_norm": 2.059302568435669, + "learning_rate": 3.682559959104135e-06, + "loss": 0.0322, + "step": 26649 + }, + { + "epoch": 72.6158038147139, + "grad_norm": 5.215627193450928, + "learning_rate": 3.6818758940857014e-06, + "loss": 0.0433, + "step": 26650 + }, + { + "epoch": 72.61852861035422, + "grad_norm": 2.479736089706421, + "learning_rate": 3.6811918782726197e-06, + "loss": 0.0568, + "step": 26651 + }, + { + "epoch": 72.62125340599455, + "grad_norm": 7.511143684387207, + "learning_rate": 3.680507911670211e-06, + "loss": 0.0508, + "step": 26652 + }, + { + "epoch": 72.62397820163488, + "grad_norm": 2.905149221420288, + "learning_rate": 3.6798239942838042e-06, + "loss": 0.0319, + "step": 26653 + }, + { + "epoch": 72.6267029972752, + "grad_norm": 3.5439958572387695, + "learning_rate": 3.679140126118721e-06, + "loss": 0.0714, + "step": 26654 + }, + { + "epoch": 72.62942779291554, + "grad_norm": 2.8212172985076904, + "learning_rate": 3.6784563071802935e-06, + "loss": 0.0584, + "step": 26655 + }, + { + "epoch": 72.63215258855585, + "grad_norm": 2.913501739501953, + "learning_rate": 3.677772537473846e-06, + "loss": 0.0654, + "step": 26656 + }, + { + "epoch": 72.63487738419619, + "grad_norm": 3.516343832015991, + "learning_rate": 3.6770888170047026e-06, + "loss": 0.0756, + "step": 26657 + }, + { + "epoch": 72.6376021798365, + "grad_norm": 2.9517154693603516, + "learning_rate": 3.6764051457781836e-06, + "loss": 0.0375, + "step": 26658 + }, + { + "epoch": 72.64032697547684, + "grad_norm": 2.010986804962158, + "learning_rate": 3.6757215237996225e-06, + "loss": 0.0317, + "step": 26659 + }, + { + "epoch": 72.64305177111717, + "grad_norm": 2.282716751098633, + "learning_rate": 3.6750379510743374e-06, + "loss": 0.0457, + "step": 26660 + }, + { + "epoch": 72.64577656675749, + "grad_norm": 2.6153957843780518, + "learning_rate": 3.6743544276076503e-06, + "loss": 0.0641, + "step": 26661 + }, + { + "epoch": 72.64850136239782, + "grad_norm": 2.0542514324188232, + "learning_rate": 3.6736709534048877e-06, + "loss": 0.0901, + "step": 26662 + }, + { + "epoch": 72.65122615803814, + "grad_norm": 2.8648242950439453, + "learning_rate": 3.6729875284713746e-06, + "loss": 0.1693, + "step": 26663 + }, + { + "epoch": 72.65395095367847, + "grad_norm": 3.498901605606079, + "learning_rate": 3.6723041528124314e-06, + "loss": 0.1068, + "step": 26664 + }, + { + "epoch": 72.65667574931881, + "grad_norm": 2.831108808517456, + "learning_rate": 3.67162082643338e-06, + "loss": 0.06, + "step": 26665 + }, + { + "epoch": 72.65940054495913, + "grad_norm": 1.8966275453567505, + "learning_rate": 3.6709375493395383e-06, + "loss": 0.098, + "step": 26666 + }, + { + "epoch": 72.66212534059946, + "grad_norm": 2.278327465057373, + "learning_rate": 3.670254321536235e-06, + "loss": 0.026, + "step": 26667 + }, + { + "epoch": 72.66485013623978, + "grad_norm": 2.6790900230407715, + "learning_rate": 3.6695711430287873e-06, + "loss": 0.0507, + "step": 26668 + }, + { + "epoch": 72.66757493188011, + "grad_norm": 3.771758794784546, + "learning_rate": 3.6688880138225158e-06, + "loss": 0.057, + "step": 26669 + }, + { + "epoch": 72.67029972752043, + "grad_norm": 4.955124855041504, + "learning_rate": 3.6682049339227364e-06, + "loss": 0.1053, + "step": 26670 + }, + { + "epoch": 72.67302452316076, + "grad_norm": 3.757066011428833, + "learning_rate": 3.6675219033347775e-06, + "loss": 0.1213, + "step": 26671 + }, + { + "epoch": 72.6757493188011, + "grad_norm": 3.1228342056274414, + "learning_rate": 3.6668389220639545e-06, + "loss": 0.075, + "step": 26672 + }, + { + "epoch": 72.67847411444141, + "grad_norm": 3.0710763931274414, + "learning_rate": 3.6661559901155852e-06, + "loss": 0.0684, + "step": 26673 + }, + { + "epoch": 72.68119891008175, + "grad_norm": 3.2185308933258057, + "learning_rate": 3.6654731074949856e-06, + "loss": 0.0791, + "step": 26674 + }, + { + "epoch": 72.68392370572207, + "grad_norm": 7.934180736541748, + "learning_rate": 3.6647902742074825e-06, + "loss": 0.1657, + "step": 26675 + }, + { + "epoch": 72.6866485013624, + "grad_norm": 4.300521373748779, + "learning_rate": 3.6641074902583875e-06, + "loss": 0.0225, + "step": 26676 + }, + { + "epoch": 72.68937329700273, + "grad_norm": 2.9716007709503174, + "learning_rate": 3.66342475565302e-06, + "loss": 0.064, + "step": 26677 + }, + { + "epoch": 72.69209809264305, + "grad_norm": 3.14971661567688, + "learning_rate": 3.662742070396693e-06, + "loss": 0.0609, + "step": 26678 + }, + { + "epoch": 72.69482288828338, + "grad_norm": 3.2120299339294434, + "learning_rate": 3.662059434494727e-06, + "loss": 0.0929, + "step": 26679 + }, + { + "epoch": 72.6975476839237, + "grad_norm": 3.51916766166687, + "learning_rate": 3.6613768479524413e-06, + "loss": 0.1384, + "step": 26680 + }, + { + "epoch": 72.70027247956403, + "grad_norm": 4.655309677124023, + "learning_rate": 3.660694310775148e-06, + "loss": 0.1508, + "step": 26681 + }, + { + "epoch": 72.70299727520435, + "grad_norm": 3.1374423503875732, + "learning_rate": 3.6600118229681646e-06, + "loss": 0.0478, + "step": 26682 + }, + { + "epoch": 72.70572207084469, + "grad_norm": 2.7924439907073975, + "learning_rate": 3.6593293845368018e-06, + "loss": 0.0433, + "step": 26683 + }, + { + "epoch": 72.70844686648502, + "grad_norm": 3.6497044563293457, + "learning_rate": 3.65864699548638e-06, + "loss": 0.1211, + "step": 26684 + }, + { + "epoch": 72.71117166212534, + "grad_norm": 3.0881779193878174, + "learning_rate": 3.6579646558222117e-06, + "loss": 0.1173, + "step": 26685 + }, + { + "epoch": 72.71389645776567, + "grad_norm": 3.23443603515625, + "learning_rate": 3.657282365549607e-06, + "loss": 0.164, + "step": 26686 + }, + { + "epoch": 72.71662125340599, + "grad_norm": 3.1497604846954346, + "learning_rate": 3.656600124673887e-06, + "loss": 0.0569, + "step": 26687 + }, + { + "epoch": 72.71934604904632, + "grad_norm": 2.4993958473205566, + "learning_rate": 3.6559179332003603e-06, + "loss": 0.0498, + "step": 26688 + }, + { + "epoch": 72.72207084468666, + "grad_norm": 2.9620442390441895, + "learning_rate": 3.6552357911343416e-06, + "loss": 0.1731, + "step": 26689 + }, + { + "epoch": 72.72479564032697, + "grad_norm": 3.671299695968628, + "learning_rate": 3.654553698481138e-06, + "loss": 0.0831, + "step": 26690 + }, + { + "epoch": 72.7275204359673, + "grad_norm": 3.332897901535034, + "learning_rate": 3.6538716552460708e-06, + "loss": 0.0389, + "step": 26691 + }, + { + "epoch": 72.73024523160763, + "grad_norm": 3.292475461959839, + "learning_rate": 3.6531896614344454e-06, + "loss": 0.1481, + "step": 26692 + }, + { + "epoch": 72.73297002724796, + "grad_norm": 2.9264400005340576, + "learning_rate": 3.6525077170515755e-06, + "loss": 0.0834, + "step": 26693 + }, + { + "epoch": 72.73569482288828, + "grad_norm": 4.83539342880249, + "learning_rate": 3.651825822102767e-06, + "loss": 0.0667, + "step": 26694 + }, + { + "epoch": 72.73841961852861, + "grad_norm": 3.4476091861724854, + "learning_rate": 3.6511439765933355e-06, + "loss": 0.0489, + "step": 26695 + }, + { + "epoch": 72.74114441416894, + "grad_norm": 2.714822292327881, + "learning_rate": 3.6504621805285935e-06, + "loss": 0.0454, + "step": 26696 + }, + { + "epoch": 72.74386920980926, + "grad_norm": 2.8618080615997314, + "learning_rate": 3.6497804339138463e-06, + "loss": 0.046, + "step": 26697 + }, + { + "epoch": 72.7465940054496, + "grad_norm": 2.8192522525787354, + "learning_rate": 3.649098736754406e-06, + "loss": 0.2039, + "step": 26698 + }, + { + "epoch": 72.74931880108991, + "grad_norm": 2.843562602996826, + "learning_rate": 3.648417089055577e-06, + "loss": 0.0672, + "step": 26699 + }, + { + "epoch": 72.75204359673025, + "grad_norm": 3.9819788932800293, + "learning_rate": 3.647735490822675e-06, + "loss": 0.1324, + "step": 26700 + }, + { + "epoch": 72.75476839237058, + "grad_norm": 11.397708892822266, + "learning_rate": 3.647053942061004e-06, + "loss": 0.1266, + "step": 26701 + }, + { + "epoch": 72.7574931880109, + "grad_norm": 3.057208299636841, + "learning_rate": 3.646372442775873e-06, + "loss": 0.0311, + "step": 26702 + }, + { + "epoch": 72.76021798365123, + "grad_norm": 2.358063220977783, + "learning_rate": 3.645690992972585e-06, + "loss": 0.0453, + "step": 26703 + }, + { + "epoch": 72.76294277929155, + "grad_norm": 1.9550522565841675, + "learning_rate": 3.6450095926564542e-06, + "loss": 0.1477, + "step": 26704 + }, + { + "epoch": 72.76566757493188, + "grad_norm": 3.588242769241333, + "learning_rate": 3.6443282418327853e-06, + "loss": 0.1253, + "step": 26705 + }, + { + "epoch": 72.7683923705722, + "grad_norm": 2.846660852432251, + "learning_rate": 3.6436469405068787e-06, + "loss": 0.066, + "step": 26706 + }, + { + "epoch": 72.77111716621253, + "grad_norm": 7.941333770751953, + "learning_rate": 3.642965688684049e-06, + "loss": 0.1424, + "step": 26707 + }, + { + "epoch": 72.77384196185287, + "grad_norm": 2.316028118133545, + "learning_rate": 3.6422844863695983e-06, + "loss": 0.0395, + "step": 26708 + }, + { + "epoch": 72.77656675749319, + "grad_norm": 3.421424150466919, + "learning_rate": 3.6416033335688306e-06, + "loss": 0.0837, + "step": 26709 + }, + { + "epoch": 72.77929155313352, + "grad_norm": 2.974992513656616, + "learning_rate": 3.6409222302870494e-06, + "loss": 0.1099, + "step": 26710 + }, + { + "epoch": 72.78201634877384, + "grad_norm": 2.0351364612579346, + "learning_rate": 3.640241176529563e-06, + "loss": 0.0329, + "step": 26711 + }, + { + "epoch": 72.78474114441417, + "grad_norm": 3.1755497455596924, + "learning_rate": 3.6395601723016714e-06, + "loss": 0.0704, + "step": 26712 + }, + { + "epoch": 72.7874659400545, + "grad_norm": 2.6936593055725098, + "learning_rate": 3.638879217608684e-06, + "loss": 0.0381, + "step": 26713 + }, + { + "epoch": 72.79019073569482, + "grad_norm": 2.541172504425049, + "learning_rate": 3.6381983124558994e-06, + "loss": 0.05, + "step": 26714 + }, + { + "epoch": 72.79291553133515, + "grad_norm": 2.3149075508117676, + "learning_rate": 3.637517456848619e-06, + "loss": 0.0375, + "step": 26715 + }, + { + "epoch": 72.79564032697547, + "grad_norm": 2.674375295639038, + "learning_rate": 3.6368366507921514e-06, + "loss": 0.0748, + "step": 26716 + }, + { + "epoch": 72.7983651226158, + "grad_norm": 3.304030656814575, + "learning_rate": 3.636155894291795e-06, + "loss": 0.0609, + "step": 26717 + }, + { + "epoch": 72.80108991825612, + "grad_norm": 2.0676522254943848, + "learning_rate": 3.6354751873528515e-06, + "loss": 0.0558, + "step": 26718 + }, + { + "epoch": 72.80381471389646, + "grad_norm": 1.728627324104309, + "learning_rate": 3.634794529980619e-06, + "loss": 0.027, + "step": 26719 + }, + { + "epoch": 72.80653950953679, + "grad_norm": 2.3659069538116455, + "learning_rate": 3.6341139221804057e-06, + "loss": 0.0548, + "step": 26720 + }, + { + "epoch": 72.80926430517711, + "grad_norm": 3.3464324474334717, + "learning_rate": 3.633433363957507e-06, + "loss": 0.0561, + "step": 26721 + }, + { + "epoch": 72.81198910081744, + "grad_norm": 4.956269264221191, + "learning_rate": 3.6327528553172252e-06, + "loss": 0.0505, + "step": 26722 + }, + { + "epoch": 72.81471389645776, + "grad_norm": 2.6530561447143555, + "learning_rate": 3.6320723962648564e-06, + "loss": 0.0955, + "step": 26723 + }, + { + "epoch": 72.8174386920981, + "grad_norm": 3.5711658000946045, + "learning_rate": 3.631391986805706e-06, + "loss": 0.1004, + "step": 26724 + }, + { + "epoch": 72.82016348773843, + "grad_norm": 3.119831085205078, + "learning_rate": 3.6307116269450692e-06, + "loss": 0.1096, + "step": 26725 + }, + { + "epoch": 72.82288828337875, + "grad_norm": 2.1545567512512207, + "learning_rate": 3.630031316688245e-06, + "loss": 0.0499, + "step": 26726 + }, + { + "epoch": 72.82561307901908, + "grad_norm": 5.135312080383301, + "learning_rate": 3.62935105604053e-06, + "loss": 0.0863, + "step": 26727 + }, + { + "epoch": 72.8283378746594, + "grad_norm": 3.198873996734619, + "learning_rate": 3.628670845007226e-06, + "loss": 0.172, + "step": 26728 + }, + { + "epoch": 72.83106267029973, + "grad_norm": 2.5908055305480957, + "learning_rate": 3.6279906835936287e-06, + "loss": 0.047, + "step": 26729 + }, + { + "epoch": 72.83378746594005, + "grad_norm": 10.214290618896484, + "learning_rate": 3.627310571805032e-06, + "loss": 0.0654, + "step": 26730 + }, + { + "epoch": 72.83651226158038, + "grad_norm": 2.863939046859741, + "learning_rate": 3.626630509646735e-06, + "loss": 0.1027, + "step": 26731 + }, + { + "epoch": 72.83923705722071, + "grad_norm": 2.706066370010376, + "learning_rate": 3.625950497124038e-06, + "loss": 0.0346, + "step": 26732 + }, + { + "epoch": 72.84196185286103, + "grad_norm": 3.4561679363250732, + "learning_rate": 3.6252705342422335e-06, + "loss": 0.071, + "step": 26733 + }, + { + "epoch": 72.84468664850137, + "grad_norm": 3.2190403938293457, + "learning_rate": 3.6245906210066163e-06, + "loss": 0.058, + "step": 26734 + }, + { + "epoch": 72.84741144414168, + "grad_norm": 2.655494213104248, + "learning_rate": 3.6239107574224785e-06, + "loss": 0.08, + "step": 26735 + }, + { + "epoch": 72.85013623978202, + "grad_norm": 3.1073572635650635, + "learning_rate": 3.623230943495123e-06, + "loss": 0.062, + "step": 26736 + }, + { + "epoch": 72.85286103542235, + "grad_norm": 2.9819273948669434, + "learning_rate": 3.6225511792298397e-06, + "loss": 0.0703, + "step": 26737 + }, + { + "epoch": 72.85558583106267, + "grad_norm": 3.415374517440796, + "learning_rate": 3.621871464631922e-06, + "loss": 0.0901, + "step": 26738 + }, + { + "epoch": 72.858310626703, + "grad_norm": 2.0922327041625977, + "learning_rate": 3.6211917997066603e-06, + "loss": 0.0298, + "step": 26739 + }, + { + "epoch": 72.86103542234332, + "grad_norm": 3.240495204925537, + "learning_rate": 3.620512184459356e-06, + "loss": 0.1008, + "step": 26740 + }, + { + "epoch": 72.86376021798365, + "grad_norm": 4.21572732925415, + "learning_rate": 3.619832618895297e-06, + "loss": 0.1594, + "step": 26741 + }, + { + "epoch": 72.86648501362397, + "grad_norm": 3.3194217681884766, + "learning_rate": 3.619153103019776e-06, + "loss": 0.244, + "step": 26742 + }, + { + "epoch": 72.8692098092643, + "grad_norm": 2.888566732406616, + "learning_rate": 3.6184736368380813e-06, + "loss": 0.2054, + "step": 26743 + }, + { + "epoch": 72.87193460490464, + "grad_norm": 2.522555351257324, + "learning_rate": 3.6177942203555125e-06, + "loss": 0.049, + "step": 26744 + }, + { + "epoch": 72.87465940054496, + "grad_norm": 2.3681910037994385, + "learning_rate": 3.617114853577357e-06, + "loss": 0.0834, + "step": 26745 + }, + { + "epoch": 72.87738419618529, + "grad_norm": 2.3938636779785156, + "learning_rate": 3.6164355365089067e-06, + "loss": 0.0289, + "step": 26746 + }, + { + "epoch": 72.88010899182561, + "grad_norm": 2.468428373336792, + "learning_rate": 3.615756269155446e-06, + "loss": 0.029, + "step": 26747 + }, + { + "epoch": 72.88283378746594, + "grad_norm": 2.586638927459717, + "learning_rate": 3.61507705152227e-06, + "loss": 0.1221, + "step": 26748 + }, + { + "epoch": 72.88555858310627, + "grad_norm": 2.7505125999450684, + "learning_rate": 3.6143978836146733e-06, + "loss": 0.0405, + "step": 26749 + }, + { + "epoch": 72.88828337874659, + "grad_norm": 3.3790388107299805, + "learning_rate": 3.613718765437939e-06, + "loss": 0.0671, + "step": 26750 + }, + { + "epoch": 72.89100817438693, + "grad_norm": 3.445241928100586, + "learning_rate": 3.6130396969973546e-06, + "loss": 0.0962, + "step": 26751 + }, + { + "epoch": 72.89373297002724, + "grad_norm": 2.545253038406372, + "learning_rate": 3.6123606782982147e-06, + "loss": 0.0629, + "step": 26752 + }, + { + "epoch": 72.89645776566758, + "grad_norm": 2.597722291946411, + "learning_rate": 3.6116817093458034e-06, + "loss": 0.0369, + "step": 26753 + }, + { + "epoch": 72.8991825613079, + "grad_norm": 4.2187581062316895, + "learning_rate": 3.61100279014541e-06, + "loss": 0.1163, + "step": 26754 + }, + { + "epoch": 72.90190735694823, + "grad_norm": 2.331432819366455, + "learning_rate": 3.610323920702319e-06, + "loss": 0.0714, + "step": 26755 + }, + { + "epoch": 72.90463215258856, + "grad_norm": 2.561901807785034, + "learning_rate": 3.6096451010218214e-06, + "loss": 0.2032, + "step": 26756 + }, + { + "epoch": 72.90735694822888, + "grad_norm": 4.418798923492432, + "learning_rate": 3.6089663311092025e-06, + "loss": 0.0755, + "step": 26757 + }, + { + "epoch": 72.91008174386921, + "grad_norm": 2.8942484855651855, + "learning_rate": 3.6082876109697485e-06, + "loss": 0.0472, + "step": 26758 + }, + { + "epoch": 72.91280653950953, + "grad_norm": 3.2254064083099365, + "learning_rate": 3.607608940608741e-06, + "loss": 0.0389, + "step": 26759 + }, + { + "epoch": 72.91553133514986, + "grad_norm": 2.458869457244873, + "learning_rate": 3.606930320031474e-06, + "loss": 0.0553, + "step": 26760 + }, + { + "epoch": 72.9182561307902, + "grad_norm": 2.1937780380249023, + "learning_rate": 3.606251749243227e-06, + "loss": 0.0553, + "step": 26761 + }, + { + "epoch": 72.92098092643052, + "grad_norm": 3.7588653564453125, + "learning_rate": 3.605573228249285e-06, + "loss": 0.034, + "step": 26762 + }, + { + "epoch": 72.92370572207085, + "grad_norm": 2.7398927211761475, + "learning_rate": 3.604894757054931e-06, + "loss": 0.0645, + "step": 26763 + }, + { + "epoch": 72.92643051771117, + "grad_norm": 3.0189967155456543, + "learning_rate": 3.604216335665449e-06, + "loss": 0.0494, + "step": 26764 + }, + { + "epoch": 72.9291553133515, + "grad_norm": 2.9006359577178955, + "learning_rate": 3.603537964086129e-06, + "loss": 0.0943, + "step": 26765 + }, + { + "epoch": 72.93188010899182, + "grad_norm": 2.7495157718658447, + "learning_rate": 3.6028596423222484e-06, + "loss": 0.0894, + "step": 26766 + }, + { + "epoch": 72.93460490463215, + "grad_norm": 3.0567915439605713, + "learning_rate": 3.602181370379092e-06, + "loss": 0.0565, + "step": 26767 + }, + { + "epoch": 72.93732970027249, + "grad_norm": 2.584810972213745, + "learning_rate": 3.601503148261938e-06, + "loss": 0.0321, + "step": 26768 + }, + { + "epoch": 72.9400544959128, + "grad_norm": 3.017181396484375, + "learning_rate": 3.6008249759760737e-06, + "loss": 0.0334, + "step": 26769 + }, + { + "epoch": 72.94277929155314, + "grad_norm": 2.5840861797332764, + "learning_rate": 3.600146853526779e-06, + "loss": 0.0415, + "step": 26770 + }, + { + "epoch": 72.94550408719346, + "grad_norm": 5.155364036560059, + "learning_rate": 3.5994687809193317e-06, + "loss": 0.1858, + "step": 26771 + }, + { + "epoch": 72.94822888283379, + "grad_norm": 4.191073417663574, + "learning_rate": 3.598790758159019e-06, + "loss": 0.0839, + "step": 26772 + }, + { + "epoch": 72.95095367847412, + "grad_norm": 2.381028890609741, + "learning_rate": 3.5981127852511178e-06, + "loss": 0.1546, + "step": 26773 + }, + { + "epoch": 72.95367847411444, + "grad_norm": 3.2304797172546387, + "learning_rate": 3.5974348622009083e-06, + "loss": 0.0593, + "step": 26774 + }, + { + "epoch": 72.95640326975477, + "grad_norm": 4.244482517242432, + "learning_rate": 3.5967569890136654e-06, + "loss": 0.0524, + "step": 26775 + }, + { + "epoch": 72.95912806539509, + "grad_norm": 4.18062162399292, + "learning_rate": 3.596079165694677e-06, + "loss": 0.0507, + "step": 26776 + }, + { + "epoch": 72.96185286103542, + "grad_norm": 2.614755153656006, + "learning_rate": 3.595401392249218e-06, + "loss": 0.0442, + "step": 26777 + }, + { + "epoch": 72.96457765667574, + "grad_norm": 3.563538074493408, + "learning_rate": 3.5947236686825683e-06, + "loss": 0.0445, + "step": 26778 + }, + { + "epoch": 72.96730245231608, + "grad_norm": 2.8035526275634766, + "learning_rate": 3.5940459949999995e-06, + "loss": 0.0846, + "step": 26779 + }, + { + "epoch": 72.97002724795641, + "grad_norm": 2.8743069171905518, + "learning_rate": 3.593368371206798e-06, + "loss": 0.1351, + "step": 26780 + }, + { + "epoch": 72.97275204359673, + "grad_norm": 3.3925259113311768, + "learning_rate": 3.5926907973082335e-06, + "loss": 0.0862, + "step": 26781 + }, + { + "epoch": 72.97547683923706, + "grad_norm": 23.501739501953125, + "learning_rate": 3.5920132733095912e-06, + "loss": 0.2362, + "step": 26782 + }, + { + "epoch": 72.97820163487738, + "grad_norm": 3.532512664794922, + "learning_rate": 3.5913357992161422e-06, + "loss": 0.1372, + "step": 26783 + }, + { + "epoch": 72.98092643051771, + "grad_norm": 2.8155605792999268, + "learning_rate": 3.5906583750331614e-06, + "loss": 0.1241, + "step": 26784 + }, + { + "epoch": 72.98365122615803, + "grad_norm": 2.777841091156006, + "learning_rate": 3.5899810007659296e-06, + "loss": 0.0543, + "step": 26785 + }, + { + "epoch": 72.98637602179836, + "grad_norm": 3.0467355251312256, + "learning_rate": 3.589303676419721e-06, + "loss": 0.1655, + "step": 26786 + }, + { + "epoch": 72.9891008174387, + "grad_norm": 3.370142698287964, + "learning_rate": 3.5886264019998074e-06, + "loss": 0.0341, + "step": 26787 + }, + { + "epoch": 72.99182561307902, + "grad_norm": 4.560024261474609, + "learning_rate": 3.5879491775114618e-06, + "loss": 0.0792, + "step": 26788 + }, + { + "epoch": 72.99455040871935, + "grad_norm": 2.4999136924743652, + "learning_rate": 3.587272002959965e-06, + "loss": 0.0627, + "step": 26789 + }, + { + "epoch": 72.99727520435967, + "grad_norm": 3.5428922176361084, + "learning_rate": 3.5865948783505877e-06, + "loss": 0.1156, + "step": 26790 + }, + { + "epoch": 73.0, + "grad_norm": 5.0766706466674805, + "learning_rate": 3.585917803688603e-06, + "loss": 0.0837, + "step": 26791 + }, + { + "epoch": 73.00272479564033, + "grad_norm": 3.724759101867676, + "learning_rate": 3.585240778979281e-06, + "loss": 0.2373, + "step": 26792 + }, + { + "epoch": 73.00544959128065, + "grad_norm": 3.019198417663574, + "learning_rate": 3.584563804227901e-06, + "loss": 0.1205, + "step": 26793 + }, + { + "epoch": 73.00817438692098, + "grad_norm": 9.265463829040527, + "learning_rate": 3.583886879439731e-06, + "loss": 0.0701, + "step": 26794 + }, + { + "epoch": 73.0108991825613, + "grad_norm": 3.006812334060669, + "learning_rate": 3.58321000462004e-06, + "loss": 0.2511, + "step": 26795 + }, + { + "epoch": 73.01362397820164, + "grad_norm": 2.4832189083099365, + "learning_rate": 3.582533179774107e-06, + "loss": 0.1251, + "step": 26796 + }, + { + "epoch": 73.01634877384195, + "grad_norm": 2.5576279163360596, + "learning_rate": 3.581856404907198e-06, + "loss": 0.0389, + "step": 26797 + }, + { + "epoch": 73.01907356948229, + "grad_norm": 2.908736228942871, + "learning_rate": 3.5811796800245857e-06, + "loss": 0.1208, + "step": 26798 + }, + { + "epoch": 73.02179836512262, + "grad_norm": 1.714284896850586, + "learning_rate": 3.580503005131536e-06, + "loss": 0.0199, + "step": 26799 + }, + { + "epoch": 73.02452316076294, + "grad_norm": 3.5295302867889404, + "learning_rate": 3.579826380233322e-06, + "loss": 0.1732, + "step": 26800 + }, + { + "epoch": 73.02724795640327, + "grad_norm": 1.9285814762115479, + "learning_rate": 3.579149805335217e-06, + "loss": 0.0325, + "step": 26801 + }, + { + "epoch": 73.02997275204359, + "grad_norm": 2.4395298957824707, + "learning_rate": 3.578473280442486e-06, + "loss": 0.0834, + "step": 26802 + }, + { + "epoch": 73.03269754768392, + "grad_norm": 3.9300200939178467, + "learning_rate": 3.5777968055603996e-06, + "loss": 0.0854, + "step": 26803 + }, + { + "epoch": 73.03542234332426, + "grad_norm": 2.8045382499694824, + "learning_rate": 3.57712038069422e-06, + "loss": 0.0413, + "step": 26804 + }, + { + "epoch": 73.03814713896458, + "grad_norm": 5.196256637573242, + "learning_rate": 3.5764440058492255e-06, + "loss": 0.0957, + "step": 26805 + }, + { + "epoch": 73.04087193460491, + "grad_norm": 5.014540672302246, + "learning_rate": 3.5757676810306775e-06, + "loss": 0.0618, + "step": 26806 + }, + { + "epoch": 73.04359673024523, + "grad_norm": 3.0821545124053955, + "learning_rate": 3.5750914062438437e-06, + "loss": 0.0332, + "step": 26807 + }, + { + "epoch": 73.04632152588556, + "grad_norm": 4.059762001037598, + "learning_rate": 3.5744151814939874e-06, + "loss": 0.0518, + "step": 26808 + }, + { + "epoch": 73.04904632152588, + "grad_norm": 5.413859844207764, + "learning_rate": 3.5737390067863833e-06, + "loss": 0.1173, + "step": 26809 + }, + { + "epoch": 73.05177111716621, + "grad_norm": 3.953683853149414, + "learning_rate": 3.5730628821262926e-06, + "loss": 0.0988, + "step": 26810 + }, + { + "epoch": 73.05449591280654, + "grad_norm": 2.2801594734191895, + "learning_rate": 3.5723868075189817e-06, + "loss": 0.1122, + "step": 26811 + }, + { + "epoch": 73.05722070844686, + "grad_norm": 2.5937554836273193, + "learning_rate": 3.5717107829697117e-06, + "loss": 0.0432, + "step": 26812 + }, + { + "epoch": 73.0599455040872, + "grad_norm": 2.5698869228363037, + "learning_rate": 3.5710348084837543e-06, + "loss": 0.0367, + "step": 26813 + }, + { + "epoch": 73.06267029972751, + "grad_norm": 2.673501968383789, + "learning_rate": 3.5703588840663706e-06, + "loss": 0.0431, + "step": 26814 + }, + { + "epoch": 73.06539509536785, + "grad_norm": 3.987767219543457, + "learning_rate": 3.569683009722826e-06, + "loss": 0.0652, + "step": 26815 + }, + { + "epoch": 73.06811989100818, + "grad_norm": 3.394280195236206, + "learning_rate": 3.5690071854583763e-06, + "loss": 0.0586, + "step": 26816 + }, + { + "epoch": 73.0708446866485, + "grad_norm": 1.5364474058151245, + "learning_rate": 3.5683314112782972e-06, + "loss": 0.0171, + "step": 26817 + }, + { + "epoch": 73.07356948228883, + "grad_norm": 3.1772634983062744, + "learning_rate": 3.567655687187848e-06, + "loss": 0.06, + "step": 26818 + }, + { + "epoch": 73.07629427792915, + "grad_norm": 2.79032039642334, + "learning_rate": 3.566980013192288e-06, + "loss": 0.0966, + "step": 26819 + }, + { + "epoch": 73.07901907356948, + "grad_norm": 1.816536545753479, + "learning_rate": 3.566304389296877e-06, + "loss": 0.0203, + "step": 26820 + }, + { + "epoch": 73.0817438692098, + "grad_norm": 2.7905635833740234, + "learning_rate": 3.5656288155068842e-06, + "loss": 0.048, + "step": 26821 + }, + { + "epoch": 73.08446866485014, + "grad_norm": 3.276249408721924, + "learning_rate": 3.5649532918275675e-06, + "loss": 0.063, + "step": 26822 + }, + { + "epoch": 73.08719346049047, + "grad_norm": 3.8438339233398438, + "learning_rate": 3.5642778182641867e-06, + "loss": 0.1294, + "step": 26823 + }, + { + "epoch": 73.08991825613079, + "grad_norm": 5.634337425231934, + "learning_rate": 3.563602394822e-06, + "loss": 0.0623, + "step": 26824 + }, + { + "epoch": 73.09264305177112, + "grad_norm": 1.9742017984390259, + "learning_rate": 3.562927021506275e-06, + "loss": 0.0255, + "step": 26825 + }, + { + "epoch": 73.09536784741144, + "grad_norm": 3.014936685562134, + "learning_rate": 3.5622516983222656e-06, + "loss": 0.0507, + "step": 26826 + }, + { + "epoch": 73.09809264305177, + "grad_norm": 3.8650033473968506, + "learning_rate": 3.561576425275234e-06, + "loss": 0.1377, + "step": 26827 + }, + { + "epoch": 73.1008174386921, + "grad_norm": 2.649522066116333, + "learning_rate": 3.5609012023704338e-06, + "loss": 0.0836, + "step": 26828 + }, + { + "epoch": 73.10354223433242, + "grad_norm": 1.812314510345459, + "learning_rate": 3.560226029613132e-06, + "loss": 0.0416, + "step": 26829 + }, + { + "epoch": 73.10626702997276, + "grad_norm": 3.097317934036255, + "learning_rate": 3.5595509070085822e-06, + "loss": 0.0644, + "step": 26830 + }, + { + "epoch": 73.10899182561307, + "grad_norm": 1.8639962673187256, + "learning_rate": 3.558875834562042e-06, + "loss": 0.0397, + "step": 26831 + }, + { + "epoch": 73.11171662125341, + "grad_norm": 3.5851614475250244, + "learning_rate": 3.558200812278767e-06, + "loss": 0.0797, + "step": 26832 + }, + { + "epoch": 73.11444141689373, + "grad_norm": 2.8216004371643066, + "learning_rate": 3.557525840164017e-06, + "loss": 0.0516, + "step": 26833 + }, + { + "epoch": 73.11716621253406, + "grad_norm": 3.30781888961792, + "learning_rate": 3.5568509182230503e-06, + "loss": 0.1132, + "step": 26834 + }, + { + "epoch": 73.11989100817439, + "grad_norm": 2.6572554111480713, + "learning_rate": 3.5561760464611227e-06, + "loss": 0.1412, + "step": 26835 + }, + { + "epoch": 73.12261580381471, + "grad_norm": 2.784372329711914, + "learning_rate": 3.555501224883484e-06, + "loss": 0.058, + "step": 26836 + }, + { + "epoch": 73.12534059945504, + "grad_norm": 3.348184823989868, + "learning_rate": 3.554826453495399e-06, + "loss": 0.1309, + "step": 26837 + }, + { + "epoch": 73.12806539509536, + "grad_norm": 2.4507763385772705, + "learning_rate": 3.554151732302118e-06, + "loss": 0.2144, + "step": 26838 + }, + { + "epoch": 73.1307901907357, + "grad_norm": 2.553067684173584, + "learning_rate": 3.553477061308895e-06, + "loss": 0.0471, + "step": 26839 + }, + { + "epoch": 73.13351498637603, + "grad_norm": 4.398159980773926, + "learning_rate": 3.5528024405209825e-06, + "loss": 0.1645, + "step": 26840 + }, + { + "epoch": 73.13623978201635, + "grad_norm": 2.97829008102417, + "learning_rate": 3.55212786994364e-06, + "loss": 0.1687, + "step": 26841 + }, + { + "epoch": 73.13896457765668, + "grad_norm": 2.869852066040039, + "learning_rate": 3.551453349582119e-06, + "loss": 0.0626, + "step": 26842 + }, + { + "epoch": 73.141689373297, + "grad_norm": 2.9041504859924316, + "learning_rate": 3.550778879441671e-06, + "loss": 0.0608, + "step": 26843 + }, + { + "epoch": 73.14441416893733, + "grad_norm": 8.342033386230469, + "learning_rate": 3.550104459527546e-06, + "loss": 0.0615, + "step": 26844 + }, + { + "epoch": 73.14713896457765, + "grad_norm": 3.2290289402008057, + "learning_rate": 3.549430089845004e-06, + "loss": 0.0406, + "step": 26845 + }, + { + "epoch": 73.14986376021798, + "grad_norm": 2.333523988723755, + "learning_rate": 3.5487557703992927e-06, + "loss": 0.045, + "step": 26846 + }, + { + "epoch": 73.15258855585832, + "grad_norm": 3.0763156414031982, + "learning_rate": 3.5480815011956626e-06, + "loss": 0.1394, + "step": 26847 + }, + { + "epoch": 73.15531335149863, + "grad_norm": 3.40331768989563, + "learning_rate": 3.5474072822393635e-06, + "loss": 0.0488, + "step": 26848 + }, + { + "epoch": 73.15803814713897, + "grad_norm": 2.91113018989563, + "learning_rate": 3.546733113535653e-06, + "loss": 0.0419, + "step": 26849 + }, + { + "epoch": 73.16076294277929, + "grad_norm": 3.1495656967163086, + "learning_rate": 3.5460589950897726e-06, + "loss": 0.0999, + "step": 26850 + }, + { + "epoch": 73.16348773841962, + "grad_norm": 2.792149305343628, + "learning_rate": 3.545384926906982e-06, + "loss": 0.0665, + "step": 26851 + }, + { + "epoch": 73.16621253405995, + "grad_norm": 3.9560298919677734, + "learning_rate": 3.5447109089925247e-06, + "loss": 0.0591, + "step": 26852 + }, + { + "epoch": 73.16893732970027, + "grad_norm": 2.1874496936798096, + "learning_rate": 3.5440369413516474e-06, + "loss": 0.0312, + "step": 26853 + }, + { + "epoch": 73.1716621253406, + "grad_norm": 2.985170841217041, + "learning_rate": 3.5433630239896064e-06, + "loss": 0.0884, + "step": 26854 + }, + { + "epoch": 73.17438692098092, + "grad_norm": 2.814131736755371, + "learning_rate": 3.542689156911647e-06, + "loss": 0.0693, + "step": 26855 + }, + { + "epoch": 73.17711171662125, + "grad_norm": 2.8599281311035156, + "learning_rate": 3.542015340123016e-06, + "loss": 0.0653, + "step": 26856 + }, + { + "epoch": 73.17983651226157, + "grad_norm": 2.7674167156219482, + "learning_rate": 3.541341573628958e-06, + "loss": 0.1506, + "step": 26857 + }, + { + "epoch": 73.1825613079019, + "grad_norm": 4.389822483062744, + "learning_rate": 3.5406678574347287e-06, + "loss": 0.0493, + "step": 26858 + }, + { + "epoch": 73.18528610354224, + "grad_norm": 2.5432190895080566, + "learning_rate": 3.5399941915455695e-06, + "loss": 0.0734, + "step": 26859 + }, + { + "epoch": 73.18801089918256, + "grad_norm": 3.0489144325256348, + "learning_rate": 3.5393205759667237e-06, + "loss": 0.2063, + "step": 26860 + }, + { + "epoch": 73.19073569482289, + "grad_norm": 3.039339303970337, + "learning_rate": 3.5386470107034443e-06, + "loss": 0.1709, + "step": 26861 + }, + { + "epoch": 73.19346049046321, + "grad_norm": 2.7697556018829346, + "learning_rate": 3.5379734957609748e-06, + "loss": 0.048, + "step": 26862 + }, + { + "epoch": 73.19618528610354, + "grad_norm": 2.4593348503112793, + "learning_rate": 3.5373000311445604e-06, + "loss": 0.0749, + "step": 26863 + }, + { + "epoch": 73.19891008174388, + "grad_norm": 2.915950059890747, + "learning_rate": 3.536626616859441e-06, + "loss": 0.0623, + "step": 26864 + }, + { + "epoch": 73.2016348773842, + "grad_norm": 3.1317269802093506, + "learning_rate": 3.5359532529108687e-06, + "loss": 0.1221, + "step": 26865 + }, + { + "epoch": 73.20435967302453, + "grad_norm": 3.3596508502960205, + "learning_rate": 3.535279939304085e-06, + "loss": 0.1033, + "step": 26866 + }, + { + "epoch": 73.20708446866485, + "grad_norm": 3.8590259552001953, + "learning_rate": 3.53460667604433e-06, + "loss": 0.1652, + "step": 26867 + }, + { + "epoch": 73.20980926430518, + "grad_norm": 2.1116504669189453, + "learning_rate": 3.5339334631368527e-06, + "loss": 0.037, + "step": 26868 + }, + { + "epoch": 73.2125340599455, + "grad_norm": 2.5465245246887207, + "learning_rate": 3.5332603005868906e-06, + "loss": 0.2003, + "step": 26869 + }, + { + "epoch": 73.21525885558583, + "grad_norm": 4.480618953704834, + "learning_rate": 3.532587188399692e-06, + "loss": 0.0864, + "step": 26870 + }, + { + "epoch": 73.21798365122616, + "grad_norm": 4.117570877075195, + "learning_rate": 3.531914126580497e-06, + "loss": 0.0868, + "step": 26871 + }, + { + "epoch": 73.22070844686648, + "grad_norm": 2.355170488357544, + "learning_rate": 3.531241115134546e-06, + "loss": 0.0279, + "step": 26872 + }, + { + "epoch": 73.22343324250681, + "grad_norm": 4.68784236907959, + "learning_rate": 3.530568154067078e-06, + "loss": 0.038, + "step": 26873 + }, + { + "epoch": 73.22615803814713, + "grad_norm": 1.8216328620910645, + "learning_rate": 3.52989524338334e-06, + "loss": 0.031, + "step": 26874 + }, + { + "epoch": 73.22888283378747, + "grad_norm": 3.390501022338867, + "learning_rate": 3.5292223830885696e-06, + "loss": 0.0874, + "step": 26875 + }, + { + "epoch": 73.2316076294278, + "grad_norm": 2.6133570671081543, + "learning_rate": 3.528549573188007e-06, + "loss": 0.0349, + "step": 26876 + }, + { + "epoch": 73.23433242506812, + "grad_norm": 2.759392499923706, + "learning_rate": 3.527876813686889e-06, + "loss": 0.074, + "step": 26877 + }, + { + "epoch": 73.23705722070845, + "grad_norm": 3.0409185886383057, + "learning_rate": 3.5272041045904615e-06, + "loss": 0.0486, + "step": 26878 + }, + { + "epoch": 73.23978201634877, + "grad_norm": 3.128284215927124, + "learning_rate": 3.52653144590396e-06, + "loss": 0.0843, + "step": 26879 + }, + { + "epoch": 73.2425068119891, + "grad_norm": 4.041402339935303, + "learning_rate": 3.5258588376326198e-06, + "loss": 0.098, + "step": 26880 + }, + { + "epoch": 73.24523160762942, + "grad_norm": 2.9336047172546387, + "learning_rate": 3.525186279781686e-06, + "loss": 0.0996, + "step": 26881 + }, + { + "epoch": 73.24795640326975, + "grad_norm": 2.2768266201019287, + "learning_rate": 3.524513772356393e-06, + "loss": 0.0269, + "step": 26882 + }, + { + "epoch": 73.25068119891009, + "grad_norm": 2.5622401237487793, + "learning_rate": 3.5238413153619788e-06, + "loss": 0.028, + "step": 26883 + }, + { + "epoch": 73.2534059945504, + "grad_norm": 2.184340715408325, + "learning_rate": 3.5231689088036757e-06, + "loss": 0.0284, + "step": 26884 + }, + { + "epoch": 73.25613079019074, + "grad_norm": 3.16709566116333, + "learning_rate": 3.522496552686725e-06, + "loss": 0.0851, + "step": 26885 + }, + { + "epoch": 73.25885558583106, + "grad_norm": 3.5944974422454834, + "learning_rate": 3.5218242470163667e-06, + "loss": 0.0303, + "step": 26886 + }, + { + "epoch": 73.26158038147139, + "grad_norm": 2.809340476989746, + "learning_rate": 3.521151991797832e-06, + "loss": 0.0643, + "step": 26887 + }, + { + "epoch": 73.26430517711172, + "grad_norm": 2.621263027191162, + "learning_rate": 3.5204797870363573e-06, + "loss": 0.0615, + "step": 26888 + }, + { + "epoch": 73.26702997275204, + "grad_norm": 2.7322444915771484, + "learning_rate": 3.5198076327371744e-06, + "loss": 0.0627, + "step": 26889 + }, + { + "epoch": 73.26975476839237, + "grad_norm": 3.0294265747070312, + "learning_rate": 3.519135528905524e-06, + "loss": 0.1357, + "step": 26890 + }, + { + "epoch": 73.2724795640327, + "grad_norm": 2.9210681915283203, + "learning_rate": 3.5184634755466374e-06, + "loss": 0.0312, + "step": 26891 + }, + { + "epoch": 73.27520435967303, + "grad_norm": 2.321434736251831, + "learning_rate": 3.5177914726657493e-06, + "loss": 0.0318, + "step": 26892 + }, + { + "epoch": 73.27792915531334, + "grad_norm": 2.2671425342559814, + "learning_rate": 3.5171195202680887e-06, + "loss": 0.0356, + "step": 26893 + }, + { + "epoch": 73.28065395095368, + "grad_norm": 2.8914756774902344, + "learning_rate": 3.516447618358896e-06, + "loss": 0.0507, + "step": 26894 + }, + { + "epoch": 73.28337874659401, + "grad_norm": 2.2265446186065674, + "learning_rate": 3.5157757669434e-06, + "loss": 0.1225, + "step": 26895 + }, + { + "epoch": 73.28610354223433, + "grad_norm": 2.8981120586395264, + "learning_rate": 3.515103966026835e-06, + "loss": 0.1077, + "step": 26896 + }, + { + "epoch": 73.28882833787466, + "grad_norm": 4.0132646560668945, + "learning_rate": 3.5144322156144274e-06, + "loss": 0.0407, + "step": 26897 + }, + { + "epoch": 73.29155313351498, + "grad_norm": 2.233222007751465, + "learning_rate": 3.5137605157114164e-06, + "loss": 0.0305, + "step": 26898 + }, + { + "epoch": 73.29427792915531, + "grad_norm": 1.9654173851013184, + "learning_rate": 3.51308886632303e-06, + "loss": 0.0269, + "step": 26899 + }, + { + "epoch": 73.29700272479565, + "grad_norm": 2.161252975463867, + "learning_rate": 3.512417267454499e-06, + "loss": 0.0472, + "step": 26900 + }, + { + "epoch": 73.29972752043597, + "grad_norm": 2.825688123703003, + "learning_rate": 3.5117457191110495e-06, + "loss": 0.0636, + "step": 26901 + }, + { + "epoch": 73.3024523160763, + "grad_norm": 3.0534720420837402, + "learning_rate": 3.5110742212979156e-06, + "loss": 0.052, + "step": 26902 + }, + { + "epoch": 73.30517711171662, + "grad_norm": 2.1501169204711914, + "learning_rate": 3.5104027740203305e-06, + "loss": 0.0364, + "step": 26903 + }, + { + "epoch": 73.30790190735695, + "grad_norm": 2.993039608001709, + "learning_rate": 3.5097313772835195e-06, + "loss": 0.0481, + "step": 26904 + }, + { + "epoch": 73.31062670299727, + "grad_norm": 3.8253333568573, + "learning_rate": 3.509060031092708e-06, + "loss": 0.0461, + "step": 26905 + }, + { + "epoch": 73.3133514986376, + "grad_norm": 1.8563841581344604, + "learning_rate": 3.508388735453132e-06, + "loss": 0.0314, + "step": 26906 + }, + { + "epoch": 73.31607629427793, + "grad_norm": 2.2914717197418213, + "learning_rate": 3.507717490370015e-06, + "loss": 0.0321, + "step": 26907 + }, + { + "epoch": 73.31880108991825, + "grad_norm": 3.319343328475952, + "learning_rate": 3.507046295848585e-06, + "loss": 0.0388, + "step": 26908 + }, + { + "epoch": 73.32152588555859, + "grad_norm": 2.9802682399749756, + "learning_rate": 3.506375151894067e-06, + "loss": 0.0704, + "step": 26909 + }, + { + "epoch": 73.3242506811989, + "grad_norm": 3.0829756259918213, + "learning_rate": 3.505704058511694e-06, + "loss": 0.0415, + "step": 26910 + }, + { + "epoch": 73.32697547683924, + "grad_norm": 3.8320634365081787, + "learning_rate": 3.505033015706688e-06, + "loss": 0.1334, + "step": 26911 + }, + { + "epoch": 73.32970027247957, + "grad_norm": 4.733470916748047, + "learning_rate": 3.5043620234842757e-06, + "loss": 0.072, + "step": 26912 + }, + { + "epoch": 73.33242506811989, + "grad_norm": 2.269888401031494, + "learning_rate": 3.5036910818496792e-06, + "loss": 0.0341, + "step": 26913 + }, + { + "epoch": 73.33514986376022, + "grad_norm": 2.475080966949463, + "learning_rate": 3.5030201908081316e-06, + "loss": 0.2342, + "step": 26914 + }, + { + "epoch": 73.33787465940054, + "grad_norm": 3.1076841354370117, + "learning_rate": 3.5023493503648543e-06, + "loss": 0.0559, + "step": 26915 + }, + { + "epoch": 73.34059945504087, + "grad_norm": 4.108279705047607, + "learning_rate": 3.5016785605250702e-06, + "loss": 0.0649, + "step": 26916 + }, + { + "epoch": 73.34332425068119, + "grad_norm": 3.272644519805908, + "learning_rate": 3.5010078212940012e-06, + "loss": 0.0421, + "step": 26917 + }, + { + "epoch": 73.34604904632153, + "grad_norm": 2.5600414276123047, + "learning_rate": 3.5003371326768778e-06, + "loss": 0.0698, + "step": 26918 + }, + { + "epoch": 73.34877384196186, + "grad_norm": 3.030984878540039, + "learning_rate": 3.499666494678915e-06, + "loss": 0.0685, + "step": 26919 + }, + { + "epoch": 73.35149863760218, + "grad_norm": 2.884631395339966, + "learning_rate": 3.4989959073053447e-06, + "loss": 0.0444, + "step": 26920 + }, + { + "epoch": 73.35422343324251, + "grad_norm": 5.614757537841797, + "learning_rate": 3.498325370561385e-06, + "loss": 0.0651, + "step": 26921 + }, + { + "epoch": 73.35694822888283, + "grad_norm": 3.0250747203826904, + "learning_rate": 3.497654884452254e-06, + "loss": 0.092, + "step": 26922 + }, + { + "epoch": 73.35967302452316, + "grad_norm": 2.085069179534912, + "learning_rate": 3.4969844489831817e-06, + "loss": 0.0547, + "step": 26923 + }, + { + "epoch": 73.3623978201635, + "grad_norm": 2.7650771141052246, + "learning_rate": 3.496314064159385e-06, + "loss": 0.0411, + "step": 26924 + }, + { + "epoch": 73.36512261580381, + "grad_norm": 4.291244029998779, + "learning_rate": 3.495643729986081e-06, + "loss": 0.1238, + "step": 26925 + }, + { + "epoch": 73.36784741144415, + "grad_norm": 3.3603227138519287, + "learning_rate": 3.494973446468499e-06, + "loss": 0.1567, + "step": 26926 + }, + { + "epoch": 73.37057220708446, + "grad_norm": 2.3697690963745117, + "learning_rate": 3.4943032136118537e-06, + "loss": 0.1454, + "step": 26927 + }, + { + "epoch": 73.3732970027248, + "grad_norm": 2.098708391189575, + "learning_rate": 3.493633031421365e-06, + "loss": 0.0315, + "step": 26928 + }, + { + "epoch": 73.37602179836512, + "grad_norm": 2.689488410949707, + "learning_rate": 3.4929628999022502e-06, + "loss": 0.0404, + "step": 26929 + }, + { + "epoch": 73.37874659400545, + "grad_norm": 2.8799092769622803, + "learning_rate": 3.492292819059734e-06, + "loss": 0.055, + "step": 26930 + }, + { + "epoch": 73.38147138964578, + "grad_norm": 5.110519886016846, + "learning_rate": 3.491622788899033e-06, + "loss": 0.0582, + "step": 26931 + }, + { + "epoch": 73.3841961852861, + "grad_norm": 2.9135501384735107, + "learning_rate": 3.490952809425363e-06, + "loss": 0.0838, + "step": 26932 + }, + { + "epoch": 73.38692098092643, + "grad_norm": 3.180020570755005, + "learning_rate": 3.4902828806439394e-06, + "loss": 0.1259, + "step": 26933 + }, + { + "epoch": 73.38964577656675, + "grad_norm": 2.6474556922912598, + "learning_rate": 3.4896130025599874e-06, + "loss": 0.0837, + "step": 26934 + }, + { + "epoch": 73.39237057220708, + "grad_norm": 2.575450897216797, + "learning_rate": 3.4889431751787195e-06, + "loss": 0.0458, + "step": 26935 + }, + { + "epoch": 73.39509536784742, + "grad_norm": 2.345289468765259, + "learning_rate": 3.4882733985053487e-06, + "loss": 0.0453, + "step": 26936 + }, + { + "epoch": 73.39782016348774, + "grad_norm": 2.388676881790161, + "learning_rate": 3.4876036725450992e-06, + "loss": 0.0397, + "step": 26937 + }, + { + "epoch": 73.40054495912807, + "grad_norm": 2.2997653484344482, + "learning_rate": 3.486933997303179e-06, + "loss": 0.0381, + "step": 26938 + }, + { + "epoch": 73.40326975476839, + "grad_norm": 3.0745630264282227, + "learning_rate": 3.486264372784811e-06, + "loss": 0.0784, + "step": 26939 + }, + { + "epoch": 73.40599455040872, + "grad_norm": 2.604595899581909, + "learning_rate": 3.4855947989952054e-06, + "loss": 0.0541, + "step": 26940 + }, + { + "epoch": 73.40871934604904, + "grad_norm": 2.5068633556365967, + "learning_rate": 3.484925275939579e-06, + "loss": 0.082, + "step": 26941 + }, + { + "epoch": 73.41144414168937, + "grad_norm": 3.6491236686706543, + "learning_rate": 3.484255803623141e-06, + "loss": 0.0739, + "step": 26942 + }, + { + "epoch": 73.4141689373297, + "grad_norm": 2.814690351486206, + "learning_rate": 3.483586382051113e-06, + "loss": 0.1959, + "step": 26943 + }, + { + "epoch": 73.41689373297002, + "grad_norm": 3.3637218475341797, + "learning_rate": 3.4829170112287037e-06, + "loss": 0.0246, + "step": 26944 + }, + { + "epoch": 73.41961852861036, + "grad_norm": 3.7373859882354736, + "learning_rate": 3.4822476911611236e-06, + "loss": 0.0738, + "step": 26945 + }, + { + "epoch": 73.42234332425068, + "grad_norm": 2.808173894882202, + "learning_rate": 3.481578421853593e-06, + "loss": 0.2099, + "step": 26946 + }, + { + "epoch": 73.42506811989101, + "grad_norm": 4.274862289428711, + "learning_rate": 3.480909203311319e-06, + "loss": 0.2475, + "step": 26947 + }, + { + "epoch": 73.42779291553134, + "grad_norm": 3.3537137508392334, + "learning_rate": 3.480240035539515e-06, + "loss": 0.1645, + "step": 26948 + }, + { + "epoch": 73.43051771117166, + "grad_norm": 8.587748527526855, + "learning_rate": 3.479570918543388e-06, + "loss": 0.0923, + "step": 26949 + }, + { + "epoch": 73.433242506812, + "grad_norm": 2.934614896774292, + "learning_rate": 3.478901852328156e-06, + "loss": 0.0681, + "step": 26950 + }, + { + "epoch": 73.43596730245231, + "grad_norm": 3.0182249546051025, + "learning_rate": 3.478232836899026e-06, + "loss": 0.2357, + "step": 26951 + }, + { + "epoch": 73.43869209809264, + "grad_norm": 2.791226387023926, + "learning_rate": 3.4775638722612095e-06, + "loss": 0.0634, + "step": 26952 + }, + { + "epoch": 73.44141689373296, + "grad_norm": 4.563493251800537, + "learning_rate": 3.4768949584199118e-06, + "loss": 0.0832, + "step": 26953 + }, + { + "epoch": 73.4441416893733, + "grad_norm": 2.327061891555786, + "learning_rate": 3.476226095380347e-06, + "loss": 0.0479, + "step": 26954 + }, + { + "epoch": 73.44686648501363, + "grad_norm": 4.2786149978637695, + "learning_rate": 3.4755572831477267e-06, + "loss": 0.0615, + "step": 26955 + }, + { + "epoch": 73.44959128065395, + "grad_norm": 3.3000879287719727, + "learning_rate": 3.4748885217272554e-06, + "loss": 0.0679, + "step": 26956 + }, + { + "epoch": 73.45231607629428, + "grad_norm": 3.506911039352417, + "learning_rate": 3.4742198111241434e-06, + "loss": 0.1641, + "step": 26957 + }, + { + "epoch": 73.4550408719346, + "grad_norm": 2.9512298107147217, + "learning_rate": 3.473551151343594e-06, + "loss": 0.0411, + "step": 26958 + }, + { + "epoch": 73.45776566757493, + "grad_norm": 1.7537989616394043, + "learning_rate": 3.472882542390821e-06, + "loss": 0.024, + "step": 26959 + }, + { + "epoch": 73.46049046321527, + "grad_norm": 3.0269646644592285, + "learning_rate": 3.472213984271028e-06, + "loss": 0.0323, + "step": 26960 + }, + { + "epoch": 73.46321525885558, + "grad_norm": 2.1651768684387207, + "learning_rate": 3.471545476989423e-06, + "loss": 0.0435, + "step": 26961 + }, + { + "epoch": 73.46594005449592, + "grad_norm": 9.547691345214844, + "learning_rate": 3.470877020551209e-06, + "loss": 0.0543, + "step": 26962 + }, + { + "epoch": 73.46866485013624, + "grad_norm": 3.3503215312957764, + "learning_rate": 3.4702086149615975e-06, + "loss": 0.0611, + "step": 26963 + }, + { + "epoch": 73.47138964577657, + "grad_norm": 2.7280259132385254, + "learning_rate": 3.469540260225791e-06, + "loss": 0.0358, + "step": 26964 + }, + { + "epoch": 73.47411444141689, + "grad_norm": 2.4752163887023926, + "learning_rate": 3.468871956348995e-06, + "loss": 0.0427, + "step": 26965 + }, + { + "epoch": 73.47683923705722, + "grad_norm": 3.0498499870300293, + "learning_rate": 3.4682037033364115e-06, + "loss": 0.0215, + "step": 26966 + }, + { + "epoch": 73.47956403269755, + "grad_norm": 2.865424394607544, + "learning_rate": 3.4675355011932486e-06, + "loss": 0.0552, + "step": 26967 + }, + { + "epoch": 73.48228882833787, + "grad_norm": 2.940736770629883, + "learning_rate": 3.4668673499247108e-06, + "loss": 0.0393, + "step": 26968 + }, + { + "epoch": 73.4850136239782, + "grad_norm": 3.774017095565796, + "learning_rate": 3.4661992495359953e-06, + "loss": 0.0905, + "step": 26969 + }, + { + "epoch": 73.48773841961852, + "grad_norm": 3.683938503265381, + "learning_rate": 3.4655312000323137e-06, + "loss": 0.0574, + "step": 26970 + }, + { + "epoch": 73.49046321525886, + "grad_norm": 2.332352876663208, + "learning_rate": 3.464863201418861e-06, + "loss": 0.0668, + "step": 26971 + }, + { + "epoch": 73.49318801089919, + "grad_norm": 6.582822799682617, + "learning_rate": 3.464195253700847e-06, + "loss": 0.0527, + "step": 26972 + }, + { + "epoch": 73.49591280653951, + "grad_norm": 2.8384523391723633, + "learning_rate": 3.4635273568834703e-06, + "loss": 0.1161, + "step": 26973 + }, + { + "epoch": 73.49863760217984, + "grad_norm": 2.0593514442443848, + "learning_rate": 3.4628595109719286e-06, + "loss": 0.0277, + "step": 26974 + }, + { + "epoch": 73.50136239782016, + "grad_norm": 2.9547767639160156, + "learning_rate": 3.46219171597143e-06, + "loss": 0.0347, + "step": 26975 + }, + { + "epoch": 73.50408719346049, + "grad_norm": 3.8641443252563477, + "learning_rate": 3.4615239718871718e-06, + "loss": 0.0797, + "step": 26976 + }, + { + "epoch": 73.50681198910081, + "grad_norm": 3.758315324783325, + "learning_rate": 3.460856278724355e-06, + "loss": 0.1119, + "step": 26977 + }, + { + "epoch": 73.50953678474114, + "grad_norm": 3.827413320541382, + "learning_rate": 3.4601886364881754e-06, + "loss": 0.0715, + "step": 26978 + }, + { + "epoch": 73.51226158038148, + "grad_norm": 3.5978944301605225, + "learning_rate": 3.459521045183839e-06, + "loss": 0.0527, + "step": 26979 + }, + { + "epoch": 73.5149863760218, + "grad_norm": 3.1433017253875732, + "learning_rate": 3.4588535048165427e-06, + "loss": 0.1333, + "step": 26980 + }, + { + "epoch": 73.51771117166213, + "grad_norm": 3.6058473587036133, + "learning_rate": 3.4581860153914846e-06, + "loss": 0.0464, + "step": 26981 + }, + { + "epoch": 73.52043596730245, + "grad_norm": 3.056950092315674, + "learning_rate": 3.4575185769138596e-06, + "loss": 0.0651, + "step": 26982 + }, + { + "epoch": 73.52316076294278, + "grad_norm": 2.929863691329956, + "learning_rate": 3.4568511893888734e-06, + "loss": 0.066, + "step": 26983 + }, + { + "epoch": 73.52588555858311, + "grad_norm": 2.9831643104553223, + "learning_rate": 3.4561838528217197e-06, + "loss": 0.1566, + "step": 26984 + }, + { + "epoch": 73.52861035422343, + "grad_norm": 3.8312771320343018, + "learning_rate": 3.455516567217595e-06, + "loss": 0.0826, + "step": 26985 + }, + { + "epoch": 73.53133514986376, + "grad_norm": 3.1933791637420654, + "learning_rate": 3.4548493325816933e-06, + "loss": 0.0866, + "step": 26986 + }, + { + "epoch": 73.53405994550408, + "grad_norm": 2.4331719875335693, + "learning_rate": 3.4541821489192175e-06, + "loss": 0.0262, + "step": 26987 + }, + { + "epoch": 73.53678474114442, + "grad_norm": 2.7866642475128174, + "learning_rate": 3.453515016235357e-06, + "loss": 0.0759, + "step": 26988 + }, + { + "epoch": 73.53950953678473, + "grad_norm": 3.1756632328033447, + "learning_rate": 3.452847934535315e-06, + "loss": 0.0363, + "step": 26989 + }, + { + "epoch": 73.54223433242507, + "grad_norm": 4.05295991897583, + "learning_rate": 3.452180903824279e-06, + "loss": 0.1147, + "step": 26990 + }, + { + "epoch": 73.5449591280654, + "grad_norm": 3.641073226928711, + "learning_rate": 3.4515139241074504e-06, + "loss": 0.0383, + "step": 26991 + }, + { + "epoch": 73.54768392370572, + "grad_norm": 2.5837535858154297, + "learning_rate": 3.4508469953900205e-06, + "loss": 0.0386, + "step": 26992 + }, + { + "epoch": 73.55040871934605, + "grad_norm": 3.5125057697296143, + "learning_rate": 3.4501801176771844e-06, + "loss": 0.0497, + "step": 26993 + }, + { + "epoch": 73.55313351498637, + "grad_norm": 4.435265064239502, + "learning_rate": 3.44951329097413e-06, + "loss": 0.1471, + "step": 26994 + }, + { + "epoch": 73.5558583106267, + "grad_norm": 2.2139368057250977, + "learning_rate": 3.4488465152860593e-06, + "loss": 0.0328, + "step": 26995 + }, + { + "epoch": 73.55858310626704, + "grad_norm": 2.945382833480835, + "learning_rate": 3.4481797906181613e-06, + "loss": 0.0815, + "step": 26996 + }, + { + "epoch": 73.56130790190736, + "grad_norm": 3.154387950897217, + "learning_rate": 3.4475131169756284e-06, + "loss": 0.1188, + "step": 26997 + }, + { + "epoch": 73.56403269754769, + "grad_norm": 2.3312432765960693, + "learning_rate": 3.4468464943636483e-06, + "loss": 0.083, + "step": 26998 + }, + { + "epoch": 73.566757493188, + "grad_norm": 3.159672260284424, + "learning_rate": 3.4461799227874204e-06, + "loss": 0.0406, + "step": 26999 + }, + { + "epoch": 73.56948228882834, + "grad_norm": 4.261843681335449, + "learning_rate": 3.445513402252132e-06, + "loss": 0.0729, + "step": 27000 + }, + { + "epoch": 73.57220708446866, + "grad_norm": 2.7450103759765625, + "learning_rate": 3.444846932762975e-06, + "loss": 0.0806, + "step": 27001 + }, + { + "epoch": 73.57493188010899, + "grad_norm": 2.718365430831909, + "learning_rate": 3.444180514325135e-06, + "loss": 0.0262, + "step": 27002 + }, + { + "epoch": 73.57765667574932, + "grad_norm": 3.1965343952178955, + "learning_rate": 3.4435141469438103e-06, + "loss": 0.0765, + "step": 27003 + }, + { + "epoch": 73.58038147138964, + "grad_norm": 2.8067641258239746, + "learning_rate": 3.442847830624186e-06, + "loss": 0.0713, + "step": 27004 + }, + { + "epoch": 73.58310626702998, + "grad_norm": 3.0505402088165283, + "learning_rate": 3.4421815653714487e-06, + "loss": 0.2842, + "step": 27005 + }, + { + "epoch": 73.5858310626703, + "grad_norm": 5.876389503479004, + "learning_rate": 3.4415153511907928e-06, + "loss": 0.1074, + "step": 27006 + }, + { + "epoch": 73.58855585831063, + "grad_norm": 2.9681506156921387, + "learning_rate": 3.440849188087402e-06, + "loss": 0.0418, + "step": 27007 + }, + { + "epoch": 73.59128065395096, + "grad_norm": 3.5146090984344482, + "learning_rate": 3.440183076066469e-06, + "loss": 0.0464, + "step": 27008 + }, + { + "epoch": 73.59400544959128, + "grad_norm": 2.744197368621826, + "learning_rate": 3.43951701513318e-06, + "loss": 0.046, + "step": 27009 + }, + { + "epoch": 73.59673024523161, + "grad_norm": 3.572244882583618, + "learning_rate": 3.438851005292717e-06, + "loss": 0.0952, + "step": 27010 + }, + { + "epoch": 73.59945504087193, + "grad_norm": 4.2489776611328125, + "learning_rate": 3.438185046550275e-06, + "loss": 0.1632, + "step": 27011 + }, + { + "epoch": 73.60217983651226, + "grad_norm": 3.1429290771484375, + "learning_rate": 3.4375191389110376e-06, + "loss": 0.0349, + "step": 27012 + }, + { + "epoch": 73.60490463215258, + "grad_norm": 1.8757532835006714, + "learning_rate": 3.4368532823801893e-06, + "loss": 0.0264, + "step": 27013 + }, + { + "epoch": 73.60762942779292, + "grad_norm": 2.5090415477752686, + "learning_rate": 3.4361874769629123e-06, + "loss": 0.1728, + "step": 27014 + }, + { + "epoch": 73.61035422343325, + "grad_norm": 3.9638609886169434, + "learning_rate": 3.4355217226644e-06, + "loss": 0.0622, + "step": 27015 + }, + { + "epoch": 73.61307901907357, + "grad_norm": 2.4548087120056152, + "learning_rate": 3.434856019489833e-06, + "loss": 0.0261, + "step": 27016 + }, + { + "epoch": 73.6158038147139, + "grad_norm": 1.9381762742996216, + "learning_rate": 3.4341903674443967e-06, + "loss": 0.0293, + "step": 27017 + }, + { + "epoch": 73.61852861035422, + "grad_norm": 3.3661253452301025, + "learning_rate": 3.4335247665332704e-06, + "loss": 0.1087, + "step": 27018 + }, + { + "epoch": 73.62125340599455, + "grad_norm": 2.90206241607666, + "learning_rate": 3.432859216761645e-06, + "loss": 0.1134, + "step": 27019 + }, + { + "epoch": 73.62397820163488, + "grad_norm": 3.3400230407714844, + "learning_rate": 3.432193718134701e-06, + "loss": 0.0483, + "step": 27020 + }, + { + "epoch": 73.6267029972752, + "grad_norm": 2.2868094444274902, + "learning_rate": 3.4315282706576215e-06, + "loss": 0.0374, + "step": 27021 + }, + { + "epoch": 73.62942779291554, + "grad_norm": 2.2642598152160645, + "learning_rate": 3.430862874335584e-06, + "loss": 0.0415, + "step": 27022 + }, + { + "epoch": 73.63215258855585, + "grad_norm": 2.777907609939575, + "learning_rate": 3.4301975291737756e-06, + "loss": 0.0542, + "step": 27023 + }, + { + "epoch": 73.63487738419619, + "grad_norm": 3.489509344100952, + "learning_rate": 3.4295322351773807e-06, + "loss": 0.0942, + "step": 27024 + }, + { + "epoch": 73.6376021798365, + "grad_norm": 2.6100316047668457, + "learning_rate": 3.4288669923515784e-06, + "loss": 0.1175, + "step": 27025 + }, + { + "epoch": 73.64032697547684, + "grad_norm": 2.0358309745788574, + "learning_rate": 3.4282018007015472e-06, + "loss": 0.0279, + "step": 27026 + }, + { + "epoch": 73.64305177111717, + "grad_norm": 2.29683518409729, + "learning_rate": 3.4275366602324654e-06, + "loss": 0.0857, + "step": 27027 + }, + { + "epoch": 73.64577656675749, + "grad_norm": 5.21312141418457, + "learning_rate": 3.4268715709495203e-06, + "loss": 0.0718, + "step": 27028 + }, + { + "epoch": 73.64850136239782, + "grad_norm": 2.5061144828796387, + "learning_rate": 3.4262065328578876e-06, + "loss": 0.1363, + "step": 27029 + }, + { + "epoch": 73.65122615803814, + "grad_norm": 4.060135841369629, + "learning_rate": 3.4255415459627473e-06, + "loss": 0.1865, + "step": 27030 + }, + { + "epoch": 73.65395095367847, + "grad_norm": 4.575860023498535, + "learning_rate": 3.4248766102692744e-06, + "loss": 0.0757, + "step": 27031 + }, + { + "epoch": 73.65667574931881, + "grad_norm": 3.948610305786133, + "learning_rate": 3.4242117257826536e-06, + "loss": 0.0531, + "step": 27032 + }, + { + "epoch": 73.65940054495913, + "grad_norm": 5.607536315917969, + "learning_rate": 3.4235468925080607e-06, + "loss": 0.0486, + "step": 27033 + }, + { + "epoch": 73.66212534059946, + "grad_norm": 2.4876418113708496, + "learning_rate": 3.4228821104506694e-06, + "loss": 0.142, + "step": 27034 + }, + { + "epoch": 73.66485013623978, + "grad_norm": 3.045175313949585, + "learning_rate": 3.4222173796156643e-06, + "loss": 0.3281, + "step": 27035 + }, + { + "epoch": 73.66757493188011, + "grad_norm": 1.4952892065048218, + "learning_rate": 3.4215527000082183e-06, + "loss": 0.0228, + "step": 27036 + }, + { + "epoch": 73.67029972752043, + "grad_norm": 2.856586456298828, + "learning_rate": 3.420888071633508e-06, + "loss": 0.1139, + "step": 27037 + }, + { + "epoch": 73.67302452316076, + "grad_norm": 2.9633374214172363, + "learning_rate": 3.4202234944967062e-06, + "loss": 0.1319, + "step": 27038 + }, + { + "epoch": 73.6757493188011, + "grad_norm": 2.963578701019287, + "learning_rate": 3.4195589686029927e-06, + "loss": 0.0939, + "step": 27039 + }, + { + "epoch": 73.67847411444141, + "grad_norm": 2.4921133518218994, + "learning_rate": 3.418894493957545e-06, + "loss": 0.0971, + "step": 27040 + }, + { + "epoch": 73.68119891008175, + "grad_norm": 3.038226842880249, + "learning_rate": 3.418230070565535e-06, + "loss": 0.0568, + "step": 27041 + }, + { + "epoch": 73.68392370572207, + "grad_norm": 2.7386224269866943, + "learning_rate": 3.417565698432138e-06, + "loss": 0.0379, + "step": 27042 + }, + { + "epoch": 73.6866485013624, + "grad_norm": 2.886458158493042, + "learning_rate": 3.4169013775625235e-06, + "loss": 0.0497, + "step": 27043 + }, + { + "epoch": 73.68937329700273, + "grad_norm": 6.311750411987305, + "learning_rate": 3.416237107961873e-06, + "loss": 0.1695, + "step": 27044 + }, + { + "epoch": 73.69209809264305, + "grad_norm": 2.677231788635254, + "learning_rate": 3.415572889635356e-06, + "loss": 0.0498, + "step": 27045 + }, + { + "epoch": 73.69482288828338, + "grad_norm": 2.985056161880493, + "learning_rate": 3.414908722588145e-06, + "loss": 0.0837, + "step": 27046 + }, + { + "epoch": 73.6975476839237, + "grad_norm": 2.018767833709717, + "learning_rate": 3.41424460682541e-06, + "loss": 0.0817, + "step": 27047 + }, + { + "epoch": 73.70027247956403, + "grad_norm": 4.268989086151123, + "learning_rate": 3.413580542352328e-06, + "loss": 0.0722, + "step": 27048 + }, + { + "epoch": 73.70299727520435, + "grad_norm": 2.608004570007324, + "learning_rate": 3.412916529174071e-06, + "loss": 0.0453, + "step": 27049 + }, + { + "epoch": 73.70572207084469, + "grad_norm": 3.135223150253296, + "learning_rate": 3.4122525672958063e-06, + "loss": 0.193, + "step": 27050 + }, + { + "epoch": 73.70844686648502, + "grad_norm": 3.511472702026367, + "learning_rate": 3.411588656722704e-06, + "loss": 0.1021, + "step": 27051 + }, + { + "epoch": 73.71117166212534, + "grad_norm": 2.338649034500122, + "learning_rate": 3.4109247974599413e-06, + "loss": 0.0454, + "step": 27052 + }, + { + "epoch": 73.71389645776567, + "grad_norm": 2.984248399734497, + "learning_rate": 3.4102609895126824e-06, + "loss": 0.1779, + "step": 27053 + }, + { + "epoch": 73.71662125340599, + "grad_norm": 3.1859493255615234, + "learning_rate": 3.4095972328860973e-06, + "loss": 0.0532, + "step": 27054 + }, + { + "epoch": 73.71934604904632, + "grad_norm": 3.8830037117004395, + "learning_rate": 3.4089335275853585e-06, + "loss": 0.0443, + "step": 27055 + }, + { + "epoch": 73.72207084468666, + "grad_norm": 5.8974504470825195, + "learning_rate": 3.408269873615635e-06, + "loss": 0.1181, + "step": 27056 + }, + { + "epoch": 73.72479564032697, + "grad_norm": 3.8796021938323975, + "learning_rate": 3.407606270982089e-06, + "loss": 0.0687, + "step": 27057 + }, + { + "epoch": 73.7275204359673, + "grad_norm": 2.5573911666870117, + "learning_rate": 3.4069427196898973e-06, + "loss": 0.0217, + "step": 27058 + }, + { + "epoch": 73.73024523160763, + "grad_norm": 3.0410897731781006, + "learning_rate": 3.4062792197442197e-06, + "loss": 0.1233, + "step": 27059 + }, + { + "epoch": 73.73297002724796, + "grad_norm": 2.8239598274230957, + "learning_rate": 3.4056157711502304e-06, + "loss": 0.0787, + "step": 27060 + }, + { + "epoch": 73.73569482288828, + "grad_norm": 2.4992105960845947, + "learning_rate": 3.404952373913093e-06, + "loss": 0.1163, + "step": 27061 + }, + { + "epoch": 73.73841961852861, + "grad_norm": 3.2608139514923096, + "learning_rate": 3.4042890280379748e-06, + "loss": 0.1182, + "step": 27062 + }, + { + "epoch": 73.74114441416894, + "grad_norm": 2.4933953285217285, + "learning_rate": 3.403625733530038e-06, + "loss": 0.0467, + "step": 27063 + }, + { + "epoch": 73.74386920980926, + "grad_norm": 3.406280517578125, + "learning_rate": 3.402962490394456e-06, + "loss": 0.0725, + "step": 27064 + }, + { + "epoch": 73.7465940054496, + "grad_norm": 3.1564791202545166, + "learning_rate": 3.402299298636388e-06, + "loss": 0.0855, + "step": 27065 + }, + { + "epoch": 73.74931880108991, + "grad_norm": 3.5999932289123535, + "learning_rate": 3.401636158261001e-06, + "loss": 0.0436, + "step": 27066 + }, + { + "epoch": 73.75204359673025, + "grad_norm": 4.174797534942627, + "learning_rate": 3.4009730692734576e-06, + "loss": 0.0261, + "step": 27067 + }, + { + "epoch": 73.75476839237058, + "grad_norm": 2.6065797805786133, + "learning_rate": 3.4003100316789252e-06, + "loss": 0.0829, + "step": 27068 + }, + { + "epoch": 73.7574931880109, + "grad_norm": 3.2122576236724854, + "learning_rate": 3.399647045482567e-06, + "loss": 0.0468, + "step": 27069 + }, + { + "epoch": 73.76021798365123, + "grad_norm": 3.098024845123291, + "learning_rate": 3.398984110689544e-06, + "loss": 0.0522, + "step": 27070 + }, + { + "epoch": 73.76294277929155, + "grad_norm": 2.635446548461914, + "learning_rate": 3.398321227305018e-06, + "loss": 0.0716, + "step": 27071 + }, + { + "epoch": 73.76566757493188, + "grad_norm": 4.597242832183838, + "learning_rate": 3.3976583953341567e-06, + "loss": 0.0338, + "step": 27072 + }, + { + "epoch": 73.7683923705722, + "grad_norm": 2.7145698070526123, + "learning_rate": 3.396995614782119e-06, + "loss": 0.0444, + "step": 27073 + }, + { + "epoch": 73.77111716621253, + "grad_norm": 2.6254477500915527, + "learning_rate": 3.3963328856540633e-06, + "loss": 0.1218, + "step": 27074 + }, + { + "epoch": 73.77384196185287, + "grad_norm": 3.306751012802124, + "learning_rate": 3.3956702079551563e-06, + "loss": 0.0382, + "step": 27075 + }, + { + "epoch": 73.77656675749319, + "grad_norm": 3.099379062652588, + "learning_rate": 3.3950075816905593e-06, + "loss": 0.0506, + "step": 27076 + }, + { + "epoch": 73.77929155313352, + "grad_norm": 2.3745014667510986, + "learning_rate": 3.3943450068654303e-06, + "loss": 0.0286, + "step": 27077 + }, + { + "epoch": 73.78201634877384, + "grad_norm": 1.9496448040008545, + "learning_rate": 3.39368248348493e-06, + "loss": 0.0256, + "step": 27078 + }, + { + "epoch": 73.78474114441417, + "grad_norm": 2.7493364810943604, + "learning_rate": 3.3930200115542143e-06, + "loss": 0.1075, + "step": 27079 + }, + { + "epoch": 73.7874659400545, + "grad_norm": 3.410435676574707, + "learning_rate": 3.39235759107845e-06, + "loss": 0.1226, + "step": 27080 + }, + { + "epoch": 73.79019073569482, + "grad_norm": 1.8335320949554443, + "learning_rate": 3.391695222062793e-06, + "loss": 0.0644, + "step": 27081 + }, + { + "epoch": 73.79291553133515, + "grad_norm": 3.351548194885254, + "learning_rate": 3.391032904512399e-06, + "loss": 0.1441, + "step": 27082 + }, + { + "epoch": 73.79564032697547, + "grad_norm": 2.729797601699829, + "learning_rate": 3.3903706384324266e-06, + "loss": 0.0472, + "step": 27083 + }, + { + "epoch": 73.7983651226158, + "grad_norm": 3.343799114227295, + "learning_rate": 3.3897084238280366e-06, + "loss": 0.0427, + "step": 27084 + }, + { + "epoch": 73.80108991825612, + "grad_norm": 2.955580949783325, + "learning_rate": 3.389046260704385e-06, + "loss": 0.0447, + "step": 27085 + }, + { + "epoch": 73.80381471389646, + "grad_norm": 3.754732370376587, + "learning_rate": 3.3883841490666293e-06, + "loss": 0.1153, + "step": 27086 + }, + { + "epoch": 73.80653950953679, + "grad_norm": 6.577873706817627, + "learning_rate": 3.3877220889199213e-06, + "loss": 0.1361, + "step": 27087 + }, + { + "epoch": 73.80926430517711, + "grad_norm": 4.125805377960205, + "learning_rate": 3.387060080269423e-06, + "loss": 0.0805, + "step": 27088 + }, + { + "epoch": 73.81198910081744, + "grad_norm": 2.5797054767608643, + "learning_rate": 3.3863981231202892e-06, + "loss": 0.0347, + "step": 27089 + }, + { + "epoch": 73.81471389645776, + "grad_norm": 5.194318771362305, + "learning_rate": 3.385736217477674e-06, + "loss": 0.0739, + "step": 27090 + }, + { + "epoch": 73.8174386920981, + "grad_norm": 2.0635688304901123, + "learning_rate": 3.3850743633467286e-06, + "loss": 0.0432, + "step": 27091 + }, + { + "epoch": 73.82016348773843, + "grad_norm": 3.3392269611358643, + "learning_rate": 3.384412560732612e-06, + "loss": 0.1498, + "step": 27092 + }, + { + "epoch": 73.82288828337875, + "grad_norm": 3.1805264949798584, + "learning_rate": 3.383750809640479e-06, + "loss": 0.1225, + "step": 27093 + }, + { + "epoch": 73.82561307901908, + "grad_norm": 2.010472297668457, + "learning_rate": 3.3830891100754837e-06, + "loss": 0.1257, + "step": 27094 + }, + { + "epoch": 73.8283378746594, + "grad_norm": 3.9813106060028076, + "learning_rate": 3.382427462042772e-06, + "loss": 0.0586, + "step": 27095 + }, + { + "epoch": 73.83106267029973, + "grad_norm": 2.3568520545959473, + "learning_rate": 3.3817658655475074e-06, + "loss": 0.0579, + "step": 27096 + }, + { + "epoch": 73.83378746594005, + "grad_norm": 2.9525599479675293, + "learning_rate": 3.3811043205948366e-06, + "loss": 0.0617, + "step": 27097 + }, + { + "epoch": 73.83651226158038, + "grad_norm": 3.1131997108459473, + "learning_rate": 3.3804428271899127e-06, + "loss": 0.108, + "step": 27098 + }, + { + "epoch": 73.83923705722071, + "grad_norm": 2.993835926055908, + "learning_rate": 3.3797813853378827e-06, + "loss": 0.037, + "step": 27099 + }, + { + "epoch": 73.84196185286103, + "grad_norm": 2.7033605575561523, + "learning_rate": 3.3791199950439057e-06, + "loss": 0.1039, + "step": 27100 + }, + { + "epoch": 73.84468664850137, + "grad_norm": 2.3294596672058105, + "learning_rate": 3.3784586563131293e-06, + "loss": 0.0421, + "step": 27101 + }, + { + "epoch": 73.84741144414168, + "grad_norm": 14.998466491699219, + "learning_rate": 3.3777973691507047e-06, + "loss": 0.168, + "step": 27102 + }, + { + "epoch": 73.85013623978202, + "grad_norm": 2.1214687824249268, + "learning_rate": 3.3771361335617767e-06, + "loss": 0.0691, + "step": 27103 + }, + { + "epoch": 73.85286103542235, + "grad_norm": 2.2651479244232178, + "learning_rate": 3.376474949551504e-06, + "loss": 0.0391, + "step": 27104 + }, + { + "epoch": 73.85558583106267, + "grad_norm": 2.9230926036834717, + "learning_rate": 3.375813817125029e-06, + "loss": 0.0271, + "step": 27105 + }, + { + "epoch": 73.858310626703, + "grad_norm": 2.500877618789673, + "learning_rate": 3.3751527362875045e-06, + "loss": 0.0363, + "step": 27106 + }, + { + "epoch": 73.86103542234332, + "grad_norm": 4.30499267578125, + "learning_rate": 3.374491707044073e-06, + "loss": 0.0638, + "step": 27107 + }, + { + "epoch": 73.86376021798365, + "grad_norm": 3.7821364402770996, + "learning_rate": 3.3738307293998874e-06, + "loss": 0.0236, + "step": 27108 + }, + { + "epoch": 73.86648501362397, + "grad_norm": 2.388015031814575, + "learning_rate": 3.373169803360098e-06, + "loss": 0.037, + "step": 27109 + }, + { + "epoch": 73.8692098092643, + "grad_norm": 2.4646902084350586, + "learning_rate": 3.3725089289298483e-06, + "loss": 0.1281, + "step": 27110 + }, + { + "epoch": 73.87193460490464, + "grad_norm": 6.184477806091309, + "learning_rate": 3.371848106114287e-06, + "loss": 0.0604, + "step": 27111 + }, + { + "epoch": 73.87465940054496, + "grad_norm": 2.7357826232910156, + "learning_rate": 3.371187334918555e-06, + "loss": 0.0882, + "step": 27112 + }, + { + "epoch": 73.87738419618529, + "grad_norm": 3.2358157634735107, + "learning_rate": 3.370526615347807e-06, + "loss": 0.0877, + "step": 27113 + }, + { + "epoch": 73.88010899182561, + "grad_norm": 2.986412525177002, + "learning_rate": 3.369865947407184e-06, + "loss": 0.0349, + "step": 27114 + }, + { + "epoch": 73.88283378746594, + "grad_norm": 3.93294358253479, + "learning_rate": 3.36920533110183e-06, + "loss": 0.0363, + "step": 27115 + }, + { + "epoch": 73.88555858310627, + "grad_norm": 3.0998787879943848, + "learning_rate": 3.36854476643689e-06, + "loss": 0.0582, + "step": 27116 + }, + { + "epoch": 73.88828337874659, + "grad_norm": 12.342453956604004, + "learning_rate": 3.3678842534175126e-06, + "loss": 0.0829, + "step": 27117 + }, + { + "epoch": 73.89100817438693, + "grad_norm": 2.846457004547119, + "learning_rate": 3.367223792048839e-06, + "loss": 0.0673, + "step": 27118 + }, + { + "epoch": 73.89373297002724, + "grad_norm": 4.059755325317383, + "learning_rate": 3.36656338233601e-06, + "loss": 0.0643, + "step": 27119 + }, + { + "epoch": 73.89645776566758, + "grad_norm": 4.853326320648193, + "learning_rate": 3.365903024284175e-06, + "loss": 0.0854, + "step": 27120 + }, + { + "epoch": 73.8991825613079, + "grad_norm": 3.6625607013702393, + "learning_rate": 3.3652427178984748e-06, + "loss": 0.0558, + "step": 27121 + }, + { + "epoch": 73.90190735694823, + "grad_norm": 2.529726982116699, + "learning_rate": 3.3645824631840496e-06, + "loss": 0.1225, + "step": 27122 + }, + { + "epoch": 73.90463215258856, + "grad_norm": 2.7696170806884766, + "learning_rate": 3.36392226014604e-06, + "loss": 0.0381, + "step": 27123 + }, + { + "epoch": 73.90735694822888, + "grad_norm": 3.455655097961426, + "learning_rate": 3.363262108789592e-06, + "loss": 0.0453, + "step": 27124 + }, + { + "epoch": 73.91008174386921, + "grad_norm": 3.9635257720947266, + "learning_rate": 3.3626020091198443e-06, + "loss": 0.0882, + "step": 27125 + }, + { + "epoch": 73.91280653950953, + "grad_norm": 2.7167911529541016, + "learning_rate": 3.3619419611419403e-06, + "loss": 0.0357, + "step": 27126 + }, + { + "epoch": 73.91553133514986, + "grad_norm": 2.969172477722168, + "learning_rate": 3.3612819648610184e-06, + "loss": 0.0334, + "step": 27127 + }, + { + "epoch": 73.9182561307902, + "grad_norm": 3.717292547225952, + "learning_rate": 3.360622020282216e-06, + "loss": 0.0478, + "step": 27128 + }, + { + "epoch": 73.92098092643052, + "grad_norm": 4.75085973739624, + "learning_rate": 3.359962127410679e-06, + "loss": 0.046, + "step": 27129 + }, + { + "epoch": 73.92370572207085, + "grad_norm": 2.781536817550659, + "learning_rate": 3.3593022862515436e-06, + "loss": 0.041, + "step": 27130 + }, + { + "epoch": 73.92643051771117, + "grad_norm": 2.7844009399414062, + "learning_rate": 3.358642496809947e-06, + "loss": 0.0322, + "step": 27131 + }, + { + "epoch": 73.9291553133515, + "grad_norm": 3.279512882232666, + "learning_rate": 3.3579827590910274e-06, + "loss": 0.0511, + "step": 27132 + }, + { + "epoch": 73.93188010899182, + "grad_norm": 2.986257553100586, + "learning_rate": 3.3573230730999264e-06, + "loss": 0.092, + "step": 27133 + }, + { + "epoch": 73.93460490463215, + "grad_norm": 2.8432276248931885, + "learning_rate": 3.3566634388417798e-06, + "loss": 0.0986, + "step": 27134 + }, + { + "epoch": 73.93732970027249, + "grad_norm": 2.8598997592926025, + "learning_rate": 3.3560038563217244e-06, + "loss": 0.0708, + "step": 27135 + }, + { + "epoch": 73.9400544959128, + "grad_norm": 4.491633892059326, + "learning_rate": 3.355344325544894e-06, + "loss": 0.117, + "step": 27136 + }, + { + "epoch": 73.94277929155314, + "grad_norm": 3.8423354625701904, + "learning_rate": 3.354684846516432e-06, + "loss": 0.0404, + "step": 27137 + }, + { + "epoch": 73.94550408719346, + "grad_norm": 2.9154446125030518, + "learning_rate": 3.354025419241469e-06, + "loss": 0.0848, + "step": 27138 + }, + { + "epoch": 73.94822888283379, + "grad_norm": 4.642427921295166, + "learning_rate": 3.3533660437251438e-06, + "loss": 0.2037, + "step": 27139 + }, + { + "epoch": 73.95095367847412, + "grad_norm": 2.829484462738037, + "learning_rate": 3.352706719972585e-06, + "loss": 0.0841, + "step": 27140 + }, + { + "epoch": 73.95367847411444, + "grad_norm": 3.3154149055480957, + "learning_rate": 3.3520474479889365e-06, + "loss": 0.0518, + "step": 27141 + }, + { + "epoch": 73.95640326975477, + "grad_norm": 3.962322235107422, + "learning_rate": 3.3513882277793287e-06, + "loss": 0.0691, + "step": 27142 + }, + { + "epoch": 73.95912806539509, + "grad_norm": 2.514549732208252, + "learning_rate": 3.3507290593488916e-06, + "loss": 0.0885, + "step": 27143 + }, + { + "epoch": 73.96185286103542, + "grad_norm": 2.186782121658325, + "learning_rate": 3.350069942702763e-06, + "loss": 0.1245, + "step": 27144 + }, + { + "epoch": 73.96457765667574, + "grad_norm": 2.092263698577881, + "learning_rate": 3.349410877846079e-06, + "loss": 0.0359, + "step": 27145 + }, + { + "epoch": 73.96730245231608, + "grad_norm": 3.4706501960754395, + "learning_rate": 3.348751864783969e-06, + "loss": 0.1299, + "step": 27146 + }, + { + "epoch": 73.97002724795641, + "grad_norm": 2.9542319774627686, + "learning_rate": 3.3480929035215647e-06, + "loss": 0.1941, + "step": 27147 + }, + { + "epoch": 73.97275204359673, + "grad_norm": 3.0135879516601562, + "learning_rate": 3.3474339940639965e-06, + "loss": 0.0414, + "step": 27148 + }, + { + "epoch": 73.97547683923706, + "grad_norm": 3.0829758644104004, + "learning_rate": 3.3467751364164013e-06, + "loss": 0.0813, + "step": 27149 + }, + { + "epoch": 73.97820163487738, + "grad_norm": 2.953204870223999, + "learning_rate": 3.3461163305839074e-06, + "loss": 0.0436, + "step": 27150 + }, + { + "epoch": 73.98092643051771, + "grad_norm": 2.9540188312530518, + "learning_rate": 3.3454575765716446e-06, + "loss": 0.0531, + "step": 27151 + }, + { + "epoch": 73.98365122615803, + "grad_norm": 4.306671619415283, + "learning_rate": 3.3447988743847402e-06, + "loss": 0.1042, + "step": 27152 + }, + { + "epoch": 73.98637602179836, + "grad_norm": 2.209057331085205, + "learning_rate": 3.3441402240283325e-06, + "loss": 0.1337, + "step": 27153 + }, + { + "epoch": 73.9891008174387, + "grad_norm": 2.6406970024108887, + "learning_rate": 3.3434816255075464e-06, + "loss": 0.0736, + "step": 27154 + }, + { + "epoch": 73.99182561307902, + "grad_norm": 2.883601665496826, + "learning_rate": 3.3428230788275106e-06, + "loss": 0.0501, + "step": 27155 + }, + { + "epoch": 73.99455040871935, + "grad_norm": 2.4726920127868652, + "learning_rate": 3.3421645839933514e-06, + "loss": 0.0774, + "step": 27156 + }, + { + "epoch": 73.99727520435967, + "grad_norm": 2.8331825733184814, + "learning_rate": 3.3415061410102036e-06, + "loss": 0.1124, + "step": 27157 + }, + { + "epoch": 74.0, + "grad_norm": 5.509169101715088, + "learning_rate": 3.3408477498831917e-06, + "loss": 0.2008, + "step": 27158 + }, + { + "epoch": 74.00272479564033, + "grad_norm": 2.4617745876312256, + "learning_rate": 3.3401894106174427e-06, + "loss": 0.0408, + "step": 27159 + }, + { + "epoch": 74.00544959128065, + "grad_norm": 2.893810987472534, + "learning_rate": 3.3395311232180783e-06, + "loss": 0.0524, + "step": 27160 + }, + { + "epoch": 74.00817438692098, + "grad_norm": 2.2738749980926514, + "learning_rate": 3.3388728876902378e-06, + "loss": 0.0448, + "step": 27161 + }, + { + "epoch": 74.0108991825613, + "grad_norm": 2.066929340362549, + "learning_rate": 3.3382147040390402e-06, + "loss": 0.0301, + "step": 27162 + }, + { + "epoch": 74.01362397820164, + "grad_norm": 3.5921077728271484, + "learning_rate": 3.3375565722696123e-06, + "loss": 0.0858, + "step": 27163 + }, + { + "epoch": 74.01634877384195, + "grad_norm": 3.013620138168335, + "learning_rate": 3.336898492387076e-06, + "loss": 0.153, + "step": 27164 + }, + { + "epoch": 74.01907356948229, + "grad_norm": 2.7107770442962646, + "learning_rate": 3.3362404643965628e-06, + "loss": 0.0401, + "step": 27165 + }, + { + "epoch": 74.02179836512262, + "grad_norm": 2.825683355331421, + "learning_rate": 3.335582488303195e-06, + "loss": 0.0418, + "step": 27166 + }, + { + "epoch": 74.02452316076294, + "grad_norm": 3.1012535095214844, + "learning_rate": 3.3349245641120965e-06, + "loss": 0.0438, + "step": 27167 + }, + { + "epoch": 74.02724795640327, + "grad_norm": 2.699633836746216, + "learning_rate": 3.334266691828387e-06, + "loss": 0.0291, + "step": 27168 + }, + { + "epoch": 74.02997275204359, + "grad_norm": 2.9676756858825684, + "learning_rate": 3.3336088714571977e-06, + "loss": 0.1213, + "step": 27169 + }, + { + "epoch": 74.03269754768392, + "grad_norm": 5.069844722747803, + "learning_rate": 3.3329511030036476e-06, + "loss": 0.0487, + "step": 27170 + }, + { + "epoch": 74.03542234332426, + "grad_norm": 2.047196626663208, + "learning_rate": 3.33229338647286e-06, + "loss": 0.137, + "step": 27171 + }, + { + "epoch": 74.03814713896458, + "grad_norm": 2.680666208267212, + "learning_rate": 3.3316357218699535e-06, + "loss": 0.1425, + "step": 27172 + }, + { + "epoch": 74.04087193460491, + "grad_norm": 3.8923232555389404, + "learning_rate": 3.330978109200057e-06, + "loss": 0.1451, + "step": 27173 + }, + { + "epoch": 74.04359673024523, + "grad_norm": 2.742316961288452, + "learning_rate": 3.3303205484682878e-06, + "loss": 0.0578, + "step": 27174 + }, + { + "epoch": 74.04632152588556, + "grad_norm": 2.411404848098755, + "learning_rate": 3.329663039679768e-06, + "loss": 0.1779, + "step": 27175 + }, + { + "epoch": 74.04904632152588, + "grad_norm": 3.542120933532715, + "learning_rate": 3.329005582839614e-06, + "loss": 0.0407, + "step": 27176 + }, + { + "epoch": 74.05177111716621, + "grad_norm": 2.5981528759002686, + "learning_rate": 3.3283481779529503e-06, + "loss": 0.0433, + "step": 27177 + }, + { + "epoch": 74.05449591280654, + "grad_norm": 3.1827433109283447, + "learning_rate": 3.3276908250249e-06, + "loss": 0.0744, + "step": 27178 + }, + { + "epoch": 74.05722070844686, + "grad_norm": 2.6564531326293945, + "learning_rate": 3.327033524060578e-06, + "loss": 0.0686, + "step": 27179 + }, + { + "epoch": 74.0599455040872, + "grad_norm": 2.9468657970428467, + "learning_rate": 3.3263762750651043e-06, + "loss": 0.0564, + "step": 27180 + }, + { + "epoch": 74.06267029972751, + "grad_norm": 3.285318613052368, + "learning_rate": 3.325719078043593e-06, + "loss": 0.0664, + "step": 27181 + }, + { + "epoch": 74.06539509536785, + "grad_norm": 1.8797310590744019, + "learning_rate": 3.3250619330011715e-06, + "loss": 0.0299, + "step": 27182 + }, + { + "epoch": 74.06811989100818, + "grad_norm": 2.1970951557159424, + "learning_rate": 3.324404839942953e-06, + "loss": 0.0534, + "step": 27183 + }, + { + "epoch": 74.0708446866485, + "grad_norm": 2.397085189819336, + "learning_rate": 3.3237477988740508e-06, + "loss": 0.0339, + "step": 27184 + }, + { + "epoch": 74.07356948228883, + "grad_norm": 3.1384451389312744, + "learning_rate": 3.3230908097995885e-06, + "loss": 0.0392, + "step": 27185 + }, + { + "epoch": 74.07629427792915, + "grad_norm": 2.7506701946258545, + "learning_rate": 3.322433872724681e-06, + "loss": 0.0712, + "step": 27186 + }, + { + "epoch": 74.07901907356948, + "grad_norm": 2.195390224456787, + "learning_rate": 3.3217769876544437e-06, + "loss": 0.0418, + "step": 27187 + }, + { + "epoch": 74.0817438692098, + "grad_norm": 2.8584413528442383, + "learning_rate": 3.3211201545939885e-06, + "loss": 0.0401, + "step": 27188 + }, + { + "epoch": 74.08446866485014, + "grad_norm": 2.165010690689087, + "learning_rate": 3.320463373548438e-06, + "loss": 0.0532, + "step": 27189 + }, + { + "epoch": 74.08719346049047, + "grad_norm": 2.679511070251465, + "learning_rate": 3.319806644522904e-06, + "loss": 0.04, + "step": 27190 + }, + { + "epoch": 74.08991825613079, + "grad_norm": 3.2109289169311523, + "learning_rate": 3.3191499675225e-06, + "loss": 0.0686, + "step": 27191 + }, + { + "epoch": 74.09264305177112, + "grad_norm": 3.273088216781616, + "learning_rate": 3.318493342552339e-06, + "loss": 0.0536, + "step": 27192 + }, + { + "epoch": 74.09536784741144, + "grad_norm": 2.2636821269989014, + "learning_rate": 3.3178367696175396e-06, + "loss": 0.08, + "step": 27193 + }, + { + "epoch": 74.09809264305177, + "grad_norm": 1.867721438407898, + "learning_rate": 3.3171802487232087e-06, + "loss": 0.1226, + "step": 27194 + }, + { + "epoch": 74.1008174386921, + "grad_norm": 2.4035680294036865, + "learning_rate": 3.3165237798744665e-06, + "loss": 0.0996, + "step": 27195 + }, + { + "epoch": 74.10354223433242, + "grad_norm": 2.8854174613952637, + "learning_rate": 3.3158673630764216e-06, + "loss": 0.0377, + "step": 27196 + }, + { + "epoch": 74.10626702997276, + "grad_norm": 2.278005838394165, + "learning_rate": 3.315210998334184e-06, + "loss": 0.0347, + "step": 27197 + }, + { + "epoch": 74.10899182561307, + "grad_norm": 3.0782861709594727, + "learning_rate": 3.314554685652871e-06, + "loss": 0.0407, + "step": 27198 + }, + { + "epoch": 74.11171662125341, + "grad_norm": 4.853907585144043, + "learning_rate": 3.3138984250375903e-06, + "loss": 0.0712, + "step": 27199 + }, + { + "epoch": 74.11444141689373, + "grad_norm": 3.5312323570251465, + "learning_rate": 3.313242216493454e-06, + "loss": 0.0998, + "step": 27200 + }, + { + "epoch": 74.11716621253406, + "grad_norm": 2.485520601272583, + "learning_rate": 3.3125860600255686e-06, + "loss": 0.0353, + "step": 27201 + }, + { + "epoch": 74.11989100817439, + "grad_norm": 4.5134172439575195, + "learning_rate": 3.3119299556390516e-06, + "loss": 0.0634, + "step": 27202 + }, + { + "epoch": 74.12261580381471, + "grad_norm": 1.728415608406067, + "learning_rate": 3.3112739033390083e-06, + "loss": 0.0255, + "step": 27203 + }, + { + "epoch": 74.12534059945504, + "grad_norm": 4.402983665466309, + "learning_rate": 3.3106179031305497e-06, + "loss": 0.0326, + "step": 27204 + }, + { + "epoch": 74.12806539509536, + "grad_norm": 2.5725178718566895, + "learning_rate": 3.309961955018779e-06, + "loss": 0.1255, + "step": 27205 + }, + { + "epoch": 74.1307901907357, + "grad_norm": 2.395601511001587, + "learning_rate": 3.3093060590088132e-06, + "loss": 0.1171, + "step": 27206 + }, + { + "epoch": 74.13351498637603, + "grad_norm": 3.410938024520874, + "learning_rate": 3.3086502151057564e-06, + "loss": 0.0776, + "step": 27207 + }, + { + "epoch": 74.13623978201635, + "grad_norm": 2.5566298961639404, + "learning_rate": 3.3079944233147123e-06, + "loss": 0.06, + "step": 27208 + }, + { + "epoch": 74.13896457765668, + "grad_norm": 3.42567777633667, + "learning_rate": 3.307338683640796e-06, + "loss": 0.1214, + "step": 27209 + }, + { + "epoch": 74.141689373297, + "grad_norm": 3.425590991973877, + "learning_rate": 3.306682996089111e-06, + "loss": 0.093, + "step": 27210 + }, + { + "epoch": 74.14441416893733, + "grad_norm": 3.416318416595459, + "learning_rate": 3.30602736066476e-06, + "loss": 0.1777, + "step": 27211 + }, + { + "epoch": 74.14713896457765, + "grad_norm": 3.309035062789917, + "learning_rate": 3.3053717773728556e-06, + "loss": 0.2189, + "step": 27212 + }, + { + "epoch": 74.14986376021798, + "grad_norm": 3.4633026123046875, + "learning_rate": 3.3047162462184965e-06, + "loss": 0.0384, + "step": 27213 + }, + { + "epoch": 74.15258855585832, + "grad_norm": 2.273061990737915, + "learning_rate": 3.304060767206796e-06, + "loss": 0.0318, + "step": 27214 + }, + { + "epoch": 74.15531335149863, + "grad_norm": 4.014997482299805, + "learning_rate": 3.3034053403428547e-06, + "loss": 0.0629, + "step": 27215 + }, + { + "epoch": 74.15803814713897, + "grad_norm": 9.901772499084473, + "learning_rate": 3.3027499656317773e-06, + "loss": 0.1588, + "step": 27216 + }, + { + "epoch": 74.16076294277929, + "grad_norm": 2.357943058013916, + "learning_rate": 3.302094643078664e-06, + "loss": 0.0382, + "step": 27217 + }, + { + "epoch": 74.16348773841962, + "grad_norm": 3.563890218734741, + "learning_rate": 3.301439372688624e-06, + "loss": 0.165, + "step": 27218 + }, + { + "epoch": 74.16621253405995, + "grad_norm": 1.481551170349121, + "learning_rate": 3.3007841544667606e-06, + "loss": 0.0162, + "step": 27219 + }, + { + "epoch": 74.16893732970027, + "grad_norm": 1.9927772283554077, + "learning_rate": 3.300128988418173e-06, + "loss": 0.0314, + "step": 27220 + }, + { + "epoch": 74.1716621253406, + "grad_norm": 2.6529672145843506, + "learning_rate": 3.2994738745479628e-06, + "loss": 0.0431, + "step": 27221 + }, + { + "epoch": 74.17438692098092, + "grad_norm": 3.6385836601257324, + "learning_rate": 3.2988188128612374e-06, + "loss": 0.0459, + "step": 27222 + }, + { + "epoch": 74.17711171662125, + "grad_norm": 2.179558753967285, + "learning_rate": 3.2981638033630956e-06, + "loss": 0.0325, + "step": 27223 + }, + { + "epoch": 74.17983651226157, + "grad_norm": 3.6399078369140625, + "learning_rate": 3.297508846058639e-06, + "loss": 0.0885, + "step": 27224 + }, + { + "epoch": 74.1825613079019, + "grad_norm": 3.046405076980591, + "learning_rate": 3.2968539409529632e-06, + "loss": 0.0281, + "step": 27225 + }, + { + "epoch": 74.18528610354224, + "grad_norm": 3.1456198692321777, + "learning_rate": 3.2961990880511773e-06, + "loss": 0.0977, + "step": 27226 + }, + { + "epoch": 74.18801089918256, + "grad_norm": 2.7781946659088135, + "learning_rate": 3.2955442873583765e-06, + "loss": 0.0759, + "step": 27227 + }, + { + "epoch": 74.19073569482289, + "grad_norm": 2.615128993988037, + "learning_rate": 3.2948895388796585e-06, + "loss": 0.0274, + "step": 27228 + }, + { + "epoch": 74.19346049046321, + "grad_norm": 4.8917083740234375, + "learning_rate": 3.2942348426201244e-06, + "loss": 0.0238, + "step": 27229 + }, + { + "epoch": 74.19618528610354, + "grad_norm": 2.16357421875, + "learning_rate": 3.293580198584877e-06, + "loss": 0.0294, + "step": 27230 + }, + { + "epoch": 74.19891008174388, + "grad_norm": 2.5870048999786377, + "learning_rate": 3.2929256067790117e-06, + "loss": 0.0522, + "step": 27231 + }, + { + "epoch": 74.2016348773842, + "grad_norm": 2.3557868003845215, + "learning_rate": 3.292271067207625e-06, + "loss": 0.2176, + "step": 27232 + }, + { + "epoch": 74.20435967302453, + "grad_norm": 3.6504061222076416, + "learning_rate": 3.2916165798758127e-06, + "loss": 0.1255, + "step": 27233 + }, + { + "epoch": 74.20708446866485, + "grad_norm": 2.0222890377044678, + "learning_rate": 3.2909621447886773e-06, + "loss": 0.0349, + "step": 27234 + }, + { + "epoch": 74.20980926430518, + "grad_norm": 3.4126057624816895, + "learning_rate": 3.2903077619513135e-06, + "loss": 0.0624, + "step": 27235 + }, + { + "epoch": 74.2125340599455, + "grad_norm": 3.1359829902648926, + "learning_rate": 3.2896534313688165e-06, + "loss": 0.0958, + "step": 27236 + }, + { + "epoch": 74.21525885558583, + "grad_norm": 3.701328754425049, + "learning_rate": 3.2889991530462793e-06, + "loss": 0.0965, + "step": 27237 + }, + { + "epoch": 74.21798365122616, + "grad_norm": 2.533704996109009, + "learning_rate": 3.2883449269888034e-06, + "loss": 0.0507, + "step": 27238 + }, + { + "epoch": 74.22070844686648, + "grad_norm": 2.3656082153320312, + "learning_rate": 3.287690753201482e-06, + "loss": 0.0458, + "step": 27239 + }, + { + "epoch": 74.22343324250681, + "grad_norm": 2.510498523712158, + "learning_rate": 3.2870366316894086e-06, + "loss": 0.0416, + "step": 27240 + }, + { + "epoch": 74.22615803814713, + "grad_norm": 2.279121160507202, + "learning_rate": 3.2863825624576752e-06, + "loss": 0.1041, + "step": 27241 + }, + { + "epoch": 74.22888283378747, + "grad_norm": 2.8952863216400146, + "learning_rate": 3.2857285455113807e-06, + "loss": 0.1, + "step": 27242 + }, + { + "epoch": 74.2316076294278, + "grad_norm": 2.5696914196014404, + "learning_rate": 3.2850745808556174e-06, + "loss": 0.0292, + "step": 27243 + }, + { + "epoch": 74.23433242506812, + "grad_norm": 2.5835812091827393, + "learning_rate": 3.284420668495476e-06, + "loss": 0.0625, + "step": 27244 + }, + { + "epoch": 74.23705722070845, + "grad_norm": 3.5429649353027344, + "learning_rate": 3.2837668084360476e-06, + "loss": 0.0728, + "step": 27245 + }, + { + "epoch": 74.23978201634877, + "grad_norm": 2.635214328765869, + "learning_rate": 3.2831130006824274e-06, + "loss": 0.0596, + "step": 27246 + }, + { + "epoch": 74.2425068119891, + "grad_norm": 3.1904172897338867, + "learning_rate": 3.2824592452397097e-06, + "loss": 0.0781, + "step": 27247 + }, + { + "epoch": 74.24523160762942, + "grad_norm": 2.6193346977233887, + "learning_rate": 3.2818055421129837e-06, + "loss": 0.0857, + "step": 27248 + }, + { + "epoch": 74.24795640326975, + "grad_norm": 2.1958374977111816, + "learning_rate": 3.281151891307336e-06, + "loss": 0.0554, + "step": 27249 + }, + { + "epoch": 74.25068119891009, + "grad_norm": 2.411705732345581, + "learning_rate": 3.280498292827864e-06, + "loss": 0.0324, + "step": 27250 + }, + { + "epoch": 74.2534059945504, + "grad_norm": 2.6255908012390137, + "learning_rate": 3.2798447466796557e-06, + "loss": 0.0736, + "step": 27251 + }, + { + "epoch": 74.25613079019074, + "grad_norm": 3.314282178878784, + "learning_rate": 3.2791912528678004e-06, + "loss": 0.1105, + "step": 27252 + }, + { + "epoch": 74.25885558583106, + "grad_norm": 2.7014825344085693, + "learning_rate": 3.2785378113973843e-06, + "loss": 0.0394, + "step": 27253 + }, + { + "epoch": 74.26158038147139, + "grad_norm": 2.0100409984588623, + "learning_rate": 3.277884422273502e-06, + "loss": 0.0471, + "step": 27254 + }, + { + "epoch": 74.26430517711172, + "grad_norm": 3.3638100624084473, + "learning_rate": 3.277231085501239e-06, + "loss": 0.0718, + "step": 27255 + }, + { + "epoch": 74.26702997275204, + "grad_norm": 2.4385015964508057, + "learning_rate": 3.2765778010856854e-06, + "loss": 0.0228, + "step": 27256 + }, + { + "epoch": 74.26975476839237, + "grad_norm": 2.5477700233459473, + "learning_rate": 3.275924569031923e-06, + "loss": 0.0393, + "step": 27257 + }, + { + "epoch": 74.2724795640327, + "grad_norm": 2.120997190475464, + "learning_rate": 3.275271389345047e-06, + "loss": 0.0376, + "step": 27258 + }, + { + "epoch": 74.27520435967303, + "grad_norm": 2.6655328273773193, + "learning_rate": 3.2746182620301416e-06, + "loss": 0.172, + "step": 27259 + }, + { + "epoch": 74.27792915531334, + "grad_norm": 2.456432580947876, + "learning_rate": 3.2739651870922926e-06, + "loss": 0.0377, + "step": 27260 + }, + { + "epoch": 74.28065395095368, + "grad_norm": 2.6079587936401367, + "learning_rate": 3.273312164536583e-06, + "loss": 0.0541, + "step": 27261 + }, + { + "epoch": 74.28337874659401, + "grad_norm": 3.5972044467926025, + "learning_rate": 3.272659194368104e-06, + "loss": 0.0997, + "step": 27262 + }, + { + "epoch": 74.28610354223433, + "grad_norm": 2.5031604766845703, + "learning_rate": 3.2720062765919368e-06, + "loss": 0.0635, + "step": 27263 + }, + { + "epoch": 74.28882833787466, + "grad_norm": 2.1376121044158936, + "learning_rate": 3.2713534112131705e-06, + "loss": 0.0237, + "step": 27264 + }, + { + "epoch": 74.29155313351498, + "grad_norm": 3.359450578689575, + "learning_rate": 3.2707005982368877e-06, + "loss": 0.1266, + "step": 27265 + }, + { + "epoch": 74.29427792915531, + "grad_norm": 2.4304559230804443, + "learning_rate": 3.2700478376681686e-06, + "loss": 0.0349, + "step": 27266 + }, + { + "epoch": 74.29700272479565, + "grad_norm": 2.10734224319458, + "learning_rate": 3.269395129512104e-06, + "loss": 0.0816, + "step": 27267 + }, + { + "epoch": 74.29972752043597, + "grad_norm": 2.9545388221740723, + "learning_rate": 3.268742473773774e-06, + "loss": 0.0568, + "step": 27268 + }, + { + "epoch": 74.3024523160763, + "grad_norm": 2.317762613296509, + "learning_rate": 3.2680898704582562e-06, + "loss": 0.0915, + "step": 27269 + }, + { + "epoch": 74.30517711171662, + "grad_norm": 2.382387638092041, + "learning_rate": 3.267437319570642e-06, + "loss": 0.1144, + "step": 27270 + }, + { + "epoch": 74.30790190735695, + "grad_norm": 3.6725282669067383, + "learning_rate": 3.2667848211160093e-06, + "loss": 0.0893, + "step": 27271 + }, + { + "epoch": 74.31062670299727, + "grad_norm": 4.105287551879883, + "learning_rate": 3.26613237509944e-06, + "loss": 0.0815, + "step": 27272 + }, + { + "epoch": 74.3133514986376, + "grad_norm": 12.403950691223145, + "learning_rate": 3.265479981526011e-06, + "loss": 0.11, + "step": 27273 + }, + { + "epoch": 74.31607629427793, + "grad_norm": 2.5986974239349365, + "learning_rate": 3.2648276404008104e-06, + "loss": 0.0958, + "step": 27274 + }, + { + "epoch": 74.31880108991825, + "grad_norm": 3.031984806060791, + "learning_rate": 3.2641753517289164e-06, + "loss": 0.0336, + "step": 27275 + }, + { + "epoch": 74.32152588555859, + "grad_norm": 2.4086272716522217, + "learning_rate": 3.2635231155154067e-06, + "loss": 0.0877, + "step": 27276 + }, + { + "epoch": 74.3242506811989, + "grad_norm": 4.058390140533447, + "learning_rate": 3.2628709317653593e-06, + "loss": 0.0777, + "step": 27277 + }, + { + "epoch": 74.32697547683924, + "grad_norm": 3.4180104732513428, + "learning_rate": 3.2622188004838594e-06, + "loss": 0.0354, + "step": 27278 + }, + { + "epoch": 74.32970027247957, + "grad_norm": 3.0404999256134033, + "learning_rate": 3.2615667216759837e-06, + "loss": 0.0519, + "step": 27279 + }, + { + "epoch": 74.33242506811989, + "grad_norm": 3.8097989559173584, + "learning_rate": 3.260914695346805e-06, + "loss": 0.0366, + "step": 27280 + }, + { + "epoch": 74.33514986376022, + "grad_norm": 2.1361637115478516, + "learning_rate": 3.2602627215014093e-06, + "loss": 0.0604, + "step": 27281 + }, + { + "epoch": 74.33787465940054, + "grad_norm": 3.0930285453796387, + "learning_rate": 3.259610800144868e-06, + "loss": 0.0418, + "step": 27282 + }, + { + "epoch": 74.34059945504087, + "grad_norm": 3.5604248046875, + "learning_rate": 3.2589589312822634e-06, + "loss": 0.2219, + "step": 27283 + }, + { + "epoch": 74.34332425068119, + "grad_norm": 3.0186381340026855, + "learning_rate": 3.2583071149186695e-06, + "loss": 0.1285, + "step": 27284 + }, + { + "epoch": 74.34604904632153, + "grad_norm": 4.4371466636657715, + "learning_rate": 3.2576553510591636e-06, + "loss": 0.1368, + "step": 27285 + }, + { + "epoch": 74.34877384196186, + "grad_norm": 2.5523457527160645, + "learning_rate": 3.257003639708818e-06, + "loss": 0.1301, + "step": 27286 + }, + { + "epoch": 74.35149863760218, + "grad_norm": 4.00749397277832, + "learning_rate": 3.256351980872713e-06, + "loss": 0.0779, + "step": 27287 + }, + { + "epoch": 74.35422343324251, + "grad_norm": 2.7158422470092773, + "learning_rate": 3.2557003745559224e-06, + "loss": 0.0338, + "step": 27288 + }, + { + "epoch": 74.35694822888283, + "grad_norm": 2.823284149169922, + "learning_rate": 3.25504882076352e-06, + "loss": 0.0979, + "step": 27289 + }, + { + "epoch": 74.35967302452316, + "grad_norm": 4.403693199157715, + "learning_rate": 3.2543973195005764e-06, + "loss": 0.0682, + "step": 27290 + }, + { + "epoch": 74.3623978201635, + "grad_norm": 2.1391823291778564, + "learning_rate": 3.2537458707721735e-06, + "loss": 0.0244, + "step": 27291 + }, + { + "epoch": 74.36512261580381, + "grad_norm": 4.027947902679443, + "learning_rate": 3.2530944745833803e-06, + "loss": 0.1552, + "step": 27292 + }, + { + "epoch": 74.36784741144415, + "grad_norm": 2.293487071990967, + "learning_rate": 3.2524431309392667e-06, + "loss": 0.0498, + "step": 27293 + }, + { + "epoch": 74.37057220708446, + "grad_norm": 2.6919054985046387, + "learning_rate": 3.2517918398449133e-06, + "loss": 0.0395, + "step": 27294 + }, + { + "epoch": 74.3732970027248, + "grad_norm": 1.9174407720565796, + "learning_rate": 3.251140601305387e-06, + "loss": 0.0276, + "step": 27295 + }, + { + "epoch": 74.37602179836512, + "grad_norm": 2.551849603652954, + "learning_rate": 3.2504894153257603e-06, + "loss": 0.1889, + "step": 27296 + }, + { + "epoch": 74.37874659400545, + "grad_norm": 3.521094799041748, + "learning_rate": 3.2498382819111017e-06, + "loss": 0.0504, + "step": 27297 + }, + { + "epoch": 74.38147138964578, + "grad_norm": 3.04475998878479, + "learning_rate": 3.2491872010664847e-06, + "loss": 0.2605, + "step": 27298 + }, + { + "epoch": 74.3841961852861, + "grad_norm": 2.8988218307495117, + "learning_rate": 3.2485361727969846e-06, + "loss": 0.0897, + "step": 27299 + }, + { + "epoch": 74.38692098092643, + "grad_norm": 3.369778871536255, + "learning_rate": 3.2478851971076675e-06, + "loss": 0.1045, + "step": 27300 + }, + { + "epoch": 74.38964577656675, + "grad_norm": 3.181368827819824, + "learning_rate": 3.2472342740036033e-06, + "loss": 0.0827, + "step": 27301 + }, + { + "epoch": 74.39237057220708, + "grad_norm": 1.9666175842285156, + "learning_rate": 3.246583403489857e-06, + "loss": 0.0548, + "step": 27302 + }, + { + "epoch": 74.39509536784742, + "grad_norm": 3.336275100708008, + "learning_rate": 3.2459325855715063e-06, + "loss": 0.0313, + "step": 27303 + }, + { + "epoch": 74.39782016348774, + "grad_norm": 2.77612566947937, + "learning_rate": 3.245281820253614e-06, + "loss": 0.0394, + "step": 27304 + }, + { + "epoch": 74.40054495912807, + "grad_norm": 2.6531143188476562, + "learning_rate": 3.2446311075412508e-06, + "loss": 0.068, + "step": 27305 + }, + { + "epoch": 74.40326975476839, + "grad_norm": 3.5499050617218018, + "learning_rate": 3.243980447439479e-06, + "loss": 0.068, + "step": 27306 + }, + { + "epoch": 74.40599455040872, + "grad_norm": 3.847198247909546, + "learning_rate": 3.243329839953373e-06, + "loss": 0.0618, + "step": 27307 + }, + { + "epoch": 74.40871934604904, + "grad_norm": 2.1634271144866943, + "learning_rate": 3.2426792850879974e-06, + "loss": 0.0325, + "step": 27308 + }, + { + "epoch": 74.41144414168937, + "grad_norm": 2.917853355407715, + "learning_rate": 3.2420287828484175e-06, + "loss": 0.055, + "step": 27309 + }, + { + "epoch": 74.4141689373297, + "grad_norm": 3.1917197704315186, + "learning_rate": 3.2413783332396977e-06, + "loss": 0.1354, + "step": 27310 + }, + { + "epoch": 74.41689373297002, + "grad_norm": 4.102021217346191, + "learning_rate": 3.240727936266909e-06, + "loss": 0.0614, + "step": 27311 + }, + { + "epoch": 74.41961852861036, + "grad_norm": 2.5872745513916016, + "learning_rate": 3.2400775919351123e-06, + "loss": 0.0473, + "step": 27312 + }, + { + "epoch": 74.42234332425068, + "grad_norm": 3.0297534465789795, + "learning_rate": 3.2394273002493747e-06, + "loss": 0.092, + "step": 27313 + }, + { + "epoch": 74.42506811989101, + "grad_norm": 2.410175323486328, + "learning_rate": 3.2387770612147562e-06, + "loss": 0.0258, + "step": 27314 + }, + { + "epoch": 74.42779291553134, + "grad_norm": 2.3826498985290527, + "learning_rate": 3.238126874836325e-06, + "loss": 0.0595, + "step": 27315 + }, + { + "epoch": 74.43051771117166, + "grad_norm": 2.6610512733459473, + "learning_rate": 3.2374767411191468e-06, + "loss": 0.0374, + "step": 27316 + }, + { + "epoch": 74.433242506812, + "grad_norm": 2.922426223754883, + "learning_rate": 3.2368266600682817e-06, + "loss": 0.0337, + "step": 27317 + }, + { + "epoch": 74.43596730245231, + "grad_norm": 2.367076873779297, + "learning_rate": 3.23617663168879e-06, + "loss": 0.0326, + "step": 27318 + }, + { + "epoch": 74.43869209809264, + "grad_norm": 3.080042600631714, + "learning_rate": 3.23552665598574e-06, + "loss": 0.0982, + "step": 27319 + }, + { + "epoch": 74.44141689373296, + "grad_norm": 2.814044952392578, + "learning_rate": 3.2348767329641908e-06, + "loss": 0.096, + "step": 27320 + }, + { + "epoch": 74.4441416893733, + "grad_norm": 3.0666403770446777, + "learning_rate": 3.2342268626292037e-06, + "loss": 0.1051, + "step": 27321 + }, + { + "epoch": 74.44686648501363, + "grad_norm": 2.8949360847473145, + "learning_rate": 3.233577044985837e-06, + "loss": 0.0424, + "step": 27322 + }, + { + "epoch": 74.44959128065395, + "grad_norm": 3.484898090362549, + "learning_rate": 3.2329272800391586e-06, + "loss": 0.0908, + "step": 27323 + }, + { + "epoch": 74.45231607629428, + "grad_norm": 3.0054502487182617, + "learning_rate": 3.232277567794223e-06, + "loss": 0.0566, + "step": 27324 + }, + { + "epoch": 74.4550408719346, + "grad_norm": 3.1153807640075684, + "learning_rate": 3.231627908256093e-06, + "loss": 0.0953, + "step": 27325 + }, + { + "epoch": 74.45776566757493, + "grad_norm": 2.3662543296813965, + "learning_rate": 3.2309783014298235e-06, + "loss": 0.0504, + "step": 27326 + }, + { + "epoch": 74.46049046321527, + "grad_norm": 2.445415496826172, + "learning_rate": 3.2303287473204813e-06, + "loss": 0.0424, + "step": 27327 + }, + { + "epoch": 74.46321525885558, + "grad_norm": 12.313671112060547, + "learning_rate": 3.2296792459331196e-06, + "loss": 0.0485, + "step": 27328 + }, + { + "epoch": 74.46594005449592, + "grad_norm": 3.2492637634277344, + "learning_rate": 3.229029797272799e-06, + "loss": 0.2021, + "step": 27329 + }, + { + "epoch": 74.46866485013624, + "grad_norm": 6.003134250640869, + "learning_rate": 3.228380401344573e-06, + "loss": 0.0459, + "step": 27330 + }, + { + "epoch": 74.47138964577657, + "grad_norm": 4.572073936462402, + "learning_rate": 3.2277310581535046e-06, + "loss": 0.0863, + "step": 27331 + }, + { + "epoch": 74.47411444141689, + "grad_norm": 2.737095832824707, + "learning_rate": 3.2270817677046463e-06, + "loss": 0.16, + "step": 27332 + }, + { + "epoch": 74.47683923705722, + "grad_norm": 1.6207386255264282, + "learning_rate": 3.226432530003061e-06, + "loss": 0.0238, + "step": 27333 + }, + { + "epoch": 74.47956403269755, + "grad_norm": 4.511898994445801, + "learning_rate": 3.225783345053797e-06, + "loss": 0.031, + "step": 27334 + }, + { + "epoch": 74.48228882833787, + "grad_norm": 2.6669580936431885, + "learning_rate": 3.2251342128619177e-06, + "loss": 0.0255, + "step": 27335 + }, + { + "epoch": 74.4850136239782, + "grad_norm": 2.2407360076904297, + "learning_rate": 3.2244851334324755e-06, + "loss": 0.0307, + "step": 27336 + }, + { + "epoch": 74.48773841961852, + "grad_norm": 1.9477989673614502, + "learning_rate": 3.223836106770525e-06, + "loss": 0.0255, + "step": 27337 + }, + { + "epoch": 74.49046321525886, + "grad_norm": 2.5379209518432617, + "learning_rate": 3.2231871328811182e-06, + "loss": 0.0577, + "step": 27338 + }, + { + "epoch": 74.49318801089919, + "grad_norm": 2.7109456062316895, + "learning_rate": 3.2225382117693137e-06, + "loss": 0.0258, + "step": 27339 + }, + { + "epoch": 74.49591280653951, + "grad_norm": 3.679842233657837, + "learning_rate": 3.2218893434401645e-06, + "loss": 0.0432, + "step": 27340 + }, + { + "epoch": 74.49863760217984, + "grad_norm": 4.106472015380859, + "learning_rate": 3.2212405278987226e-06, + "loss": 0.07, + "step": 27341 + }, + { + "epoch": 74.50136239782016, + "grad_norm": 2.846247911453247, + "learning_rate": 3.2205917651500373e-06, + "loss": 0.0514, + "step": 27342 + }, + { + "epoch": 74.50408719346049, + "grad_norm": 3.2952558994293213, + "learning_rate": 3.2199430551991695e-06, + "loss": 0.0911, + "step": 27343 + }, + { + "epoch": 74.50681198910081, + "grad_norm": 3.331434965133667, + "learning_rate": 3.219294398051167e-06, + "loss": 0.1626, + "step": 27344 + }, + { + "epoch": 74.50953678474114, + "grad_norm": 2.7207252979278564, + "learning_rate": 3.2186457937110803e-06, + "loss": 0.0487, + "step": 27345 + }, + { + "epoch": 74.51226158038148, + "grad_norm": 5.137471675872803, + "learning_rate": 3.21799724218396e-06, + "loss": 0.0723, + "step": 27346 + }, + { + "epoch": 74.5149863760218, + "grad_norm": 3.6339457035064697, + "learning_rate": 3.217348743474862e-06, + "loss": 0.1025, + "step": 27347 + }, + { + "epoch": 74.51771117166213, + "grad_norm": 2.727165937423706, + "learning_rate": 3.216700297588833e-06, + "loss": 0.109, + "step": 27348 + }, + { + "epoch": 74.52043596730245, + "grad_norm": 2.7108774185180664, + "learning_rate": 3.2160519045309203e-06, + "loss": 0.1641, + "step": 27349 + }, + { + "epoch": 74.52316076294278, + "grad_norm": 3.9313526153564453, + "learning_rate": 3.2154035643061808e-06, + "loss": 0.2677, + "step": 27350 + }, + { + "epoch": 74.52588555858311, + "grad_norm": 3.4737322330474854, + "learning_rate": 3.214755276919657e-06, + "loss": 0.0931, + "step": 27351 + }, + { + "epoch": 74.52861035422343, + "grad_norm": 3.3170359134674072, + "learning_rate": 3.2141070423764043e-06, + "loss": 0.0443, + "step": 27352 + }, + { + "epoch": 74.53133514986376, + "grad_norm": 2.8323776721954346, + "learning_rate": 3.2134588606814665e-06, + "loss": 0.0626, + "step": 27353 + }, + { + "epoch": 74.53405994550408, + "grad_norm": 2.4754843711853027, + "learning_rate": 3.2128107318398925e-06, + "loss": 0.0316, + "step": 27354 + }, + { + "epoch": 74.53678474114442, + "grad_norm": 4.48448371887207, + "learning_rate": 3.2121626558567277e-06, + "loss": 0.0392, + "step": 27355 + }, + { + "epoch": 74.53950953678473, + "grad_norm": 2.2643465995788574, + "learning_rate": 3.211514632737025e-06, + "loss": 0.0391, + "step": 27356 + }, + { + "epoch": 74.54223433242507, + "grad_norm": 1.680436134338379, + "learning_rate": 3.2108666624858276e-06, + "loss": 0.0253, + "step": 27357 + }, + { + "epoch": 74.5449591280654, + "grad_norm": 2.255134344100952, + "learning_rate": 3.210218745108179e-06, + "loss": 0.0316, + "step": 27358 + }, + { + "epoch": 74.54768392370572, + "grad_norm": 2.986950635910034, + "learning_rate": 3.2095708806091306e-06, + "loss": 0.0462, + "step": 27359 + }, + { + "epoch": 74.55040871934605, + "grad_norm": 2.898524522781372, + "learning_rate": 3.208923068993727e-06, + "loss": 0.0457, + "step": 27360 + }, + { + "epoch": 74.55313351498637, + "grad_norm": 4.367632865905762, + "learning_rate": 3.2082753102670105e-06, + "loss": 0.0928, + "step": 27361 + }, + { + "epoch": 74.5558583106267, + "grad_norm": 2.7649285793304443, + "learning_rate": 3.207627604434025e-06, + "loss": 0.075, + "step": 27362 + }, + { + "epoch": 74.55858310626704, + "grad_norm": 8.433934211730957, + "learning_rate": 3.20697995149982e-06, + "loss": 0.0453, + "step": 27363 + }, + { + "epoch": 74.56130790190736, + "grad_norm": 2.8349850177764893, + "learning_rate": 3.2063323514694365e-06, + "loss": 0.0472, + "step": 27364 + }, + { + "epoch": 74.56403269754769, + "grad_norm": 2.8618035316467285, + "learning_rate": 3.2056848043479184e-06, + "loss": 0.1002, + "step": 27365 + }, + { + "epoch": 74.566757493188, + "grad_norm": 3.4427757263183594, + "learning_rate": 3.2050373101403053e-06, + "loss": 0.1556, + "step": 27366 + }, + { + "epoch": 74.56948228882834, + "grad_norm": 5.154320240020752, + "learning_rate": 3.2043898688516428e-06, + "loss": 0.0816, + "step": 27367 + }, + { + "epoch": 74.57220708446866, + "grad_norm": 2.4975204467773438, + "learning_rate": 3.2037424804869765e-06, + "loss": 0.0421, + "step": 27368 + }, + { + "epoch": 74.57493188010899, + "grad_norm": 2.318462610244751, + "learning_rate": 3.203095145051345e-06, + "loss": 0.0351, + "step": 27369 + }, + { + "epoch": 74.57765667574932, + "grad_norm": 4.079827308654785, + "learning_rate": 3.202447862549789e-06, + "loss": 0.0742, + "step": 27370 + }, + { + "epoch": 74.58038147138964, + "grad_norm": 3.9023802280426025, + "learning_rate": 3.2018006329873475e-06, + "loss": 0.0985, + "step": 27371 + }, + { + "epoch": 74.58310626702998, + "grad_norm": 3.151120185852051, + "learning_rate": 3.201153456369067e-06, + "loss": 0.0608, + "step": 27372 + }, + { + "epoch": 74.5858310626703, + "grad_norm": 7.027402877807617, + "learning_rate": 3.2005063326999853e-06, + "loss": 0.1259, + "step": 27373 + }, + { + "epoch": 74.58855585831063, + "grad_norm": 1.838041067123413, + "learning_rate": 3.199859261985141e-06, + "loss": 0.0264, + "step": 27374 + }, + { + "epoch": 74.59128065395096, + "grad_norm": 1.8210034370422363, + "learning_rate": 3.1992122442295702e-06, + "loss": 0.0347, + "step": 27375 + }, + { + "epoch": 74.59400544959128, + "grad_norm": 3.0615527629852295, + "learning_rate": 3.1985652794383193e-06, + "loss": 0.0963, + "step": 27376 + }, + { + "epoch": 74.59673024523161, + "grad_norm": 4.979789733886719, + "learning_rate": 3.197918367616423e-06, + "loss": 0.0697, + "step": 27377 + }, + { + "epoch": 74.59945504087193, + "grad_norm": 2.7697553634643555, + "learning_rate": 3.197271508768919e-06, + "loss": 0.0279, + "step": 27378 + }, + { + "epoch": 74.60217983651226, + "grad_norm": 2.101897716522217, + "learning_rate": 3.1966247029008433e-06, + "loss": 0.0374, + "step": 27379 + }, + { + "epoch": 74.60490463215258, + "grad_norm": 2.0909366607666016, + "learning_rate": 3.1959779500172382e-06, + "loss": 0.039, + "step": 27380 + }, + { + "epoch": 74.60762942779292, + "grad_norm": 2.7853620052337646, + "learning_rate": 3.195331250123138e-06, + "loss": 0.1248, + "step": 27381 + }, + { + "epoch": 74.61035422343325, + "grad_norm": 2.994997262954712, + "learning_rate": 3.1946846032235754e-06, + "loss": 0.0518, + "step": 27382 + }, + { + "epoch": 74.61307901907357, + "grad_norm": 2.473146677017212, + "learning_rate": 3.1940380093235932e-06, + "loss": 0.0805, + "step": 27383 + }, + { + "epoch": 74.6158038147139, + "grad_norm": 4.3801093101501465, + "learning_rate": 3.1933914684282206e-06, + "loss": 0.0557, + "step": 27384 + }, + { + "epoch": 74.61852861035422, + "grad_norm": 2.473504066467285, + "learning_rate": 3.1927449805425005e-06, + "loss": 0.064, + "step": 27385 + }, + { + "epoch": 74.62125340599455, + "grad_norm": 3.362474203109741, + "learning_rate": 3.1920985456714625e-06, + "loss": 0.0344, + "step": 27386 + }, + { + "epoch": 74.62397820163488, + "grad_norm": 2.301248550415039, + "learning_rate": 3.191452163820139e-06, + "loss": 0.0992, + "step": 27387 + }, + { + "epoch": 74.6267029972752, + "grad_norm": 3.087402820587158, + "learning_rate": 3.19080583499357e-06, + "loss": 0.0502, + "step": 27388 + }, + { + "epoch": 74.62942779291554, + "grad_norm": 2.3167479038238525, + "learning_rate": 3.190159559196786e-06, + "loss": 0.0351, + "step": 27389 + }, + { + "epoch": 74.63215258855585, + "grad_norm": 2.209955930709839, + "learning_rate": 3.1895133364348208e-06, + "loss": 0.0273, + "step": 27390 + }, + { + "epoch": 74.63487738419619, + "grad_norm": 2.4292988777160645, + "learning_rate": 3.1888671667127026e-06, + "loss": 0.0896, + "step": 27391 + }, + { + "epoch": 74.6376021798365, + "grad_norm": 3.015127420425415, + "learning_rate": 3.1882210500354705e-06, + "loss": 0.1085, + "step": 27392 + }, + { + "epoch": 74.64032697547684, + "grad_norm": 2.6956639289855957, + "learning_rate": 3.187574986408155e-06, + "loss": 0.1141, + "step": 27393 + }, + { + "epoch": 74.64305177111717, + "grad_norm": 4.860119342803955, + "learning_rate": 3.1869289758357845e-06, + "loss": 0.1346, + "step": 27394 + }, + { + "epoch": 74.64577656675749, + "grad_norm": 4.685331344604492, + "learning_rate": 3.1862830183233907e-06, + "loss": 0.0365, + "step": 27395 + }, + { + "epoch": 74.64850136239782, + "grad_norm": 2.2085535526275635, + "learning_rate": 3.185637113876007e-06, + "loss": 0.038, + "step": 27396 + }, + { + "epoch": 74.65122615803814, + "grad_norm": 2.1946418285369873, + "learning_rate": 3.184991262498662e-06, + "loss": 0.0293, + "step": 27397 + }, + { + "epoch": 74.65395095367847, + "grad_norm": 4.102278709411621, + "learning_rate": 3.1843454641963866e-06, + "loss": 0.1202, + "step": 27398 + }, + { + "epoch": 74.65667574931881, + "grad_norm": 2.386718273162842, + "learning_rate": 3.183699718974207e-06, + "loss": 0.0411, + "step": 27399 + }, + { + "epoch": 74.65940054495913, + "grad_norm": 3.3451311588287354, + "learning_rate": 3.183054026837157e-06, + "loss": 0.0872, + "step": 27400 + }, + { + "epoch": 74.66212534059946, + "grad_norm": 4.495838165283203, + "learning_rate": 3.182408387790259e-06, + "loss": 0.049, + "step": 27401 + }, + { + "epoch": 74.66485013623978, + "grad_norm": 2.089571475982666, + "learning_rate": 3.181762801838548e-06, + "loss": 0.0252, + "step": 27402 + }, + { + "epoch": 74.66757493188011, + "grad_norm": 2.0634653568267822, + "learning_rate": 3.181117268987046e-06, + "loss": 0.0289, + "step": 27403 + }, + { + "epoch": 74.67029972752043, + "grad_norm": 3.0624613761901855, + "learning_rate": 3.1804717892407877e-06, + "loss": 0.1385, + "step": 27404 + }, + { + "epoch": 74.67302452316076, + "grad_norm": 3.4951775074005127, + "learning_rate": 3.1798263626047944e-06, + "loss": 0.1402, + "step": 27405 + }, + { + "epoch": 74.6757493188011, + "grad_norm": 5.737732410430908, + "learning_rate": 3.1791809890840942e-06, + "loss": 0.0913, + "step": 27406 + }, + { + "epoch": 74.67847411444141, + "grad_norm": 2.3680155277252197, + "learning_rate": 3.1785356686837097e-06, + "loss": 0.1333, + "step": 27407 + }, + { + "epoch": 74.68119891008175, + "grad_norm": 3.2178423404693604, + "learning_rate": 3.177890401408673e-06, + "loss": 0.0432, + "step": 27408 + }, + { + "epoch": 74.68392370572207, + "grad_norm": 3.593608856201172, + "learning_rate": 3.1772451872640066e-06, + "loss": 0.0455, + "step": 27409 + }, + { + "epoch": 74.6866485013624, + "grad_norm": 2.4788355827331543, + "learning_rate": 3.1766000262547347e-06, + "loss": 0.135, + "step": 27410 + }, + { + "epoch": 74.68937329700273, + "grad_norm": 3.574361562728882, + "learning_rate": 3.1759549183858797e-06, + "loss": 0.1343, + "step": 27411 + }, + { + "epoch": 74.69209809264305, + "grad_norm": 2.709545373916626, + "learning_rate": 3.17530986366247e-06, + "loss": 0.0407, + "step": 27412 + }, + { + "epoch": 74.69482288828338, + "grad_norm": 5.369472980499268, + "learning_rate": 3.174664862089528e-06, + "loss": 0.0397, + "step": 27413 + }, + { + "epoch": 74.6975476839237, + "grad_norm": 4.344054222106934, + "learning_rate": 3.174019913672077e-06, + "loss": 0.1633, + "step": 27414 + }, + { + "epoch": 74.70027247956403, + "grad_norm": 2.938528537750244, + "learning_rate": 3.1733750184151357e-06, + "loss": 0.0618, + "step": 27415 + }, + { + "epoch": 74.70299727520435, + "grad_norm": 2.4566922187805176, + "learning_rate": 3.172730176323733e-06, + "loss": 0.0391, + "step": 27416 + }, + { + "epoch": 74.70572207084469, + "grad_norm": 3.157243251800537, + "learning_rate": 3.172085387402888e-06, + "loss": 0.0467, + "step": 27417 + }, + { + "epoch": 74.70844686648502, + "grad_norm": 6.23567008972168, + "learning_rate": 3.171440651657619e-06, + "loss": 0.0554, + "step": 27418 + }, + { + "epoch": 74.71117166212534, + "grad_norm": 2.5095317363739014, + "learning_rate": 3.1707959690929545e-06, + "loss": 0.0399, + "step": 27419 + }, + { + "epoch": 74.71389645776567, + "grad_norm": 2.690309524536133, + "learning_rate": 3.1701513397139072e-06, + "loss": 0.0354, + "step": 27420 + }, + { + "epoch": 74.71662125340599, + "grad_norm": 2.5978381633758545, + "learning_rate": 3.169506763525505e-06, + "loss": 0.0376, + "step": 27421 + }, + { + "epoch": 74.71934604904632, + "grad_norm": 3.6311593055725098, + "learning_rate": 3.168862240532764e-06, + "loss": 0.0861, + "step": 27422 + }, + { + "epoch": 74.72207084468666, + "grad_norm": 3.008673906326294, + "learning_rate": 3.1682177707407e-06, + "loss": 0.1461, + "step": 27423 + }, + { + "epoch": 74.72479564032697, + "grad_norm": 3.299814462661743, + "learning_rate": 3.167573354154341e-06, + "loss": 0.0843, + "step": 27424 + }, + { + "epoch": 74.7275204359673, + "grad_norm": 3.0510849952697754, + "learning_rate": 3.1669289907786994e-06, + "loss": 0.0392, + "step": 27425 + }, + { + "epoch": 74.73024523160763, + "grad_norm": 3.5574769973754883, + "learning_rate": 3.1662846806187952e-06, + "loss": 0.1855, + "step": 27426 + }, + { + "epoch": 74.73297002724796, + "grad_norm": 2.4356772899627686, + "learning_rate": 3.1656404236796436e-06, + "loss": 0.0417, + "step": 27427 + }, + { + "epoch": 74.73569482288828, + "grad_norm": 3.1003222465515137, + "learning_rate": 3.1649962199662665e-06, + "loss": 0.1738, + "step": 27428 + }, + { + "epoch": 74.73841961852861, + "grad_norm": 3.6968743801116943, + "learning_rate": 3.1643520694836793e-06, + "loss": 0.1928, + "step": 27429 + }, + { + "epoch": 74.74114441416894, + "grad_norm": 2.2422289848327637, + "learning_rate": 3.163707972236899e-06, + "loss": 0.0593, + "step": 27430 + }, + { + "epoch": 74.74386920980926, + "grad_norm": 2.408618450164795, + "learning_rate": 3.163063928230937e-06, + "loss": 0.104, + "step": 27431 + }, + { + "epoch": 74.7465940054496, + "grad_norm": 3.220341444015503, + "learning_rate": 3.1624199374708163e-06, + "loss": 0.1713, + "step": 27432 + }, + { + "epoch": 74.74931880108991, + "grad_norm": 3.2058322429656982, + "learning_rate": 3.1617759999615495e-06, + "loss": 0.041, + "step": 27433 + }, + { + "epoch": 74.75204359673025, + "grad_norm": 2.603969097137451, + "learning_rate": 3.161132115708151e-06, + "loss": 0.0929, + "step": 27434 + }, + { + "epoch": 74.75476839237058, + "grad_norm": 3.143913507461548, + "learning_rate": 3.1604882847156314e-06, + "loss": 0.1677, + "step": 27435 + }, + { + "epoch": 74.7574931880109, + "grad_norm": 4.815069198608398, + "learning_rate": 3.1598445069890093e-06, + "loss": 0.0504, + "step": 27436 + }, + { + "epoch": 74.76021798365123, + "grad_norm": 2.8605568408966064, + "learning_rate": 3.1592007825333015e-06, + "loss": 0.0369, + "step": 27437 + }, + { + "epoch": 74.76294277929155, + "grad_norm": 2.512197732925415, + "learning_rate": 3.1585571113535186e-06, + "loss": 0.1017, + "step": 27438 + }, + { + "epoch": 74.76566757493188, + "grad_norm": 3.2640180587768555, + "learning_rate": 3.1579134934546716e-06, + "loss": 0.1161, + "step": 27439 + }, + { + "epoch": 74.7683923705722, + "grad_norm": 2.781555652618408, + "learning_rate": 3.1572699288417708e-06, + "loss": 0.1141, + "step": 27440 + }, + { + "epoch": 74.77111716621253, + "grad_norm": 3.1150054931640625, + "learning_rate": 3.156626417519836e-06, + "loss": 0.0651, + "step": 27441 + }, + { + "epoch": 74.77384196185287, + "grad_norm": 3.060635805130005, + "learning_rate": 3.1559829594938728e-06, + "loss": 0.2373, + "step": 27442 + }, + { + "epoch": 74.77656675749319, + "grad_norm": 5.093193531036377, + "learning_rate": 3.1553395547688914e-06, + "loss": 0.1321, + "step": 27443 + }, + { + "epoch": 74.77929155313352, + "grad_norm": 3.535568952560425, + "learning_rate": 3.1546962033499084e-06, + "loss": 0.0812, + "step": 27444 + }, + { + "epoch": 74.78201634877384, + "grad_norm": 2.840769052505493, + "learning_rate": 3.1540529052419323e-06, + "loss": 0.0421, + "step": 27445 + }, + { + "epoch": 74.78474114441417, + "grad_norm": 3.9191110134124756, + "learning_rate": 3.153409660449971e-06, + "loss": 0.2843, + "step": 27446 + }, + { + "epoch": 74.7874659400545, + "grad_norm": 3.4338719844818115, + "learning_rate": 3.1527664689790316e-06, + "loss": 0.0596, + "step": 27447 + }, + { + "epoch": 74.79019073569482, + "grad_norm": 2.8352816104888916, + "learning_rate": 3.1521233308341292e-06, + "loss": 0.041, + "step": 27448 + }, + { + "epoch": 74.79291553133515, + "grad_norm": 3.671628952026367, + "learning_rate": 3.1514802460202707e-06, + "loss": 0.0803, + "step": 27449 + }, + { + "epoch": 74.79564032697547, + "grad_norm": 6.532846450805664, + "learning_rate": 3.1508372145424637e-06, + "loss": 0.0462, + "step": 27450 + }, + { + "epoch": 74.7983651226158, + "grad_norm": 2.7748310565948486, + "learning_rate": 3.1501942364057116e-06, + "loss": 0.082, + "step": 27451 + }, + { + "epoch": 74.80108991825612, + "grad_norm": 3.0477004051208496, + "learning_rate": 3.1495513116150276e-06, + "loss": 0.0637, + "step": 27452 + }, + { + "epoch": 74.80381471389646, + "grad_norm": 3.5865554809570312, + "learning_rate": 3.14890844017542e-06, + "loss": 0.0871, + "step": 27453 + }, + { + "epoch": 74.80653950953679, + "grad_norm": 3.582667112350464, + "learning_rate": 3.1482656220918938e-06, + "loss": 0.0389, + "step": 27454 + }, + { + "epoch": 74.80926430517711, + "grad_norm": 2.5279176235198975, + "learning_rate": 3.1476228573694533e-06, + "loss": 0.0623, + "step": 27455 + }, + { + "epoch": 74.81198910081744, + "grad_norm": 3.823660373687744, + "learning_rate": 3.1469801460131035e-06, + "loss": 0.1617, + "step": 27456 + }, + { + "epoch": 74.81471389645776, + "grad_norm": 2.192878007888794, + "learning_rate": 3.146337488027854e-06, + "loss": 0.0431, + "step": 27457 + }, + { + "epoch": 74.8174386920981, + "grad_norm": 2.2675254344940186, + "learning_rate": 3.1456948834187083e-06, + "loss": 0.0314, + "step": 27458 + }, + { + "epoch": 74.82016348773843, + "grad_norm": 6.254118919372559, + "learning_rate": 3.14505233219067e-06, + "loss": 0.0462, + "step": 27459 + }, + { + "epoch": 74.82288828337875, + "grad_norm": 3.756660223007202, + "learning_rate": 3.1444098343487394e-06, + "loss": 0.1437, + "step": 27460 + }, + { + "epoch": 74.82561307901908, + "grad_norm": 3.801999092102051, + "learning_rate": 3.1437673898979282e-06, + "loss": 0.0514, + "step": 27461 + }, + { + "epoch": 74.8283378746594, + "grad_norm": 3.2751238346099854, + "learning_rate": 3.143124998843237e-06, + "loss": 0.0385, + "step": 27462 + }, + { + "epoch": 74.83106267029973, + "grad_norm": 3.086588144302368, + "learning_rate": 3.1424826611896664e-06, + "loss": 0.2446, + "step": 27463 + }, + { + "epoch": 74.83378746594005, + "grad_norm": 3.3873214721679688, + "learning_rate": 3.1418403769422166e-06, + "loss": 0.0282, + "step": 27464 + }, + { + "epoch": 74.83651226158038, + "grad_norm": 3.4134676456451416, + "learning_rate": 3.1411981461058973e-06, + "loss": 0.1302, + "step": 27465 + }, + { + "epoch": 74.83923705722071, + "grad_norm": 2.2357282638549805, + "learning_rate": 3.1405559686857058e-06, + "loss": 0.0338, + "step": 27466 + }, + { + "epoch": 74.84196185286103, + "grad_norm": 3.2296764850616455, + "learning_rate": 3.1399138446866405e-06, + "loss": 0.0518, + "step": 27467 + }, + { + "epoch": 74.84468664850137, + "grad_norm": 3.764432191848755, + "learning_rate": 3.139271774113708e-06, + "loss": 0.0755, + "step": 27468 + }, + { + "epoch": 74.84741144414168, + "grad_norm": 1.9802919626235962, + "learning_rate": 3.138629756971907e-06, + "loss": 0.0351, + "step": 27469 + }, + { + "epoch": 74.85013623978202, + "grad_norm": 2.98422908782959, + "learning_rate": 3.137987793266233e-06, + "loss": 0.0886, + "step": 27470 + }, + { + "epoch": 74.85286103542235, + "grad_norm": 3.518028736114502, + "learning_rate": 3.1373458830016925e-06, + "loss": 0.0994, + "step": 27471 + }, + { + "epoch": 74.85558583106267, + "grad_norm": 9.135181427001953, + "learning_rate": 3.136704026183278e-06, + "loss": 0.0541, + "step": 27472 + }, + { + "epoch": 74.858310626703, + "grad_norm": 5.177651405334473, + "learning_rate": 3.136062222815994e-06, + "loss": 0.0259, + "step": 27473 + }, + { + "epoch": 74.86103542234332, + "grad_norm": 3.1518969535827637, + "learning_rate": 3.135420472904839e-06, + "loss": 0.2288, + "step": 27474 + }, + { + "epoch": 74.86376021798365, + "grad_norm": 4.267491340637207, + "learning_rate": 3.1347787764548064e-06, + "loss": 0.0771, + "step": 27475 + }, + { + "epoch": 74.86648501362397, + "grad_norm": 2.849985122680664, + "learning_rate": 3.1341371334708924e-06, + "loss": 0.0856, + "step": 27476 + }, + { + "epoch": 74.8692098092643, + "grad_norm": 2.889461040496826, + "learning_rate": 3.1334955439581016e-06, + "loss": 0.0764, + "step": 27477 + }, + { + "epoch": 74.87193460490464, + "grad_norm": 3.2429332733154297, + "learning_rate": 3.1328540079214264e-06, + "loss": 0.0383, + "step": 27478 + }, + { + "epoch": 74.87465940054496, + "grad_norm": 4.318110942840576, + "learning_rate": 3.132212525365863e-06, + "loss": 0.1022, + "step": 27479 + }, + { + "epoch": 74.87738419618529, + "grad_norm": 3.088435173034668, + "learning_rate": 3.131571096296404e-06, + "loss": 0.1602, + "step": 27480 + }, + { + "epoch": 74.88010899182561, + "grad_norm": 3.6335043907165527, + "learning_rate": 3.130929720718051e-06, + "loss": 0.0867, + "step": 27481 + }, + { + "epoch": 74.88283378746594, + "grad_norm": 2.422663688659668, + "learning_rate": 3.130288398635797e-06, + "loss": 0.0382, + "step": 27482 + }, + { + "epoch": 74.88555858310627, + "grad_norm": 2.0690314769744873, + "learning_rate": 3.129647130054636e-06, + "loss": 0.0944, + "step": 27483 + }, + { + "epoch": 74.88828337874659, + "grad_norm": 2.035308599472046, + "learning_rate": 3.129005914979558e-06, + "loss": 0.0386, + "step": 27484 + }, + { + "epoch": 74.89100817438693, + "grad_norm": 4.204923629760742, + "learning_rate": 3.128364753415565e-06, + "loss": 0.1086, + "step": 27485 + }, + { + "epoch": 74.89373297002724, + "grad_norm": 2.8162553310394287, + "learning_rate": 3.127723645367645e-06, + "loss": 0.1143, + "step": 27486 + }, + { + "epoch": 74.89645776566758, + "grad_norm": 5.131668567657471, + "learning_rate": 3.1270825908407897e-06, + "loss": 0.0968, + "step": 27487 + }, + { + "epoch": 74.8991825613079, + "grad_norm": 2.573620319366455, + "learning_rate": 3.1264415898399935e-06, + "loss": 0.0359, + "step": 27488 + }, + { + "epoch": 74.90190735694823, + "grad_norm": 2.7319297790527344, + "learning_rate": 3.1258006423702536e-06, + "loss": 0.0433, + "step": 27489 + }, + { + "epoch": 74.90463215258856, + "grad_norm": 5.500871181488037, + "learning_rate": 3.125159748436556e-06, + "loss": 0.1917, + "step": 27490 + }, + { + "epoch": 74.90735694822888, + "grad_norm": 2.8717222213745117, + "learning_rate": 3.124518908043892e-06, + "loss": 0.0293, + "step": 27491 + }, + { + "epoch": 74.91008174386921, + "grad_norm": 2.114720582962036, + "learning_rate": 3.123878121197251e-06, + "loss": 0.0366, + "step": 27492 + }, + { + "epoch": 74.91280653950953, + "grad_norm": 2.324105978012085, + "learning_rate": 3.12323738790163e-06, + "loss": 0.0734, + "step": 27493 + }, + { + "epoch": 74.91553133514986, + "grad_norm": 5.976681232452393, + "learning_rate": 3.1225967081620136e-06, + "loss": 0.0399, + "step": 27494 + }, + { + "epoch": 74.9182561307902, + "grad_norm": 2.522785186767578, + "learning_rate": 3.121956081983394e-06, + "loss": 0.0262, + "step": 27495 + }, + { + "epoch": 74.92098092643052, + "grad_norm": 2.162013292312622, + "learning_rate": 3.1213155093707547e-06, + "loss": 0.0357, + "step": 27496 + }, + { + "epoch": 74.92370572207085, + "grad_norm": 2.9040699005126953, + "learning_rate": 3.1206749903290924e-06, + "loss": 0.2002, + "step": 27497 + }, + { + "epoch": 74.92643051771117, + "grad_norm": 2.6344516277313232, + "learning_rate": 3.120034524863392e-06, + "loss": 0.0361, + "step": 27498 + }, + { + "epoch": 74.9291553133515, + "grad_norm": 4.292081832885742, + "learning_rate": 3.119394112978641e-06, + "loss": 0.1328, + "step": 27499 + }, + { + "epoch": 74.93188010899182, + "grad_norm": 2.953303575515747, + "learning_rate": 3.1187537546798243e-06, + "loss": 0.0359, + "step": 27500 + }, + { + "epoch": 74.93460490463215, + "grad_norm": 2.4193108081817627, + "learning_rate": 3.1181134499719346e-06, + "loss": 0.0311, + "step": 27501 + }, + { + "epoch": 74.93732970027249, + "grad_norm": 3.2863755226135254, + "learning_rate": 3.117473198859957e-06, + "loss": 0.0691, + "step": 27502 + }, + { + "epoch": 74.9400544959128, + "grad_norm": 3.368201971054077, + "learning_rate": 3.1168330013488756e-06, + "loss": 0.1171, + "step": 27503 + }, + { + "epoch": 74.94277929155314, + "grad_norm": 2.8241043090820312, + "learning_rate": 3.116192857443674e-06, + "loss": 0.1456, + "step": 27504 + }, + { + "epoch": 74.94550408719346, + "grad_norm": 4.0922040939331055, + "learning_rate": 3.1155527671493414e-06, + "loss": 0.0755, + "step": 27505 + }, + { + "epoch": 74.94822888283379, + "grad_norm": 3.2033066749572754, + "learning_rate": 3.114912730470865e-06, + "loss": 0.0304, + "step": 27506 + }, + { + "epoch": 74.95095367847412, + "grad_norm": 4.60787296295166, + "learning_rate": 3.1142727474132275e-06, + "loss": 0.0421, + "step": 27507 + }, + { + "epoch": 74.95367847411444, + "grad_norm": 2.8809895515441895, + "learning_rate": 3.113632817981408e-06, + "loss": 0.0502, + "step": 27508 + }, + { + "epoch": 74.95640326975477, + "grad_norm": 3.216729164123535, + "learning_rate": 3.1129929421803982e-06, + "loss": 0.0675, + "step": 27509 + }, + { + "epoch": 74.95912806539509, + "grad_norm": 2.9025216102600098, + "learning_rate": 3.112353120015178e-06, + "loss": 0.0555, + "step": 27510 + }, + { + "epoch": 74.96185286103542, + "grad_norm": 3.4627859592437744, + "learning_rate": 3.1117133514907294e-06, + "loss": 0.0776, + "step": 27511 + }, + { + "epoch": 74.96457765667574, + "grad_norm": 2.72674298286438, + "learning_rate": 3.111073636612032e-06, + "loss": 0.0797, + "step": 27512 + }, + { + "epoch": 74.96730245231608, + "grad_norm": 2.8152270317077637, + "learning_rate": 3.1104339753840752e-06, + "loss": 0.0518, + "step": 27513 + }, + { + "epoch": 74.97002724795641, + "grad_norm": 3.045332670211792, + "learning_rate": 3.109794367811837e-06, + "loss": 0.1923, + "step": 27514 + }, + { + "epoch": 74.97275204359673, + "grad_norm": 4.088866233825684, + "learning_rate": 3.109154813900298e-06, + "loss": 0.0596, + "step": 27515 + }, + { + "epoch": 74.97547683923706, + "grad_norm": 3.0625717639923096, + "learning_rate": 3.108515313654438e-06, + "loss": 0.1124, + "step": 27516 + }, + { + "epoch": 74.97820163487738, + "grad_norm": 2.966005325317383, + "learning_rate": 3.1078758670792397e-06, + "loss": 0.1448, + "step": 27517 + }, + { + "epoch": 74.98092643051771, + "grad_norm": 2.499295234680176, + "learning_rate": 3.1072364741796833e-06, + "loss": 0.0385, + "step": 27518 + }, + { + "epoch": 74.98365122615803, + "grad_norm": 2.7400944232940674, + "learning_rate": 3.1065971349607484e-06, + "loss": 0.0467, + "step": 27519 + }, + { + "epoch": 74.98637602179836, + "grad_norm": 3.302360773086548, + "learning_rate": 3.105957849427409e-06, + "loss": 0.0998, + "step": 27520 + }, + { + "epoch": 74.9891008174387, + "grad_norm": 2.534291982650757, + "learning_rate": 3.1053186175846474e-06, + "loss": 0.0341, + "step": 27521 + }, + { + "epoch": 74.99182561307902, + "grad_norm": 3.326748847961426, + "learning_rate": 3.104679439437447e-06, + "loss": 0.1436, + "step": 27522 + }, + { + "epoch": 74.99455040871935, + "grad_norm": 2.6939988136291504, + "learning_rate": 3.1040403149907805e-06, + "loss": 0.1331, + "step": 27523 + }, + { + "epoch": 74.99727520435967, + "grad_norm": 3.131129264831543, + "learning_rate": 3.1034012442496253e-06, + "loss": 0.0787, + "step": 27524 + }, + { + "epoch": 75.0, + "grad_norm": 2.8523824214935303, + "learning_rate": 3.1027622272189572e-06, + "loss": 0.1013, + "step": 27525 + }, + { + "epoch": 75.00272479564033, + "grad_norm": 3.311145782470703, + "learning_rate": 3.102123263903758e-06, + "loss": 0.0655, + "step": 27526 + }, + { + "epoch": 75.00544959128065, + "grad_norm": 2.3888118267059326, + "learning_rate": 3.1014843543090002e-06, + "loss": 0.0348, + "step": 27527 + }, + { + "epoch": 75.00817438692098, + "grad_norm": 3.0262041091918945, + "learning_rate": 3.1008454984396606e-06, + "loss": 0.0293, + "step": 27528 + }, + { + "epoch": 75.0108991825613, + "grad_norm": 2.7091064453125, + "learning_rate": 3.1002066963007116e-06, + "loss": 0.05, + "step": 27529 + }, + { + "epoch": 75.01362397820164, + "grad_norm": 2.9500162601470947, + "learning_rate": 3.099567947897133e-06, + "loss": 0.0561, + "step": 27530 + }, + { + "epoch": 75.01634877384195, + "grad_norm": 2.945417642593384, + "learning_rate": 3.0989292532338978e-06, + "loss": 0.0326, + "step": 27531 + }, + { + "epoch": 75.01907356948229, + "grad_norm": 2.4412946701049805, + "learning_rate": 3.098290612315976e-06, + "loss": 0.051, + "step": 27532 + }, + { + "epoch": 75.02179836512262, + "grad_norm": 3.124022960662842, + "learning_rate": 3.0976520251483476e-06, + "loss": 0.1109, + "step": 27533 + }, + { + "epoch": 75.02452316076294, + "grad_norm": 2.738534927368164, + "learning_rate": 3.097013491735984e-06, + "loss": 0.0518, + "step": 27534 + }, + { + "epoch": 75.02724795640327, + "grad_norm": 5.542792797088623, + "learning_rate": 3.0963750120838564e-06, + "loss": 0.0744, + "step": 27535 + }, + { + "epoch": 75.02997275204359, + "grad_norm": 4.510857105255127, + "learning_rate": 3.0957365861969345e-06, + "loss": 0.2035, + "step": 27536 + }, + { + "epoch": 75.03269754768392, + "grad_norm": 4.250611782073975, + "learning_rate": 3.095098214080198e-06, + "loss": 0.0578, + "step": 27537 + }, + { + "epoch": 75.03542234332426, + "grad_norm": 1.8988556861877441, + "learning_rate": 3.0944598957386107e-06, + "loss": 0.1159, + "step": 27538 + }, + { + "epoch": 75.03814713896458, + "grad_norm": 3.1393895149230957, + "learning_rate": 3.0938216311771507e-06, + "loss": 0.0352, + "step": 27539 + }, + { + "epoch": 75.04087193460491, + "grad_norm": 1.4722155332565308, + "learning_rate": 3.0931834204007862e-06, + "loss": 0.0173, + "step": 27540 + }, + { + "epoch": 75.04359673024523, + "grad_norm": 2.404116630554199, + "learning_rate": 3.0925452634144825e-06, + "loss": 0.0752, + "step": 27541 + }, + { + "epoch": 75.04632152588556, + "grad_norm": 2.586320161819458, + "learning_rate": 3.0919071602232175e-06, + "loss": 0.0381, + "step": 27542 + }, + { + "epoch": 75.04904632152588, + "grad_norm": 9.841873168945312, + "learning_rate": 3.0912691108319582e-06, + "loss": 0.0425, + "step": 27543 + }, + { + "epoch": 75.05177111716621, + "grad_norm": 2.585761308670044, + "learning_rate": 3.0906311152456713e-06, + "loss": 0.0844, + "step": 27544 + }, + { + "epoch": 75.05449591280654, + "grad_norm": 2.6232521533966064, + "learning_rate": 3.0899931734693246e-06, + "loss": 0.1565, + "step": 27545 + }, + { + "epoch": 75.05722070844686, + "grad_norm": 2.5462450981140137, + "learning_rate": 3.089355285507891e-06, + "loss": 0.0682, + "step": 27546 + }, + { + "epoch": 75.0599455040872, + "grad_norm": 3.3379335403442383, + "learning_rate": 3.0887174513663376e-06, + "loss": 0.2347, + "step": 27547 + }, + { + "epoch": 75.06267029972751, + "grad_norm": 2.2917251586914062, + "learning_rate": 3.0880796710496287e-06, + "loss": 0.0336, + "step": 27548 + }, + { + "epoch": 75.06539509536785, + "grad_norm": 3.615720748901367, + "learning_rate": 3.08744194456273e-06, + "loss": 0.2591, + "step": 27549 + }, + { + "epoch": 75.06811989100818, + "grad_norm": 3.1300547122955322, + "learning_rate": 3.0868042719106152e-06, + "loss": 0.0327, + "step": 27550 + }, + { + "epoch": 75.0708446866485, + "grad_norm": 2.6372008323669434, + "learning_rate": 3.086166653098246e-06, + "loss": 0.1014, + "step": 27551 + }, + { + "epoch": 75.07356948228883, + "grad_norm": 5.758232593536377, + "learning_rate": 3.0855290881305845e-06, + "loss": 0.1821, + "step": 27552 + }, + { + "epoch": 75.07629427792915, + "grad_norm": 4.68319034576416, + "learning_rate": 3.084891577012603e-06, + "loss": 0.1471, + "step": 27553 + }, + { + "epoch": 75.07901907356948, + "grad_norm": 7.116035461425781, + "learning_rate": 3.0842541197492637e-06, + "loss": 0.1569, + "step": 27554 + }, + { + "epoch": 75.0817438692098, + "grad_norm": 3.22837495803833, + "learning_rate": 3.08361671634553e-06, + "loss": 0.0503, + "step": 27555 + }, + { + "epoch": 75.08446866485014, + "grad_norm": 3.4298107624053955, + "learning_rate": 3.0829793668063646e-06, + "loss": 0.059, + "step": 27556 + }, + { + "epoch": 75.08719346049047, + "grad_norm": 2.6836814880371094, + "learning_rate": 3.0823420711367322e-06, + "loss": 0.0687, + "step": 27557 + }, + { + "epoch": 75.08991825613079, + "grad_norm": 2.5157830715179443, + "learning_rate": 3.0817048293416017e-06, + "loss": 0.1594, + "step": 27558 + }, + { + "epoch": 75.09264305177112, + "grad_norm": 2.5752265453338623, + "learning_rate": 3.08106764142593e-06, + "loss": 0.0341, + "step": 27559 + }, + { + "epoch": 75.09536784741144, + "grad_norm": 3.477228879928589, + "learning_rate": 3.0804305073946818e-06, + "loss": 0.1307, + "step": 27560 + }, + { + "epoch": 75.09809264305177, + "grad_norm": 2.9757039546966553, + "learning_rate": 3.079793427252814e-06, + "loss": 0.1973, + "step": 27561 + }, + { + "epoch": 75.1008174386921, + "grad_norm": 2.4333109855651855, + "learning_rate": 3.0791564010052967e-06, + "loss": 0.0641, + "step": 27562 + }, + { + "epoch": 75.10354223433242, + "grad_norm": 6.196342468261719, + "learning_rate": 3.0785194286570854e-06, + "loss": 0.095, + "step": 27563 + }, + { + "epoch": 75.10626702997276, + "grad_norm": 2.131510019302368, + "learning_rate": 3.077882510213143e-06, + "loss": 0.0516, + "step": 27564 + }, + { + "epoch": 75.10899182561307, + "grad_norm": 3.1831939220428467, + "learning_rate": 3.077245645678425e-06, + "loss": 0.0906, + "step": 27565 + }, + { + "epoch": 75.11171662125341, + "grad_norm": 2.7010202407836914, + "learning_rate": 3.0766088350578984e-06, + "loss": 0.173, + "step": 27566 + }, + { + "epoch": 75.11444141689373, + "grad_norm": 4.274178504943848, + "learning_rate": 3.0759720783565196e-06, + "loss": 0.1548, + "step": 27567 + }, + { + "epoch": 75.11716621253406, + "grad_norm": 3.5782458782196045, + "learning_rate": 3.075335375579247e-06, + "loss": 0.0499, + "step": 27568 + }, + { + "epoch": 75.11989100817439, + "grad_norm": 2.65104079246521, + "learning_rate": 3.074698726731036e-06, + "loss": 0.2272, + "step": 27569 + }, + { + "epoch": 75.12261580381471, + "grad_norm": 3.3322086334228516, + "learning_rate": 3.074062131816853e-06, + "loss": 0.0595, + "step": 27570 + }, + { + "epoch": 75.12534059945504, + "grad_norm": 3.812431812286377, + "learning_rate": 3.07342559084165e-06, + "loss": 0.1319, + "step": 27571 + }, + { + "epoch": 75.12806539509536, + "grad_norm": 2.5226943492889404, + "learning_rate": 3.0727891038103865e-06, + "loss": 0.0484, + "step": 27572 + }, + { + "epoch": 75.1307901907357, + "grad_norm": 3.453836441040039, + "learning_rate": 3.0721526707280113e-06, + "loss": 0.0654, + "step": 27573 + }, + { + "epoch": 75.13351498637603, + "grad_norm": 2.5528485774993896, + "learning_rate": 3.0715162915994944e-06, + "loss": 0.0306, + "step": 27574 + }, + { + "epoch": 75.13623978201635, + "grad_norm": 2.835279703140259, + "learning_rate": 3.0708799664297863e-06, + "loss": 0.1264, + "step": 27575 + }, + { + "epoch": 75.13896457765668, + "grad_norm": 3.1006345748901367, + "learning_rate": 3.0702436952238412e-06, + "loss": 0.0411, + "step": 27576 + }, + { + "epoch": 75.141689373297, + "grad_norm": 4.25516414642334, + "learning_rate": 3.0696074779866127e-06, + "loss": 0.1298, + "step": 27577 + }, + { + "epoch": 75.14441416893733, + "grad_norm": 3.170030355453491, + "learning_rate": 3.0689713147230617e-06, + "loss": 0.0373, + "step": 27578 + }, + { + "epoch": 75.14713896457765, + "grad_norm": 2.772905111312866, + "learning_rate": 3.068335205438139e-06, + "loss": 0.0337, + "step": 27579 + }, + { + "epoch": 75.14986376021798, + "grad_norm": 2.9926319122314453, + "learning_rate": 3.067699150136797e-06, + "loss": 0.037, + "step": 27580 + }, + { + "epoch": 75.15258855585832, + "grad_norm": 5.851269245147705, + "learning_rate": 3.067063148823989e-06, + "loss": 0.0896, + "step": 27581 + }, + { + "epoch": 75.15531335149863, + "grad_norm": 3.1910886764526367, + "learning_rate": 3.0664272015046735e-06, + "loss": 0.0748, + "step": 27582 + }, + { + "epoch": 75.15803814713897, + "grad_norm": 2.5612995624542236, + "learning_rate": 3.0657913081837987e-06, + "loss": 0.0662, + "step": 27583 + }, + { + "epoch": 75.16076294277929, + "grad_norm": 2.8816475868225098, + "learning_rate": 3.0651554688663188e-06, + "loss": 0.0505, + "step": 27584 + }, + { + "epoch": 75.16348773841962, + "grad_norm": 3.678269624710083, + "learning_rate": 3.064519683557182e-06, + "loss": 0.0569, + "step": 27585 + }, + { + "epoch": 75.16621253405995, + "grad_norm": 3.733116626739502, + "learning_rate": 3.063883952261345e-06, + "loss": 0.1498, + "step": 27586 + }, + { + "epoch": 75.16893732970027, + "grad_norm": 2.7683281898498535, + "learning_rate": 3.0632482749837578e-06, + "loss": 0.1222, + "step": 27587 + }, + { + "epoch": 75.1716621253406, + "grad_norm": 3.418689012527466, + "learning_rate": 3.0626126517293686e-06, + "loss": 0.1271, + "step": 27588 + }, + { + "epoch": 75.17438692098092, + "grad_norm": 2.2630598545074463, + "learning_rate": 3.061977082503126e-06, + "loss": 0.0248, + "step": 27589 + }, + { + "epoch": 75.17711171662125, + "grad_norm": 3.1087136268615723, + "learning_rate": 3.0613415673099822e-06, + "loss": 0.0364, + "step": 27590 + }, + { + "epoch": 75.17983651226157, + "grad_norm": 2.079453945159912, + "learning_rate": 3.0607061061548902e-06, + "loss": 0.0803, + "step": 27591 + }, + { + "epoch": 75.1825613079019, + "grad_norm": 2.0259814262390137, + "learning_rate": 3.0600706990427966e-06, + "loss": 0.0543, + "step": 27592 + }, + { + "epoch": 75.18528610354224, + "grad_norm": 3.862144947052002, + "learning_rate": 3.0594353459786484e-06, + "loss": 0.1582, + "step": 27593 + }, + { + "epoch": 75.18801089918256, + "grad_norm": 3.890875816345215, + "learning_rate": 3.058800046967392e-06, + "loss": 0.0651, + "step": 27594 + }, + { + "epoch": 75.19073569482289, + "grad_norm": 3.464887857437134, + "learning_rate": 3.058164802013979e-06, + "loss": 0.0947, + "step": 27595 + }, + { + "epoch": 75.19346049046321, + "grad_norm": 4.630736827850342, + "learning_rate": 3.0575296111233567e-06, + "loss": 0.1276, + "step": 27596 + }, + { + "epoch": 75.19618528610354, + "grad_norm": 5.1742844581604, + "learning_rate": 3.056894474300466e-06, + "loss": 0.0518, + "step": 27597 + }, + { + "epoch": 75.19891008174388, + "grad_norm": 3.2487473487854004, + "learning_rate": 3.0562593915502614e-06, + "loss": 0.068, + "step": 27598 + }, + { + "epoch": 75.2016348773842, + "grad_norm": 2.2730767726898193, + "learning_rate": 3.055624362877685e-06, + "loss": 0.037, + "step": 27599 + }, + { + "epoch": 75.20435967302453, + "grad_norm": 2.942718982696533, + "learning_rate": 3.0549893882876825e-06, + "loss": 0.0358, + "step": 27600 + }, + { + "epoch": 75.20708446866485, + "grad_norm": 3.3944926261901855, + "learning_rate": 3.0543544677851953e-06, + "loss": 0.0327, + "step": 27601 + }, + { + "epoch": 75.20980926430518, + "grad_norm": 2.9558629989624023, + "learning_rate": 3.0537196013751767e-06, + "loss": 0.1034, + "step": 27602 + }, + { + "epoch": 75.2125340599455, + "grad_norm": 2.820882558822632, + "learning_rate": 3.0530847890625646e-06, + "loss": 0.0258, + "step": 27603 + }, + { + "epoch": 75.21525885558583, + "grad_norm": 2.4985244274139404, + "learning_rate": 3.0524500308523064e-06, + "loss": 0.0382, + "step": 27604 + }, + { + "epoch": 75.21798365122616, + "grad_norm": 2.783466339111328, + "learning_rate": 3.0518153267493388e-06, + "loss": 0.1242, + "step": 27605 + }, + { + "epoch": 75.22070844686648, + "grad_norm": 2.2642557621002197, + "learning_rate": 3.051180676758614e-06, + "loss": 0.0503, + "step": 27606 + }, + { + "epoch": 75.22343324250681, + "grad_norm": 3.5770883560180664, + "learning_rate": 3.0505460808850674e-06, + "loss": 0.046, + "step": 27607 + }, + { + "epoch": 75.22615803814713, + "grad_norm": 2.408412456512451, + "learning_rate": 3.0499115391336464e-06, + "loss": 0.0304, + "step": 27608 + }, + { + "epoch": 75.22888283378747, + "grad_norm": 3.0149154663085938, + "learning_rate": 3.0492770515092917e-06, + "loss": 0.083, + "step": 27609 + }, + { + "epoch": 75.2316076294278, + "grad_norm": 1.9410196542739868, + "learning_rate": 3.0486426180169404e-06, + "loss": 0.0279, + "step": 27610 + }, + { + "epoch": 75.23433242506812, + "grad_norm": 2.15051007270813, + "learning_rate": 3.0480082386615394e-06, + "loss": 0.0249, + "step": 27611 + }, + { + "epoch": 75.23705722070845, + "grad_norm": 2.653397560119629, + "learning_rate": 3.047373913448026e-06, + "loss": 0.0563, + "step": 27612 + }, + { + "epoch": 75.23978201634877, + "grad_norm": 2.4434974193573, + "learning_rate": 3.0467396423813423e-06, + "loss": 0.0385, + "step": 27613 + }, + { + "epoch": 75.2425068119891, + "grad_norm": 4.21658992767334, + "learning_rate": 3.0461054254664225e-06, + "loss": 0.0706, + "step": 27614 + }, + { + "epoch": 75.24523160762942, + "grad_norm": 2.064725875854492, + "learning_rate": 3.0454712627082128e-06, + "loss": 0.0735, + "step": 27615 + }, + { + "epoch": 75.24795640326975, + "grad_norm": 3.525247573852539, + "learning_rate": 3.044837154111648e-06, + "loss": 0.0584, + "step": 27616 + }, + { + "epoch": 75.25068119891009, + "grad_norm": 2.2720861434936523, + "learning_rate": 3.044203099681666e-06, + "loss": 0.0968, + "step": 27617 + }, + { + "epoch": 75.2534059945504, + "grad_norm": 3.067094326019287, + "learning_rate": 3.043569099423209e-06, + "loss": 0.0601, + "step": 27618 + }, + { + "epoch": 75.25613079019074, + "grad_norm": 5.3943772315979, + "learning_rate": 3.042935153341212e-06, + "loss": 0.0832, + "step": 27619 + }, + { + "epoch": 75.25885558583106, + "grad_norm": 4.334679126739502, + "learning_rate": 3.042301261440612e-06, + "loss": 0.1378, + "step": 27620 + }, + { + "epoch": 75.26158038147139, + "grad_norm": 2.4944615364074707, + "learning_rate": 3.041667423726343e-06, + "loss": 0.031, + "step": 27621 + }, + { + "epoch": 75.26430517711172, + "grad_norm": 5.525595188140869, + "learning_rate": 3.041033640203348e-06, + "loss": 0.0374, + "step": 27622 + }, + { + "epoch": 75.26702997275204, + "grad_norm": 3.597632646560669, + "learning_rate": 3.040399910876558e-06, + "loss": 0.0563, + "step": 27623 + }, + { + "epoch": 75.26975476839237, + "grad_norm": 2.9683830738067627, + "learning_rate": 3.039766235750907e-06, + "loss": 0.1118, + "step": 27624 + }, + { + "epoch": 75.2724795640327, + "grad_norm": 3.4934754371643066, + "learning_rate": 3.039132614831335e-06, + "loss": 0.0343, + "step": 27625 + }, + { + "epoch": 75.27520435967303, + "grad_norm": 2.8926949501037598, + "learning_rate": 3.0384990481227716e-06, + "loss": 0.0251, + "step": 27626 + }, + { + "epoch": 75.27792915531334, + "grad_norm": 2.601649045944214, + "learning_rate": 3.0378655356301554e-06, + "loss": 0.1234, + "step": 27627 + }, + { + "epoch": 75.28065395095368, + "grad_norm": 3.4047579765319824, + "learning_rate": 3.0372320773584196e-06, + "loss": 0.1368, + "step": 27628 + }, + { + "epoch": 75.28337874659401, + "grad_norm": 3.0398342609405518, + "learning_rate": 3.0365986733124963e-06, + "loss": 0.0831, + "step": 27629 + }, + { + "epoch": 75.28610354223433, + "grad_norm": 2.6498756408691406, + "learning_rate": 3.0359653234973154e-06, + "loss": 0.0872, + "step": 27630 + }, + { + "epoch": 75.28882833787466, + "grad_norm": 2.3392951488494873, + "learning_rate": 3.0353320279178146e-06, + "loss": 0.026, + "step": 27631 + }, + { + "epoch": 75.29155313351498, + "grad_norm": 3.178831100463867, + "learning_rate": 3.0346987865789245e-06, + "loss": 0.0377, + "step": 27632 + }, + { + "epoch": 75.29427792915531, + "grad_norm": 2.388498544692993, + "learning_rate": 3.034065599485576e-06, + "loss": 0.0193, + "step": 27633 + }, + { + "epoch": 75.29700272479565, + "grad_norm": 2.380526304244995, + "learning_rate": 3.033432466642697e-06, + "loss": 0.0348, + "step": 27634 + }, + { + "epoch": 75.29972752043597, + "grad_norm": 3.2772305011749268, + "learning_rate": 3.032799388055225e-06, + "loss": 0.0394, + "step": 27635 + }, + { + "epoch": 75.3024523160763, + "grad_norm": 2.7993104457855225, + "learning_rate": 3.0321663637280875e-06, + "loss": 0.1427, + "step": 27636 + }, + { + "epoch": 75.30517711171662, + "grad_norm": 1.7309693098068237, + "learning_rate": 3.031533393666214e-06, + "loss": 0.0159, + "step": 27637 + }, + { + "epoch": 75.30790190735695, + "grad_norm": 2.8570635318756104, + "learning_rate": 3.030900477874531e-06, + "loss": 0.0799, + "step": 27638 + }, + { + "epoch": 75.31062670299727, + "grad_norm": 4.14675235748291, + "learning_rate": 3.0302676163579738e-06, + "loss": 0.0627, + "step": 27639 + }, + { + "epoch": 75.3133514986376, + "grad_norm": 2.1780340671539307, + "learning_rate": 3.0296348091214676e-06, + "loss": 0.0623, + "step": 27640 + }, + { + "epoch": 75.31607629427793, + "grad_norm": 2.5636348724365234, + "learning_rate": 3.0290020561699385e-06, + "loss": 0.054, + "step": 27641 + }, + { + "epoch": 75.31880108991825, + "grad_norm": 2.5974178314208984, + "learning_rate": 3.0283693575083174e-06, + "loss": 0.0677, + "step": 27642 + }, + { + "epoch": 75.32152588555859, + "grad_norm": 1.8714269399642944, + "learning_rate": 3.0277367131415336e-06, + "loss": 0.0333, + "step": 27643 + }, + { + "epoch": 75.3242506811989, + "grad_norm": 3.2616562843322754, + "learning_rate": 3.0271041230745122e-06, + "loss": 0.0676, + "step": 27644 + }, + { + "epoch": 75.32697547683924, + "grad_norm": 2.9135024547576904, + "learning_rate": 3.0264715873121796e-06, + "loss": 0.1273, + "step": 27645 + }, + { + "epoch": 75.32970027247957, + "grad_norm": 2.4170942306518555, + "learning_rate": 3.0258391058594595e-06, + "loss": 0.031, + "step": 27646 + }, + { + "epoch": 75.33242506811989, + "grad_norm": 2.555218458175659, + "learning_rate": 3.0252066787212817e-06, + "loss": 0.0245, + "step": 27647 + }, + { + "epoch": 75.33514986376022, + "grad_norm": 3.3662526607513428, + "learning_rate": 3.0245743059025713e-06, + "loss": 0.0355, + "step": 27648 + }, + { + "epoch": 75.33787465940054, + "grad_norm": 3.288583517074585, + "learning_rate": 3.023941987408251e-06, + "loss": 0.0867, + "step": 27649 + }, + { + "epoch": 75.34059945504087, + "grad_norm": 2.092853307723999, + "learning_rate": 3.0233097232432417e-06, + "loss": 0.0334, + "step": 27650 + }, + { + "epoch": 75.34332425068119, + "grad_norm": 2.833671808242798, + "learning_rate": 3.022677513412476e-06, + "loss": 0.0348, + "step": 27651 + }, + { + "epoch": 75.34604904632153, + "grad_norm": 2.574719190597534, + "learning_rate": 3.022045357920873e-06, + "loss": 0.0339, + "step": 27652 + }, + { + "epoch": 75.34877384196186, + "grad_norm": 2.987471342086792, + "learning_rate": 3.0214132567733565e-06, + "loss": 0.0458, + "step": 27653 + }, + { + "epoch": 75.35149863760218, + "grad_norm": 2.910118341445923, + "learning_rate": 3.020781209974846e-06, + "loss": 0.0943, + "step": 27654 + }, + { + "epoch": 75.35422343324251, + "grad_norm": 2.1420702934265137, + "learning_rate": 3.0201492175302695e-06, + "loss": 0.0319, + "step": 27655 + }, + { + "epoch": 75.35694822888283, + "grad_norm": 2.2705018520355225, + "learning_rate": 3.019517279444546e-06, + "loss": 0.038, + "step": 27656 + }, + { + "epoch": 75.35967302452316, + "grad_norm": 3.6899421215057373, + "learning_rate": 3.0188853957225984e-06, + "loss": 0.1614, + "step": 27657 + }, + { + "epoch": 75.3623978201635, + "grad_norm": 3.608517646789551, + "learning_rate": 3.0182535663693422e-06, + "loss": 0.0713, + "step": 27658 + }, + { + "epoch": 75.36512261580381, + "grad_norm": 4.432520389556885, + "learning_rate": 3.0176217913897034e-06, + "loss": 0.0383, + "step": 27659 + }, + { + "epoch": 75.36784741144415, + "grad_norm": 3.134857416152954, + "learning_rate": 3.0169900707886036e-06, + "loss": 0.0288, + "step": 27660 + }, + { + "epoch": 75.37057220708446, + "grad_norm": 2.952052116394043, + "learning_rate": 3.0163584045709615e-06, + "loss": 0.0445, + "step": 27661 + }, + { + "epoch": 75.3732970027248, + "grad_norm": 3.3065953254699707, + "learning_rate": 3.0157267927416912e-06, + "loss": 0.0955, + "step": 27662 + }, + { + "epoch": 75.37602179836512, + "grad_norm": 17.400815963745117, + "learning_rate": 3.0150952353057195e-06, + "loss": 0.038, + "step": 27663 + }, + { + "epoch": 75.37874659400545, + "grad_norm": 2.445208787918091, + "learning_rate": 3.0144637322679617e-06, + "loss": 0.0956, + "step": 27664 + }, + { + "epoch": 75.38147138964578, + "grad_norm": 3.191053867340088, + "learning_rate": 3.0138322836333343e-06, + "loss": 0.09, + "step": 27665 + }, + { + "epoch": 75.3841961852861, + "grad_norm": 3.7337753772735596, + "learning_rate": 3.0132008894067545e-06, + "loss": 0.0848, + "step": 27666 + }, + { + "epoch": 75.38692098092643, + "grad_norm": 14.248208045959473, + "learning_rate": 3.012569549593143e-06, + "loss": 0.062, + "step": 27667 + }, + { + "epoch": 75.38964577656675, + "grad_norm": 3.1568360328674316, + "learning_rate": 3.011938264197416e-06, + "loss": 0.052, + "step": 27668 + }, + { + "epoch": 75.39237057220708, + "grad_norm": 4.756346702575684, + "learning_rate": 3.0113070332244886e-06, + "loss": 0.0316, + "step": 27669 + }, + { + "epoch": 75.39509536784742, + "grad_norm": 3.052743673324585, + "learning_rate": 3.0106758566792737e-06, + "loss": 0.2044, + "step": 27670 + }, + { + "epoch": 75.39782016348774, + "grad_norm": 3.078798770904541, + "learning_rate": 3.0100447345666937e-06, + "loss": 0.0694, + "step": 27671 + }, + { + "epoch": 75.40054495912807, + "grad_norm": 2.136767864227295, + "learning_rate": 3.0094136668916607e-06, + "loss": 0.067, + "step": 27672 + }, + { + "epoch": 75.40326975476839, + "grad_norm": 3.910614490509033, + "learning_rate": 3.008782653659089e-06, + "loss": 0.0602, + "step": 27673 + }, + { + "epoch": 75.40599455040872, + "grad_norm": 2.9418959617614746, + "learning_rate": 3.0081516948738887e-06, + "loss": 0.0776, + "step": 27674 + }, + { + "epoch": 75.40871934604904, + "grad_norm": 3.3807084560394287, + "learning_rate": 3.007520790540982e-06, + "loss": 0.0402, + "step": 27675 + }, + { + "epoch": 75.41144414168937, + "grad_norm": 3.7821102142333984, + "learning_rate": 3.0068899406652752e-06, + "loss": 0.0484, + "step": 27676 + }, + { + "epoch": 75.4141689373297, + "grad_norm": 2.784954309463501, + "learning_rate": 3.0062591452516876e-06, + "loss": 0.0745, + "step": 27677 + }, + { + "epoch": 75.41689373297002, + "grad_norm": 2.7617006301879883, + "learning_rate": 3.0056284043051286e-06, + "loss": 0.0839, + "step": 27678 + }, + { + "epoch": 75.41961852861036, + "grad_norm": 6.001311779022217, + "learning_rate": 3.004997717830508e-06, + "loss": 0.0457, + "step": 27679 + }, + { + "epoch": 75.42234332425068, + "grad_norm": 3.061800241470337, + "learning_rate": 3.004367085832742e-06, + "loss": 0.0797, + "step": 27680 + }, + { + "epoch": 75.42506811989101, + "grad_norm": 2.0810399055480957, + "learning_rate": 3.0037365083167404e-06, + "loss": 0.0618, + "step": 27681 + }, + { + "epoch": 75.42779291553134, + "grad_norm": 2.682482957839966, + "learning_rate": 3.003105985287411e-06, + "loss": 0.0948, + "step": 27682 + }, + { + "epoch": 75.43051771117166, + "grad_norm": 3.283461570739746, + "learning_rate": 3.00247551674967e-06, + "loss": 0.0921, + "step": 27683 + }, + { + "epoch": 75.433242506812, + "grad_norm": 3.275836229324341, + "learning_rate": 3.0018451027084238e-06, + "loss": 0.0941, + "step": 27684 + }, + { + "epoch": 75.43596730245231, + "grad_norm": 2.952338218688965, + "learning_rate": 3.0012147431685832e-06, + "loss": 0.0492, + "step": 27685 + }, + { + "epoch": 75.43869209809264, + "grad_norm": 2.4903459548950195, + "learning_rate": 3.0005844381350545e-06, + "loss": 0.0975, + "step": 27686 + }, + { + "epoch": 75.44141689373296, + "grad_norm": 2.38456130027771, + "learning_rate": 2.9999541876127513e-06, + "loss": 0.0465, + "step": 27687 + }, + { + "epoch": 75.4441416893733, + "grad_norm": 2.847486972808838, + "learning_rate": 2.99932399160658e-06, + "loss": 0.2217, + "step": 27688 + }, + { + "epoch": 75.44686648501363, + "grad_norm": 2.646130323410034, + "learning_rate": 2.998693850121447e-06, + "loss": 0.1184, + "step": 27689 + }, + { + "epoch": 75.44959128065395, + "grad_norm": 2.516571044921875, + "learning_rate": 2.998063763162259e-06, + "loss": 0.0384, + "step": 27690 + }, + { + "epoch": 75.45231607629428, + "grad_norm": 2.517336368560791, + "learning_rate": 2.9974337307339274e-06, + "loss": 0.0426, + "step": 27691 + }, + { + "epoch": 75.4550408719346, + "grad_norm": 3.6232411861419678, + "learning_rate": 2.9968037528413573e-06, + "loss": 0.0533, + "step": 27692 + }, + { + "epoch": 75.45776566757493, + "grad_norm": 3.2437920570373535, + "learning_rate": 2.9961738294894504e-06, + "loss": 0.0405, + "step": 27693 + }, + { + "epoch": 75.46049046321527, + "grad_norm": 3.5633132457733154, + "learning_rate": 2.9955439606831195e-06, + "loss": 0.1422, + "step": 27694 + }, + { + "epoch": 75.46321525885558, + "grad_norm": 3.4561767578125, + "learning_rate": 2.9949141464272635e-06, + "loss": 0.0347, + "step": 27695 + }, + { + "epoch": 75.46594005449592, + "grad_norm": 3.184873580932617, + "learning_rate": 2.9942843867267947e-06, + "loss": 0.0481, + "step": 27696 + }, + { + "epoch": 75.46866485013624, + "grad_norm": 2.4604759216308594, + "learning_rate": 2.993654681586613e-06, + "loss": 0.0634, + "step": 27697 + }, + { + "epoch": 75.47138964577657, + "grad_norm": 2.241732120513916, + "learning_rate": 2.993025031011623e-06, + "loss": 0.0384, + "step": 27698 + }, + { + "epoch": 75.47411444141689, + "grad_norm": 2.451686382293701, + "learning_rate": 2.9923954350067263e-06, + "loss": 0.149, + "step": 27699 + }, + { + "epoch": 75.47683923705722, + "grad_norm": 2.762377977371216, + "learning_rate": 2.99176589357683e-06, + "loss": 0.1074, + "step": 27700 + }, + { + "epoch": 75.47956403269755, + "grad_norm": 3.2475740909576416, + "learning_rate": 2.9911364067268366e-06, + "loss": 0.027, + "step": 27701 + }, + { + "epoch": 75.48228882833787, + "grad_norm": 4.86683988571167, + "learning_rate": 2.9905069744616466e-06, + "loss": 0.0376, + "step": 27702 + }, + { + "epoch": 75.4850136239782, + "grad_norm": 1.99662446975708, + "learning_rate": 2.9898775967861605e-06, + "loss": 0.0282, + "step": 27703 + }, + { + "epoch": 75.48773841961852, + "grad_norm": 3.2977609634399414, + "learning_rate": 2.9892482737052843e-06, + "loss": 0.0354, + "step": 27704 + }, + { + "epoch": 75.49046321525886, + "grad_norm": 1.8643726110458374, + "learning_rate": 2.9886190052239173e-06, + "loss": 0.029, + "step": 27705 + }, + { + "epoch": 75.49318801089919, + "grad_norm": 2.6245758533477783, + "learning_rate": 2.987989791346957e-06, + "loss": 0.1093, + "step": 27706 + }, + { + "epoch": 75.49591280653951, + "grad_norm": 1.6000523567199707, + "learning_rate": 2.987360632079308e-06, + "loss": 0.0178, + "step": 27707 + }, + { + "epoch": 75.49863760217984, + "grad_norm": 2.616818428039551, + "learning_rate": 2.98673152742587e-06, + "loss": 0.0347, + "step": 27708 + }, + { + "epoch": 75.50136239782016, + "grad_norm": 2.732534408569336, + "learning_rate": 2.9861024773915415e-06, + "loss": 0.0381, + "step": 27709 + }, + { + "epoch": 75.50408719346049, + "grad_norm": 2.3392136096954346, + "learning_rate": 2.985473481981218e-06, + "loss": 0.0285, + "step": 27710 + }, + { + "epoch": 75.50681198910081, + "grad_norm": 2.6736907958984375, + "learning_rate": 2.9848445411998006e-06, + "loss": 0.0343, + "step": 27711 + }, + { + "epoch": 75.50953678474114, + "grad_norm": 4.17382287979126, + "learning_rate": 2.9842156550521915e-06, + "loss": 0.2088, + "step": 27712 + }, + { + "epoch": 75.51226158038148, + "grad_norm": 3.360193967819214, + "learning_rate": 2.983586823543285e-06, + "loss": 0.0765, + "step": 27713 + }, + { + "epoch": 75.5149863760218, + "grad_norm": 5.581449031829834, + "learning_rate": 2.9829580466779784e-06, + "loss": 0.1318, + "step": 27714 + }, + { + "epoch": 75.51771117166213, + "grad_norm": 2.783514976501465, + "learning_rate": 2.982329324461166e-06, + "loss": 0.0382, + "step": 27715 + }, + { + "epoch": 75.52043596730245, + "grad_norm": 5.091421604156494, + "learning_rate": 2.981700656897749e-06, + "loss": 0.1542, + "step": 27716 + }, + { + "epoch": 75.52316076294278, + "grad_norm": 2.9237117767333984, + "learning_rate": 2.981072043992623e-06, + "loss": 0.1121, + "step": 27717 + }, + { + "epoch": 75.52588555858311, + "grad_norm": 2.1351101398468018, + "learning_rate": 2.9804434857506816e-06, + "loss": 0.0408, + "step": 27718 + }, + { + "epoch": 75.52861035422343, + "grad_norm": 2.7612287998199463, + "learning_rate": 2.979814982176816e-06, + "loss": 0.0926, + "step": 27719 + }, + { + "epoch": 75.53133514986376, + "grad_norm": 3.3539750576019287, + "learning_rate": 2.9791865332759294e-06, + "loss": 0.1746, + "step": 27720 + }, + { + "epoch": 75.53405994550408, + "grad_norm": 3.053982734680176, + "learning_rate": 2.978558139052913e-06, + "loss": 0.0992, + "step": 27721 + }, + { + "epoch": 75.53678474114442, + "grad_norm": 2.8916139602661133, + "learning_rate": 2.9779297995126587e-06, + "loss": 0.1357, + "step": 27722 + }, + { + "epoch": 75.53950953678473, + "grad_norm": 3.015062093734741, + "learning_rate": 2.977301514660058e-06, + "loss": 0.049, + "step": 27723 + }, + { + "epoch": 75.54223433242507, + "grad_norm": 2.5487701892852783, + "learning_rate": 2.97667328450001e-06, + "loss": 0.0358, + "step": 27724 + }, + { + "epoch": 75.5449591280654, + "grad_norm": 2.8236160278320312, + "learning_rate": 2.9760451090374054e-06, + "loss": 0.1336, + "step": 27725 + }, + { + "epoch": 75.54768392370572, + "grad_norm": 2.3216240406036377, + "learning_rate": 2.9754169882771324e-06, + "loss": 0.0232, + "step": 27726 + }, + { + "epoch": 75.55040871934605, + "grad_norm": 2.9198029041290283, + "learning_rate": 2.9747889222240878e-06, + "loss": 0.1321, + "step": 27727 + }, + { + "epoch": 75.55313351498637, + "grad_norm": 2.4257829189300537, + "learning_rate": 2.974160910883158e-06, + "loss": 0.0457, + "step": 27728 + }, + { + "epoch": 75.5558583106267, + "grad_norm": 2.857954740524292, + "learning_rate": 2.9735329542592407e-06, + "loss": 0.0479, + "step": 27729 + }, + { + "epoch": 75.55858310626704, + "grad_norm": 2.7027206420898438, + "learning_rate": 2.9729050523572222e-06, + "loss": 0.0682, + "step": 27730 + }, + { + "epoch": 75.56130790190736, + "grad_norm": 3.273747205734253, + "learning_rate": 2.9722772051819902e-06, + "loss": 0.0833, + "step": 27731 + }, + { + "epoch": 75.56403269754769, + "grad_norm": 3.459521770477295, + "learning_rate": 2.9716494127384397e-06, + "loss": 0.2134, + "step": 27732 + }, + { + "epoch": 75.566757493188, + "grad_norm": 2.729978084564209, + "learning_rate": 2.971021675031458e-06, + "loss": 0.038, + "step": 27733 + }, + { + "epoch": 75.56948228882834, + "grad_norm": 3.5037550926208496, + "learning_rate": 2.9703939920659332e-06, + "loss": 0.0571, + "step": 27734 + }, + { + "epoch": 75.57220708446866, + "grad_norm": 2.6768691539764404, + "learning_rate": 2.96976636384675e-06, + "loss": 0.1088, + "step": 27735 + }, + { + "epoch": 75.57493188010899, + "grad_norm": 2.6828341484069824, + "learning_rate": 2.9691387903788037e-06, + "loss": 0.0492, + "step": 27736 + }, + { + "epoch": 75.57765667574932, + "grad_norm": 3.8994791507720947, + "learning_rate": 2.9685112716669783e-06, + "loss": 0.0544, + "step": 27737 + }, + { + "epoch": 75.58038147138964, + "grad_norm": 2.9792799949645996, + "learning_rate": 2.967883807716161e-06, + "loss": 0.1784, + "step": 27738 + }, + { + "epoch": 75.58310626702998, + "grad_norm": 3.3979854583740234, + "learning_rate": 2.967256398531234e-06, + "loss": 0.1164, + "step": 27739 + }, + { + "epoch": 75.5858310626703, + "grad_norm": 3.6894583702087402, + "learning_rate": 2.966629044117092e-06, + "loss": 0.137, + "step": 27740 + }, + { + "epoch": 75.58855585831063, + "grad_norm": 3.2741520404815674, + "learning_rate": 2.966001744478616e-06, + "loss": 0.0805, + "step": 27741 + }, + { + "epoch": 75.59128065395096, + "grad_norm": 2.296541690826416, + "learning_rate": 2.9653744996206926e-06, + "loss": 0.0402, + "step": 27742 + }, + { + "epoch": 75.59400544959128, + "grad_norm": 4.692990779876709, + "learning_rate": 2.964747309548203e-06, + "loss": 0.0397, + "step": 27743 + }, + { + "epoch": 75.59673024523161, + "grad_norm": 3.9447741508483887, + "learning_rate": 2.9641201742660376e-06, + "loss": 0.1126, + "step": 27744 + }, + { + "epoch": 75.59945504087193, + "grad_norm": 2.402883529663086, + "learning_rate": 2.963493093779075e-06, + "loss": 0.105, + "step": 27745 + }, + { + "epoch": 75.60217983651226, + "grad_norm": 8.863261222839355, + "learning_rate": 2.962866068092205e-06, + "loss": 0.057, + "step": 27746 + }, + { + "epoch": 75.60490463215258, + "grad_norm": 2.721849203109741, + "learning_rate": 2.9622390972103043e-06, + "loss": 0.0706, + "step": 27747 + }, + { + "epoch": 75.60762942779292, + "grad_norm": 2.285156726837158, + "learning_rate": 2.9616121811382626e-06, + "loss": 0.0397, + "step": 27748 + }, + { + "epoch": 75.61035422343325, + "grad_norm": 2.971112012863159, + "learning_rate": 2.9609853198809578e-06, + "loss": 0.0477, + "step": 27749 + }, + { + "epoch": 75.61307901907357, + "grad_norm": 3.614335536956787, + "learning_rate": 2.9603585134432733e-06, + "loss": 0.1705, + "step": 27750 + }, + { + "epoch": 75.6158038147139, + "grad_norm": 3.1232776641845703, + "learning_rate": 2.959731761830087e-06, + "loss": 0.0841, + "step": 27751 + }, + { + "epoch": 75.61852861035422, + "grad_norm": 1.7605881690979004, + "learning_rate": 2.959105065046286e-06, + "loss": 0.0292, + "step": 27752 + }, + { + "epoch": 75.62125340599455, + "grad_norm": 2.2683191299438477, + "learning_rate": 2.958478423096748e-06, + "loss": 0.0318, + "step": 27753 + }, + { + "epoch": 75.62397820163488, + "grad_norm": 2.2947306632995605, + "learning_rate": 2.9578518359863537e-06, + "loss": 0.0449, + "step": 27754 + }, + { + "epoch": 75.6267029972752, + "grad_norm": 2.4742581844329834, + "learning_rate": 2.9572253037199795e-06, + "loss": 0.0302, + "step": 27755 + }, + { + "epoch": 75.62942779291554, + "grad_norm": 2.044041633605957, + "learning_rate": 2.9565988263025114e-06, + "loss": 0.1055, + "step": 27756 + }, + { + "epoch": 75.63215258855585, + "grad_norm": 2.1931862831115723, + "learning_rate": 2.955972403738825e-06, + "loss": 0.0292, + "step": 27757 + }, + { + "epoch": 75.63487738419619, + "grad_norm": 2.2893283367156982, + "learning_rate": 2.9553460360337983e-06, + "loss": 0.0285, + "step": 27758 + }, + { + "epoch": 75.6376021798365, + "grad_norm": 3.866868734359741, + "learning_rate": 2.9547197231923065e-06, + "loss": 0.0428, + "step": 27759 + }, + { + "epoch": 75.64032697547684, + "grad_norm": 2.8351898193359375, + "learning_rate": 2.9540934652192343e-06, + "loss": 0.03, + "step": 27760 + }, + { + "epoch": 75.64305177111717, + "grad_norm": 3.13128399848938, + "learning_rate": 2.953467262119456e-06, + "loss": 0.1227, + "step": 27761 + }, + { + "epoch": 75.64577656675749, + "grad_norm": 2.306823492050171, + "learning_rate": 2.952841113897844e-06, + "loss": 0.0343, + "step": 27762 + }, + { + "epoch": 75.64850136239782, + "grad_norm": 3.6572632789611816, + "learning_rate": 2.9522150205592825e-06, + "loss": 0.0845, + "step": 27763 + }, + { + "epoch": 75.65122615803814, + "grad_norm": 3.499213457107544, + "learning_rate": 2.9515889821086395e-06, + "loss": 0.0363, + "step": 27764 + }, + { + "epoch": 75.65395095367847, + "grad_norm": 2.911710262298584, + "learning_rate": 2.950962998550798e-06, + "loss": 0.0303, + "step": 27765 + }, + { + "epoch": 75.65667574931881, + "grad_norm": 2.25347638130188, + "learning_rate": 2.9503370698906298e-06, + "loss": 0.026, + "step": 27766 + }, + { + "epoch": 75.65940054495913, + "grad_norm": 2.3659725189208984, + "learning_rate": 2.9497111961330103e-06, + "loss": 0.0445, + "step": 27767 + }, + { + "epoch": 75.66212534059946, + "grad_norm": 3.2874715328216553, + "learning_rate": 2.94908537728281e-06, + "loss": 0.0517, + "step": 27768 + }, + { + "epoch": 75.66485013623978, + "grad_norm": 4.073539733886719, + "learning_rate": 2.9484596133449086e-06, + "loss": 0.2055, + "step": 27769 + }, + { + "epoch": 75.66757493188011, + "grad_norm": 2.573126792907715, + "learning_rate": 2.9478339043241753e-06, + "loss": 0.1221, + "step": 27770 + }, + { + "epoch": 75.67029972752043, + "grad_norm": 4.630699157714844, + "learning_rate": 2.947208250225484e-06, + "loss": 0.2313, + "step": 27771 + }, + { + "epoch": 75.67302452316076, + "grad_norm": 2.453627109527588, + "learning_rate": 2.946582651053709e-06, + "loss": 0.0513, + "step": 27772 + }, + { + "epoch": 75.6757493188011, + "grad_norm": 5.062366008758545, + "learning_rate": 2.945957106813723e-06, + "loss": 0.1424, + "step": 27773 + }, + { + "epoch": 75.67847411444141, + "grad_norm": 2.7563202381134033, + "learning_rate": 2.945331617510394e-06, + "loss": 0.1469, + "step": 27774 + }, + { + "epoch": 75.68119891008175, + "grad_norm": 8.14344596862793, + "learning_rate": 2.9447061831485933e-06, + "loss": 0.0764, + "step": 27775 + }, + { + "epoch": 75.68392370572207, + "grad_norm": 2.9626362323760986, + "learning_rate": 2.944080803733197e-06, + "loss": 0.0455, + "step": 27776 + }, + { + "epoch": 75.6866485013624, + "grad_norm": 2.519667148590088, + "learning_rate": 2.943455479269073e-06, + "loss": 0.1069, + "step": 27777 + }, + { + "epoch": 75.68937329700273, + "grad_norm": 2.71968674659729, + "learning_rate": 2.9428302097610894e-06, + "loss": 0.0428, + "step": 27778 + }, + { + "epoch": 75.69209809264305, + "grad_norm": 2.561763286590576, + "learning_rate": 2.9422049952141142e-06, + "loss": 0.1014, + "step": 27779 + }, + { + "epoch": 75.69482288828338, + "grad_norm": 2.0596539974212646, + "learning_rate": 2.941579835633019e-06, + "loss": 0.032, + "step": 27780 + }, + { + "epoch": 75.6975476839237, + "grad_norm": 1.8910735845565796, + "learning_rate": 2.9409547310226773e-06, + "loss": 0.1788, + "step": 27781 + }, + { + "epoch": 75.70027247956403, + "grad_norm": 5.750277519226074, + "learning_rate": 2.9403296813879513e-06, + "loss": 0.0515, + "step": 27782 + }, + { + "epoch": 75.70299727520435, + "grad_norm": 1.9856802225112915, + "learning_rate": 2.939704686733711e-06, + "loss": 0.0274, + "step": 27783 + }, + { + "epoch": 75.70572207084469, + "grad_norm": 2.824207067489624, + "learning_rate": 2.939079747064821e-06, + "loss": 0.0716, + "step": 27784 + }, + { + "epoch": 75.70844686648502, + "grad_norm": 3.398721933364868, + "learning_rate": 2.9384548623861533e-06, + "loss": 0.1962, + "step": 27785 + }, + { + "epoch": 75.71117166212534, + "grad_norm": 3.622636318206787, + "learning_rate": 2.937830032702572e-06, + "loss": 0.0571, + "step": 27786 + }, + { + "epoch": 75.71389645776567, + "grad_norm": 4.732388019561768, + "learning_rate": 2.9372052580189424e-06, + "loss": 0.0569, + "step": 27787 + }, + { + "epoch": 75.71662125340599, + "grad_norm": 2.658836841583252, + "learning_rate": 2.936580538340129e-06, + "loss": 0.0514, + "step": 27788 + }, + { + "epoch": 75.71934604904632, + "grad_norm": 2.121434211730957, + "learning_rate": 2.9359558736710016e-06, + "loss": 0.0357, + "step": 27789 + }, + { + "epoch": 75.72207084468666, + "grad_norm": 3.747109889984131, + "learning_rate": 2.9353312640164223e-06, + "loss": 0.1473, + "step": 27790 + }, + { + "epoch": 75.72479564032697, + "grad_norm": 3.1915030479431152, + "learning_rate": 2.934706709381253e-06, + "loss": 0.2152, + "step": 27791 + }, + { + "epoch": 75.7275204359673, + "grad_norm": 2.266594886779785, + "learning_rate": 2.9340822097703626e-06, + "loss": 0.039, + "step": 27792 + }, + { + "epoch": 75.73024523160763, + "grad_norm": 4.012491226196289, + "learning_rate": 2.933457765188613e-06, + "loss": 0.0697, + "step": 27793 + }, + { + "epoch": 75.73297002724796, + "grad_norm": 3.757294178009033, + "learning_rate": 2.932833375640868e-06, + "loss": 0.1701, + "step": 27794 + }, + { + "epoch": 75.73569482288828, + "grad_norm": 4.026195526123047, + "learning_rate": 2.932209041131985e-06, + "loss": 0.0751, + "step": 27795 + }, + { + "epoch": 75.73841961852861, + "grad_norm": 3.2037413120269775, + "learning_rate": 2.9315847616668315e-06, + "loss": 0.0926, + "step": 27796 + }, + { + "epoch": 75.74114441416894, + "grad_norm": 2.414330005645752, + "learning_rate": 2.93096053725027e-06, + "loss": 0.0307, + "step": 27797 + }, + { + "epoch": 75.74386920980926, + "grad_norm": 2.8596391677856445, + "learning_rate": 2.930336367887161e-06, + "loss": 0.0864, + "step": 27798 + }, + { + "epoch": 75.7465940054496, + "grad_norm": 3.3420329093933105, + "learning_rate": 2.929712253582365e-06, + "loss": 0.0613, + "step": 27799 + }, + { + "epoch": 75.74931880108991, + "grad_norm": 2.1052417755126953, + "learning_rate": 2.929088194340739e-06, + "loss": 0.0838, + "step": 27800 + }, + { + "epoch": 75.75204359673025, + "grad_norm": 3.157144784927368, + "learning_rate": 2.928464190167151e-06, + "loss": 0.1619, + "step": 27801 + }, + { + "epoch": 75.75476839237058, + "grad_norm": 2.7051918506622314, + "learning_rate": 2.9278402410664543e-06, + "loss": 0.0595, + "step": 27802 + }, + { + "epoch": 75.7574931880109, + "grad_norm": 2.1615326404571533, + "learning_rate": 2.927216347043511e-06, + "loss": 0.0281, + "step": 27803 + }, + { + "epoch": 75.76021798365123, + "grad_norm": 4.368989944458008, + "learning_rate": 2.9265925081031767e-06, + "loss": 0.0499, + "step": 27804 + }, + { + "epoch": 75.76294277929155, + "grad_norm": 2.4406278133392334, + "learning_rate": 2.9259687242503144e-06, + "loss": 0.0515, + "step": 27805 + }, + { + "epoch": 75.76566757493188, + "grad_norm": 1.9840441942214966, + "learning_rate": 2.9253449954897807e-06, + "loss": 0.0221, + "step": 27806 + }, + { + "epoch": 75.7683923705722, + "grad_norm": 5.387057781219482, + "learning_rate": 2.9247213218264326e-06, + "loss": 0.1185, + "step": 27807 + }, + { + "epoch": 75.77111716621253, + "grad_norm": 3.386645555496216, + "learning_rate": 2.924097703265123e-06, + "loss": 0.15, + "step": 27808 + }, + { + "epoch": 75.77384196185287, + "grad_norm": 3.5044636726379395, + "learning_rate": 2.9234741398107168e-06, + "loss": 0.1477, + "step": 27809 + }, + { + "epoch": 75.77656675749319, + "grad_norm": 2.8873465061187744, + "learning_rate": 2.922850631468066e-06, + "loss": 0.0611, + "step": 27810 + }, + { + "epoch": 75.77929155313352, + "grad_norm": 5.114377975463867, + "learning_rate": 2.9222271782420264e-06, + "loss": 0.0489, + "step": 27811 + }, + { + "epoch": 75.78201634877384, + "grad_norm": 2.4986019134521484, + "learning_rate": 2.921603780137451e-06, + "loss": 0.0862, + "step": 27812 + }, + { + "epoch": 75.78474114441417, + "grad_norm": 10.487380981445312, + "learning_rate": 2.9209804371592e-06, + "loss": 0.0415, + "step": 27813 + }, + { + "epoch": 75.7874659400545, + "grad_norm": 2.6905405521392822, + "learning_rate": 2.920357149312123e-06, + "loss": 0.0858, + "step": 27814 + }, + { + "epoch": 75.79019073569482, + "grad_norm": 2.6635348796844482, + "learning_rate": 2.9197339166010795e-06, + "loss": 0.041, + "step": 27815 + }, + { + "epoch": 75.79291553133515, + "grad_norm": 2.844661235809326, + "learning_rate": 2.919110739030918e-06, + "loss": 0.0576, + "step": 27816 + }, + { + "epoch": 75.79564032697547, + "grad_norm": 3.05802583694458, + "learning_rate": 2.918487616606497e-06, + "loss": 0.0695, + "step": 27817 + }, + { + "epoch": 75.7983651226158, + "grad_norm": 3.6677818298339844, + "learning_rate": 2.9178645493326664e-06, + "loss": 0.0724, + "step": 27818 + }, + { + "epoch": 75.80108991825612, + "grad_norm": 2.994086980819702, + "learning_rate": 2.917241537214278e-06, + "loss": 0.04, + "step": 27819 + }, + { + "epoch": 75.80381471389646, + "grad_norm": 2.594191551208496, + "learning_rate": 2.916618580256182e-06, + "loss": 0.0652, + "step": 27820 + }, + { + "epoch": 75.80653950953679, + "grad_norm": 3.1373801231384277, + "learning_rate": 2.915995678463236e-06, + "loss": 0.0761, + "step": 27821 + }, + { + "epoch": 75.80926430517711, + "grad_norm": 2.3345096111297607, + "learning_rate": 2.9153728318402875e-06, + "loss": 0.0311, + "step": 27822 + }, + { + "epoch": 75.81198910081744, + "grad_norm": 2.6505022048950195, + "learning_rate": 2.914750040392187e-06, + "loss": 0.0343, + "step": 27823 + }, + { + "epoch": 75.81471389645776, + "grad_norm": 2.4502649307250977, + "learning_rate": 2.9141273041237817e-06, + "loss": 0.0377, + "step": 27824 + }, + { + "epoch": 75.8174386920981, + "grad_norm": 2.3624539375305176, + "learning_rate": 2.9135046230399288e-06, + "loss": 0.0392, + "step": 27825 + }, + { + "epoch": 75.82016348773843, + "grad_norm": 5.040776252746582, + "learning_rate": 2.9128819971454736e-06, + "loss": 0.0507, + "step": 27826 + }, + { + "epoch": 75.82288828337875, + "grad_norm": 1.5148581266403198, + "learning_rate": 2.9122594264452654e-06, + "loss": 0.0234, + "step": 27827 + }, + { + "epoch": 75.82561307901908, + "grad_norm": 3.950441360473633, + "learning_rate": 2.9116369109441487e-06, + "loss": 0.1785, + "step": 27828 + }, + { + "epoch": 75.8283378746594, + "grad_norm": 16.9500675201416, + "learning_rate": 2.9110144506469806e-06, + "loss": 0.0715, + "step": 27829 + }, + { + "epoch": 75.83106267029973, + "grad_norm": 2.742633819580078, + "learning_rate": 2.910392045558602e-06, + "loss": 0.1761, + "step": 27830 + }, + { + "epoch": 75.83378746594005, + "grad_norm": 2.607189655303955, + "learning_rate": 2.9097696956838596e-06, + "loss": 0.0296, + "step": 27831 + }, + { + "epoch": 75.83651226158038, + "grad_norm": 2.5312812328338623, + "learning_rate": 2.9091474010276024e-06, + "loss": 0.0247, + "step": 27832 + }, + { + "epoch": 75.83923705722071, + "grad_norm": 4.3888630867004395, + "learning_rate": 2.908525161594681e-06, + "loss": 0.0471, + "step": 27833 + }, + { + "epoch": 75.84196185286103, + "grad_norm": 3.578895092010498, + "learning_rate": 2.9079029773899357e-06, + "loss": 0.0296, + "step": 27834 + }, + { + "epoch": 75.84468664850137, + "grad_norm": 1.764914870262146, + "learning_rate": 2.9072808484182146e-06, + "loss": 0.0236, + "step": 27835 + }, + { + "epoch": 75.84741144414168, + "grad_norm": 4.9986419677734375, + "learning_rate": 2.90665877468436e-06, + "loss": 0.0736, + "step": 27836 + }, + { + "epoch": 75.85013623978202, + "grad_norm": 3.350407361984253, + "learning_rate": 2.9060367561932202e-06, + "loss": 0.0569, + "step": 27837 + }, + { + "epoch": 75.85286103542235, + "grad_norm": 2.895502805709839, + "learning_rate": 2.905414792949638e-06, + "loss": 0.059, + "step": 27838 + }, + { + "epoch": 75.85558583106267, + "grad_norm": 2.3329083919525146, + "learning_rate": 2.9047928849584573e-06, + "loss": 0.0486, + "step": 27839 + }, + { + "epoch": 75.858310626703, + "grad_norm": 2.8299543857574463, + "learning_rate": 2.904171032224519e-06, + "loss": 0.1994, + "step": 27840 + }, + { + "epoch": 75.86103542234332, + "grad_norm": 2.45097017288208, + "learning_rate": 2.9035492347526704e-06, + "loss": 0.0972, + "step": 27841 + }, + { + "epoch": 75.86376021798365, + "grad_norm": 2.9409539699554443, + "learning_rate": 2.902927492547751e-06, + "loss": 0.1533, + "step": 27842 + }, + { + "epoch": 75.86648501362397, + "grad_norm": 2.9123213291168213, + "learning_rate": 2.9023058056146058e-06, + "loss": 0.0451, + "step": 27843 + }, + { + "epoch": 75.8692098092643, + "grad_norm": 3.152182102203369, + "learning_rate": 2.9016841739580703e-06, + "loss": 0.0314, + "step": 27844 + }, + { + "epoch": 75.87193460490464, + "grad_norm": 6.103669166564941, + "learning_rate": 2.9010625975829944e-06, + "loss": 0.092, + "step": 27845 + }, + { + "epoch": 75.87465940054496, + "grad_norm": 2.2012038230895996, + "learning_rate": 2.9004410764942125e-06, + "loss": 0.0655, + "step": 27846 + }, + { + "epoch": 75.87738419618529, + "grad_norm": 2.2651119232177734, + "learning_rate": 2.8998196106965693e-06, + "loss": 0.0396, + "step": 27847 + }, + { + "epoch": 75.88010899182561, + "grad_norm": 2.6364383697509766, + "learning_rate": 2.899198200194897e-06, + "loss": 0.036, + "step": 27848 + }, + { + "epoch": 75.88283378746594, + "grad_norm": 1.9506982564926147, + "learning_rate": 2.8985768449940422e-06, + "loss": 0.0258, + "step": 27849 + }, + { + "epoch": 75.88555858310627, + "grad_norm": 2.8842601776123047, + "learning_rate": 2.897955545098845e-06, + "loss": 0.0325, + "step": 27850 + }, + { + "epoch": 75.88828337874659, + "grad_norm": 2.7214174270629883, + "learning_rate": 2.897334300514142e-06, + "loss": 0.082, + "step": 27851 + }, + { + "epoch": 75.89100817438693, + "grad_norm": 3.42515230178833, + "learning_rate": 2.89671311124477e-06, + "loss": 0.0865, + "step": 27852 + }, + { + "epoch": 75.89373297002724, + "grad_norm": 2.3143978118896484, + "learning_rate": 2.8960919772955642e-06, + "loss": 0.0284, + "step": 27853 + }, + { + "epoch": 75.89645776566758, + "grad_norm": 3.6452369689941406, + "learning_rate": 2.89547089867137e-06, + "loss": 0.0711, + "step": 27854 + }, + { + "epoch": 75.8991825613079, + "grad_norm": 3.0343549251556396, + "learning_rate": 2.894849875377018e-06, + "loss": 0.1123, + "step": 27855 + }, + { + "epoch": 75.90190735694823, + "grad_norm": 2.7725486755371094, + "learning_rate": 2.8942289074173447e-06, + "loss": 0.0851, + "step": 27856 + }, + { + "epoch": 75.90463215258856, + "grad_norm": 3.272948980331421, + "learning_rate": 2.8936079947971907e-06, + "loss": 0.115, + "step": 27857 + }, + { + "epoch": 75.90735694822888, + "grad_norm": 2.96177077293396, + "learning_rate": 2.8929871375213893e-06, + "loss": 0.0474, + "step": 27858 + }, + { + "epoch": 75.91008174386921, + "grad_norm": 2.71899151802063, + "learning_rate": 2.892366335594775e-06, + "loss": 0.0421, + "step": 27859 + }, + { + "epoch": 75.91280653950953, + "grad_norm": 2.39719557762146, + "learning_rate": 2.8917455890221803e-06, + "loss": 0.0221, + "step": 27860 + }, + { + "epoch": 75.91553133514986, + "grad_norm": 3.4639968872070312, + "learning_rate": 2.891124897808445e-06, + "loss": 0.0678, + "step": 27861 + }, + { + "epoch": 75.9182561307902, + "grad_norm": 3.6853580474853516, + "learning_rate": 2.890504261958399e-06, + "loss": 0.0255, + "step": 27862 + }, + { + "epoch": 75.92098092643052, + "grad_norm": 3.5848002433776855, + "learning_rate": 2.8898836814768783e-06, + "loss": 0.0842, + "step": 27863 + }, + { + "epoch": 75.92370572207085, + "grad_norm": 3.7451703548431396, + "learning_rate": 2.889263156368711e-06, + "loss": 0.1634, + "step": 27864 + }, + { + "epoch": 75.92643051771117, + "grad_norm": 2.401470184326172, + "learning_rate": 2.8886426866387342e-06, + "loss": 0.0686, + "step": 27865 + }, + { + "epoch": 75.9291553133515, + "grad_norm": 5.314740180969238, + "learning_rate": 2.8880222722917817e-06, + "loss": 0.0775, + "step": 27866 + }, + { + "epoch": 75.93188010899182, + "grad_norm": 2.852182149887085, + "learning_rate": 2.8874019133326825e-06, + "loss": 0.0278, + "step": 27867 + }, + { + "epoch": 75.93460490463215, + "grad_norm": 3.7330596446990967, + "learning_rate": 2.8867816097662693e-06, + "loss": 0.0779, + "step": 27868 + }, + { + "epoch": 75.93732970027249, + "grad_norm": 3.6809818744659424, + "learning_rate": 2.886161361597368e-06, + "loss": 0.1212, + "step": 27869 + }, + { + "epoch": 75.9400544959128, + "grad_norm": 2.729417324066162, + "learning_rate": 2.8855411688308165e-06, + "loss": 0.0404, + "step": 27870 + }, + { + "epoch": 75.94277929155314, + "grad_norm": 4.025170803070068, + "learning_rate": 2.8849210314714414e-06, + "loss": 0.0796, + "step": 27871 + }, + { + "epoch": 75.94550408719346, + "grad_norm": 3.068633556365967, + "learning_rate": 2.8843009495240724e-06, + "loss": 0.0654, + "step": 27872 + }, + { + "epoch": 75.94822888283379, + "grad_norm": 2.7954258918762207, + "learning_rate": 2.883680922993536e-06, + "loss": 0.1775, + "step": 27873 + }, + { + "epoch": 75.95095367847412, + "grad_norm": 2.1981656551361084, + "learning_rate": 2.8830609518846652e-06, + "loss": 0.0327, + "step": 27874 + }, + { + "epoch": 75.95367847411444, + "grad_norm": 4.070340156555176, + "learning_rate": 2.882441036202288e-06, + "loss": 0.0748, + "step": 27875 + }, + { + "epoch": 75.95640326975477, + "grad_norm": 4.704790115356445, + "learning_rate": 2.8818211759512306e-06, + "loss": 0.0441, + "step": 27876 + }, + { + "epoch": 75.95912806539509, + "grad_norm": 2.5818374156951904, + "learning_rate": 2.8812013711363173e-06, + "loss": 0.0647, + "step": 27877 + }, + { + "epoch": 75.96185286103542, + "grad_norm": 2.595198154449463, + "learning_rate": 2.8805816217623815e-06, + "loss": 0.0374, + "step": 27878 + }, + { + "epoch": 75.96457765667574, + "grad_norm": 2.841723680496216, + "learning_rate": 2.8799619278342474e-06, + "loss": 0.2167, + "step": 27879 + }, + { + "epoch": 75.96730245231608, + "grad_norm": 3.9617176055908203, + "learning_rate": 2.879342289356737e-06, + "loss": 0.1075, + "step": 27880 + }, + { + "epoch": 75.97002724795641, + "grad_norm": 2.281709909439087, + "learning_rate": 2.8787227063346835e-06, + "loss": 0.1604, + "step": 27881 + }, + { + "epoch": 75.97275204359673, + "grad_norm": 2.5206027030944824, + "learning_rate": 2.878103178772905e-06, + "loss": 0.0326, + "step": 27882 + }, + { + "epoch": 75.97547683923706, + "grad_norm": 2.060612916946411, + "learning_rate": 2.877483706676233e-06, + "loss": 0.0428, + "step": 27883 + }, + { + "epoch": 75.97820163487738, + "grad_norm": 3.6709465980529785, + "learning_rate": 2.876864290049488e-06, + "loss": 0.0366, + "step": 27884 + }, + { + "epoch": 75.98092643051771, + "grad_norm": 3.077700138092041, + "learning_rate": 2.8762449288974924e-06, + "loss": 0.0332, + "step": 27885 + }, + { + "epoch": 75.98365122615803, + "grad_norm": 3.304319381713867, + "learning_rate": 2.8756256232250744e-06, + "loss": 0.0729, + "step": 27886 + }, + { + "epoch": 75.98637602179836, + "grad_norm": 2.5324795246124268, + "learning_rate": 2.875006373037055e-06, + "loss": 0.0511, + "step": 27887 + }, + { + "epoch": 75.9891008174387, + "grad_norm": 3.1744704246520996, + "learning_rate": 2.874387178338257e-06, + "loss": 0.0573, + "step": 27888 + }, + { + "epoch": 75.99182561307902, + "grad_norm": 3.301844835281372, + "learning_rate": 2.873768039133499e-06, + "loss": 0.0862, + "step": 27889 + }, + { + "epoch": 75.99455040871935, + "grad_norm": 2.8942222595214844, + "learning_rate": 2.8731489554276092e-06, + "loss": 0.0601, + "step": 27890 + }, + { + "epoch": 75.99727520435967, + "grad_norm": 4.084033966064453, + "learning_rate": 2.872529927225406e-06, + "loss": 0.0986, + "step": 27891 + }, + { + "epoch": 76.0, + "grad_norm": 3.195117950439453, + "learning_rate": 2.8719109545317102e-06, + "loss": 0.0686, + "step": 27892 + }, + { + "epoch": 76.00272479564033, + "grad_norm": 2.6047229766845703, + "learning_rate": 2.871292037351339e-06, + "loss": 0.0732, + "step": 27893 + }, + { + "epoch": 76.00544959128065, + "grad_norm": 3.359541416168213, + "learning_rate": 2.8706731756891194e-06, + "loss": 0.0746, + "step": 27894 + }, + { + "epoch": 76.00817438692098, + "grad_norm": 2.1447629928588867, + "learning_rate": 2.870054369549868e-06, + "loss": 0.0314, + "step": 27895 + }, + { + "epoch": 76.0108991825613, + "grad_norm": 3.1212072372436523, + "learning_rate": 2.869435618938403e-06, + "loss": 0.0592, + "step": 27896 + }, + { + "epoch": 76.01362397820164, + "grad_norm": 4.256537437438965, + "learning_rate": 2.868816923859542e-06, + "loss": 0.1006, + "step": 27897 + }, + { + "epoch": 76.01634877384195, + "grad_norm": 4.424111366271973, + "learning_rate": 2.868198284318108e-06, + "loss": 0.0366, + "step": 27898 + }, + { + "epoch": 76.01907356948229, + "grad_norm": 2.855241298675537, + "learning_rate": 2.8675797003189155e-06, + "loss": 0.071, + "step": 27899 + }, + { + "epoch": 76.02179836512262, + "grad_norm": 2.134061336517334, + "learning_rate": 2.86696117186678e-06, + "loss": 0.0453, + "step": 27900 + }, + { + "epoch": 76.02452316076294, + "grad_norm": 3.598741054534912, + "learning_rate": 2.866342698966521e-06, + "loss": 0.0938, + "step": 27901 + }, + { + "epoch": 76.02724795640327, + "grad_norm": 2.796027898788452, + "learning_rate": 2.865724281622959e-06, + "loss": 0.0489, + "step": 27902 + }, + { + "epoch": 76.02997275204359, + "grad_norm": 2.716315746307373, + "learning_rate": 2.865105919840906e-06, + "loss": 0.0393, + "step": 27903 + }, + { + "epoch": 76.03269754768392, + "grad_norm": 3.5865912437438965, + "learning_rate": 2.86448761362518e-06, + "loss": 0.1215, + "step": 27904 + }, + { + "epoch": 76.03542234332426, + "grad_norm": 2.713700771331787, + "learning_rate": 2.8638693629805904e-06, + "loss": 0.1316, + "step": 27905 + }, + { + "epoch": 76.03814713896458, + "grad_norm": 2.532438039779663, + "learning_rate": 2.8632511679119603e-06, + "loss": 0.0276, + "step": 27906 + }, + { + "epoch": 76.04087193460491, + "grad_norm": 1.9082499742507935, + "learning_rate": 2.8626330284241e-06, + "loss": 0.0623, + "step": 27907 + }, + { + "epoch": 76.04359673024523, + "grad_norm": 2.3191237449645996, + "learning_rate": 2.862014944521824e-06, + "loss": 0.1041, + "step": 27908 + }, + { + "epoch": 76.04632152588556, + "grad_norm": 3.031367301940918, + "learning_rate": 2.861396916209942e-06, + "loss": 0.1075, + "step": 27909 + }, + { + "epoch": 76.04904632152588, + "grad_norm": 2.3648593425750732, + "learning_rate": 2.8607789434932753e-06, + "loss": 0.0485, + "step": 27910 + }, + { + "epoch": 76.05177111716621, + "grad_norm": 2.374833583831787, + "learning_rate": 2.8601610263766324e-06, + "loss": 0.0395, + "step": 27911 + }, + { + "epoch": 76.05449591280654, + "grad_norm": 2.5501208305358887, + "learning_rate": 2.8595431648648255e-06, + "loss": 0.0316, + "step": 27912 + }, + { + "epoch": 76.05722070844686, + "grad_norm": 2.2800769805908203, + "learning_rate": 2.8589253589626633e-06, + "loss": 0.2246, + "step": 27913 + }, + { + "epoch": 76.0599455040872, + "grad_norm": 2.5565056800842285, + "learning_rate": 2.8583076086749627e-06, + "loss": 0.0528, + "step": 27914 + }, + { + "epoch": 76.06267029972751, + "grad_norm": 8.033062934875488, + "learning_rate": 2.857689914006534e-06, + "loss": 0.1059, + "step": 27915 + }, + { + "epoch": 76.06539509536785, + "grad_norm": 2.8080556392669678, + "learning_rate": 2.857072274962186e-06, + "loss": 0.0694, + "step": 27916 + }, + { + "epoch": 76.06811989100818, + "grad_norm": 2.6445555686950684, + "learning_rate": 2.856454691546726e-06, + "loss": 0.042, + "step": 27917 + }, + { + "epoch": 76.0708446866485, + "grad_norm": 3.4859976768493652, + "learning_rate": 2.8558371637649674e-06, + "loss": 0.0708, + "step": 27918 + }, + { + "epoch": 76.07356948228883, + "grad_norm": 3.230778217315674, + "learning_rate": 2.855219691621721e-06, + "loss": 0.0956, + "step": 27919 + }, + { + "epoch": 76.07629427792915, + "grad_norm": 2.596186399459839, + "learning_rate": 2.854602275121795e-06, + "loss": 0.0324, + "step": 27920 + }, + { + "epoch": 76.07901907356948, + "grad_norm": 2.370415210723877, + "learning_rate": 2.853984914269993e-06, + "loss": 0.2181, + "step": 27921 + }, + { + "epoch": 76.0817438692098, + "grad_norm": 2.104543447494507, + "learning_rate": 2.8533676090711294e-06, + "loss": 0.0369, + "step": 27922 + }, + { + "epoch": 76.08446866485014, + "grad_norm": 2.1844191551208496, + "learning_rate": 2.852750359530009e-06, + "loss": 0.0964, + "step": 27923 + }, + { + "epoch": 76.08719346049047, + "grad_norm": 2.8125557899475098, + "learning_rate": 2.8521331656514383e-06, + "loss": 0.2011, + "step": 27924 + }, + { + "epoch": 76.08991825613079, + "grad_norm": 2.3025074005126953, + "learning_rate": 2.851516027440222e-06, + "loss": 0.028, + "step": 27925 + }, + { + "epoch": 76.09264305177112, + "grad_norm": 3.783123731613159, + "learning_rate": 2.8508989449011716e-06, + "loss": 0.1999, + "step": 27926 + }, + { + "epoch": 76.09536784741144, + "grad_norm": 9.983528137207031, + "learning_rate": 2.8502819180390905e-06, + "loss": 0.0537, + "step": 27927 + }, + { + "epoch": 76.09809264305177, + "grad_norm": 3.5010738372802734, + "learning_rate": 2.8496649468587835e-06, + "loss": 0.0777, + "step": 27928 + }, + { + "epoch": 76.1008174386921, + "grad_norm": 1.9456828832626343, + "learning_rate": 2.8490480313650526e-06, + "loss": 0.0508, + "step": 27929 + }, + { + "epoch": 76.10354223433242, + "grad_norm": 1.8603999614715576, + "learning_rate": 2.848431171562708e-06, + "loss": 0.0305, + "step": 27930 + }, + { + "epoch": 76.10626702997276, + "grad_norm": 1.9711729288101196, + "learning_rate": 2.847814367456552e-06, + "loss": 0.0224, + "step": 27931 + }, + { + "epoch": 76.10899182561307, + "grad_norm": 2.993370771408081, + "learning_rate": 2.8471976190513873e-06, + "loss": 0.1023, + "step": 27932 + }, + { + "epoch": 76.11171662125341, + "grad_norm": 1.6494911909103394, + "learning_rate": 2.846580926352014e-06, + "loss": 0.0245, + "step": 27933 + }, + { + "epoch": 76.11444141689373, + "grad_norm": 2.5368120670318604, + "learning_rate": 2.845964289363239e-06, + "loss": 0.0825, + "step": 27934 + }, + { + "epoch": 76.11716621253406, + "grad_norm": 2.156525135040283, + "learning_rate": 2.8453477080898663e-06, + "loss": 0.0362, + "step": 27935 + }, + { + "epoch": 76.11989100817439, + "grad_norm": 3.1506590843200684, + "learning_rate": 2.844731182536695e-06, + "loss": 0.0372, + "step": 27936 + }, + { + "epoch": 76.12261580381471, + "grad_norm": 2.9435369968414307, + "learning_rate": 2.844114712708528e-06, + "loss": 0.0659, + "step": 27937 + }, + { + "epoch": 76.12534059945504, + "grad_norm": 2.2656257152557373, + "learning_rate": 2.843498298610161e-06, + "loss": 0.0573, + "step": 27938 + }, + { + "epoch": 76.12806539509536, + "grad_norm": 2.793180465698242, + "learning_rate": 2.8428819402464024e-06, + "loss": 0.0764, + "step": 27939 + }, + { + "epoch": 76.1307901907357, + "grad_norm": 2.548090934753418, + "learning_rate": 2.842265637622049e-06, + "loss": 0.0552, + "step": 27940 + }, + { + "epoch": 76.13351498637603, + "grad_norm": 1.7717152833938599, + "learning_rate": 2.8416493907418986e-06, + "loss": 0.06, + "step": 27941 + }, + { + "epoch": 76.13623978201635, + "grad_norm": 2.3561151027679443, + "learning_rate": 2.841033199610754e-06, + "loss": 0.1106, + "step": 27942 + }, + { + "epoch": 76.13896457765668, + "grad_norm": 1.8871134519577026, + "learning_rate": 2.8404170642334126e-06, + "loss": 0.1241, + "step": 27943 + }, + { + "epoch": 76.141689373297, + "grad_norm": 2.2275400161743164, + "learning_rate": 2.8398009846146733e-06, + "loss": 0.0392, + "step": 27944 + }, + { + "epoch": 76.14441416893733, + "grad_norm": 2.4605019092559814, + "learning_rate": 2.839184960759329e-06, + "loss": 0.0312, + "step": 27945 + }, + { + "epoch": 76.14713896457765, + "grad_norm": 2.262267589569092, + "learning_rate": 2.838568992672186e-06, + "loss": 0.0595, + "step": 27946 + }, + { + "epoch": 76.14986376021798, + "grad_norm": 1.9158697128295898, + "learning_rate": 2.837953080358038e-06, + "loss": 0.0305, + "step": 27947 + }, + { + "epoch": 76.15258855585832, + "grad_norm": 3.2195372581481934, + "learning_rate": 2.837337223821679e-06, + "loss": 0.0617, + "step": 27948 + }, + { + "epoch": 76.15531335149863, + "grad_norm": 3.519857406616211, + "learning_rate": 2.836721423067905e-06, + "loss": 0.0342, + "step": 27949 + }, + { + "epoch": 76.15803814713897, + "grad_norm": 2.3365373611450195, + "learning_rate": 2.836105678101517e-06, + "loss": 0.0415, + "step": 27950 + }, + { + "epoch": 76.16076294277929, + "grad_norm": 2.3643312454223633, + "learning_rate": 2.8354899889273045e-06, + "loss": 0.0693, + "step": 27951 + }, + { + "epoch": 76.16348773841962, + "grad_norm": 2.281914234161377, + "learning_rate": 2.834874355550069e-06, + "loss": 0.0739, + "step": 27952 + }, + { + "epoch": 76.16621253405995, + "grad_norm": 2.2375946044921875, + "learning_rate": 2.8342587779746e-06, + "loss": 0.045, + "step": 27953 + }, + { + "epoch": 76.16893732970027, + "grad_norm": 3.7037556171417236, + "learning_rate": 2.8336432562056914e-06, + "loss": 0.1268, + "step": 27954 + }, + { + "epoch": 76.1716621253406, + "grad_norm": 3.3654592037200928, + "learning_rate": 2.833027790248141e-06, + "loss": 0.0493, + "step": 27955 + }, + { + "epoch": 76.17438692098092, + "grad_norm": 2.998358964920044, + "learning_rate": 2.8324123801067395e-06, + "loss": 0.1388, + "step": 27956 + }, + { + "epoch": 76.17711171662125, + "grad_norm": 2.6205263137817383, + "learning_rate": 2.8317970257862793e-06, + "loss": 0.1454, + "step": 27957 + }, + { + "epoch": 76.17983651226157, + "grad_norm": 2.7314774990081787, + "learning_rate": 2.83118172729155e-06, + "loss": 0.0678, + "step": 27958 + }, + { + "epoch": 76.1825613079019, + "grad_norm": 3.8011600971221924, + "learning_rate": 2.8305664846273507e-06, + "loss": 0.1158, + "step": 27959 + }, + { + "epoch": 76.18528610354224, + "grad_norm": 2.4972071647644043, + "learning_rate": 2.8299512977984677e-06, + "loss": 0.0309, + "step": 27960 + }, + { + "epoch": 76.18801089918256, + "grad_norm": 3.224722385406494, + "learning_rate": 2.8293361668096943e-06, + "loss": 0.144, + "step": 27961 + }, + { + "epoch": 76.19073569482289, + "grad_norm": 2.707001209259033, + "learning_rate": 2.828721091665816e-06, + "loss": 0.0603, + "step": 27962 + }, + { + "epoch": 76.19346049046321, + "grad_norm": 2.6368777751922607, + "learning_rate": 2.8281060723716303e-06, + "loss": 0.1009, + "step": 27963 + }, + { + "epoch": 76.19618528610354, + "grad_norm": 3.2318313121795654, + "learning_rate": 2.8274911089319247e-06, + "loss": 0.1747, + "step": 27964 + }, + { + "epoch": 76.19891008174388, + "grad_norm": 1.9589316844940186, + "learning_rate": 2.8268762013514826e-06, + "loss": 0.1039, + "step": 27965 + }, + { + "epoch": 76.2016348773842, + "grad_norm": 3.561958074569702, + "learning_rate": 2.826261349635102e-06, + "loss": 0.1214, + "step": 27966 + }, + { + "epoch": 76.20435967302453, + "grad_norm": 2.2904269695281982, + "learning_rate": 2.8256465537875677e-06, + "loss": 0.0497, + "step": 27967 + }, + { + "epoch": 76.20708446866485, + "grad_norm": 6.865897178649902, + "learning_rate": 2.8250318138136655e-06, + "loss": 0.0824, + "step": 27968 + }, + { + "epoch": 76.20980926430518, + "grad_norm": 2.350994348526001, + "learning_rate": 2.8244171297181834e-06, + "loss": 0.0295, + "step": 27969 + }, + { + "epoch": 76.2125340599455, + "grad_norm": 2.612551689147949, + "learning_rate": 2.823802501505909e-06, + "loss": 0.0493, + "step": 27970 + }, + { + "epoch": 76.21525885558583, + "grad_norm": 2.6668803691864014, + "learning_rate": 2.8231879291816323e-06, + "loss": 0.1468, + "step": 27971 + }, + { + "epoch": 76.21798365122616, + "grad_norm": 1.4058564901351929, + "learning_rate": 2.822573412750137e-06, + "loss": 0.0191, + "step": 27972 + }, + { + "epoch": 76.22070844686648, + "grad_norm": 4.3451409339904785, + "learning_rate": 2.8219589522162094e-06, + "loss": 0.0678, + "step": 27973 + }, + { + "epoch": 76.22343324250681, + "grad_norm": 3.9595370292663574, + "learning_rate": 2.8213445475846314e-06, + "loss": 0.061, + "step": 27974 + }, + { + "epoch": 76.22615803814713, + "grad_norm": 2.8853468894958496, + "learning_rate": 2.820730198860194e-06, + "loss": 0.0319, + "step": 27975 + }, + { + "epoch": 76.22888283378747, + "grad_norm": 2.830885648727417, + "learning_rate": 2.820115906047679e-06, + "loss": 0.056, + "step": 27976 + }, + { + "epoch": 76.2316076294278, + "grad_norm": 3.3954076766967773, + "learning_rate": 2.8195016691518708e-06, + "loss": 0.0363, + "step": 27977 + }, + { + "epoch": 76.23433242506812, + "grad_norm": 2.9091482162475586, + "learning_rate": 2.8188874881775484e-06, + "loss": 0.1156, + "step": 27978 + }, + { + "epoch": 76.23705722070845, + "grad_norm": 2.5474894046783447, + "learning_rate": 2.8182733631295023e-06, + "loss": 0.0461, + "step": 27979 + }, + { + "epoch": 76.23978201634877, + "grad_norm": 3.0233871936798096, + "learning_rate": 2.8176592940125124e-06, + "loss": 0.0463, + "step": 27980 + }, + { + "epoch": 76.2425068119891, + "grad_norm": 2.699345350265503, + "learning_rate": 2.8170452808313597e-06, + "loss": 0.0485, + "step": 27981 + }, + { + "epoch": 76.24523160762942, + "grad_norm": 2.619124174118042, + "learning_rate": 2.816431323590826e-06, + "loss": 0.0411, + "step": 27982 + }, + { + "epoch": 76.24795640326975, + "grad_norm": 2.5384392738342285, + "learning_rate": 2.815817422295696e-06, + "loss": 0.0391, + "step": 27983 + }, + { + "epoch": 76.25068119891009, + "grad_norm": 3.0800857543945312, + "learning_rate": 2.815203576950748e-06, + "loss": 0.1152, + "step": 27984 + }, + { + "epoch": 76.2534059945504, + "grad_norm": 3.9242215156555176, + "learning_rate": 2.8145897875607642e-06, + "loss": 0.0888, + "step": 27985 + }, + { + "epoch": 76.25613079019074, + "grad_norm": 2.9212911128997803, + "learning_rate": 2.813976054130517e-06, + "loss": 0.0359, + "step": 27986 + }, + { + "epoch": 76.25885558583106, + "grad_norm": 2.257206678390503, + "learning_rate": 2.8133623766648e-06, + "loss": 0.0341, + "step": 27987 + }, + { + "epoch": 76.26158038147139, + "grad_norm": 2.452134370803833, + "learning_rate": 2.812748755168385e-06, + "loss": 0.0352, + "step": 27988 + }, + { + "epoch": 76.26430517711172, + "grad_norm": 4.033824920654297, + "learning_rate": 2.8121351896460526e-06, + "loss": 0.0509, + "step": 27989 + }, + { + "epoch": 76.26702997275204, + "grad_norm": 3.3400137424468994, + "learning_rate": 2.8115216801025757e-06, + "loss": 0.0494, + "step": 27990 + }, + { + "epoch": 76.26975476839237, + "grad_norm": 2.57417631149292, + "learning_rate": 2.81090822654274e-06, + "loss": 0.0645, + "step": 27991 + }, + { + "epoch": 76.2724795640327, + "grad_norm": 3.750145435333252, + "learning_rate": 2.8102948289713192e-06, + "loss": 0.0961, + "step": 27992 + }, + { + "epoch": 76.27520435967303, + "grad_norm": 2.211428165435791, + "learning_rate": 2.8096814873930913e-06, + "loss": 0.0286, + "step": 27993 + }, + { + "epoch": 76.27792915531334, + "grad_norm": 5.707901954650879, + "learning_rate": 2.809068201812829e-06, + "loss": 0.0414, + "step": 27994 + }, + { + "epoch": 76.28065395095368, + "grad_norm": 2.3994359970092773, + "learning_rate": 2.808454972235316e-06, + "loss": 0.0437, + "step": 27995 + }, + { + "epoch": 76.28337874659401, + "grad_norm": 2.9409661293029785, + "learning_rate": 2.807841798665324e-06, + "loss": 0.0636, + "step": 27996 + }, + { + "epoch": 76.28610354223433, + "grad_norm": 3.0790517330169678, + "learning_rate": 2.8072286811076276e-06, + "loss": 0.0868, + "step": 27997 + }, + { + "epoch": 76.28882833787466, + "grad_norm": 3.28312349319458, + "learning_rate": 2.8066156195670013e-06, + "loss": 0.0531, + "step": 27998 + }, + { + "epoch": 76.29155313351498, + "grad_norm": 4.68637228012085, + "learning_rate": 2.806002614048223e-06, + "loss": 0.181, + "step": 27999 + }, + { + "epoch": 76.29427792915531, + "grad_norm": 2.338714361190796, + "learning_rate": 2.8053896645560653e-06, + "loss": 0.0722, + "step": 28000 + }, + { + "epoch": 76.29700272479565, + "grad_norm": 2.7918925285339355, + "learning_rate": 2.8047767710953013e-06, + "loss": 0.0634, + "step": 28001 + }, + { + "epoch": 76.29972752043597, + "grad_norm": 2.9978299140930176, + "learning_rate": 2.8041639336707007e-06, + "loss": 0.0465, + "step": 28002 + }, + { + "epoch": 76.3024523160763, + "grad_norm": 2.5506551265716553, + "learning_rate": 2.8035511522870395e-06, + "loss": 0.1142, + "step": 28003 + }, + { + "epoch": 76.30517711171662, + "grad_norm": 2.7005417346954346, + "learning_rate": 2.8029384269490946e-06, + "loss": 0.0645, + "step": 28004 + }, + { + "epoch": 76.30790190735695, + "grad_norm": 2.3669233322143555, + "learning_rate": 2.8023257576616327e-06, + "loss": 0.0862, + "step": 28005 + }, + { + "epoch": 76.31062670299727, + "grad_norm": 2.5922515392303467, + "learning_rate": 2.8017131444294233e-06, + "loss": 0.1133, + "step": 28006 + }, + { + "epoch": 76.3133514986376, + "grad_norm": 2.9336061477661133, + "learning_rate": 2.801100587257243e-06, + "loss": 0.0842, + "step": 28007 + }, + { + "epoch": 76.31607629427793, + "grad_norm": 2.012657642364502, + "learning_rate": 2.8004880861498595e-06, + "loss": 0.0312, + "step": 28008 + }, + { + "epoch": 76.31880108991825, + "grad_norm": 2.521577835083008, + "learning_rate": 2.7998756411120444e-06, + "loss": 0.0452, + "step": 28009 + }, + { + "epoch": 76.32152588555859, + "grad_norm": 1.3363769054412842, + "learning_rate": 2.7992632521485617e-06, + "loss": 0.0178, + "step": 28010 + }, + { + "epoch": 76.3242506811989, + "grad_norm": 3.8090527057647705, + "learning_rate": 2.7986509192641887e-06, + "loss": 0.2722, + "step": 28011 + }, + { + "epoch": 76.32697547683924, + "grad_norm": 2.51955246925354, + "learning_rate": 2.7980386424636895e-06, + "loss": 0.0662, + "step": 28012 + }, + { + "epoch": 76.32970027247957, + "grad_norm": 2.5476555824279785, + "learning_rate": 2.7974264217518355e-06, + "loss": 0.0414, + "step": 28013 + }, + { + "epoch": 76.33242506811989, + "grad_norm": 2.8338663578033447, + "learning_rate": 2.7968142571333878e-06, + "loss": 0.0899, + "step": 28014 + }, + { + "epoch": 76.33514986376022, + "grad_norm": 2.1845476627349854, + "learning_rate": 2.796202148613123e-06, + "loss": 0.0297, + "step": 28015 + }, + { + "epoch": 76.33787465940054, + "grad_norm": 4.120614051818848, + "learning_rate": 2.795590096195804e-06, + "loss": 0.062, + "step": 28016 + }, + { + "epoch": 76.34059945504087, + "grad_norm": 2.4877171516418457, + "learning_rate": 2.7949780998861966e-06, + "loss": 0.0369, + "step": 28017 + }, + { + "epoch": 76.34332425068119, + "grad_norm": 2.8294050693511963, + "learning_rate": 2.794366159689066e-06, + "loss": 0.0565, + "step": 28018 + }, + { + "epoch": 76.34604904632153, + "grad_norm": 2.469412088394165, + "learning_rate": 2.793754275609182e-06, + "loss": 0.0534, + "step": 28019 + }, + { + "epoch": 76.34877384196186, + "grad_norm": 3.135049819946289, + "learning_rate": 2.7931424476513047e-06, + "loss": 0.026, + "step": 28020 + }, + { + "epoch": 76.35149863760218, + "grad_norm": 2.621840476989746, + "learning_rate": 2.7925306758202052e-06, + "loss": 0.032, + "step": 28021 + }, + { + "epoch": 76.35422343324251, + "grad_norm": 2.8926784992218018, + "learning_rate": 2.7919189601206455e-06, + "loss": 0.0618, + "step": 28022 + }, + { + "epoch": 76.35694822888283, + "grad_norm": 2.510206460952759, + "learning_rate": 2.7913073005573854e-06, + "loss": 0.073, + "step": 28023 + }, + { + "epoch": 76.35967302452316, + "grad_norm": 3.0854604244232178, + "learning_rate": 2.790695697135195e-06, + "loss": 0.0657, + "step": 28024 + }, + { + "epoch": 76.3623978201635, + "grad_norm": 4.972815036773682, + "learning_rate": 2.790084149858835e-06, + "loss": 0.0562, + "step": 28025 + }, + { + "epoch": 76.36512261580381, + "grad_norm": 2.648543357849121, + "learning_rate": 2.7894726587330666e-06, + "loss": 0.0404, + "step": 28026 + }, + { + "epoch": 76.36784741144415, + "grad_norm": 2.186492681503296, + "learning_rate": 2.7888612237626512e-06, + "loss": 0.1184, + "step": 28027 + }, + { + "epoch": 76.37057220708446, + "grad_norm": 3.8680977821350098, + "learning_rate": 2.788249844952354e-06, + "loss": 0.1279, + "step": 28028 + }, + { + "epoch": 76.3732970027248, + "grad_norm": 2.42016339302063, + "learning_rate": 2.787638522306936e-06, + "loss": 0.0575, + "step": 28029 + }, + { + "epoch": 76.37602179836512, + "grad_norm": 2.315438747406006, + "learning_rate": 2.787027255831154e-06, + "loss": 0.1398, + "step": 28030 + }, + { + "epoch": 76.37874659400545, + "grad_norm": 3.082136392593384, + "learning_rate": 2.7864160455297753e-06, + "loss": 0.0778, + "step": 28031 + }, + { + "epoch": 76.38147138964578, + "grad_norm": 2.4704718589782715, + "learning_rate": 2.7858048914075543e-06, + "loss": 0.0338, + "step": 28032 + }, + { + "epoch": 76.3841961852861, + "grad_norm": 3.232985258102417, + "learning_rate": 2.785193793469254e-06, + "loss": 0.0452, + "step": 28033 + }, + { + "epoch": 76.38692098092643, + "grad_norm": 2.485524892807007, + "learning_rate": 2.784582751719629e-06, + "loss": 0.0645, + "step": 28034 + }, + { + "epoch": 76.38964577656675, + "grad_norm": 3.575551986694336, + "learning_rate": 2.7839717661634446e-06, + "loss": 0.033, + "step": 28035 + }, + { + "epoch": 76.39237057220708, + "grad_norm": 4.037444114685059, + "learning_rate": 2.7833608368054556e-06, + "loss": 0.0912, + "step": 28036 + }, + { + "epoch": 76.39509536784742, + "grad_norm": 2.73028564453125, + "learning_rate": 2.7827499636504164e-06, + "loss": 0.0389, + "step": 28037 + }, + { + "epoch": 76.39782016348774, + "grad_norm": 2.976391077041626, + "learning_rate": 2.7821391467030923e-06, + "loss": 0.073, + "step": 28038 + }, + { + "epoch": 76.40054495912807, + "grad_norm": 2.569194793701172, + "learning_rate": 2.781528385968233e-06, + "loss": 0.0475, + "step": 28039 + }, + { + "epoch": 76.40326975476839, + "grad_norm": 2.133589267730713, + "learning_rate": 2.780917681450601e-06, + "loss": 0.0782, + "step": 28040 + }, + { + "epoch": 76.40599455040872, + "grad_norm": 2.573448419570923, + "learning_rate": 2.7803070331549497e-06, + "loss": 0.041, + "step": 28041 + }, + { + "epoch": 76.40871934604904, + "grad_norm": 8.486881256103516, + "learning_rate": 2.7796964410860348e-06, + "loss": 0.0852, + "step": 28042 + }, + { + "epoch": 76.41144414168937, + "grad_norm": 2.282289981842041, + "learning_rate": 2.7790859052486086e-06, + "loss": 0.0532, + "step": 28043 + }, + { + "epoch": 76.4141689373297, + "grad_norm": 2.2929494380950928, + "learning_rate": 2.778475425647432e-06, + "loss": 0.0283, + "step": 28044 + }, + { + "epoch": 76.41689373297002, + "grad_norm": 2.257180690765381, + "learning_rate": 2.777865002287257e-06, + "loss": 0.028, + "step": 28045 + }, + { + "epoch": 76.41961852861036, + "grad_norm": 3.966956377029419, + "learning_rate": 2.777254635172837e-06, + "loss": 0.1017, + "step": 28046 + }, + { + "epoch": 76.42234332425068, + "grad_norm": 3.150528907775879, + "learning_rate": 2.7766443243089215e-06, + "loss": 0.0626, + "step": 28047 + }, + { + "epoch": 76.42506811989101, + "grad_norm": 2.919949531555176, + "learning_rate": 2.776034069700271e-06, + "loss": 0.0627, + "step": 28048 + }, + { + "epoch": 76.42779291553134, + "grad_norm": 4.475660800933838, + "learning_rate": 2.7754238713516347e-06, + "loss": 0.0263, + "step": 28049 + }, + { + "epoch": 76.43051771117166, + "grad_norm": 4.334867000579834, + "learning_rate": 2.7748137292677647e-06, + "loss": 0.0891, + "step": 28050 + }, + { + "epoch": 76.433242506812, + "grad_norm": 2.3135111331939697, + "learning_rate": 2.7742036434534094e-06, + "loss": 0.0327, + "step": 28051 + }, + { + "epoch": 76.43596730245231, + "grad_norm": 2.878211736679077, + "learning_rate": 2.773593613913327e-06, + "loss": 0.0934, + "step": 28052 + }, + { + "epoch": 76.43869209809264, + "grad_norm": 3.610713243484497, + "learning_rate": 2.772983640652265e-06, + "loss": 0.0512, + "step": 28053 + }, + { + "epoch": 76.44141689373296, + "grad_norm": 2.4285902976989746, + "learning_rate": 2.7723737236749705e-06, + "loss": 0.0773, + "step": 28054 + }, + { + "epoch": 76.4441416893733, + "grad_norm": 8.0861177444458, + "learning_rate": 2.7717638629861965e-06, + "loss": 0.1366, + "step": 28055 + }, + { + "epoch": 76.44686648501363, + "grad_norm": 2.8861968517303467, + "learning_rate": 2.771154058590697e-06, + "loss": 0.0925, + "step": 28056 + }, + { + "epoch": 76.44959128065395, + "grad_norm": 1.7526333332061768, + "learning_rate": 2.7705443104932163e-06, + "loss": 0.0517, + "step": 28057 + }, + { + "epoch": 76.45231607629428, + "grad_norm": 3.7791574001312256, + "learning_rate": 2.7699346186985044e-06, + "loss": 0.0516, + "step": 28058 + }, + { + "epoch": 76.4550408719346, + "grad_norm": 3.859914541244507, + "learning_rate": 2.7693249832113055e-06, + "loss": 0.0406, + "step": 28059 + }, + { + "epoch": 76.45776566757493, + "grad_norm": 2.121925115585327, + "learning_rate": 2.768715404036374e-06, + "loss": 0.0477, + "step": 28060 + }, + { + "epoch": 76.46049046321527, + "grad_norm": 2.7566285133361816, + "learning_rate": 2.7681058811784545e-06, + "loss": 0.0475, + "step": 28061 + }, + { + "epoch": 76.46321525885558, + "grad_norm": 6.3780837059021, + "learning_rate": 2.7674964146422933e-06, + "loss": 0.0175, + "step": 28062 + }, + { + "epoch": 76.46594005449592, + "grad_norm": 2.3032732009887695, + "learning_rate": 2.7668870044326335e-06, + "loss": 0.033, + "step": 28063 + }, + { + "epoch": 76.46866485013624, + "grad_norm": 3.9634287357330322, + "learning_rate": 2.7662776505542286e-06, + "loss": 0.0636, + "step": 28064 + }, + { + "epoch": 76.47138964577657, + "grad_norm": 2.698305368423462, + "learning_rate": 2.765668353011821e-06, + "loss": 0.1124, + "step": 28065 + }, + { + "epoch": 76.47411444141689, + "grad_norm": 1.495788812637329, + "learning_rate": 2.7650591118101557e-06, + "loss": 0.0204, + "step": 28066 + }, + { + "epoch": 76.47683923705722, + "grad_norm": 3.5963215827941895, + "learning_rate": 2.7644499269539728e-06, + "loss": 0.033, + "step": 28067 + }, + { + "epoch": 76.47956403269755, + "grad_norm": 2.6007676124572754, + "learning_rate": 2.7638407984480255e-06, + "loss": 0.04, + "step": 28068 + }, + { + "epoch": 76.48228882833787, + "grad_norm": 2.2179477214813232, + "learning_rate": 2.763231726297052e-06, + "loss": 0.1683, + "step": 28069 + }, + { + "epoch": 76.4850136239782, + "grad_norm": 3.5508370399475098, + "learning_rate": 2.762622710505797e-06, + "loss": 0.0412, + "step": 28070 + }, + { + "epoch": 76.48773841961852, + "grad_norm": 3.038764476776123, + "learning_rate": 2.762013751079001e-06, + "loss": 0.1343, + "step": 28071 + }, + { + "epoch": 76.49046321525886, + "grad_norm": 3.583001136779785, + "learning_rate": 2.7614048480214085e-06, + "loss": 0.1194, + "step": 28072 + }, + { + "epoch": 76.49318801089919, + "grad_norm": 2.5639359951019287, + "learning_rate": 2.7607960013377655e-06, + "loss": 0.0358, + "step": 28073 + }, + { + "epoch": 76.49591280653951, + "grad_norm": 2.9354007244110107, + "learning_rate": 2.76018721103281e-06, + "loss": 0.1409, + "step": 28074 + }, + { + "epoch": 76.49863760217984, + "grad_norm": 4.090127468109131, + "learning_rate": 2.7595784771112798e-06, + "loss": 0.053, + "step": 28075 + }, + { + "epoch": 76.50136239782016, + "grad_norm": 2.726362466812134, + "learning_rate": 2.758969799577923e-06, + "loss": 0.0317, + "step": 28076 + }, + { + "epoch": 76.50408719346049, + "grad_norm": 2.5246667861938477, + "learning_rate": 2.7583611784374766e-06, + "loss": 0.0327, + "step": 28077 + }, + { + "epoch": 76.50681198910081, + "grad_norm": 4.658145427703857, + "learning_rate": 2.7577526136946797e-06, + "loss": 0.027, + "step": 28078 + }, + { + "epoch": 76.50953678474114, + "grad_norm": 3.1911253929138184, + "learning_rate": 2.7571441053542703e-06, + "loss": 0.0586, + "step": 28079 + }, + { + "epoch": 76.51226158038148, + "grad_norm": 1.6940730810165405, + "learning_rate": 2.756535653420992e-06, + "loss": 0.0263, + "step": 28080 + }, + { + "epoch": 76.5149863760218, + "grad_norm": 2.7947118282318115, + "learning_rate": 2.755927257899581e-06, + "loss": 0.1399, + "step": 28081 + }, + { + "epoch": 76.51771117166213, + "grad_norm": 2.8880624771118164, + "learning_rate": 2.7553189187947747e-06, + "loss": 0.0391, + "step": 28082 + }, + { + "epoch": 76.52043596730245, + "grad_norm": 2.8466579914093018, + "learning_rate": 2.7547106361113087e-06, + "loss": 0.034, + "step": 28083 + }, + { + "epoch": 76.52316076294278, + "grad_norm": 2.4123668670654297, + "learning_rate": 2.754102409853927e-06, + "loss": 0.0248, + "step": 28084 + }, + { + "epoch": 76.52588555858311, + "grad_norm": 2.8858022689819336, + "learning_rate": 2.753494240027361e-06, + "loss": 0.049, + "step": 28085 + }, + { + "epoch": 76.52861035422343, + "grad_norm": 3.041144609451294, + "learning_rate": 2.7528861266363507e-06, + "loss": 0.0863, + "step": 28086 + }, + { + "epoch": 76.53133514986376, + "grad_norm": 3.7189900875091553, + "learning_rate": 2.7522780696856256e-06, + "loss": 0.0559, + "step": 28087 + }, + { + "epoch": 76.53405994550408, + "grad_norm": 2.4244542121887207, + "learning_rate": 2.751670069179928e-06, + "loss": 0.0654, + "step": 28088 + }, + { + "epoch": 76.53678474114442, + "grad_norm": 2.1451120376586914, + "learning_rate": 2.751062125123989e-06, + "loss": 0.0377, + "step": 28089 + }, + { + "epoch": 76.53950953678473, + "grad_norm": 3.701094627380371, + "learning_rate": 2.7504542375225474e-06, + "loss": 0.0522, + "step": 28090 + }, + { + "epoch": 76.54223433242507, + "grad_norm": 2.5902910232543945, + "learning_rate": 2.7498464063803342e-06, + "loss": 0.0261, + "step": 28091 + }, + { + "epoch": 76.5449591280654, + "grad_norm": 3.0719902515411377, + "learning_rate": 2.7492386317020814e-06, + "loss": 0.0694, + "step": 28092 + }, + { + "epoch": 76.54768392370572, + "grad_norm": 3.1734306812286377, + "learning_rate": 2.748630913492528e-06, + "loss": 0.0366, + "step": 28093 + }, + { + "epoch": 76.55040871934605, + "grad_norm": 2.8310868740081787, + "learning_rate": 2.7480232517564033e-06, + "loss": 0.1542, + "step": 28094 + }, + { + "epoch": 76.55313351498637, + "grad_norm": 2.7298359870910645, + "learning_rate": 2.747415646498438e-06, + "loss": 0.049, + "step": 28095 + }, + { + "epoch": 76.5558583106267, + "grad_norm": 2.6002743244171143, + "learning_rate": 2.746808097723368e-06, + "loss": 0.137, + "step": 28096 + }, + { + "epoch": 76.55858310626704, + "grad_norm": 2.7242491245269775, + "learning_rate": 2.7462006054359234e-06, + "loss": 0.087, + "step": 28097 + }, + { + "epoch": 76.56130790190736, + "grad_norm": 2.934518575668335, + "learning_rate": 2.7455931696408356e-06, + "loss": 0.0244, + "step": 28098 + }, + { + "epoch": 76.56403269754769, + "grad_norm": 3.0216727256774902, + "learning_rate": 2.7449857903428314e-06, + "loss": 0.1071, + "step": 28099 + }, + { + "epoch": 76.566757493188, + "grad_norm": 2.2561445236206055, + "learning_rate": 2.7443784675466465e-06, + "loss": 0.0375, + "step": 28100 + }, + { + "epoch": 76.56948228882834, + "grad_norm": 6.173305511474609, + "learning_rate": 2.7437712012570105e-06, + "loss": 0.0829, + "step": 28101 + }, + { + "epoch": 76.57220708446866, + "grad_norm": 2.828070640563965, + "learning_rate": 2.7431639914786488e-06, + "loss": 0.1561, + "step": 28102 + }, + { + "epoch": 76.57493188010899, + "grad_norm": 4.874003887176514, + "learning_rate": 2.7425568382162904e-06, + "loss": 0.0374, + "step": 28103 + }, + { + "epoch": 76.57765667574932, + "grad_norm": 3.1307716369628906, + "learning_rate": 2.7419497414746687e-06, + "loss": 0.0495, + "step": 28104 + }, + { + "epoch": 76.58038147138964, + "grad_norm": 2.9444665908813477, + "learning_rate": 2.741342701258509e-06, + "loss": 0.0503, + "step": 28105 + }, + { + "epoch": 76.58310626702998, + "grad_norm": 3.124049186706543, + "learning_rate": 2.7407357175725356e-06, + "loss": 0.0382, + "step": 28106 + }, + { + "epoch": 76.5858310626703, + "grad_norm": 3.487481117248535, + "learning_rate": 2.7401287904214813e-06, + "loss": 0.1275, + "step": 28107 + }, + { + "epoch": 76.58855585831063, + "grad_norm": 2.9745378494262695, + "learning_rate": 2.7395219198100674e-06, + "loss": 0.1387, + "step": 28108 + }, + { + "epoch": 76.59128065395096, + "grad_norm": 3.164611577987671, + "learning_rate": 2.7389151057430272e-06, + "loss": 0.0644, + "step": 28109 + }, + { + "epoch": 76.59400544959128, + "grad_norm": 2.4915006160736084, + "learning_rate": 2.7383083482250815e-06, + "loss": 0.0702, + "step": 28110 + }, + { + "epoch": 76.59673024523161, + "grad_norm": 3.8384878635406494, + "learning_rate": 2.7377016472609562e-06, + "loss": 0.0516, + "step": 28111 + }, + { + "epoch": 76.59945504087193, + "grad_norm": 3.1336984634399414, + "learning_rate": 2.7370950028553744e-06, + "loss": 0.0435, + "step": 28112 + }, + { + "epoch": 76.60217983651226, + "grad_norm": 3.026506185531616, + "learning_rate": 2.7364884150130667e-06, + "loss": 0.0527, + "step": 28113 + }, + { + "epoch": 76.60490463215258, + "grad_norm": 2.474282741546631, + "learning_rate": 2.7358818837387525e-06, + "loss": 0.06, + "step": 28114 + }, + { + "epoch": 76.60762942779292, + "grad_norm": 2.46525502204895, + "learning_rate": 2.7352754090371538e-06, + "loss": 0.0275, + "step": 28115 + }, + { + "epoch": 76.61035422343325, + "grad_norm": 3.462277412414551, + "learning_rate": 2.734668990912999e-06, + "loss": 0.0523, + "step": 28116 + }, + { + "epoch": 76.61307901907357, + "grad_norm": 4.526456356048584, + "learning_rate": 2.734062629371008e-06, + "loss": 0.1228, + "step": 28117 + }, + { + "epoch": 76.6158038147139, + "grad_norm": 2.8008873462677, + "learning_rate": 2.733456324415904e-06, + "loss": 0.0318, + "step": 28118 + }, + { + "epoch": 76.61852861035422, + "grad_norm": 3.2150888442993164, + "learning_rate": 2.732850076052406e-06, + "loss": 0.0477, + "step": 28119 + }, + { + "epoch": 76.62125340599455, + "grad_norm": 3.417959213256836, + "learning_rate": 2.7322438842852394e-06, + "loss": 0.0276, + "step": 28120 + }, + { + "epoch": 76.62397820163488, + "grad_norm": 3.4848334789276123, + "learning_rate": 2.7316377491191236e-06, + "loss": 0.0489, + "step": 28121 + }, + { + "epoch": 76.6267029972752, + "grad_norm": 2.5796701908111572, + "learning_rate": 2.7310316705587793e-06, + "loss": 0.1577, + "step": 28122 + }, + { + "epoch": 76.62942779291554, + "grad_norm": 2.8394663333892822, + "learning_rate": 2.730425648608923e-06, + "loss": 0.065, + "step": 28123 + }, + { + "epoch": 76.63215258855585, + "grad_norm": 4.187651634216309, + "learning_rate": 2.7298196832742786e-06, + "loss": 0.2452, + "step": 28124 + }, + { + "epoch": 76.63487738419619, + "grad_norm": 2.425128936767578, + "learning_rate": 2.729213774559567e-06, + "loss": 0.0353, + "step": 28125 + }, + { + "epoch": 76.6376021798365, + "grad_norm": 1.9688972234725952, + "learning_rate": 2.728607922469505e-06, + "loss": 0.0743, + "step": 28126 + }, + { + "epoch": 76.64032697547684, + "grad_norm": 3.256420135498047, + "learning_rate": 2.728002127008811e-06, + "loss": 0.0281, + "step": 28127 + }, + { + "epoch": 76.64305177111717, + "grad_norm": 2.346224784851074, + "learning_rate": 2.7273963881821984e-06, + "loss": 0.1408, + "step": 28128 + }, + { + "epoch": 76.64577656675749, + "grad_norm": 2.3820855617523193, + "learning_rate": 2.726790705994391e-06, + "loss": 0.0971, + "step": 28129 + }, + { + "epoch": 76.64850136239782, + "grad_norm": 2.2366647720336914, + "learning_rate": 2.7261850804501043e-06, + "loss": 0.045, + "step": 28130 + }, + { + "epoch": 76.65122615803814, + "grad_norm": 2.996664524078369, + "learning_rate": 2.725579511554055e-06, + "loss": 0.1373, + "step": 28131 + }, + { + "epoch": 76.65395095367847, + "grad_norm": 2.155332565307617, + "learning_rate": 2.724973999310954e-06, + "loss": 0.0671, + "step": 28132 + }, + { + "epoch": 76.65667574931881, + "grad_norm": 3.2764053344726562, + "learning_rate": 2.7243685437255253e-06, + "loss": 0.1598, + "step": 28133 + }, + { + "epoch": 76.65940054495913, + "grad_norm": 1.984950065612793, + "learning_rate": 2.7237631448024792e-06, + "loss": 0.1516, + "step": 28134 + }, + { + "epoch": 76.66212534059946, + "grad_norm": 2.99607253074646, + "learning_rate": 2.723157802546532e-06, + "loss": 0.0355, + "step": 28135 + }, + { + "epoch": 76.66485013623978, + "grad_norm": 2.9442052841186523, + "learning_rate": 2.7225525169623947e-06, + "loss": 0.1218, + "step": 28136 + }, + { + "epoch": 76.66757493188011, + "grad_norm": 3.8162875175476074, + "learning_rate": 2.721947288054787e-06, + "loss": 0.0678, + "step": 28137 + }, + { + "epoch": 76.67029972752043, + "grad_norm": 1.9887125492095947, + "learning_rate": 2.7213421158284203e-06, + "loss": 0.091, + "step": 28138 + }, + { + "epoch": 76.67302452316076, + "grad_norm": 2.8055906295776367, + "learning_rate": 2.720737000288003e-06, + "loss": 0.1335, + "step": 28139 + }, + { + "epoch": 76.6757493188011, + "grad_norm": 2.4547324180603027, + "learning_rate": 2.7201319414382554e-06, + "loss": 0.0993, + "step": 28140 + }, + { + "epoch": 76.67847411444141, + "grad_norm": 2.761908769607544, + "learning_rate": 2.7195269392838818e-06, + "loss": 0.041, + "step": 28141 + }, + { + "epoch": 76.68119891008175, + "grad_norm": 3.926360607147217, + "learning_rate": 2.718921993829603e-06, + "loss": 0.0517, + "step": 28142 + }, + { + "epoch": 76.68392370572207, + "grad_norm": 2.480558395385742, + "learning_rate": 2.718317105080124e-06, + "loss": 0.1028, + "step": 28143 + }, + { + "epoch": 76.6866485013624, + "grad_norm": 2.091433525085449, + "learning_rate": 2.717712273040154e-06, + "loss": 0.0251, + "step": 28144 + }, + { + "epoch": 76.68937329700273, + "grad_norm": 2.3875463008880615, + "learning_rate": 2.71710749771441e-06, + "loss": 0.0562, + "step": 28145 + }, + { + "epoch": 76.69209809264305, + "grad_norm": 2.630124568939209, + "learning_rate": 2.7165027791075984e-06, + "loss": 0.1114, + "step": 28146 + }, + { + "epoch": 76.69482288828338, + "grad_norm": 2.8091511726379395, + "learning_rate": 2.715898117224428e-06, + "loss": 0.0477, + "step": 28147 + }, + { + "epoch": 76.6975476839237, + "grad_norm": 2.7866899967193604, + "learning_rate": 2.7152935120696056e-06, + "loss": 0.0769, + "step": 28148 + }, + { + "epoch": 76.70027247956403, + "grad_norm": 2.8136236667633057, + "learning_rate": 2.7146889636478467e-06, + "loss": 0.0573, + "step": 28149 + }, + { + "epoch": 76.70299727520435, + "grad_norm": 2.7409310340881348, + "learning_rate": 2.714084471963855e-06, + "loss": 0.1757, + "step": 28150 + }, + { + "epoch": 76.70572207084469, + "grad_norm": 2.173962354660034, + "learning_rate": 2.713480037022339e-06, + "loss": 0.0296, + "step": 28151 + }, + { + "epoch": 76.70844686648502, + "grad_norm": 2.338724374771118, + "learning_rate": 2.712875658828004e-06, + "loss": 0.0399, + "step": 28152 + }, + { + "epoch": 76.71117166212534, + "grad_norm": 2.862715244293213, + "learning_rate": 2.7122713373855605e-06, + "loss": 0.0353, + "step": 28153 + }, + { + "epoch": 76.71389645776567, + "grad_norm": 2.498589515686035, + "learning_rate": 2.7116670726997142e-06, + "loss": 0.0765, + "step": 28154 + }, + { + "epoch": 76.71662125340599, + "grad_norm": 2.568979024887085, + "learning_rate": 2.7110628647751704e-06, + "loss": 0.1366, + "step": 28155 + }, + { + "epoch": 76.71934604904632, + "grad_norm": 2.9421985149383545, + "learning_rate": 2.7104587136166304e-06, + "loss": 0.0272, + "step": 28156 + }, + { + "epoch": 76.72207084468666, + "grad_norm": 2.875525951385498, + "learning_rate": 2.709854619228807e-06, + "loss": 0.0487, + "step": 28157 + }, + { + "epoch": 76.72479564032697, + "grad_norm": 2.8808341026306152, + "learning_rate": 2.709250581616397e-06, + "loss": 0.0318, + "step": 28158 + }, + { + "epoch": 76.7275204359673, + "grad_norm": 2.8514723777770996, + "learning_rate": 2.7086466007841126e-06, + "loss": 0.1324, + "step": 28159 + }, + { + "epoch": 76.73024523160763, + "grad_norm": 3.5004167556762695, + "learning_rate": 2.708042676736651e-06, + "loss": 0.041, + "step": 28160 + }, + { + "epoch": 76.73297002724796, + "grad_norm": 1.74006986618042, + "learning_rate": 2.707438809478722e-06, + "loss": 0.0284, + "step": 28161 + }, + { + "epoch": 76.73569482288828, + "grad_norm": 2.246943950653076, + "learning_rate": 2.7068349990150235e-06, + "loss": 0.0215, + "step": 28162 + }, + { + "epoch": 76.73841961852861, + "grad_norm": 3.3550186157226562, + "learning_rate": 2.7062312453502606e-06, + "loss": 0.126, + "step": 28163 + }, + { + "epoch": 76.74114441416894, + "grad_norm": 3.6439809799194336, + "learning_rate": 2.70562754848913e-06, + "loss": 0.0873, + "step": 28164 + }, + { + "epoch": 76.74386920980926, + "grad_norm": 3.409364938735962, + "learning_rate": 2.7050239084363404e-06, + "loss": 0.2361, + "step": 28165 + }, + { + "epoch": 76.7465940054496, + "grad_norm": 3.3585925102233887, + "learning_rate": 2.7044203251965907e-06, + "loss": 0.0896, + "step": 28166 + }, + { + "epoch": 76.74931880108991, + "grad_norm": 2.680992841720581, + "learning_rate": 2.703816798774579e-06, + "loss": 0.0342, + "step": 28167 + }, + { + "epoch": 76.75204359673025, + "grad_norm": 3.4959325790405273, + "learning_rate": 2.703213329175006e-06, + "loss": 0.1762, + "step": 28168 + }, + { + "epoch": 76.75476839237058, + "grad_norm": 3.6395339965820312, + "learning_rate": 2.702609916402574e-06, + "loss": 0.1915, + "step": 28169 + }, + { + "epoch": 76.7574931880109, + "grad_norm": 3.4512598514556885, + "learning_rate": 2.7020065604619826e-06, + "loss": 0.1554, + "step": 28170 + }, + { + "epoch": 76.76021798365123, + "grad_norm": 3.1817307472229004, + "learning_rate": 2.701403261357929e-06, + "loss": 0.1507, + "step": 28171 + }, + { + "epoch": 76.76294277929155, + "grad_norm": 2.7833666801452637, + "learning_rate": 2.700800019095109e-06, + "loss": 0.0706, + "step": 28172 + }, + { + "epoch": 76.76566757493188, + "grad_norm": 2.8812572956085205, + "learning_rate": 2.700196833678226e-06, + "loss": 0.0998, + "step": 28173 + }, + { + "epoch": 76.7683923705722, + "grad_norm": 2.6217448711395264, + "learning_rate": 2.6995937051119747e-06, + "loss": 0.0408, + "step": 28174 + }, + { + "epoch": 76.77111716621253, + "grad_norm": 2.885335683822632, + "learning_rate": 2.6989906334010507e-06, + "loss": 0.0736, + "step": 28175 + }, + { + "epoch": 76.77384196185287, + "grad_norm": 2.695162057876587, + "learning_rate": 2.6983876185501556e-06, + "loss": 0.1038, + "step": 28176 + }, + { + "epoch": 76.77656675749319, + "grad_norm": 2.176483392715454, + "learning_rate": 2.697784660563979e-06, + "loss": 0.0552, + "step": 28177 + }, + { + "epoch": 76.77929155313352, + "grad_norm": 3.070734977722168, + "learning_rate": 2.697181759447224e-06, + "loss": 0.0683, + "step": 28178 + }, + { + "epoch": 76.78201634877384, + "grad_norm": 3.0700390338897705, + "learning_rate": 2.6965789152045818e-06, + "loss": 0.0523, + "step": 28179 + }, + { + "epoch": 76.78474114441417, + "grad_norm": 3.2693450450897217, + "learning_rate": 2.695976127840745e-06, + "loss": 0.0439, + "step": 28180 + }, + { + "epoch": 76.7874659400545, + "grad_norm": 3.124469041824341, + "learning_rate": 2.6953733973604147e-06, + "loss": 0.0341, + "step": 28181 + }, + { + "epoch": 76.79019073569482, + "grad_norm": 2.651022434234619, + "learning_rate": 2.6947707237682807e-06, + "loss": 0.0321, + "step": 28182 + }, + { + "epoch": 76.79291553133515, + "grad_norm": 2.7244935035705566, + "learning_rate": 2.6941681070690374e-06, + "loss": 0.1518, + "step": 28183 + }, + { + "epoch": 76.79564032697547, + "grad_norm": 2.6263954639434814, + "learning_rate": 2.693565547267375e-06, + "loss": 0.0666, + "step": 28184 + }, + { + "epoch": 76.7983651226158, + "grad_norm": 2.7580041885375977, + "learning_rate": 2.6929630443679923e-06, + "loss": 0.0497, + "step": 28185 + }, + { + "epoch": 76.80108991825612, + "grad_norm": 3.8143322467803955, + "learning_rate": 2.6923605983755772e-06, + "loss": 0.0467, + "step": 28186 + }, + { + "epoch": 76.80381471389646, + "grad_norm": 2.6981263160705566, + "learning_rate": 2.6917582092948235e-06, + "loss": 0.0385, + "step": 28187 + }, + { + "epoch": 76.80653950953679, + "grad_norm": 2.2770352363586426, + "learning_rate": 2.691155877130418e-06, + "loss": 0.097, + "step": 28188 + }, + { + "epoch": 76.80926430517711, + "grad_norm": 3.7626657485961914, + "learning_rate": 2.690553601887058e-06, + "loss": 0.0444, + "step": 28189 + }, + { + "epoch": 76.81198910081744, + "grad_norm": 3.5276734828948975, + "learning_rate": 2.6899513835694323e-06, + "loss": 0.0593, + "step": 28190 + }, + { + "epoch": 76.81471389645776, + "grad_norm": 3.3592352867126465, + "learning_rate": 2.6893492221822293e-06, + "loss": 0.062, + "step": 28191 + }, + { + "epoch": 76.8174386920981, + "grad_norm": 3.7183713912963867, + "learning_rate": 2.688747117730136e-06, + "loss": 0.1264, + "step": 28192 + }, + { + "epoch": 76.82016348773843, + "grad_norm": 2.527022123336792, + "learning_rate": 2.688145070217846e-06, + "loss": 0.0335, + "step": 28193 + }, + { + "epoch": 76.82288828337875, + "grad_norm": 1.935794711112976, + "learning_rate": 2.687543079650049e-06, + "loss": 0.0331, + "step": 28194 + }, + { + "epoch": 76.82561307901908, + "grad_norm": 3.119727611541748, + "learning_rate": 2.686941146031431e-06, + "loss": 0.0788, + "step": 28195 + }, + { + "epoch": 76.8283378746594, + "grad_norm": 1.7302227020263672, + "learning_rate": 2.68633926936668e-06, + "loss": 0.035, + "step": 28196 + }, + { + "epoch": 76.83106267029973, + "grad_norm": 1.9190800189971924, + "learning_rate": 2.6857374496604805e-06, + "loss": 0.0282, + "step": 28197 + }, + { + "epoch": 76.83378746594005, + "grad_norm": 3.658738136291504, + "learning_rate": 2.685135686917526e-06, + "loss": 0.1258, + "step": 28198 + }, + { + "epoch": 76.83651226158038, + "grad_norm": 4.712545394897461, + "learning_rate": 2.6845339811424987e-06, + "loss": 0.1422, + "step": 28199 + }, + { + "epoch": 76.83923705722071, + "grad_norm": 3.1784772872924805, + "learning_rate": 2.6839323323400856e-06, + "loss": 0.1382, + "step": 28200 + }, + { + "epoch": 76.84196185286103, + "grad_norm": 2.335515022277832, + "learning_rate": 2.683330740514969e-06, + "loss": 0.1429, + "step": 28201 + }, + { + "epoch": 76.84468664850137, + "grad_norm": 3.69903826713562, + "learning_rate": 2.682729205671839e-06, + "loss": 0.0551, + "step": 28202 + }, + { + "epoch": 76.84741144414168, + "grad_norm": 3.7585651874542236, + "learning_rate": 2.68212772781538e-06, + "loss": 0.0995, + "step": 28203 + }, + { + "epoch": 76.85013623978202, + "grad_norm": 2.2671399116516113, + "learning_rate": 2.6815263069502706e-06, + "loss": 0.142, + "step": 28204 + }, + { + "epoch": 76.85286103542235, + "grad_norm": 2.960724353790283, + "learning_rate": 2.6809249430812025e-06, + "loss": 0.1053, + "step": 28205 + }, + { + "epoch": 76.85558583106267, + "grad_norm": 2.2976996898651123, + "learning_rate": 2.680323636212856e-06, + "loss": 0.0359, + "step": 28206 + }, + { + "epoch": 76.858310626703, + "grad_norm": 2.176069974899292, + "learning_rate": 2.6797223863499123e-06, + "loss": 0.0302, + "step": 28207 + }, + { + "epoch": 76.86103542234332, + "grad_norm": 2.679279088973999, + "learning_rate": 2.6791211934970516e-06, + "loss": 0.0996, + "step": 28208 + }, + { + "epoch": 76.86376021798365, + "grad_norm": 2.479323625564575, + "learning_rate": 2.678520057658961e-06, + "loss": 0.1651, + "step": 28209 + }, + { + "epoch": 76.86648501362397, + "grad_norm": 3.211015224456787, + "learning_rate": 2.6779189788403226e-06, + "loss": 0.1225, + "step": 28210 + }, + { + "epoch": 76.8692098092643, + "grad_norm": 2.575972557067871, + "learning_rate": 2.677317957045815e-06, + "loss": 0.0479, + "step": 28211 + }, + { + "epoch": 76.87193460490464, + "grad_norm": 2.300093650817871, + "learning_rate": 2.6767169922801205e-06, + "loss": 0.0372, + "step": 28212 + }, + { + "epoch": 76.87465940054496, + "grad_norm": 3.722437858581543, + "learning_rate": 2.676116084547915e-06, + "loss": 0.0959, + "step": 28213 + }, + { + "epoch": 76.87738419618529, + "grad_norm": 2.495455741882324, + "learning_rate": 2.6755152338538847e-06, + "loss": 0.0296, + "step": 28214 + }, + { + "epoch": 76.88010899182561, + "grad_norm": 1.7627158164978027, + "learning_rate": 2.674914440202706e-06, + "loss": 0.0229, + "step": 28215 + }, + { + "epoch": 76.88283378746594, + "grad_norm": 1.7345685958862305, + "learning_rate": 2.6743137035990583e-06, + "loss": 0.0279, + "step": 28216 + }, + { + "epoch": 76.88555858310627, + "grad_norm": 3.9004459381103516, + "learning_rate": 2.673713024047616e-06, + "loss": 0.0658, + "step": 28217 + }, + { + "epoch": 76.88828337874659, + "grad_norm": 2.0879580974578857, + "learning_rate": 2.673112401553064e-06, + "loss": 0.0262, + "step": 28218 + }, + { + "epoch": 76.89100817438693, + "grad_norm": 2.071228504180908, + "learning_rate": 2.6725118361200775e-06, + "loss": 0.0816, + "step": 28219 + }, + { + "epoch": 76.89373297002724, + "grad_norm": 2.176243543624878, + "learning_rate": 2.6719113277533328e-06, + "loss": 0.0212, + "step": 28220 + }, + { + "epoch": 76.89645776566758, + "grad_norm": 3.3080270290374756, + "learning_rate": 2.6713108764575035e-06, + "loss": 0.2384, + "step": 28221 + }, + { + "epoch": 76.8991825613079, + "grad_norm": 1.9479093551635742, + "learning_rate": 2.670710482237272e-06, + "loss": 0.0732, + "step": 28222 + }, + { + "epoch": 76.90190735694823, + "grad_norm": 2.9821300506591797, + "learning_rate": 2.670110145097311e-06, + "loss": 0.0446, + "step": 28223 + }, + { + "epoch": 76.90463215258856, + "grad_norm": 2.207801580429077, + "learning_rate": 2.6695098650422967e-06, + "loss": 0.0363, + "step": 28224 + }, + { + "epoch": 76.90735694822888, + "grad_norm": 2.4613595008850098, + "learning_rate": 2.6689096420769013e-06, + "loss": 0.0281, + "step": 28225 + }, + { + "epoch": 76.91008174386921, + "grad_norm": 3.8711798191070557, + "learning_rate": 2.668309476205805e-06, + "loss": 0.0889, + "step": 28226 + }, + { + "epoch": 76.91280653950953, + "grad_norm": 2.2596654891967773, + "learning_rate": 2.667709367433674e-06, + "loss": 0.1087, + "step": 28227 + }, + { + "epoch": 76.91553133514986, + "grad_norm": 8.316119194030762, + "learning_rate": 2.6671093157651908e-06, + "loss": 0.0371, + "step": 28228 + }, + { + "epoch": 76.9182561307902, + "grad_norm": 2.0880208015441895, + "learning_rate": 2.6665093212050197e-06, + "loss": 0.1088, + "step": 28229 + }, + { + "epoch": 76.92098092643052, + "grad_norm": 3.546389102935791, + "learning_rate": 2.665909383757842e-06, + "loss": 0.0752, + "step": 28230 + }, + { + "epoch": 76.92370572207085, + "grad_norm": 2.2764501571655273, + "learning_rate": 2.665309503428326e-06, + "loss": 0.0328, + "step": 28231 + }, + { + "epoch": 76.92643051771117, + "grad_norm": 2.9497528076171875, + "learning_rate": 2.664709680221144e-06, + "loss": 0.0358, + "step": 28232 + }, + { + "epoch": 76.9291553133515, + "grad_norm": 2.4686737060546875, + "learning_rate": 2.664109914140963e-06, + "loss": 0.0261, + "step": 28233 + }, + { + "epoch": 76.93188010899182, + "grad_norm": 2.6861212253570557, + "learning_rate": 2.663510205192461e-06, + "loss": 0.1651, + "step": 28234 + }, + { + "epoch": 76.93460490463215, + "grad_norm": 2.74786376953125, + "learning_rate": 2.6629105533803055e-06, + "loss": 0.0352, + "step": 28235 + }, + { + "epoch": 76.93732970027249, + "grad_norm": 3.4205210208892822, + "learning_rate": 2.6623109587091665e-06, + "loss": 0.0706, + "step": 28236 + }, + { + "epoch": 76.9400544959128, + "grad_norm": 2.435868740081787, + "learning_rate": 2.66171142118371e-06, + "loss": 0.028, + "step": 28237 + }, + { + "epoch": 76.94277929155314, + "grad_norm": 2.9123997688293457, + "learning_rate": 2.6611119408086127e-06, + "loss": 0.1593, + "step": 28238 + }, + { + "epoch": 76.94550408719346, + "grad_norm": 2.951160192489624, + "learning_rate": 2.6605125175885394e-06, + "loss": 0.0507, + "step": 28239 + }, + { + "epoch": 76.94822888283379, + "grad_norm": 2.1408684253692627, + "learning_rate": 2.6599131515281586e-06, + "loss": 0.0346, + "step": 28240 + }, + { + "epoch": 76.95095367847412, + "grad_norm": 3.152165412902832, + "learning_rate": 2.659313842632134e-06, + "loss": 0.1153, + "step": 28241 + }, + { + "epoch": 76.95367847411444, + "grad_norm": 2.740638017654419, + "learning_rate": 2.6587145909051405e-06, + "loss": 0.0339, + "step": 28242 + }, + { + "epoch": 76.95640326975477, + "grad_norm": 2.587643623352051, + "learning_rate": 2.6581153963518413e-06, + "loss": 0.0314, + "step": 28243 + }, + { + "epoch": 76.95912806539509, + "grad_norm": 2.3162875175476074, + "learning_rate": 2.6575162589769e-06, + "loss": 0.0368, + "step": 28244 + }, + { + "epoch": 76.96185286103542, + "grad_norm": 2.167597770690918, + "learning_rate": 2.6569171787849867e-06, + "loss": 0.0902, + "step": 28245 + }, + { + "epoch": 76.96457765667574, + "grad_norm": 2.763551712036133, + "learning_rate": 2.656318155780768e-06, + "loss": 0.0383, + "step": 28246 + }, + { + "epoch": 76.96730245231608, + "grad_norm": 2.515599489212036, + "learning_rate": 2.6557191899689073e-06, + "loss": 0.0407, + "step": 28247 + }, + { + "epoch": 76.97002724795641, + "grad_norm": 3.3870689868927, + "learning_rate": 2.6551202813540686e-06, + "loss": 0.0601, + "step": 28248 + }, + { + "epoch": 76.97275204359673, + "grad_norm": 3.033858060836792, + "learning_rate": 2.654521429940915e-06, + "loss": 0.0531, + "step": 28249 + }, + { + "epoch": 76.97547683923706, + "grad_norm": 2.1676909923553467, + "learning_rate": 2.653922635734115e-06, + "loss": 0.0474, + "step": 28250 + }, + { + "epoch": 76.97820163487738, + "grad_norm": 2.9437270164489746, + "learning_rate": 2.6533238987383283e-06, + "loss": 0.0601, + "step": 28251 + }, + { + "epoch": 76.98092643051771, + "grad_norm": 2.319300413131714, + "learning_rate": 2.6527252189582185e-06, + "loss": 0.1809, + "step": 28252 + }, + { + "epoch": 76.98365122615803, + "grad_norm": 2.7304632663726807, + "learning_rate": 2.6521265963984467e-06, + "loss": 0.1882, + "step": 28253 + }, + { + "epoch": 76.98637602179836, + "grad_norm": 2.2285587787628174, + "learning_rate": 2.6515280310636783e-06, + "loss": 0.1317, + "step": 28254 + }, + { + "epoch": 76.9891008174387, + "grad_norm": 3.706568717956543, + "learning_rate": 2.650929522958573e-06, + "loss": 0.0984, + "step": 28255 + }, + { + "epoch": 76.99182561307902, + "grad_norm": 2.6711254119873047, + "learning_rate": 2.6503310720877928e-06, + "loss": 0.0777, + "step": 28256 + }, + { + "epoch": 76.99455040871935, + "grad_norm": 2.2969894409179688, + "learning_rate": 2.6497326784559942e-06, + "loss": 0.1066, + "step": 28257 + }, + { + "epoch": 76.99727520435967, + "grad_norm": 3.119093894958496, + "learning_rate": 2.649134342067844e-06, + "loss": 0.0731, + "step": 28258 + }, + { + "epoch": 77.0, + "grad_norm": 3.4760067462921143, + "learning_rate": 2.648536062927999e-06, + "loss": 0.0501, + "step": 28259 + }, + { + "epoch": 77.00272479564033, + "grad_norm": 2.6079323291778564, + "learning_rate": 2.6479378410411184e-06, + "loss": 0.0379, + "step": 28260 + }, + { + "epoch": 77.00544959128065, + "grad_norm": 2.5225589275360107, + "learning_rate": 2.6473396764118575e-06, + "loss": 0.0651, + "step": 28261 + }, + { + "epoch": 77.00817438692098, + "grad_norm": 2.607790231704712, + "learning_rate": 2.6467415690448795e-06, + "loss": 0.1128, + "step": 28262 + }, + { + "epoch": 77.0108991825613, + "grad_norm": 3.149742841720581, + "learning_rate": 2.646143518944845e-06, + "loss": 0.0402, + "step": 28263 + }, + { + "epoch": 77.01362397820164, + "grad_norm": 3.2176196575164795, + "learning_rate": 2.6455455261164066e-06, + "loss": 0.2326, + "step": 28264 + }, + { + "epoch": 77.01634877384195, + "grad_norm": 2.213528871536255, + "learning_rate": 2.6449475905642242e-06, + "loss": 0.0215, + "step": 28265 + }, + { + "epoch": 77.01907356948229, + "grad_norm": 2.8598074913024902, + "learning_rate": 2.6443497122929495e-06, + "loss": 0.0456, + "step": 28266 + }, + { + "epoch": 77.02179836512262, + "grad_norm": 2.2847464084625244, + "learning_rate": 2.6437518913072456e-06, + "loss": 0.0284, + "step": 28267 + }, + { + "epoch": 77.02452316076294, + "grad_norm": 3.0514705181121826, + "learning_rate": 2.6431541276117654e-06, + "loss": 0.0791, + "step": 28268 + }, + { + "epoch": 77.02724795640327, + "grad_norm": 2.536168098449707, + "learning_rate": 2.6425564212111608e-06, + "loss": 0.038, + "step": 28269 + }, + { + "epoch": 77.02997275204359, + "grad_norm": 2.7003395557403564, + "learning_rate": 2.6419587721100938e-06, + "loss": 0.0629, + "step": 28270 + }, + { + "epoch": 77.03269754768392, + "grad_norm": 2.958134412765503, + "learning_rate": 2.6413611803132146e-06, + "loss": 0.0738, + "step": 28271 + }, + { + "epoch": 77.03542234332426, + "grad_norm": 1.7861578464508057, + "learning_rate": 2.6407636458251773e-06, + "loss": 0.0308, + "step": 28272 + }, + { + "epoch": 77.03814713896458, + "grad_norm": 1.8519829511642456, + "learning_rate": 2.640166168650633e-06, + "loss": 0.1506, + "step": 28273 + }, + { + "epoch": 77.04087193460491, + "grad_norm": 2.518130302429199, + "learning_rate": 2.639568748794241e-06, + "loss": 0.043, + "step": 28274 + }, + { + "epoch": 77.04359673024523, + "grad_norm": 1.6704596281051636, + "learning_rate": 2.6389713862606513e-06, + "loss": 0.0183, + "step": 28275 + }, + { + "epoch": 77.04632152588556, + "grad_norm": 2.4765989780426025, + "learning_rate": 2.6383740810545145e-06, + "loss": 0.0365, + "step": 28276 + }, + { + "epoch": 77.04904632152588, + "grad_norm": 2.888434886932373, + "learning_rate": 2.637776833180481e-06, + "loss": 0.1115, + "step": 28277 + }, + { + "epoch": 77.05177111716621, + "grad_norm": 3.075648069381714, + "learning_rate": 2.6371796426432038e-06, + "loss": 0.0443, + "step": 28278 + }, + { + "epoch": 77.05449591280654, + "grad_norm": 2.9790425300598145, + "learning_rate": 2.6365825094473387e-06, + "loss": 0.1049, + "step": 28279 + }, + { + "epoch": 77.05722070844686, + "grad_norm": 1.9135756492614746, + "learning_rate": 2.635985433597531e-06, + "loss": 0.0471, + "step": 28280 + }, + { + "epoch": 77.0599455040872, + "grad_norm": 1.6832255125045776, + "learning_rate": 2.6353884150984322e-06, + "loss": 0.0177, + "step": 28281 + }, + { + "epoch": 77.06267029972751, + "grad_norm": 2.3960390090942383, + "learning_rate": 2.6347914539546883e-06, + "loss": 0.0945, + "step": 28282 + }, + { + "epoch": 77.06539509536785, + "grad_norm": 2.7573649883270264, + "learning_rate": 2.634194550170954e-06, + "loss": 0.0348, + "step": 28283 + }, + { + "epoch": 77.06811989100818, + "grad_norm": 2.5236833095550537, + "learning_rate": 2.6335977037518767e-06, + "loss": 0.0521, + "step": 28284 + }, + { + "epoch": 77.0708446866485, + "grad_norm": 2.3994863033294678, + "learning_rate": 2.633000914702103e-06, + "loss": 0.0568, + "step": 28285 + }, + { + "epoch": 77.07356948228883, + "grad_norm": 3.348933696746826, + "learning_rate": 2.632404183026277e-06, + "loss": 0.0605, + "step": 28286 + }, + { + "epoch": 77.07629427792915, + "grad_norm": 2.594438314437866, + "learning_rate": 2.631807508729054e-06, + "loss": 0.0686, + "step": 28287 + }, + { + "epoch": 77.07901907356948, + "grad_norm": 2.689310073852539, + "learning_rate": 2.631210891815077e-06, + "loss": 0.1564, + "step": 28288 + }, + { + "epoch": 77.0817438692098, + "grad_norm": 2.0371029376983643, + "learning_rate": 2.63061433228899e-06, + "loss": 0.029, + "step": 28289 + }, + { + "epoch": 77.08446866485014, + "grad_norm": 2.612265110015869, + "learning_rate": 2.6300178301554436e-06, + "loss": 0.029, + "step": 28290 + }, + { + "epoch": 77.08719346049047, + "grad_norm": 2.674476385116577, + "learning_rate": 2.6294213854190807e-06, + "loss": 0.0578, + "step": 28291 + }, + { + "epoch": 77.08991825613079, + "grad_norm": 2.713242292404175, + "learning_rate": 2.628824998084547e-06, + "loss": 0.057, + "step": 28292 + }, + { + "epoch": 77.09264305177112, + "grad_norm": 2.3643999099731445, + "learning_rate": 2.628228668156485e-06, + "loss": 0.0653, + "step": 28293 + }, + { + "epoch": 77.09536784741144, + "grad_norm": 2.3944807052612305, + "learning_rate": 2.6276323956395433e-06, + "loss": 0.0291, + "step": 28294 + }, + { + "epoch": 77.09809264305177, + "grad_norm": 1.9519646167755127, + "learning_rate": 2.6270361805383593e-06, + "loss": 0.0367, + "step": 28295 + }, + { + "epoch": 77.1008174386921, + "grad_norm": 2.5369083881378174, + "learning_rate": 2.626440022857585e-06, + "loss": 0.1256, + "step": 28296 + }, + { + "epoch": 77.10354223433242, + "grad_norm": 2.037079095840454, + "learning_rate": 2.6258439226018574e-06, + "loss": 0.0463, + "step": 28297 + }, + { + "epoch": 77.10626702997276, + "grad_norm": 3.5799801349639893, + "learning_rate": 2.625247879775816e-06, + "loss": 0.0837, + "step": 28298 + }, + { + "epoch": 77.10899182561307, + "grad_norm": 2.167036533355713, + "learning_rate": 2.6246518943841115e-06, + "loss": 0.0272, + "step": 28299 + }, + { + "epoch": 77.11171662125341, + "grad_norm": 1.9913524389266968, + "learning_rate": 2.6240559664313805e-06, + "loss": 0.1283, + "step": 28300 + }, + { + "epoch": 77.11444141689373, + "grad_norm": 3.5613033771514893, + "learning_rate": 2.623460095922263e-06, + "loss": 0.0795, + "step": 28301 + }, + { + "epoch": 77.11716621253406, + "grad_norm": 2.2153353691101074, + "learning_rate": 2.622864282861399e-06, + "loss": 0.0369, + "step": 28302 + }, + { + "epoch": 77.11989100817439, + "grad_norm": 6.166149616241455, + "learning_rate": 2.6222685272534333e-06, + "loss": 0.0724, + "step": 28303 + }, + { + "epoch": 77.12261580381471, + "grad_norm": 2.6389477252960205, + "learning_rate": 2.6216728291030024e-06, + "loss": 0.2047, + "step": 28304 + }, + { + "epoch": 77.12534059945504, + "grad_norm": 1.5879967212677002, + "learning_rate": 2.6210771884147468e-06, + "loss": 0.0274, + "step": 28305 + }, + { + "epoch": 77.12806539509536, + "grad_norm": 2.509934902191162, + "learning_rate": 2.620481605193301e-06, + "loss": 0.0383, + "step": 28306 + }, + { + "epoch": 77.1307901907357, + "grad_norm": 3.834446907043457, + "learning_rate": 2.61988607944331e-06, + "loss": 0.1499, + "step": 28307 + }, + { + "epoch": 77.13351498637603, + "grad_norm": 1.7610657215118408, + "learning_rate": 2.6192906111694095e-06, + "loss": 0.0284, + "step": 28308 + }, + { + "epoch": 77.13623978201635, + "grad_norm": 2.327150583267212, + "learning_rate": 2.6186952003762355e-06, + "loss": 0.0209, + "step": 28309 + }, + { + "epoch": 77.13896457765668, + "grad_norm": 3.574877977371216, + "learning_rate": 2.618099847068423e-06, + "loss": 0.0795, + "step": 28310 + }, + { + "epoch": 77.141689373297, + "grad_norm": 2.3875651359558105, + "learning_rate": 2.6175045512506138e-06, + "loss": 0.0315, + "step": 28311 + }, + { + "epoch": 77.14441416893733, + "grad_norm": 2.992039203643799, + "learning_rate": 2.6169093129274416e-06, + "loss": 0.0344, + "step": 28312 + }, + { + "epoch": 77.14713896457765, + "grad_norm": 3.4359548091888428, + "learning_rate": 2.616314132103539e-06, + "loss": 0.0569, + "step": 28313 + }, + { + "epoch": 77.14986376021798, + "grad_norm": 2.833533763885498, + "learning_rate": 2.6157190087835437e-06, + "loss": 0.0392, + "step": 28314 + }, + { + "epoch": 77.15258855585832, + "grad_norm": 2.8054587841033936, + "learning_rate": 2.6151239429720952e-06, + "loss": 0.0392, + "step": 28315 + }, + { + "epoch": 77.15531335149863, + "grad_norm": 2.4326376914978027, + "learning_rate": 2.6145289346738234e-06, + "loss": 0.057, + "step": 28316 + }, + { + "epoch": 77.15803814713897, + "grad_norm": 3.105372667312622, + "learning_rate": 2.613933983893363e-06, + "loss": 0.0458, + "step": 28317 + }, + { + "epoch": 77.16076294277929, + "grad_norm": 3.383669853210449, + "learning_rate": 2.613339090635343e-06, + "loss": 0.0524, + "step": 28318 + }, + { + "epoch": 77.16348773841962, + "grad_norm": 3.113739252090454, + "learning_rate": 2.612744254904405e-06, + "loss": 0.1057, + "step": 28319 + }, + { + "epoch": 77.16621253405995, + "grad_norm": 2.453718423843384, + "learning_rate": 2.612149476705176e-06, + "loss": 0.0477, + "step": 28320 + }, + { + "epoch": 77.16893732970027, + "grad_norm": 2.184514284133911, + "learning_rate": 2.6115547560422884e-06, + "loss": 0.0405, + "step": 28321 + }, + { + "epoch": 77.1716621253406, + "grad_norm": 3.3941001892089844, + "learning_rate": 2.6109600929203726e-06, + "loss": 0.0401, + "step": 28322 + }, + { + "epoch": 77.17438692098092, + "grad_norm": 2.4680778980255127, + "learning_rate": 2.6103654873440642e-06, + "loss": 0.124, + "step": 28323 + }, + { + "epoch": 77.17711171662125, + "grad_norm": 3.5254034996032715, + "learning_rate": 2.6097709393179915e-06, + "loss": 0.1141, + "step": 28324 + }, + { + "epoch": 77.17983651226157, + "grad_norm": 1.8669538497924805, + "learning_rate": 2.6091764488467852e-06, + "loss": 0.0264, + "step": 28325 + }, + { + "epoch": 77.1825613079019, + "grad_norm": 2.805007219314575, + "learning_rate": 2.608582015935072e-06, + "loss": 0.0604, + "step": 28326 + }, + { + "epoch": 77.18528610354224, + "grad_norm": 2.943263053894043, + "learning_rate": 2.607987640587487e-06, + "loss": 0.0502, + "step": 28327 + }, + { + "epoch": 77.18801089918256, + "grad_norm": 1.7465529441833496, + "learning_rate": 2.6073933228086568e-06, + "loss": 0.0792, + "step": 28328 + }, + { + "epoch": 77.19073569482289, + "grad_norm": 2.9444684982299805, + "learning_rate": 2.606799062603208e-06, + "loss": 0.0529, + "step": 28329 + }, + { + "epoch": 77.19346049046321, + "grad_norm": 3.38279128074646, + "learning_rate": 2.6062048599757685e-06, + "loss": 0.0979, + "step": 28330 + }, + { + "epoch": 77.19618528610354, + "grad_norm": 2.9587132930755615, + "learning_rate": 2.6056107149309673e-06, + "loss": 0.0893, + "step": 28331 + }, + { + "epoch": 77.19891008174388, + "grad_norm": 2.821481466293335, + "learning_rate": 2.6050166274734346e-06, + "loss": 0.1403, + "step": 28332 + }, + { + "epoch": 77.2016348773842, + "grad_norm": 2.5020580291748047, + "learning_rate": 2.6044225976077954e-06, + "loss": 0.0394, + "step": 28333 + }, + { + "epoch": 77.20435967302453, + "grad_norm": 2.6696362495422363, + "learning_rate": 2.6038286253386704e-06, + "loss": 0.0489, + "step": 28334 + }, + { + "epoch": 77.20708446866485, + "grad_norm": 3.003931760787964, + "learning_rate": 2.6032347106706945e-06, + "loss": 0.0685, + "step": 28335 + }, + { + "epoch": 77.20980926430518, + "grad_norm": 2.7271816730499268, + "learning_rate": 2.602640853608488e-06, + "loss": 0.0413, + "step": 28336 + }, + { + "epoch": 77.2125340599455, + "grad_norm": 2.33297061920166, + "learning_rate": 2.6020470541566757e-06, + "loss": 0.127, + "step": 28337 + }, + { + "epoch": 77.21525885558583, + "grad_norm": 2.468869924545288, + "learning_rate": 2.6014533123198803e-06, + "loss": 0.0863, + "step": 28338 + }, + { + "epoch": 77.21798365122616, + "grad_norm": 2.542198896408081, + "learning_rate": 2.600859628102732e-06, + "loss": 0.0531, + "step": 28339 + }, + { + "epoch": 77.22070844686648, + "grad_norm": 4.324550628662109, + "learning_rate": 2.60026600150985e-06, + "loss": 0.0866, + "step": 28340 + }, + { + "epoch": 77.22343324250681, + "grad_norm": 2.388823986053467, + "learning_rate": 2.5996724325458588e-06, + "loss": 0.0703, + "step": 28341 + }, + { + "epoch": 77.22615803814713, + "grad_norm": 2.9211771488189697, + "learning_rate": 2.599078921215378e-06, + "loss": 0.0849, + "step": 28342 + }, + { + "epoch": 77.22888283378747, + "grad_norm": 3.4782581329345703, + "learning_rate": 2.598485467523034e-06, + "loss": 0.1114, + "step": 28343 + }, + { + "epoch": 77.2316076294278, + "grad_norm": 2.142575263977051, + "learning_rate": 2.597892071473448e-06, + "loss": 0.0821, + "step": 28344 + }, + { + "epoch": 77.23433242506812, + "grad_norm": 2.9981675148010254, + "learning_rate": 2.5972987330712398e-06, + "loss": 0.0402, + "step": 28345 + }, + { + "epoch": 77.23705722070845, + "grad_norm": 2.780332565307617, + "learning_rate": 2.596705452321028e-06, + "loss": 0.0741, + "step": 28346 + }, + { + "epoch": 77.23978201634877, + "grad_norm": 2.5900814533233643, + "learning_rate": 2.5961122292274353e-06, + "loss": 0.0463, + "step": 28347 + }, + { + "epoch": 77.2425068119891, + "grad_norm": 3.1700220108032227, + "learning_rate": 2.5955190637950855e-06, + "loss": 0.0936, + "step": 28348 + }, + { + "epoch": 77.24523160762942, + "grad_norm": 3.501685619354248, + "learning_rate": 2.5949259560285955e-06, + "loss": 0.1122, + "step": 28349 + }, + { + "epoch": 77.24795640326975, + "grad_norm": 2.62182354927063, + "learning_rate": 2.594332905932584e-06, + "loss": 0.1405, + "step": 28350 + }, + { + "epoch": 77.25068119891009, + "grad_norm": 3.6526505947113037, + "learning_rate": 2.593739913511666e-06, + "loss": 0.0448, + "step": 28351 + }, + { + "epoch": 77.2534059945504, + "grad_norm": 1.768544316291809, + "learning_rate": 2.5931469787704656e-06, + "loss": 0.0274, + "step": 28352 + }, + { + "epoch": 77.25613079019074, + "grad_norm": 2.2839407920837402, + "learning_rate": 2.5925541017135992e-06, + "loss": 0.0411, + "step": 28353 + }, + { + "epoch": 77.25885558583106, + "grad_norm": 2.1834545135498047, + "learning_rate": 2.5919612823456795e-06, + "loss": 0.0223, + "step": 28354 + }, + { + "epoch": 77.26158038147139, + "grad_norm": 2.4900600910186768, + "learning_rate": 2.59136852067133e-06, + "loss": 0.1543, + "step": 28355 + }, + { + "epoch": 77.26430517711172, + "grad_norm": 1.9542450904846191, + "learning_rate": 2.5907758166951635e-06, + "loss": 0.026, + "step": 28356 + }, + { + "epoch": 77.26702997275204, + "grad_norm": 2.0919249057769775, + "learning_rate": 2.5901831704217973e-06, + "loss": 0.0234, + "step": 28357 + }, + { + "epoch": 77.26975476839237, + "grad_norm": 3.337462902069092, + "learning_rate": 2.589590581855843e-06, + "loss": 0.1082, + "step": 28358 + }, + { + "epoch": 77.2724795640327, + "grad_norm": 2.0865652561187744, + "learning_rate": 2.588998051001921e-06, + "loss": 0.0257, + "step": 28359 + }, + { + "epoch": 77.27520435967303, + "grad_norm": 2.4404172897338867, + "learning_rate": 2.5884055778646443e-06, + "loss": 0.1117, + "step": 28360 + }, + { + "epoch": 77.27792915531334, + "grad_norm": 2.837879180908203, + "learning_rate": 2.5878131624486256e-06, + "loss": 0.0444, + "step": 28361 + }, + { + "epoch": 77.28065395095368, + "grad_norm": 2.6554408073425293, + "learning_rate": 2.587220804758478e-06, + "loss": 0.0308, + "step": 28362 + }, + { + "epoch": 77.28337874659401, + "grad_norm": 2.34537935256958, + "learning_rate": 2.586628504798818e-06, + "loss": 0.0512, + "step": 28363 + }, + { + "epoch": 77.28610354223433, + "grad_norm": 3.424349546432495, + "learning_rate": 2.586036262574254e-06, + "loss": 0.0612, + "step": 28364 + }, + { + "epoch": 77.28882833787466, + "grad_norm": 3.2750487327575684, + "learning_rate": 2.585444078089404e-06, + "loss": 0.1182, + "step": 28365 + }, + { + "epoch": 77.29155313351498, + "grad_norm": 4.671356678009033, + "learning_rate": 2.5848519513488767e-06, + "loss": 0.1176, + "step": 28366 + }, + { + "epoch": 77.29427792915531, + "grad_norm": 1.9492790699005127, + "learning_rate": 2.5842598823572805e-06, + "loss": 0.1477, + "step": 28367 + }, + { + "epoch": 77.29700272479565, + "grad_norm": 2.4482572078704834, + "learning_rate": 2.583667871119233e-06, + "loss": 0.0818, + "step": 28368 + }, + { + "epoch": 77.29972752043597, + "grad_norm": 2.9148521423339844, + "learning_rate": 2.583075917639342e-06, + "loss": 0.091, + "step": 28369 + }, + { + "epoch": 77.3024523160763, + "grad_norm": 2.2485458850860596, + "learning_rate": 2.582484021922216e-06, + "loss": 0.0435, + "step": 28370 + }, + { + "epoch": 77.30517711171662, + "grad_norm": 2.246720790863037, + "learning_rate": 2.581892183972463e-06, + "loss": 0.0347, + "step": 28371 + }, + { + "epoch": 77.30790190735695, + "grad_norm": 2.415050506591797, + "learning_rate": 2.5813004037946986e-06, + "loss": 0.0427, + "step": 28372 + }, + { + "epoch": 77.31062670299727, + "grad_norm": 2.1264264583587646, + "learning_rate": 2.5807086813935266e-06, + "loss": 0.0243, + "step": 28373 + }, + { + "epoch": 77.3133514986376, + "grad_norm": 2.6624844074249268, + "learning_rate": 2.580117016773558e-06, + "loss": 0.0432, + "step": 28374 + }, + { + "epoch": 77.31607629427793, + "grad_norm": 3.3343701362609863, + "learning_rate": 2.5795254099393953e-06, + "loss": 0.2262, + "step": 28375 + }, + { + "epoch": 77.31880108991825, + "grad_norm": 3.9192686080932617, + "learning_rate": 2.5789338608956526e-06, + "loss": 0.0735, + "step": 28376 + }, + { + "epoch": 77.32152588555859, + "grad_norm": 2.675515651702881, + "learning_rate": 2.5783423696469356e-06, + "loss": 0.0828, + "step": 28377 + }, + { + "epoch": 77.3242506811989, + "grad_norm": 2.6446645259857178, + "learning_rate": 2.577750936197845e-06, + "loss": 0.0365, + "step": 28378 + }, + { + "epoch": 77.32697547683924, + "grad_norm": 2.8183844089508057, + "learning_rate": 2.577159560552995e-06, + "loss": 0.1491, + "step": 28379 + }, + { + "epoch": 77.32970027247957, + "grad_norm": 2.186535596847534, + "learning_rate": 2.576568242716987e-06, + "loss": 0.1011, + "step": 28380 + }, + { + "epoch": 77.33242506811989, + "grad_norm": 1.7282354831695557, + "learning_rate": 2.5759769826944236e-06, + "loss": 0.0212, + "step": 28381 + }, + { + "epoch": 77.33514986376022, + "grad_norm": 2.604694128036499, + "learning_rate": 2.5753857804899163e-06, + "loss": 0.0619, + "step": 28382 + }, + { + "epoch": 77.33787465940054, + "grad_norm": 2.528526544570923, + "learning_rate": 2.574794636108061e-06, + "loss": 0.0391, + "step": 28383 + }, + { + "epoch": 77.34059945504087, + "grad_norm": 2.8281095027923584, + "learning_rate": 2.574203549553471e-06, + "loss": 0.1655, + "step": 28384 + }, + { + "epoch": 77.34332425068119, + "grad_norm": 2.5194592475891113, + "learning_rate": 2.573612520830744e-06, + "loss": 0.0715, + "step": 28385 + }, + { + "epoch": 77.34604904632153, + "grad_norm": 2.8153131008148193, + "learning_rate": 2.573021549944483e-06, + "loss": 0.0998, + "step": 28386 + }, + { + "epoch": 77.34877384196186, + "grad_norm": 2.246671438217163, + "learning_rate": 2.5724306368992893e-06, + "loss": 0.0366, + "step": 28387 + }, + { + "epoch": 77.35149863760218, + "grad_norm": 2.389148473739624, + "learning_rate": 2.5718397816997685e-06, + "loss": 0.0414, + "step": 28388 + }, + { + "epoch": 77.35422343324251, + "grad_norm": 3.353811740875244, + "learning_rate": 2.5712489843505207e-06, + "loss": 0.0623, + "step": 28389 + }, + { + "epoch": 77.35694822888283, + "grad_norm": 1.9880976676940918, + "learning_rate": 2.570658244856147e-06, + "loss": 0.0815, + "step": 28390 + }, + { + "epoch": 77.35967302452316, + "grad_norm": 2.823745012283325, + "learning_rate": 2.5700675632212445e-06, + "loss": 0.044, + "step": 28391 + }, + { + "epoch": 77.3623978201635, + "grad_norm": 2.4052863121032715, + "learning_rate": 2.5694769394504204e-06, + "loss": 0.0336, + "step": 28392 + }, + { + "epoch": 77.36512261580381, + "grad_norm": 1.7629444599151611, + "learning_rate": 2.5688863735482706e-06, + "loss": 0.0214, + "step": 28393 + }, + { + "epoch": 77.36784741144415, + "grad_norm": 2.4777607917785645, + "learning_rate": 2.5682958655193936e-06, + "loss": 0.0639, + "step": 28394 + }, + { + "epoch": 77.37057220708446, + "grad_norm": 2.55159854888916, + "learning_rate": 2.5677054153683868e-06, + "loss": 0.0357, + "step": 28395 + }, + { + "epoch": 77.3732970027248, + "grad_norm": 1.5858360528945923, + "learning_rate": 2.567115023099854e-06, + "loss": 0.0222, + "step": 28396 + }, + { + "epoch": 77.37602179836512, + "grad_norm": 2.7543575763702393, + "learning_rate": 2.5665246887183903e-06, + "loss": 0.0491, + "step": 28397 + }, + { + "epoch": 77.37874659400545, + "grad_norm": 2.8959872722625732, + "learning_rate": 2.5659344122285902e-06, + "loss": 0.0356, + "step": 28398 + }, + { + "epoch": 77.38147138964578, + "grad_norm": 3.3684165477752686, + "learning_rate": 2.565344193635053e-06, + "loss": 0.0575, + "step": 28399 + }, + { + "epoch": 77.3841961852861, + "grad_norm": 2.763245105743408, + "learning_rate": 2.56475403294238e-06, + "loss": 0.0911, + "step": 28400 + }, + { + "epoch": 77.38692098092643, + "grad_norm": 3.3602499961853027, + "learning_rate": 2.5641639301551622e-06, + "loss": 0.0258, + "step": 28401 + }, + { + "epoch": 77.38964577656675, + "grad_norm": 2.2327897548675537, + "learning_rate": 2.563573885277998e-06, + "loss": 0.0354, + "step": 28402 + }, + { + "epoch": 77.39237057220708, + "grad_norm": 3.208909034729004, + "learning_rate": 2.5629838983154763e-06, + "loss": 0.0729, + "step": 28403 + }, + { + "epoch": 77.39509536784742, + "grad_norm": 3.959651231765747, + "learning_rate": 2.5623939692722e-06, + "loss": 0.0508, + "step": 28404 + }, + { + "epoch": 77.39782016348774, + "grad_norm": 3.821998357772827, + "learning_rate": 2.5618040981527603e-06, + "loss": 0.055, + "step": 28405 + }, + { + "epoch": 77.40054495912807, + "grad_norm": 3.2189230918884277, + "learning_rate": 2.5612142849617516e-06, + "loss": 0.2097, + "step": 28406 + }, + { + "epoch": 77.40326975476839, + "grad_norm": 2.05731201171875, + "learning_rate": 2.5606245297037624e-06, + "loss": 0.0259, + "step": 28407 + }, + { + "epoch": 77.40599455040872, + "grad_norm": 3.0733771324157715, + "learning_rate": 2.5600348323833936e-06, + "loss": 0.1019, + "step": 28408 + }, + { + "epoch": 77.40871934604904, + "grad_norm": 1.7058881521224976, + "learning_rate": 2.5594451930052346e-06, + "loss": 0.1188, + "step": 28409 + }, + { + "epoch": 77.41144414168937, + "grad_norm": 3.7195069789886475, + "learning_rate": 2.558855611573876e-06, + "loss": 0.0881, + "step": 28410 + }, + { + "epoch": 77.4141689373297, + "grad_norm": 2.2621467113494873, + "learning_rate": 2.558266088093907e-06, + "loss": 0.0548, + "step": 28411 + }, + { + "epoch": 77.41689373297002, + "grad_norm": 2.409527540206909, + "learning_rate": 2.5576766225699267e-06, + "loss": 0.0314, + "step": 28412 + }, + { + "epoch": 77.41961852861036, + "grad_norm": 2.0626375675201416, + "learning_rate": 2.557087215006521e-06, + "loss": 0.035, + "step": 28413 + }, + { + "epoch": 77.42234332425068, + "grad_norm": 3.906682252883911, + "learning_rate": 2.5564978654082794e-06, + "loss": 0.0733, + "step": 28414 + }, + { + "epoch": 77.42506811989101, + "grad_norm": 2.634202718734741, + "learning_rate": 2.5559085737797904e-06, + "loss": 0.0646, + "step": 28415 + }, + { + "epoch": 77.42779291553134, + "grad_norm": 2.1719534397125244, + "learning_rate": 2.555319340125646e-06, + "loss": 0.0753, + "step": 28416 + }, + { + "epoch": 77.43051771117166, + "grad_norm": 2.6878604888916016, + "learning_rate": 2.5547301644504386e-06, + "loss": 0.082, + "step": 28417 + }, + { + "epoch": 77.433242506812, + "grad_norm": 4.437887668609619, + "learning_rate": 2.5541410467587512e-06, + "loss": 0.0317, + "step": 28418 + }, + { + "epoch": 77.43596730245231, + "grad_norm": 2.2146847248077393, + "learning_rate": 2.5535519870551728e-06, + "loss": 0.0438, + "step": 28419 + }, + { + "epoch": 77.43869209809264, + "grad_norm": 5.827820301055908, + "learning_rate": 2.5529629853442937e-06, + "loss": 0.1261, + "step": 28420 + }, + { + "epoch": 77.44141689373296, + "grad_norm": 3.3244845867156982, + "learning_rate": 2.5523740416306995e-06, + "loss": 0.0577, + "step": 28421 + }, + { + "epoch": 77.4441416893733, + "grad_norm": 3.4202892780303955, + "learning_rate": 2.5517851559189764e-06, + "loss": 0.0662, + "step": 28422 + }, + { + "epoch": 77.44686648501363, + "grad_norm": 3.468672275543213, + "learning_rate": 2.5511963282137077e-06, + "loss": 0.0556, + "step": 28423 + }, + { + "epoch": 77.44959128065395, + "grad_norm": 2.372209072113037, + "learning_rate": 2.5506075585194856e-06, + "loss": 0.0378, + "step": 28424 + }, + { + "epoch": 77.45231607629428, + "grad_norm": 3.1423909664154053, + "learning_rate": 2.5500188468408917e-06, + "loss": 0.0616, + "step": 28425 + }, + { + "epoch": 77.4550408719346, + "grad_norm": 2.312046766281128, + "learning_rate": 2.5494301931825117e-06, + "loss": 0.0883, + "step": 28426 + }, + { + "epoch": 77.45776566757493, + "grad_norm": 2.011847496032715, + "learning_rate": 2.5488415975489266e-06, + "loss": 0.0862, + "step": 28427 + }, + { + "epoch": 77.46049046321527, + "grad_norm": 2.175135850906372, + "learning_rate": 2.5482530599447254e-06, + "loss": 0.0264, + "step": 28428 + }, + { + "epoch": 77.46321525885558, + "grad_norm": 3.052598714828491, + "learning_rate": 2.5476645803744902e-06, + "loss": 0.0904, + "step": 28429 + }, + { + "epoch": 77.46594005449592, + "grad_norm": 2.514087677001953, + "learning_rate": 2.547076158842804e-06, + "loss": 0.037, + "step": 28430 + }, + { + "epoch": 77.46866485013624, + "grad_norm": 3.4340426921844482, + "learning_rate": 2.5464877953542457e-06, + "loss": 0.0733, + "step": 28431 + }, + { + "epoch": 77.47138964577657, + "grad_norm": 2.293118476867676, + "learning_rate": 2.5458994899134024e-06, + "loss": 0.0403, + "step": 28432 + }, + { + "epoch": 77.47411444141689, + "grad_norm": 2.7532589435577393, + "learning_rate": 2.5453112425248516e-06, + "loss": 0.0716, + "step": 28433 + }, + { + "epoch": 77.47683923705722, + "grad_norm": 4.328482627868652, + "learning_rate": 2.54472305319318e-06, + "loss": 0.0523, + "step": 28434 + }, + { + "epoch": 77.47956403269755, + "grad_norm": 3.9203343391418457, + "learning_rate": 2.544134921922965e-06, + "loss": 0.0409, + "step": 28435 + }, + { + "epoch": 77.48228882833787, + "grad_norm": 2.15958571434021, + "learning_rate": 2.543546848718784e-06, + "loss": 0.0343, + "step": 28436 + }, + { + "epoch": 77.4850136239782, + "grad_norm": 2.3497140407562256, + "learning_rate": 2.542958833585224e-06, + "loss": 0.0417, + "step": 28437 + }, + { + "epoch": 77.48773841961852, + "grad_norm": 2.4433770179748535, + "learning_rate": 2.5423708765268607e-06, + "loss": 0.1215, + "step": 28438 + }, + { + "epoch": 77.49046321525886, + "grad_norm": 4.357604503631592, + "learning_rate": 2.541782977548273e-06, + "loss": 0.2337, + "step": 28439 + }, + { + "epoch": 77.49318801089919, + "grad_norm": 2.417895555496216, + "learning_rate": 2.5411951366540357e-06, + "loss": 0.0518, + "step": 28440 + }, + { + "epoch": 77.49591280653951, + "grad_norm": 2.396540403366089, + "learning_rate": 2.540607353848733e-06, + "loss": 0.0302, + "step": 28441 + }, + { + "epoch": 77.49863760217984, + "grad_norm": 5.14478874206543, + "learning_rate": 2.5400196291369417e-06, + "loss": 0.1045, + "step": 28442 + }, + { + "epoch": 77.50136239782016, + "grad_norm": 3.3471691608428955, + "learning_rate": 2.5394319625232333e-06, + "loss": 0.0754, + "step": 28443 + }, + { + "epoch": 77.50408719346049, + "grad_norm": 2.0748744010925293, + "learning_rate": 2.538844354012192e-06, + "loss": 0.056, + "step": 28444 + }, + { + "epoch": 77.50681198910081, + "grad_norm": 2.3002915382385254, + "learning_rate": 2.538256803608391e-06, + "loss": 0.1092, + "step": 28445 + }, + { + "epoch": 77.50953678474114, + "grad_norm": 2.032125234603882, + "learning_rate": 2.5376693113164062e-06, + "loss": 0.0223, + "step": 28446 + }, + { + "epoch": 77.51226158038148, + "grad_norm": 2.5156798362731934, + "learning_rate": 2.537081877140809e-06, + "loss": 0.0757, + "step": 28447 + }, + { + "epoch": 77.5149863760218, + "grad_norm": 2.4647250175476074, + "learning_rate": 2.536494501086181e-06, + "loss": 0.0571, + "step": 28448 + }, + { + "epoch": 77.51771117166213, + "grad_norm": 3.689142942428589, + "learning_rate": 2.5359071831570937e-06, + "loss": 0.1352, + "step": 28449 + }, + { + "epoch": 77.52043596730245, + "grad_norm": 2.561048984527588, + "learning_rate": 2.5353199233581184e-06, + "loss": 0.0277, + "step": 28450 + }, + { + "epoch": 77.52316076294278, + "grad_norm": 2.206209897994995, + "learning_rate": 2.534732721693833e-06, + "loss": 0.0263, + "step": 28451 + }, + { + "epoch": 77.52588555858311, + "grad_norm": 2.5610644817352295, + "learning_rate": 2.5341455781688073e-06, + "loss": 0.0652, + "step": 28452 + }, + { + "epoch": 77.52861035422343, + "grad_norm": 2.32920241355896, + "learning_rate": 2.5335584927876178e-06, + "loss": 0.101, + "step": 28453 + }, + { + "epoch": 77.53133514986376, + "grad_norm": 2.0175223350524902, + "learning_rate": 2.5329714655548352e-06, + "loss": 0.0839, + "step": 28454 + }, + { + "epoch": 77.53405994550408, + "grad_norm": 4.562267303466797, + "learning_rate": 2.53238449647503e-06, + "loss": 0.1799, + "step": 28455 + }, + { + "epoch": 77.53678474114442, + "grad_norm": 2.625113010406494, + "learning_rate": 2.531797585552771e-06, + "loss": 0.1283, + "step": 28456 + }, + { + "epoch": 77.53950953678473, + "grad_norm": 2.9678537845611572, + "learning_rate": 2.5312107327926348e-06, + "loss": 0.0218, + "step": 28457 + }, + { + "epoch": 77.54223433242507, + "grad_norm": 1.9777448177337646, + "learning_rate": 2.5306239381991893e-06, + "loss": 0.0483, + "step": 28458 + }, + { + "epoch": 77.5449591280654, + "grad_norm": 2.6387410163879395, + "learning_rate": 2.5300372017770046e-06, + "loss": 0.0432, + "step": 28459 + }, + { + "epoch": 77.54768392370572, + "grad_norm": 2.3963844776153564, + "learning_rate": 2.5294505235306465e-06, + "loss": 0.1325, + "step": 28460 + }, + { + "epoch": 77.55040871934605, + "grad_norm": 3.0688164234161377, + "learning_rate": 2.52886390346469e-06, + "loss": 0.085, + "step": 28461 + }, + { + "epoch": 77.55313351498637, + "grad_norm": 1.909074306488037, + "learning_rate": 2.5282773415837013e-06, + "loss": 0.0277, + "step": 28462 + }, + { + "epoch": 77.5558583106267, + "grad_norm": 2.116577625274658, + "learning_rate": 2.527690837892245e-06, + "loss": 0.0285, + "step": 28463 + }, + { + "epoch": 77.55858310626704, + "grad_norm": 3.282200336456299, + "learning_rate": 2.5271043923948946e-06, + "loss": 0.0984, + "step": 28464 + }, + { + "epoch": 77.56130790190736, + "grad_norm": 4.2497711181640625, + "learning_rate": 2.5265180050962147e-06, + "loss": 0.0449, + "step": 28465 + }, + { + "epoch": 77.56403269754769, + "grad_norm": 3.986081838607788, + "learning_rate": 2.5259316760007724e-06, + "loss": 0.0499, + "step": 28466 + }, + { + "epoch": 77.566757493188, + "grad_norm": 2.5657618045806885, + "learning_rate": 2.525345405113131e-06, + "loss": 0.0757, + "step": 28467 + }, + { + "epoch": 77.56948228882834, + "grad_norm": 6.001152038574219, + "learning_rate": 2.5247591924378577e-06, + "loss": 0.0677, + "step": 28468 + }, + { + "epoch": 77.57220708446866, + "grad_norm": 2.1566176414489746, + "learning_rate": 2.5241730379795235e-06, + "loss": 0.0281, + "step": 28469 + }, + { + "epoch": 77.57493188010899, + "grad_norm": 3.7497494220733643, + "learning_rate": 2.5235869417426885e-06, + "loss": 0.1297, + "step": 28470 + }, + { + "epoch": 77.57765667574932, + "grad_norm": 4.071877956390381, + "learning_rate": 2.523000903731918e-06, + "loss": 0.0648, + "step": 28471 + }, + { + "epoch": 77.58038147138964, + "grad_norm": 2.499847888946533, + "learning_rate": 2.522414923951774e-06, + "loss": 0.1004, + "step": 28472 + }, + { + "epoch": 77.58310626702998, + "grad_norm": 4.971376419067383, + "learning_rate": 2.5218290024068224e-06, + "loss": 0.0852, + "step": 28473 + }, + { + "epoch": 77.5858310626703, + "grad_norm": 3.4536664485931396, + "learning_rate": 2.521243139101628e-06, + "loss": 0.0426, + "step": 28474 + }, + { + "epoch": 77.58855585831063, + "grad_norm": 2.9197516441345215, + "learning_rate": 2.52065733404075e-06, + "loss": 0.0365, + "step": 28475 + }, + { + "epoch": 77.59128065395096, + "grad_norm": 2.83383846282959, + "learning_rate": 2.5200715872287495e-06, + "loss": 0.0608, + "step": 28476 + }, + { + "epoch": 77.59400544959128, + "grad_norm": 2.68898606300354, + "learning_rate": 2.5194858986701933e-06, + "loss": 0.0448, + "step": 28477 + }, + { + "epoch": 77.59673024523161, + "grad_norm": 2.6219491958618164, + "learning_rate": 2.5189002683696408e-06, + "loss": 0.0353, + "step": 28478 + }, + { + "epoch": 77.59945504087193, + "grad_norm": 2.5507733821868896, + "learning_rate": 2.518314696331652e-06, + "loss": 0.0954, + "step": 28479 + }, + { + "epoch": 77.60217983651226, + "grad_norm": 2.0204384326934814, + "learning_rate": 2.5177291825607843e-06, + "loss": 0.0526, + "step": 28480 + }, + { + "epoch": 77.60490463215258, + "grad_norm": 2.4395458698272705, + "learning_rate": 2.5171437270616038e-06, + "loss": 0.0817, + "step": 28481 + }, + { + "epoch": 77.60762942779292, + "grad_norm": 2.6209070682525635, + "learning_rate": 2.5165583298386673e-06, + "loss": 0.1323, + "step": 28482 + }, + { + "epoch": 77.61035422343325, + "grad_norm": 2.391087055206299, + "learning_rate": 2.5159729908965346e-06, + "loss": 0.222, + "step": 28483 + }, + { + "epoch": 77.61307901907357, + "grad_norm": 3.7429230213165283, + "learning_rate": 2.5153877102397596e-06, + "loss": 0.1582, + "step": 28484 + }, + { + "epoch": 77.6158038147139, + "grad_norm": 2.515198230743408, + "learning_rate": 2.5148024878729037e-06, + "loss": 0.124, + "step": 28485 + }, + { + "epoch": 77.61852861035422, + "grad_norm": 2.550065279006958, + "learning_rate": 2.5142173238005286e-06, + "loss": 0.1448, + "step": 28486 + }, + { + "epoch": 77.62125340599455, + "grad_norm": 2.8454697132110596, + "learning_rate": 2.5136322180271886e-06, + "loss": 0.0258, + "step": 28487 + }, + { + "epoch": 77.62397820163488, + "grad_norm": 3.082376003265381, + "learning_rate": 2.5130471705574367e-06, + "loss": 0.0619, + "step": 28488 + }, + { + "epoch": 77.6267029972752, + "grad_norm": 2.665174961090088, + "learning_rate": 2.512462181395835e-06, + "loss": 0.0304, + "step": 28489 + }, + { + "epoch": 77.62942779291554, + "grad_norm": 2.899925947189331, + "learning_rate": 2.5118772505469367e-06, + "loss": 0.0466, + "step": 28490 + }, + { + "epoch": 77.63215258855585, + "grad_norm": 2.897447347640991, + "learning_rate": 2.5112923780152975e-06, + "loss": 0.0399, + "step": 28491 + }, + { + "epoch": 77.63487738419619, + "grad_norm": 1.9452128410339355, + "learning_rate": 2.5107075638054703e-06, + "loss": 0.0993, + "step": 28492 + }, + { + "epoch": 77.6376021798365, + "grad_norm": 2.642165422439575, + "learning_rate": 2.510122807922013e-06, + "loss": 0.1071, + "step": 28493 + }, + { + "epoch": 77.64032697547684, + "grad_norm": 2.3399901390075684, + "learning_rate": 2.5095381103694794e-06, + "loss": 0.1992, + "step": 28494 + }, + { + "epoch": 77.64305177111717, + "grad_norm": 1.9544345140457153, + "learning_rate": 2.508953471152421e-06, + "loss": 0.0491, + "step": 28495 + }, + { + "epoch": 77.64577656675749, + "grad_norm": 2.452011823654175, + "learning_rate": 2.508368890275389e-06, + "loss": 0.0988, + "step": 28496 + }, + { + "epoch": 77.64850136239782, + "grad_norm": 2.419713258743286, + "learning_rate": 2.5077843677429424e-06, + "loss": 0.0252, + "step": 28497 + }, + { + "epoch": 77.65122615803814, + "grad_norm": 1.995934009552002, + "learning_rate": 2.5071999035596297e-06, + "loss": 0.031, + "step": 28498 + }, + { + "epoch": 77.65395095367847, + "grad_norm": 2.7805862426757812, + "learning_rate": 2.5066154977300027e-06, + "loss": 0.0597, + "step": 28499 + }, + { + "epoch": 77.65667574931881, + "grad_norm": 2.0950520038604736, + "learning_rate": 2.506031150258611e-06, + "loss": 0.0681, + "step": 28500 + }, + { + "epoch": 77.65940054495913, + "grad_norm": 2.8751299381256104, + "learning_rate": 2.5054468611500106e-06, + "loss": 0.1098, + "step": 28501 + }, + { + "epoch": 77.66212534059946, + "grad_norm": 1.9896756410598755, + "learning_rate": 2.5048626304087443e-06, + "loss": 0.051, + "step": 28502 + }, + { + "epoch": 77.66485013623978, + "grad_norm": 2.270315647125244, + "learning_rate": 2.504278458039371e-06, + "loss": 0.0659, + "step": 28503 + }, + { + "epoch": 77.66757493188011, + "grad_norm": 2.663672924041748, + "learning_rate": 2.5036943440464323e-06, + "loss": 0.0409, + "step": 28504 + }, + { + "epoch": 77.67029972752043, + "grad_norm": 2.6846094131469727, + "learning_rate": 2.5031102884344837e-06, + "loss": 0.1217, + "step": 28505 + }, + { + "epoch": 77.67302452316076, + "grad_norm": 2.4924800395965576, + "learning_rate": 2.5025262912080715e-06, + "loss": 0.0799, + "step": 28506 + }, + { + "epoch": 77.6757493188011, + "grad_norm": 3.586364507675171, + "learning_rate": 2.5019423523717425e-06, + "loss": 0.1618, + "step": 28507 + }, + { + "epoch": 77.67847411444141, + "grad_norm": 3.409531354904175, + "learning_rate": 2.5013584719300423e-06, + "loss": 0.1027, + "step": 28508 + }, + { + "epoch": 77.68119891008175, + "grad_norm": 2.3508975505828857, + "learning_rate": 2.500774649887524e-06, + "loss": 0.0678, + "step": 28509 + }, + { + "epoch": 77.68392370572207, + "grad_norm": 2.8088393211364746, + "learning_rate": 2.500190886248731e-06, + "loss": 0.0328, + "step": 28510 + }, + { + "epoch": 77.6866485013624, + "grad_norm": 2.0199978351593018, + "learning_rate": 2.499607181018211e-06, + "loss": 0.0927, + "step": 28511 + }, + { + "epoch": 77.68937329700273, + "grad_norm": 2.5782463550567627, + "learning_rate": 2.4990235342005056e-06, + "loss": 0.0284, + "step": 28512 + }, + { + "epoch": 77.69209809264305, + "grad_norm": 4.917638301849365, + "learning_rate": 2.4984399458001662e-06, + "loss": 0.14, + "step": 28513 + }, + { + "epoch": 77.69482288828338, + "grad_norm": 3.7573370933532715, + "learning_rate": 2.4978564158217344e-06, + "loss": 0.1011, + "step": 28514 + }, + { + "epoch": 77.6975476839237, + "grad_norm": 2.4647064208984375, + "learning_rate": 2.497272944269756e-06, + "loss": 0.0746, + "step": 28515 + }, + { + "epoch": 77.70027247956403, + "grad_norm": 2.724976062774658, + "learning_rate": 2.4966895311487716e-06, + "loss": 0.0434, + "step": 28516 + }, + { + "epoch": 77.70299727520435, + "grad_norm": 1.962424635887146, + "learning_rate": 2.496106176463331e-06, + "loss": 0.1256, + "step": 28517 + }, + { + "epoch": 77.70572207084469, + "grad_norm": 2.76932430267334, + "learning_rate": 2.495522880217973e-06, + "loss": 0.1447, + "step": 28518 + }, + { + "epoch": 77.70844686648502, + "grad_norm": 3.503516674041748, + "learning_rate": 2.494939642417239e-06, + "loss": 0.0959, + "step": 28519 + }, + { + "epoch": 77.71117166212534, + "grad_norm": 3.4417996406555176, + "learning_rate": 2.494356463065676e-06, + "loss": 0.1635, + "step": 28520 + }, + { + "epoch": 77.71389645776567, + "grad_norm": 2.597670316696167, + "learning_rate": 2.493773342167821e-06, + "loss": 0.0391, + "step": 28521 + }, + { + "epoch": 77.71662125340599, + "grad_norm": 2.055619955062866, + "learning_rate": 2.49319027972822e-06, + "loss": 0.03, + "step": 28522 + }, + { + "epoch": 77.71934604904632, + "grad_norm": 2.1465537548065186, + "learning_rate": 2.492607275751412e-06, + "loss": 0.059, + "step": 28523 + }, + { + "epoch": 77.72207084468666, + "grad_norm": 2.7853634357452393, + "learning_rate": 2.4920243302419367e-06, + "loss": 0.1247, + "step": 28524 + }, + { + "epoch": 77.72479564032697, + "grad_norm": 3.553372859954834, + "learning_rate": 2.491441443204331e-06, + "loss": 0.0993, + "step": 28525 + }, + { + "epoch": 77.7275204359673, + "grad_norm": 3.1164045333862305, + "learning_rate": 2.4908586146431413e-06, + "loss": 0.0721, + "step": 28526 + }, + { + "epoch": 77.73024523160763, + "grad_norm": 2.7990827560424805, + "learning_rate": 2.4902758445629027e-06, + "loss": 0.0696, + "step": 28527 + }, + { + "epoch": 77.73297002724796, + "grad_norm": 3.442732810974121, + "learning_rate": 2.4896931329681508e-06, + "loss": 0.079, + "step": 28528 + }, + { + "epoch": 77.73569482288828, + "grad_norm": 2.3545656204223633, + "learning_rate": 2.4891104798634303e-06, + "loss": 0.0855, + "step": 28529 + }, + { + "epoch": 77.73841961852861, + "grad_norm": 2.6045665740966797, + "learning_rate": 2.4885278852532758e-06, + "loss": 0.0456, + "step": 28530 + }, + { + "epoch": 77.74114441416894, + "grad_norm": 2.317164659500122, + "learning_rate": 2.4879453491422236e-06, + "loss": 0.0657, + "step": 28531 + }, + { + "epoch": 77.74386920980926, + "grad_norm": 3.0449130535125732, + "learning_rate": 2.4873628715348088e-06, + "loss": 0.106, + "step": 28532 + }, + { + "epoch": 77.7465940054496, + "grad_norm": 2.2596282958984375, + "learning_rate": 2.486780452435573e-06, + "loss": 0.0338, + "step": 28533 + }, + { + "epoch": 77.74931880108991, + "grad_norm": 2.0528342723846436, + "learning_rate": 2.48619809184905e-06, + "loss": 0.0239, + "step": 28534 + }, + { + "epoch": 77.75204359673025, + "grad_norm": 2.289703845977783, + "learning_rate": 2.485615789779774e-06, + "loss": 0.0353, + "step": 28535 + }, + { + "epoch": 77.75476839237058, + "grad_norm": 2.7122628688812256, + "learning_rate": 2.485033546232277e-06, + "loss": 0.0579, + "step": 28536 + }, + { + "epoch": 77.7574931880109, + "grad_norm": 3.519174575805664, + "learning_rate": 2.4844513612110977e-06, + "loss": 0.0473, + "step": 28537 + }, + { + "epoch": 77.76021798365123, + "grad_norm": 3.06754207611084, + "learning_rate": 2.4838692347207717e-06, + "loss": 0.0389, + "step": 28538 + }, + { + "epoch": 77.76294277929155, + "grad_norm": 2.3011691570281982, + "learning_rate": 2.48328716676583e-06, + "loss": 0.0808, + "step": 28539 + }, + { + "epoch": 77.76566757493188, + "grad_norm": 4.819763660430908, + "learning_rate": 2.4827051573508067e-06, + "loss": 0.1052, + "step": 28540 + }, + { + "epoch": 77.7683923705722, + "grad_norm": 2.2383973598480225, + "learning_rate": 2.482123206480229e-06, + "loss": 0.096, + "step": 28541 + }, + { + "epoch": 77.77111716621253, + "grad_norm": 3.0312654972076416, + "learning_rate": 2.4815413141586387e-06, + "loss": 0.2563, + "step": 28542 + }, + { + "epoch": 77.77384196185287, + "grad_norm": 4.265959739685059, + "learning_rate": 2.4809594803905614e-06, + "loss": 0.0585, + "step": 28543 + }, + { + "epoch": 77.77656675749319, + "grad_norm": 3.2749221324920654, + "learning_rate": 2.48037770518053e-06, + "loss": 0.1504, + "step": 28544 + }, + { + "epoch": 77.77929155313352, + "grad_norm": 2.5465848445892334, + "learning_rate": 2.4797959885330724e-06, + "loss": 0.0627, + "step": 28545 + }, + { + "epoch": 77.78201634877384, + "grad_norm": 3.44708514213562, + "learning_rate": 2.479214330452725e-06, + "loss": 0.255, + "step": 28546 + }, + { + "epoch": 77.78474114441417, + "grad_norm": 3.05719256401062, + "learning_rate": 2.4786327309440138e-06, + "loss": 0.1095, + "step": 28547 + }, + { + "epoch": 77.7874659400545, + "grad_norm": 3.280073642730713, + "learning_rate": 2.4780511900114678e-06, + "loss": 0.039, + "step": 28548 + }, + { + "epoch": 77.79019073569482, + "grad_norm": 3.0980327129364014, + "learning_rate": 2.4774697076596154e-06, + "loss": 0.0374, + "step": 28549 + }, + { + "epoch": 77.79291553133515, + "grad_norm": 2.5396461486816406, + "learning_rate": 2.47688828389299e-06, + "loss": 0.0234, + "step": 28550 + }, + { + "epoch": 77.79564032697547, + "grad_norm": 2.5326597690582275, + "learning_rate": 2.4763069187161158e-06, + "loss": 0.0935, + "step": 28551 + }, + { + "epoch": 77.7983651226158, + "grad_norm": 3.904620409011841, + "learning_rate": 2.4757256121335182e-06, + "loss": 0.0399, + "step": 28552 + }, + { + "epoch": 77.80108991825612, + "grad_norm": 2.865692615509033, + "learning_rate": 2.4751443641497307e-06, + "loss": 0.0881, + "step": 28553 + }, + { + "epoch": 77.80381471389646, + "grad_norm": 2.2848098278045654, + "learning_rate": 2.4745631747692732e-06, + "loss": 0.1282, + "step": 28554 + }, + { + "epoch": 77.80653950953679, + "grad_norm": 2.0827324390411377, + "learning_rate": 2.473982043996679e-06, + "loss": 0.0274, + "step": 28555 + }, + { + "epoch": 77.80926430517711, + "grad_norm": 4.4037652015686035, + "learning_rate": 2.4734009718364693e-06, + "loss": 0.0599, + "step": 28556 + }, + { + "epoch": 77.81198910081744, + "grad_norm": 3.0163779258728027, + "learning_rate": 2.4728199582931687e-06, + "loss": 0.0578, + "step": 28557 + }, + { + "epoch": 77.81471389645776, + "grad_norm": 2.8764543533325195, + "learning_rate": 2.4722390033713074e-06, + "loss": 0.1005, + "step": 28558 + }, + { + "epoch": 77.8174386920981, + "grad_norm": 3.6553354263305664, + "learning_rate": 2.471658107075405e-06, + "loss": 0.1354, + "step": 28559 + }, + { + "epoch": 77.82016348773843, + "grad_norm": 4.242199420928955, + "learning_rate": 2.4710772694099885e-06, + "loss": 0.0526, + "step": 28560 + }, + { + "epoch": 77.82288828337875, + "grad_norm": 2.175461769104004, + "learning_rate": 2.470496490379576e-06, + "loss": 0.2264, + "step": 28561 + }, + { + "epoch": 77.82561307901908, + "grad_norm": 2.97206974029541, + "learning_rate": 2.4699157699886977e-06, + "loss": 0.0428, + "step": 28562 + }, + { + "epoch": 77.8283378746594, + "grad_norm": 4.373528957366943, + "learning_rate": 2.4693351082418725e-06, + "loss": 0.1485, + "step": 28563 + }, + { + "epoch": 77.83106267029973, + "grad_norm": 2.3471200466156006, + "learning_rate": 2.4687545051436233e-06, + "loss": 0.0856, + "step": 28564 + }, + { + "epoch": 77.83378746594005, + "grad_norm": 4.146914958953857, + "learning_rate": 2.46817396069847e-06, + "loss": 0.2022, + "step": 28565 + }, + { + "epoch": 77.83651226158038, + "grad_norm": 2.7037479877471924, + "learning_rate": 2.4675934749109375e-06, + "loss": 0.0649, + "step": 28566 + }, + { + "epoch": 77.83923705722071, + "grad_norm": 2.6036858558654785, + "learning_rate": 2.4670130477855437e-06, + "loss": 0.0867, + "step": 28567 + }, + { + "epoch": 77.84196185286103, + "grad_norm": 3.4696624279022217, + "learning_rate": 2.466432679326811e-06, + "loss": 0.0988, + "step": 28568 + }, + { + "epoch": 77.84468664850137, + "grad_norm": 3.490933418273926, + "learning_rate": 2.4658523695392545e-06, + "loss": 0.1309, + "step": 28569 + }, + { + "epoch": 77.84741144414168, + "grad_norm": 4.492375373840332, + "learning_rate": 2.4652721184274008e-06, + "loss": 0.133, + "step": 28570 + }, + { + "epoch": 77.85013623978202, + "grad_norm": 3.200601577758789, + "learning_rate": 2.4646919259957623e-06, + "loss": 0.043, + "step": 28571 + }, + { + "epoch": 77.85286103542235, + "grad_norm": 2.435253143310547, + "learning_rate": 2.464111792248863e-06, + "loss": 0.0278, + "step": 28572 + }, + { + "epoch": 77.85558583106267, + "grad_norm": 3.9881691932678223, + "learning_rate": 2.4635317171912164e-06, + "loss": 0.0846, + "step": 28573 + }, + { + "epoch": 77.858310626703, + "grad_norm": 2.9328901767730713, + "learning_rate": 2.462951700827344e-06, + "loss": 0.051, + "step": 28574 + }, + { + "epoch": 77.86103542234332, + "grad_norm": 2.805507183074951, + "learning_rate": 2.462371743161762e-06, + "loss": 0.1161, + "step": 28575 + }, + { + "epoch": 77.86376021798365, + "grad_norm": 2.6177818775177, + "learning_rate": 2.461791844198986e-06, + "loss": 0.0343, + "step": 28576 + }, + { + "epoch": 77.86648501362397, + "grad_norm": 3.3624141216278076, + "learning_rate": 2.4612120039435306e-06, + "loss": 0.0402, + "step": 28577 + }, + { + "epoch": 77.8692098092643, + "grad_norm": 2.7366902828216553, + "learning_rate": 2.4606322223999147e-06, + "loss": 0.0373, + "step": 28578 + }, + { + "epoch": 77.87193460490464, + "grad_norm": 3.220646619796753, + "learning_rate": 2.4600524995726537e-06, + "loss": 0.063, + "step": 28579 + }, + { + "epoch": 77.87465940054496, + "grad_norm": 2.4427764415740967, + "learning_rate": 2.45947283546626e-06, + "loss": 0.0569, + "step": 28580 + }, + { + "epoch": 77.87738419618529, + "grad_norm": 2.1700329780578613, + "learning_rate": 2.4588932300852476e-06, + "loss": 0.0531, + "step": 28581 + }, + { + "epoch": 77.88010899182561, + "grad_norm": 3.691664457321167, + "learning_rate": 2.4583136834341336e-06, + "loss": 0.0465, + "step": 28582 + }, + { + "epoch": 77.88283378746594, + "grad_norm": 3.2681214809417725, + "learning_rate": 2.4577341955174307e-06, + "loss": 0.0373, + "step": 28583 + }, + { + "epoch": 77.88555858310627, + "grad_norm": 3.141700029373169, + "learning_rate": 2.4571547663396513e-06, + "loss": 0.0994, + "step": 28584 + }, + { + "epoch": 77.88828337874659, + "grad_norm": 2.2609872817993164, + "learning_rate": 2.456575395905304e-06, + "loss": 0.0366, + "step": 28585 + }, + { + "epoch": 77.89100817438693, + "grad_norm": 2.097759962081909, + "learning_rate": 2.455996084218909e-06, + "loss": 0.0322, + "step": 28586 + }, + { + "epoch": 77.89373297002724, + "grad_norm": 2.123995780944824, + "learning_rate": 2.4554168312849724e-06, + "loss": 0.0785, + "step": 28587 + }, + { + "epoch": 77.89645776566758, + "grad_norm": 2.2426674365997314, + "learning_rate": 2.454837637108004e-06, + "loss": 0.0409, + "step": 28588 + }, + { + "epoch": 77.8991825613079, + "grad_norm": 3.0533556938171387, + "learning_rate": 2.4542585016925215e-06, + "loss": 0.0635, + "step": 28589 + }, + { + "epoch": 77.90190735694823, + "grad_norm": 4.239056587219238, + "learning_rate": 2.4536794250430264e-06, + "loss": 0.0288, + "step": 28590 + }, + { + "epoch": 77.90463215258856, + "grad_norm": 2.0648422241210938, + "learning_rate": 2.453100407164036e-06, + "loss": 0.1212, + "step": 28591 + }, + { + "epoch": 77.90735694822888, + "grad_norm": 3.995161771774292, + "learning_rate": 2.4525214480600577e-06, + "loss": 0.0303, + "step": 28592 + }, + { + "epoch": 77.91008174386921, + "grad_norm": 2.431945323944092, + "learning_rate": 2.451942547735596e-06, + "loss": 0.0356, + "step": 28593 + }, + { + "epoch": 77.91280653950953, + "grad_norm": 2.9772019386291504, + "learning_rate": 2.4513637061951655e-06, + "loss": 0.0361, + "step": 28594 + }, + { + "epoch": 77.91553133514986, + "grad_norm": 2.962559461593628, + "learning_rate": 2.450784923443272e-06, + "loss": 0.0815, + "step": 28595 + }, + { + "epoch": 77.9182561307902, + "grad_norm": 2.871248960494995, + "learning_rate": 2.450206199484423e-06, + "loss": 0.0609, + "step": 28596 + }, + { + "epoch": 77.92098092643052, + "grad_norm": 2.7894411087036133, + "learning_rate": 2.4496275343231214e-06, + "loss": 0.0312, + "step": 28597 + }, + { + "epoch": 77.92370572207085, + "grad_norm": 2.7226953506469727, + "learning_rate": 2.4490489279638806e-06, + "loss": 0.0375, + "step": 28598 + }, + { + "epoch": 77.92643051771117, + "grad_norm": 4.2436699867248535, + "learning_rate": 2.448470380411204e-06, + "loss": 0.0745, + "step": 28599 + }, + { + "epoch": 77.9291553133515, + "grad_norm": 3.8377609252929688, + "learning_rate": 2.447891891669596e-06, + "loss": 0.0422, + "step": 28600 + }, + { + "epoch": 77.93188010899182, + "grad_norm": 4.173841953277588, + "learning_rate": 2.4473134617435614e-06, + "loss": 0.0461, + "step": 28601 + }, + { + "epoch": 77.93460490463215, + "grad_norm": 3.207427501678467, + "learning_rate": 2.4467350906376085e-06, + "loss": 0.0936, + "step": 28602 + }, + { + "epoch": 77.93732970027249, + "grad_norm": 3.2238423824310303, + "learning_rate": 2.44615677835624e-06, + "loss": 0.1035, + "step": 28603 + }, + { + "epoch": 77.9400544959128, + "grad_norm": 3.26841402053833, + "learning_rate": 2.44557852490396e-06, + "loss": 0.0754, + "step": 28604 + }, + { + "epoch": 77.94277929155314, + "grad_norm": 3.017800807952881, + "learning_rate": 2.4450003302852663e-06, + "loss": 0.1067, + "step": 28605 + }, + { + "epoch": 77.94550408719346, + "grad_norm": 2.6638243198394775, + "learning_rate": 2.4444221945046687e-06, + "loss": 0.0359, + "step": 28606 + }, + { + "epoch": 77.94822888283379, + "grad_norm": 3.491483449935913, + "learning_rate": 2.4438441175666706e-06, + "loss": 0.0686, + "step": 28607 + }, + { + "epoch": 77.95095367847412, + "grad_norm": 2.04025936126709, + "learning_rate": 2.4432660994757707e-06, + "loss": 0.0423, + "step": 28608 + }, + { + "epoch": 77.95367847411444, + "grad_norm": 2.4790706634521484, + "learning_rate": 2.4426881402364722e-06, + "loss": 0.0403, + "step": 28609 + }, + { + "epoch": 77.95640326975477, + "grad_norm": 1.964853286743164, + "learning_rate": 2.4421102398532716e-06, + "loss": 0.0282, + "step": 28610 + }, + { + "epoch": 77.95912806539509, + "grad_norm": 2.6440622806549072, + "learning_rate": 2.441532398330676e-06, + "loss": 0.1535, + "step": 28611 + }, + { + "epoch": 77.96185286103542, + "grad_norm": 2.9482619762420654, + "learning_rate": 2.4409546156731835e-06, + "loss": 0.0292, + "step": 28612 + }, + { + "epoch": 77.96457765667574, + "grad_norm": 1.9689563512802124, + "learning_rate": 2.4403768918852923e-06, + "loss": 0.0505, + "step": 28613 + }, + { + "epoch": 77.96730245231608, + "grad_norm": 3.476179361343384, + "learning_rate": 2.4397992269714996e-06, + "loss": 0.0635, + "step": 28614 + }, + { + "epoch": 77.97002724795641, + "grad_norm": 1.731796145439148, + "learning_rate": 2.4392216209363106e-06, + "loss": 0.0228, + "step": 28615 + }, + { + "epoch": 77.97275204359673, + "grad_norm": 1.4027667045593262, + "learning_rate": 2.438644073784221e-06, + "loss": 0.0183, + "step": 28616 + }, + { + "epoch": 77.97547683923706, + "grad_norm": 2.9973654747009277, + "learning_rate": 2.438066585519724e-06, + "loss": 0.0488, + "step": 28617 + }, + { + "epoch": 77.97820163487738, + "grad_norm": 2.85360050201416, + "learning_rate": 2.4374891561473236e-06, + "loss": 0.0324, + "step": 28618 + }, + { + "epoch": 77.98092643051771, + "grad_norm": 1.7630435228347778, + "learning_rate": 2.4369117856715152e-06, + "loss": 0.1123, + "step": 28619 + }, + { + "epoch": 77.98365122615803, + "grad_norm": 2.655789852142334, + "learning_rate": 2.436334474096794e-06, + "loss": 0.2556, + "step": 28620 + }, + { + "epoch": 77.98637602179836, + "grad_norm": 2.6451289653778076, + "learning_rate": 2.4357572214276536e-06, + "loss": 0.1174, + "step": 28621 + }, + { + "epoch": 77.9891008174387, + "grad_norm": 3.7719886302948, + "learning_rate": 2.4351800276685932e-06, + "loss": 0.0858, + "step": 28622 + }, + { + "epoch": 77.99182561307902, + "grad_norm": 4.808012962341309, + "learning_rate": 2.4346028928241095e-06, + "loss": 0.0458, + "step": 28623 + }, + { + "epoch": 77.99455040871935, + "grad_norm": 3.1198360919952393, + "learning_rate": 2.434025816898695e-06, + "loss": 0.0456, + "step": 28624 + }, + { + "epoch": 77.99727520435967, + "grad_norm": 2.0654773712158203, + "learning_rate": 2.4334487998968435e-06, + "loss": 0.0265, + "step": 28625 + }, + { + "epoch": 78.0, + "grad_norm": 3.193361520767212, + "learning_rate": 2.432871841823047e-06, + "loss": 0.056, + "step": 28626 + }, + { + "epoch": 78.00272479564033, + "grad_norm": 4.100928783416748, + "learning_rate": 2.432294942681803e-06, + "loss": 0.0728, + "step": 28627 + }, + { + "epoch": 78.00544959128065, + "grad_norm": 2.658005475997925, + "learning_rate": 2.431718102477604e-06, + "loss": 0.0624, + "step": 28628 + }, + { + "epoch": 78.00817438692098, + "grad_norm": 4.394220352172852, + "learning_rate": 2.4311413212149395e-06, + "loss": 0.0923, + "step": 28629 + }, + { + "epoch": 78.0108991825613, + "grad_norm": 4.086851596832275, + "learning_rate": 2.4305645988983007e-06, + "loss": 0.0847, + "step": 28630 + }, + { + "epoch": 78.01362397820164, + "grad_norm": 2.9714341163635254, + "learning_rate": 2.4299879355321844e-06, + "loss": 0.0385, + "step": 28631 + }, + { + "epoch": 78.01634877384195, + "grad_norm": 4.148153305053711, + "learning_rate": 2.4294113311210775e-06, + "loss": 0.0505, + "step": 28632 + }, + { + "epoch": 78.01907356948229, + "grad_norm": 3.036773920059204, + "learning_rate": 2.4288347856694718e-06, + "loss": 0.0606, + "step": 28633 + }, + { + "epoch": 78.02179836512262, + "grad_norm": 3.061009168624878, + "learning_rate": 2.428258299181854e-06, + "loss": 0.0309, + "step": 28634 + }, + { + "epoch": 78.02452316076294, + "grad_norm": 2.729743242263794, + "learning_rate": 2.4276818716627195e-06, + "loss": 0.0668, + "step": 28635 + }, + { + "epoch": 78.02724795640327, + "grad_norm": 2.4344239234924316, + "learning_rate": 2.4271055031165557e-06, + "loss": 0.0886, + "step": 28636 + }, + { + "epoch": 78.02997275204359, + "grad_norm": 4.145779132843018, + "learning_rate": 2.4265291935478472e-06, + "loss": 0.1251, + "step": 28637 + }, + { + "epoch": 78.03269754768392, + "grad_norm": 3.1622867584228516, + "learning_rate": 2.4259529429610884e-06, + "loss": 0.0432, + "step": 28638 + }, + { + "epoch": 78.03542234332426, + "grad_norm": 2.4364748001098633, + "learning_rate": 2.425376751360764e-06, + "loss": 0.0872, + "step": 28639 + }, + { + "epoch": 78.03814713896458, + "grad_norm": 2.948251724243164, + "learning_rate": 2.4248006187513597e-06, + "loss": 0.0499, + "step": 28640 + }, + { + "epoch": 78.04087193460491, + "grad_norm": 1.996466875076294, + "learning_rate": 2.4242245451373667e-06, + "loss": 0.0398, + "step": 28641 + }, + { + "epoch": 78.04359673024523, + "grad_norm": 3.166872262954712, + "learning_rate": 2.423648530523266e-06, + "loss": 0.1205, + "step": 28642 + }, + { + "epoch": 78.04632152588556, + "grad_norm": 2.3039448261260986, + "learning_rate": 2.4230725749135496e-06, + "loss": 0.0712, + "step": 28643 + }, + { + "epoch": 78.04904632152588, + "grad_norm": 1.8140027523040771, + "learning_rate": 2.4224966783127014e-06, + "loss": 0.0257, + "step": 28644 + }, + { + "epoch": 78.05177111716621, + "grad_norm": 3.5995044708251953, + "learning_rate": 2.4219208407252036e-06, + "loss": 0.1424, + "step": 28645 + }, + { + "epoch": 78.05449591280654, + "grad_norm": 2.4110090732574463, + "learning_rate": 2.42134506215554e-06, + "loss": 0.0586, + "step": 28646 + }, + { + "epoch": 78.05722070844686, + "grad_norm": 2.7712249755859375, + "learning_rate": 2.4207693426082003e-06, + "loss": 0.0375, + "step": 28647 + }, + { + "epoch": 78.0599455040872, + "grad_norm": 2.5217080116271973, + "learning_rate": 2.420193682087665e-06, + "loss": 0.0937, + "step": 28648 + }, + { + "epoch": 78.06267029972751, + "grad_norm": 2.138751268386841, + "learning_rate": 2.419618080598417e-06, + "loss": 0.0216, + "step": 28649 + }, + { + "epoch": 78.06539509536785, + "grad_norm": 2.249903917312622, + "learning_rate": 2.4190425381449366e-06, + "loss": 0.0235, + "step": 28650 + }, + { + "epoch": 78.06811989100818, + "grad_norm": 2.7832961082458496, + "learning_rate": 2.4184670547317123e-06, + "loss": 0.1426, + "step": 28651 + }, + { + "epoch": 78.0708446866485, + "grad_norm": 3.140596866607666, + "learning_rate": 2.417891630363222e-06, + "loss": 0.045, + "step": 28652 + }, + { + "epoch": 78.07356948228883, + "grad_norm": 3.63569712638855, + "learning_rate": 2.4173162650439485e-06, + "loss": 0.0302, + "step": 28653 + }, + { + "epoch": 78.07629427792915, + "grad_norm": 2.5194928646087646, + "learning_rate": 2.4167409587783676e-06, + "loss": 0.1044, + "step": 28654 + }, + { + "epoch": 78.07901907356948, + "grad_norm": 3.443791151046753, + "learning_rate": 2.416165711570968e-06, + "loss": 0.1248, + "step": 28655 + }, + { + "epoch": 78.0817438692098, + "grad_norm": 2.9317615032196045, + "learning_rate": 2.4155905234262255e-06, + "loss": 0.1934, + "step": 28656 + }, + { + "epoch": 78.08446866485014, + "grad_norm": 3.092083692550659, + "learning_rate": 2.4150153943486166e-06, + "loss": 0.0334, + "step": 28657 + }, + { + "epoch": 78.08719346049047, + "grad_norm": 1.6678235530853271, + "learning_rate": 2.414440324342624e-06, + "loss": 0.0247, + "step": 28658 + }, + { + "epoch": 78.08991825613079, + "grad_norm": 4.245721340179443, + "learning_rate": 2.413865313412729e-06, + "loss": 0.035, + "step": 28659 + }, + { + "epoch": 78.09264305177112, + "grad_norm": 2.952965021133423, + "learning_rate": 2.4132903615634073e-06, + "loss": 0.0525, + "step": 28660 + }, + { + "epoch": 78.09536784741144, + "grad_norm": 3.37847900390625, + "learning_rate": 2.412715468799135e-06, + "loss": 0.0291, + "step": 28661 + }, + { + "epoch": 78.09809264305177, + "grad_norm": 2.557279348373413, + "learning_rate": 2.412140635124388e-06, + "loss": 0.0285, + "step": 28662 + }, + { + "epoch": 78.1008174386921, + "grad_norm": 2.3011956214904785, + "learning_rate": 2.4115658605436488e-06, + "loss": 0.0356, + "step": 28663 + }, + { + "epoch": 78.10354223433242, + "grad_norm": 3.312464714050293, + "learning_rate": 2.41099114506139e-06, + "loss": 0.19, + "step": 28664 + }, + { + "epoch": 78.10626702997276, + "grad_norm": 3.0109522342681885, + "learning_rate": 2.410416488682088e-06, + "loss": 0.0625, + "step": 28665 + }, + { + "epoch": 78.10899182561307, + "grad_norm": 3.418283224105835, + "learning_rate": 2.409841891410215e-06, + "loss": 0.0352, + "step": 28666 + }, + { + "epoch": 78.11171662125341, + "grad_norm": 2.0435028076171875, + "learning_rate": 2.409267353250252e-06, + "loss": 0.0279, + "step": 28667 + }, + { + "epoch": 78.11444141689373, + "grad_norm": 3.5080766677856445, + "learning_rate": 2.408692874206672e-06, + "loss": 0.0999, + "step": 28668 + }, + { + "epoch": 78.11716621253406, + "grad_norm": 2.4358937740325928, + "learning_rate": 2.4081184542839455e-06, + "loss": 0.046, + "step": 28669 + }, + { + "epoch": 78.11989100817439, + "grad_norm": 2.2511494159698486, + "learning_rate": 2.407544093486546e-06, + "loss": 0.0417, + "step": 28670 + }, + { + "epoch": 78.12261580381471, + "grad_norm": 4.012392997741699, + "learning_rate": 2.4069697918189515e-06, + "loss": 0.0346, + "step": 28671 + }, + { + "epoch": 78.12534059945504, + "grad_norm": 2.87082839012146, + "learning_rate": 2.406395549285633e-06, + "loss": 0.1297, + "step": 28672 + }, + { + "epoch": 78.12806539509536, + "grad_norm": 2.527850866317749, + "learning_rate": 2.4058213658910602e-06, + "loss": 0.0732, + "step": 28673 + }, + { + "epoch": 78.1307901907357, + "grad_norm": 2.9530582427978516, + "learning_rate": 2.4052472416397034e-06, + "loss": 0.0562, + "step": 28674 + }, + { + "epoch": 78.13351498637603, + "grad_norm": 2.147108793258667, + "learning_rate": 2.4046731765360377e-06, + "loss": 0.0231, + "step": 28675 + }, + { + "epoch": 78.13623978201635, + "grad_norm": 3.0856306552886963, + "learning_rate": 2.404099170584534e-06, + "loss": 0.1795, + "step": 28676 + }, + { + "epoch": 78.13896457765668, + "grad_norm": 1.4786776304244995, + "learning_rate": 2.4035252237896635e-06, + "loss": 0.0247, + "step": 28677 + }, + { + "epoch": 78.141689373297, + "grad_norm": 2.742638111114502, + "learning_rate": 2.40295133615589e-06, + "loss": 0.0406, + "step": 28678 + }, + { + "epoch": 78.14441416893733, + "grad_norm": 1.8566851615905762, + "learning_rate": 2.40237750768769e-06, + "loss": 0.0573, + "step": 28679 + }, + { + "epoch": 78.14713896457765, + "grad_norm": 3.6054091453552246, + "learning_rate": 2.4018037383895287e-06, + "loss": 0.0728, + "step": 28680 + }, + { + "epoch": 78.14986376021798, + "grad_norm": 1.8873311281204224, + "learning_rate": 2.401230028265876e-06, + "loss": 0.0246, + "step": 28681 + }, + { + "epoch": 78.15258855585832, + "grad_norm": 2.6724722385406494, + "learning_rate": 2.400656377321197e-06, + "loss": 0.0229, + "step": 28682 + }, + { + "epoch": 78.15531335149863, + "grad_norm": 2.5824334621429443, + "learning_rate": 2.400082785559964e-06, + "loss": 0.1163, + "step": 28683 + }, + { + "epoch": 78.15803814713897, + "grad_norm": 2.8021554946899414, + "learning_rate": 2.3995092529866415e-06, + "loss": 0.0304, + "step": 28684 + }, + { + "epoch": 78.16076294277929, + "grad_norm": 2.497877359390259, + "learning_rate": 2.3989357796056966e-06, + "loss": 0.0562, + "step": 28685 + }, + { + "epoch": 78.16348773841962, + "grad_norm": 2.606130361557007, + "learning_rate": 2.398362365421593e-06, + "loss": 0.1258, + "step": 28686 + }, + { + "epoch": 78.16621253405995, + "grad_norm": 2.5798847675323486, + "learning_rate": 2.3977890104388002e-06, + "loss": 0.1724, + "step": 28687 + }, + { + "epoch": 78.16893732970027, + "grad_norm": 3.3414177894592285, + "learning_rate": 2.3972157146617823e-06, + "loss": 0.067, + "step": 28688 + }, + { + "epoch": 78.1716621253406, + "grad_norm": 2.186988592147827, + "learning_rate": 2.396642478095004e-06, + "loss": 0.0766, + "step": 28689 + }, + { + "epoch": 78.17438692098092, + "grad_norm": 3.304708480834961, + "learning_rate": 2.396069300742926e-06, + "loss": 0.0408, + "step": 28690 + }, + { + "epoch": 78.17711171662125, + "grad_norm": 2.2575109004974365, + "learning_rate": 2.3954961826100154e-06, + "loss": 0.0367, + "step": 28691 + }, + { + "epoch": 78.17983651226157, + "grad_norm": 3.3511736392974854, + "learning_rate": 2.3949231237007396e-06, + "loss": 0.0939, + "step": 28692 + }, + { + "epoch": 78.1825613079019, + "grad_norm": 2.3919754028320312, + "learning_rate": 2.3943501240195565e-06, + "loss": 0.0427, + "step": 28693 + }, + { + "epoch": 78.18528610354224, + "grad_norm": 2.78475022315979, + "learning_rate": 2.3937771835709313e-06, + "loss": 0.0657, + "step": 28694 + }, + { + "epoch": 78.18801089918256, + "grad_norm": 2.3260419368743896, + "learning_rate": 2.393204302359321e-06, + "loss": 0.0314, + "step": 28695 + }, + { + "epoch": 78.19073569482289, + "grad_norm": 3.031043767929077, + "learning_rate": 2.392631480389194e-06, + "loss": 0.1068, + "step": 28696 + }, + { + "epoch": 78.19346049046321, + "grad_norm": 2.7713918685913086, + "learning_rate": 2.3920587176650077e-06, + "loss": 0.0604, + "step": 28697 + }, + { + "epoch": 78.19618528610354, + "grad_norm": 2.4141011238098145, + "learning_rate": 2.3914860141912234e-06, + "loss": 0.0314, + "step": 28698 + }, + { + "epoch": 78.19891008174388, + "grad_norm": 2.8410580158233643, + "learning_rate": 2.3909133699722976e-06, + "loss": 0.1591, + "step": 28699 + }, + { + "epoch": 78.2016348773842, + "grad_norm": 2.6988158226013184, + "learning_rate": 2.390340785012697e-06, + "loss": 0.0617, + "step": 28700 + }, + { + "epoch": 78.20435967302453, + "grad_norm": 2.9085278511047363, + "learning_rate": 2.389768259316878e-06, + "loss": 0.1084, + "step": 28701 + }, + { + "epoch": 78.20708446866485, + "grad_norm": 2.911033868789673, + "learning_rate": 2.389195792889295e-06, + "loss": 0.0561, + "step": 28702 + }, + { + "epoch": 78.20980926430518, + "grad_norm": 3.393951892852783, + "learning_rate": 2.3886233857344143e-06, + "loss": 0.0407, + "step": 28703 + }, + { + "epoch": 78.2125340599455, + "grad_norm": 2.7640810012817383, + "learning_rate": 2.388051037856689e-06, + "loss": 0.0319, + "step": 28704 + }, + { + "epoch": 78.21525885558583, + "grad_norm": 3.228947401046753, + "learning_rate": 2.3874787492605765e-06, + "loss": 0.0586, + "step": 28705 + }, + { + "epoch": 78.21798365122616, + "grad_norm": 2.958425760269165, + "learning_rate": 2.3869065199505328e-06, + "loss": 0.1149, + "step": 28706 + }, + { + "epoch": 78.22070844686648, + "grad_norm": 2.5740206241607666, + "learning_rate": 2.3863343499310187e-06, + "loss": 0.072, + "step": 28707 + }, + { + "epoch": 78.22343324250681, + "grad_norm": 2.93585467338562, + "learning_rate": 2.385762239206485e-06, + "loss": 0.0311, + "step": 28708 + }, + { + "epoch": 78.22615803814713, + "grad_norm": 2.986391305923462, + "learning_rate": 2.3851901877813923e-06, + "loss": 0.0425, + "step": 28709 + }, + { + "epoch": 78.22888283378747, + "grad_norm": 3.4620413780212402, + "learning_rate": 2.384618195660193e-06, + "loss": 0.1551, + "step": 28710 + }, + { + "epoch": 78.2316076294278, + "grad_norm": 2.392394781112671, + "learning_rate": 2.3840462628473403e-06, + "loss": 0.1175, + "step": 28711 + }, + { + "epoch": 78.23433242506812, + "grad_norm": 2.5387089252471924, + "learning_rate": 2.3834743893472923e-06, + "loss": 0.1602, + "step": 28712 + }, + { + "epoch": 78.23705722070845, + "grad_norm": 2.3510639667510986, + "learning_rate": 2.382902575164501e-06, + "loss": 0.061, + "step": 28713 + }, + { + "epoch": 78.23978201634877, + "grad_norm": 2.9034781455993652, + "learning_rate": 2.382330820303419e-06, + "loss": 0.0475, + "step": 28714 + }, + { + "epoch": 78.2425068119891, + "grad_norm": 2.7706029415130615, + "learning_rate": 2.381759124768496e-06, + "loss": 0.0645, + "step": 28715 + }, + { + "epoch": 78.24523160762942, + "grad_norm": 2.5357940196990967, + "learning_rate": 2.381187488564192e-06, + "loss": 0.1157, + "step": 28716 + }, + { + "epoch": 78.24795640326975, + "grad_norm": 2.7941699028015137, + "learning_rate": 2.3806159116949536e-06, + "loss": 0.12, + "step": 28717 + }, + { + "epoch": 78.25068119891009, + "grad_norm": 2.7098867893218994, + "learning_rate": 2.380044394165233e-06, + "loss": 0.0565, + "step": 28718 + }, + { + "epoch": 78.2534059945504, + "grad_norm": 2.5567994117736816, + "learning_rate": 2.379472935979479e-06, + "loss": 0.0454, + "step": 28719 + }, + { + "epoch": 78.25613079019074, + "grad_norm": 2.509187698364258, + "learning_rate": 2.3789015371421476e-06, + "loss": 0.0357, + "step": 28720 + }, + { + "epoch": 78.25885558583106, + "grad_norm": 2.3222243785858154, + "learning_rate": 2.3783301976576854e-06, + "loss": 0.1334, + "step": 28721 + }, + { + "epoch": 78.26158038147139, + "grad_norm": 3.3466756343841553, + "learning_rate": 2.3777589175305428e-06, + "loss": 0.0579, + "step": 28722 + }, + { + "epoch": 78.26430517711172, + "grad_norm": 2.327862501144409, + "learning_rate": 2.3771876967651652e-06, + "loss": 0.02, + "step": 28723 + }, + { + "epoch": 78.26702997275204, + "grad_norm": 2.378955841064453, + "learning_rate": 2.3766165353660065e-06, + "loss": 0.0176, + "step": 28724 + }, + { + "epoch": 78.26975476839237, + "grad_norm": 3.090916156768799, + "learning_rate": 2.376045433337514e-06, + "loss": 0.084, + "step": 28725 + }, + { + "epoch": 78.2724795640327, + "grad_norm": 2.2813174724578857, + "learning_rate": 2.3754743906841316e-06, + "loss": 0.0248, + "step": 28726 + }, + { + "epoch": 78.27520435967303, + "grad_norm": 3.227043628692627, + "learning_rate": 2.3749034074103084e-06, + "loss": 0.0445, + "step": 28727 + }, + { + "epoch": 78.27792915531334, + "grad_norm": 3.2909417152404785, + "learning_rate": 2.374332483520495e-06, + "loss": 0.0624, + "step": 28728 + }, + { + "epoch": 78.28065395095368, + "grad_norm": 2.8302438259124756, + "learning_rate": 2.373761619019136e-06, + "loss": 0.0344, + "step": 28729 + }, + { + "epoch": 78.28337874659401, + "grad_norm": 2.969295024871826, + "learning_rate": 2.373190813910674e-06, + "loss": 0.1248, + "step": 28730 + }, + { + "epoch": 78.28610354223433, + "grad_norm": 4.589273452758789, + "learning_rate": 2.372620068199555e-06, + "loss": 0.042, + "step": 28731 + }, + { + "epoch": 78.28882833787466, + "grad_norm": 2.352987051010132, + "learning_rate": 2.372049381890228e-06, + "loss": 0.0339, + "step": 28732 + }, + { + "epoch": 78.29155313351498, + "grad_norm": 2.2704436779022217, + "learning_rate": 2.3714787549871355e-06, + "loss": 0.1835, + "step": 28733 + }, + { + "epoch": 78.29427792915531, + "grad_norm": 3.4268100261688232, + "learning_rate": 2.3709081874947204e-06, + "loss": 0.1952, + "step": 28734 + }, + { + "epoch": 78.29700272479565, + "grad_norm": 3.415231227874756, + "learning_rate": 2.3703376794174237e-06, + "loss": 0.0875, + "step": 28735 + }, + { + "epoch": 78.29972752043597, + "grad_norm": 2.6673519611358643, + "learning_rate": 2.3697672307596955e-06, + "loss": 0.1024, + "step": 28736 + }, + { + "epoch": 78.3024523160763, + "grad_norm": 2.4854893684387207, + "learning_rate": 2.3691968415259727e-06, + "loss": 0.0857, + "step": 28737 + }, + { + "epoch": 78.30517711171662, + "grad_norm": 2.290933609008789, + "learning_rate": 2.3686265117207007e-06, + "loss": 0.0839, + "step": 28738 + }, + { + "epoch": 78.30790190735695, + "grad_norm": 2.550001621246338, + "learning_rate": 2.3680562413483167e-06, + "loss": 0.0688, + "step": 28739 + }, + { + "epoch": 78.31062670299727, + "grad_norm": 2.604231119155884, + "learning_rate": 2.3674860304132675e-06, + "loss": 0.0317, + "step": 28740 + }, + { + "epoch": 78.3133514986376, + "grad_norm": 1.6347862482070923, + "learning_rate": 2.366915878919992e-06, + "loss": 0.0231, + "step": 28741 + }, + { + "epoch": 78.31607629427793, + "grad_norm": 3.765108585357666, + "learning_rate": 2.366345786872929e-06, + "loss": 0.0516, + "step": 28742 + }, + { + "epoch": 78.31880108991825, + "grad_norm": 3.561452627182007, + "learning_rate": 2.3657757542765145e-06, + "loss": 0.0322, + "step": 28743 + }, + { + "epoch": 78.32152588555859, + "grad_norm": 4.27000093460083, + "learning_rate": 2.3652057811351982e-06, + "loss": 0.0577, + "step": 28744 + }, + { + "epoch": 78.3242506811989, + "grad_norm": 2.3249168395996094, + "learning_rate": 2.364635867453414e-06, + "loss": 0.0946, + "step": 28745 + }, + { + "epoch": 78.32697547683924, + "grad_norm": 2.7798616886138916, + "learning_rate": 2.3640660132356e-06, + "loss": 0.035, + "step": 28746 + }, + { + "epoch": 78.32970027247957, + "grad_norm": 2.1884665489196777, + "learning_rate": 2.3634962184861897e-06, + "loss": 0.0337, + "step": 28747 + }, + { + "epoch": 78.33242506811989, + "grad_norm": 2.7179813385009766, + "learning_rate": 2.36292648320963e-06, + "loss": 0.0405, + "step": 28748 + }, + { + "epoch": 78.33514986376022, + "grad_norm": 2.6988346576690674, + "learning_rate": 2.362356807410352e-06, + "loss": 0.0359, + "step": 28749 + }, + { + "epoch": 78.33787465940054, + "grad_norm": 5.135148525238037, + "learning_rate": 2.3617871910927927e-06, + "loss": 0.0783, + "step": 28750 + }, + { + "epoch": 78.34059945504087, + "grad_norm": 2.046766519546509, + "learning_rate": 2.361217634261387e-06, + "loss": 0.0861, + "step": 28751 + }, + { + "epoch": 78.34332425068119, + "grad_norm": 3.113476514816284, + "learning_rate": 2.360648136920575e-06, + "loss": 0.0417, + "step": 28752 + }, + { + "epoch": 78.34604904632153, + "grad_norm": 3.2326583862304688, + "learning_rate": 2.360078699074789e-06, + "loss": 0.0532, + "step": 28753 + }, + { + "epoch": 78.34877384196186, + "grad_norm": 3.191349983215332, + "learning_rate": 2.3595093207284657e-06, + "loss": 0.2164, + "step": 28754 + }, + { + "epoch": 78.35149863760218, + "grad_norm": 2.1410105228424072, + "learning_rate": 2.3589400018860343e-06, + "loss": 0.0667, + "step": 28755 + }, + { + "epoch": 78.35422343324251, + "grad_norm": 2.7011985778808594, + "learning_rate": 2.3583707425519344e-06, + "loss": 0.0472, + "step": 28756 + }, + { + "epoch": 78.35694822888283, + "grad_norm": 2.3861894607543945, + "learning_rate": 2.3578015427305977e-06, + "loss": 0.0372, + "step": 28757 + }, + { + "epoch": 78.35967302452316, + "grad_norm": 2.214292049407959, + "learning_rate": 2.357232402426457e-06, + "loss": 0.0371, + "step": 28758 + }, + { + "epoch": 78.3623978201635, + "grad_norm": 2.59604811668396, + "learning_rate": 2.3566633216439416e-06, + "loss": 0.1263, + "step": 28759 + }, + { + "epoch": 78.36512261580381, + "grad_norm": 2.2566699981689453, + "learning_rate": 2.356094300387486e-06, + "loss": 0.0396, + "step": 28760 + }, + { + "epoch": 78.36784741144415, + "grad_norm": 3.471081256866455, + "learning_rate": 2.355525338661524e-06, + "loss": 0.0435, + "step": 28761 + }, + { + "epoch": 78.37057220708446, + "grad_norm": 2.0240402221679688, + "learning_rate": 2.3549564364704856e-06, + "loss": 0.0403, + "step": 28762 + }, + { + "epoch": 78.3732970027248, + "grad_norm": 3.4439470767974854, + "learning_rate": 2.3543875938187997e-06, + "loss": 0.1056, + "step": 28763 + }, + { + "epoch": 78.37602179836512, + "grad_norm": 10.956733703613281, + "learning_rate": 2.353818810710895e-06, + "loss": 0.1349, + "step": 28764 + }, + { + "epoch": 78.37874659400545, + "grad_norm": 2.729780435562134, + "learning_rate": 2.3532500871512054e-06, + "loss": 0.0398, + "step": 28765 + }, + { + "epoch": 78.38147138964578, + "grad_norm": 2.260324478149414, + "learning_rate": 2.3526814231441586e-06, + "loss": 0.032, + "step": 28766 + }, + { + "epoch": 78.3841961852861, + "grad_norm": 2.290607213973999, + "learning_rate": 2.35211281869418e-06, + "loss": 0.0474, + "step": 28767 + }, + { + "epoch": 78.38692098092643, + "grad_norm": 2.24245548248291, + "learning_rate": 2.3515442738057027e-06, + "loss": 0.0325, + "step": 28768 + }, + { + "epoch": 78.38964577656675, + "grad_norm": 2.8790132999420166, + "learning_rate": 2.350975788483153e-06, + "loss": 0.083, + "step": 28769 + }, + { + "epoch": 78.39237057220708, + "grad_norm": 3.1960229873657227, + "learning_rate": 2.3504073627309575e-06, + "loss": 0.0376, + "step": 28770 + }, + { + "epoch": 78.39509536784742, + "grad_norm": 2.145268440246582, + "learning_rate": 2.3498389965535406e-06, + "loss": 0.1345, + "step": 28771 + }, + { + "epoch": 78.39782016348774, + "grad_norm": 2.2832589149475098, + "learning_rate": 2.3492706899553354e-06, + "loss": 0.0894, + "step": 28772 + }, + { + "epoch": 78.40054495912807, + "grad_norm": 2.4074416160583496, + "learning_rate": 2.3487024429407625e-06, + "loss": 0.1127, + "step": 28773 + }, + { + "epoch": 78.40326975476839, + "grad_norm": 3.619366407394409, + "learning_rate": 2.3481342555142484e-06, + "loss": 0.1049, + "step": 28774 + }, + { + "epoch": 78.40599455040872, + "grad_norm": 2.3534491062164307, + "learning_rate": 2.3475661276802164e-06, + "loss": 0.0329, + "step": 28775 + }, + { + "epoch": 78.40871934604904, + "grad_norm": 3.1109061241149902, + "learning_rate": 2.346998059443095e-06, + "loss": 0.0492, + "step": 28776 + }, + { + "epoch": 78.41144414168937, + "grad_norm": 2.226891279220581, + "learning_rate": 2.3464300508073046e-06, + "loss": 0.1112, + "step": 28777 + }, + { + "epoch": 78.4141689373297, + "grad_norm": 3.561785936355591, + "learning_rate": 2.3458621017772733e-06, + "loss": 0.111, + "step": 28778 + }, + { + "epoch": 78.41689373297002, + "grad_norm": 1.934870719909668, + "learning_rate": 2.3452942123574208e-06, + "loss": 0.1072, + "step": 28779 + }, + { + "epoch": 78.41961852861036, + "grad_norm": 3.1643896102905273, + "learning_rate": 2.344726382552168e-06, + "loss": 0.0567, + "step": 28780 + }, + { + "epoch": 78.42234332425068, + "grad_norm": 2.6465632915496826, + "learning_rate": 2.3441586123659434e-06, + "loss": 0.3397, + "step": 28781 + }, + { + "epoch": 78.42506811989101, + "grad_norm": 2.2327096462249756, + "learning_rate": 2.3435909018031645e-06, + "loss": 0.0273, + "step": 28782 + }, + { + "epoch": 78.42779291553134, + "grad_norm": 2.1167855262756348, + "learning_rate": 2.3430232508682525e-06, + "loss": 0.0499, + "step": 28783 + }, + { + "epoch": 78.43051771117166, + "grad_norm": 2.2226626873016357, + "learning_rate": 2.3424556595656276e-06, + "loss": 0.0219, + "step": 28784 + }, + { + "epoch": 78.433242506812, + "grad_norm": 1.781945824623108, + "learning_rate": 2.341888127899714e-06, + "loss": 0.0151, + "step": 28785 + }, + { + "epoch": 78.43596730245231, + "grad_norm": 2.4531352519989014, + "learning_rate": 2.341320655874929e-06, + "loss": 0.0362, + "step": 28786 + }, + { + "epoch": 78.43869209809264, + "grad_norm": 5.346907138824463, + "learning_rate": 2.3407532434956913e-06, + "loss": 0.0654, + "step": 28787 + }, + { + "epoch": 78.44141689373296, + "grad_norm": 2.3232154846191406, + "learning_rate": 2.34018589076642e-06, + "loss": 0.1128, + "step": 28788 + }, + { + "epoch": 78.4441416893733, + "grad_norm": 2.272002696990967, + "learning_rate": 2.3396185976915355e-06, + "loss": 0.0318, + "step": 28789 + }, + { + "epoch": 78.44686648501363, + "grad_norm": 2.511538028717041, + "learning_rate": 2.3390513642754555e-06, + "loss": 0.0739, + "step": 28790 + }, + { + "epoch": 78.44959128065395, + "grad_norm": 5.701254367828369, + "learning_rate": 2.338484190522594e-06, + "loss": 0.0444, + "step": 28791 + }, + { + "epoch": 78.45231607629428, + "grad_norm": 3.599649429321289, + "learning_rate": 2.3379170764373737e-06, + "loss": 0.0984, + "step": 28792 + }, + { + "epoch": 78.4550408719346, + "grad_norm": 3.17618989944458, + "learning_rate": 2.3373500220242095e-06, + "loss": 0.0459, + "step": 28793 + }, + { + "epoch": 78.45776566757493, + "grad_norm": 2.0977768898010254, + "learning_rate": 2.3367830272875136e-06, + "loss": 0.1065, + "step": 28794 + }, + { + "epoch": 78.46049046321527, + "grad_norm": 2.5540215969085693, + "learning_rate": 2.336216092231707e-06, + "loss": 0.0894, + "step": 28795 + }, + { + "epoch": 78.46321525885558, + "grad_norm": 2.071661949157715, + "learning_rate": 2.3356492168612e-06, + "loss": 0.1047, + "step": 28796 + }, + { + "epoch": 78.46594005449592, + "grad_norm": 6.077733516693115, + "learning_rate": 2.335082401180413e-06, + "loss": 0.0467, + "step": 28797 + }, + { + "epoch": 78.46866485013624, + "grad_norm": 3.6167330741882324, + "learning_rate": 2.3345156451937577e-06, + "loss": 0.0438, + "step": 28798 + }, + { + "epoch": 78.47138964577657, + "grad_norm": 2.4257559776306152, + "learning_rate": 2.333948948905649e-06, + "loss": 0.0466, + "step": 28799 + }, + { + "epoch": 78.47411444141689, + "grad_norm": 2.514841318130493, + "learning_rate": 2.3333823123204946e-06, + "loss": 0.0828, + "step": 28800 + }, + { + "epoch": 78.47683923705722, + "grad_norm": 2.6107676029205322, + "learning_rate": 2.332815735442716e-06, + "loss": 0.1185, + "step": 28801 + }, + { + "epoch": 78.47956403269755, + "grad_norm": 4.774962425231934, + "learning_rate": 2.332249218276721e-06, + "loss": 0.1953, + "step": 28802 + }, + { + "epoch": 78.48228882833787, + "grad_norm": 2.341609477996826, + "learning_rate": 2.3316827608269233e-06, + "loss": 0.0344, + "step": 28803 + }, + { + "epoch": 78.4850136239782, + "grad_norm": 2.3848965167999268, + "learning_rate": 2.3311163630977296e-06, + "loss": 0.0329, + "step": 28804 + }, + { + "epoch": 78.48773841961852, + "grad_norm": 2.820605993270874, + "learning_rate": 2.3305500250935574e-06, + "loss": 0.1103, + "step": 28805 + }, + { + "epoch": 78.49046321525886, + "grad_norm": 3.5609471797943115, + "learning_rate": 2.3299837468188156e-06, + "loss": 0.0772, + "step": 28806 + }, + { + "epoch": 78.49318801089919, + "grad_norm": 2.606863498687744, + "learning_rate": 2.329417528277914e-06, + "loss": 0.0339, + "step": 28807 + }, + { + "epoch": 78.49591280653951, + "grad_norm": 2.2633886337280273, + "learning_rate": 2.328851369475258e-06, + "loss": 0.0802, + "step": 28808 + }, + { + "epoch": 78.49863760217984, + "grad_norm": 2.9578235149383545, + "learning_rate": 2.3282852704152638e-06, + "loss": 0.0504, + "step": 28809 + }, + { + "epoch": 78.50136239782016, + "grad_norm": 4.267442226409912, + "learning_rate": 2.3277192311023366e-06, + "loss": 0.0799, + "step": 28810 + }, + { + "epoch": 78.50408719346049, + "grad_norm": 2.333279848098755, + "learning_rate": 2.3271532515408825e-06, + "loss": 0.062, + "step": 28811 + }, + { + "epoch": 78.50681198910081, + "grad_norm": 2.689195394515991, + "learning_rate": 2.326587331735313e-06, + "loss": 0.2114, + "step": 28812 + }, + { + "epoch": 78.50953678474114, + "grad_norm": 2.947387218475342, + "learning_rate": 2.3260214716900353e-06, + "loss": 0.1225, + "step": 28813 + }, + { + "epoch": 78.51226158038148, + "grad_norm": 2.5247998237609863, + "learning_rate": 2.325455671409457e-06, + "loss": 0.1136, + "step": 28814 + }, + { + "epoch": 78.5149863760218, + "grad_norm": 3.2816948890686035, + "learning_rate": 2.324889930897982e-06, + "loss": 0.1286, + "step": 28815 + }, + { + "epoch": 78.51771117166213, + "grad_norm": 3.0933926105499268, + "learning_rate": 2.324324250160015e-06, + "loss": 0.2823, + "step": 28816 + }, + { + "epoch": 78.52043596730245, + "grad_norm": 3.2287774085998535, + "learning_rate": 2.3237586291999657e-06, + "loss": 0.0517, + "step": 28817 + }, + { + "epoch": 78.52316076294278, + "grad_norm": 2.898211717605591, + "learning_rate": 2.323193068022238e-06, + "loss": 0.0798, + "step": 28818 + }, + { + "epoch": 78.52588555858311, + "grad_norm": 3.3788342475891113, + "learning_rate": 2.3226275666312346e-06, + "loss": 0.0695, + "step": 28819 + }, + { + "epoch": 78.52861035422343, + "grad_norm": 2.0427491664886475, + "learning_rate": 2.322062125031359e-06, + "loss": 0.0794, + "step": 28820 + }, + { + "epoch": 78.53133514986376, + "grad_norm": 4.412542343139648, + "learning_rate": 2.3214967432270187e-06, + "loss": 0.0426, + "step": 28821 + }, + { + "epoch": 78.53405994550408, + "grad_norm": 3.6098456382751465, + "learning_rate": 2.3209314212226143e-06, + "loss": 0.0804, + "step": 28822 + }, + { + "epoch": 78.53678474114442, + "grad_norm": 3.7335867881774902, + "learning_rate": 2.320366159022549e-06, + "loss": 0.0569, + "step": 28823 + }, + { + "epoch": 78.53950953678473, + "grad_norm": 2.3873815536499023, + "learning_rate": 2.319800956631222e-06, + "loss": 0.1644, + "step": 28824 + }, + { + "epoch": 78.54223433242507, + "grad_norm": 2.321789503097534, + "learning_rate": 2.3192358140530415e-06, + "loss": 0.0952, + "step": 28825 + }, + { + "epoch": 78.5449591280654, + "grad_norm": 3.5240705013275146, + "learning_rate": 2.3186707312924053e-06, + "loss": 0.0321, + "step": 28826 + }, + { + "epoch": 78.54768392370572, + "grad_norm": 2.644545078277588, + "learning_rate": 2.3181057083537127e-06, + "loss": 0.1152, + "step": 28827 + }, + { + "epoch": 78.55040871934605, + "grad_norm": 3.6151700019836426, + "learning_rate": 2.3175407452413647e-06, + "loss": 0.1202, + "step": 28828 + }, + { + "epoch": 78.55313351498637, + "grad_norm": 10.351760864257812, + "learning_rate": 2.316975841959761e-06, + "loss": 0.0574, + "step": 28829 + }, + { + "epoch": 78.5558583106267, + "grad_norm": 3.1691505908966064, + "learning_rate": 2.3164109985133043e-06, + "loss": 0.0472, + "step": 28830 + }, + { + "epoch": 78.55858310626704, + "grad_norm": 1.7434918880462646, + "learning_rate": 2.315846214906393e-06, + "loss": 0.0239, + "step": 28831 + }, + { + "epoch": 78.56130790190736, + "grad_norm": 2.751307487487793, + "learning_rate": 2.315281491143421e-06, + "loss": 0.1578, + "step": 28832 + }, + { + "epoch": 78.56403269754769, + "grad_norm": 2.538161039352417, + "learning_rate": 2.314716827228791e-06, + "loss": 0.1006, + "step": 28833 + }, + { + "epoch": 78.566757493188, + "grad_norm": 2.3712387084960938, + "learning_rate": 2.3141522231669e-06, + "loss": 0.0345, + "step": 28834 + }, + { + "epoch": 78.56948228882834, + "grad_norm": 4.287030220031738, + "learning_rate": 2.3135876789621436e-06, + "loss": 0.1119, + "step": 28835 + }, + { + "epoch": 78.57220708446866, + "grad_norm": 2.3746984004974365, + "learning_rate": 2.313023194618916e-06, + "loss": 0.1901, + "step": 28836 + }, + { + "epoch": 78.57493188010899, + "grad_norm": 2.118539810180664, + "learning_rate": 2.31245877014162e-06, + "loss": 0.0384, + "step": 28837 + }, + { + "epoch": 78.57765667574932, + "grad_norm": 2.6033174991607666, + "learning_rate": 2.3118944055346482e-06, + "loss": 0.0305, + "step": 28838 + }, + { + "epoch": 78.58038147138964, + "grad_norm": 1.9644960165023804, + "learning_rate": 2.3113301008023936e-06, + "loss": 0.0574, + "step": 28839 + }, + { + "epoch": 78.58310626702998, + "grad_norm": 3.0274219512939453, + "learning_rate": 2.3107658559492506e-06, + "loss": 0.0731, + "step": 28840 + }, + { + "epoch": 78.5858310626703, + "grad_norm": 3.726154088973999, + "learning_rate": 2.3102016709796193e-06, + "loss": 0.0348, + "step": 28841 + }, + { + "epoch": 78.58855585831063, + "grad_norm": 3.710953712463379, + "learning_rate": 2.3096375458978892e-06, + "loss": 0.0619, + "step": 28842 + }, + { + "epoch": 78.59128065395096, + "grad_norm": 3.5191240310668945, + "learning_rate": 2.3090734807084545e-06, + "loss": 0.0454, + "step": 28843 + }, + { + "epoch": 78.59400544959128, + "grad_norm": 2.173923969268799, + "learning_rate": 2.3085094754157045e-06, + "loss": 0.0251, + "step": 28844 + }, + { + "epoch": 78.59673024523161, + "grad_norm": 2.0286457538604736, + "learning_rate": 2.3079455300240394e-06, + "loss": 0.0334, + "step": 28845 + }, + { + "epoch": 78.59945504087193, + "grad_norm": 3.141050338745117, + "learning_rate": 2.3073816445378427e-06, + "loss": 0.0636, + "step": 28846 + }, + { + "epoch": 78.60217983651226, + "grad_norm": 3.3132381439208984, + "learning_rate": 2.3068178189615142e-06, + "loss": 0.035, + "step": 28847 + }, + { + "epoch": 78.60490463215258, + "grad_norm": 2.5420422554016113, + "learning_rate": 2.306254053299439e-06, + "loss": 0.0612, + "step": 28848 + }, + { + "epoch": 78.60762942779292, + "grad_norm": 2.8048555850982666, + "learning_rate": 2.305690347556009e-06, + "loss": 0.054, + "step": 28849 + }, + { + "epoch": 78.61035422343325, + "grad_norm": 2.628035545349121, + "learning_rate": 2.305126701735617e-06, + "loss": 0.0912, + "step": 28850 + }, + { + "epoch": 78.61307901907357, + "grad_norm": 2.939763307571411, + "learning_rate": 2.304563115842651e-06, + "loss": 0.0539, + "step": 28851 + }, + { + "epoch": 78.6158038147139, + "grad_norm": 3.509037733078003, + "learning_rate": 2.303999589881496e-06, + "loss": 0.1482, + "step": 28852 + }, + { + "epoch": 78.61852861035422, + "grad_norm": 2.390042543411255, + "learning_rate": 2.3034361238565474e-06, + "loss": 0.026, + "step": 28853 + }, + { + "epoch": 78.62125340599455, + "grad_norm": 2.847133159637451, + "learning_rate": 2.302872717772191e-06, + "loss": 0.0264, + "step": 28854 + }, + { + "epoch": 78.62397820163488, + "grad_norm": 2.7450544834136963, + "learning_rate": 2.302309371632814e-06, + "loss": 0.0334, + "step": 28855 + }, + { + "epoch": 78.6267029972752, + "grad_norm": 2.1127185821533203, + "learning_rate": 2.301746085442801e-06, + "loss": 0.0891, + "step": 28856 + }, + { + "epoch": 78.62942779291554, + "grad_norm": 3.734999895095825, + "learning_rate": 2.301182859206544e-06, + "loss": 0.0828, + "step": 28857 + }, + { + "epoch": 78.63215258855585, + "grad_norm": 1.8150416612625122, + "learning_rate": 2.3006196929284276e-06, + "loss": 0.0191, + "step": 28858 + }, + { + "epoch": 78.63487738419619, + "grad_norm": 4.945652008056641, + "learning_rate": 2.3000565866128377e-06, + "loss": 0.1195, + "step": 28859 + }, + { + "epoch": 78.6376021798365, + "grad_norm": 2.6597771644592285, + "learning_rate": 2.299493540264156e-06, + "loss": 0.1091, + "step": 28860 + }, + { + "epoch": 78.64032697547684, + "grad_norm": 2.7733194828033447, + "learning_rate": 2.2989305538867735e-06, + "loss": 0.1298, + "step": 28861 + }, + { + "epoch": 78.64305177111717, + "grad_norm": 10.696962356567383, + "learning_rate": 2.298367627485072e-06, + "loss": 0.0415, + "step": 28862 + }, + { + "epoch": 78.64577656675749, + "grad_norm": 2.93894100189209, + "learning_rate": 2.2978047610634335e-06, + "loss": 0.051, + "step": 28863 + }, + { + "epoch": 78.64850136239782, + "grad_norm": 3.761629343032837, + "learning_rate": 2.297241954626246e-06, + "loss": 0.1012, + "step": 28864 + }, + { + "epoch": 78.65122615803814, + "grad_norm": 3.8135571479797363, + "learning_rate": 2.2966792081778866e-06, + "loss": 0.0323, + "step": 28865 + }, + { + "epoch": 78.65395095367847, + "grad_norm": 2.2769131660461426, + "learning_rate": 2.2961165217227453e-06, + "loss": 0.0677, + "step": 28866 + }, + { + "epoch": 78.65667574931881, + "grad_norm": 3.278449058532715, + "learning_rate": 2.2955538952652e-06, + "loss": 0.1002, + "step": 28867 + }, + { + "epoch": 78.65940054495913, + "grad_norm": 2.091280221939087, + "learning_rate": 2.294991328809634e-06, + "loss": 0.0965, + "step": 28868 + }, + { + "epoch": 78.66212534059946, + "grad_norm": 3.919696092605591, + "learning_rate": 2.2944288223604237e-06, + "loss": 0.1999, + "step": 28869 + }, + { + "epoch": 78.66485013623978, + "grad_norm": 3.111398935317993, + "learning_rate": 2.293866375921957e-06, + "loss": 0.0377, + "step": 28870 + }, + { + "epoch": 78.66757493188011, + "grad_norm": 2.956389904022217, + "learning_rate": 2.2933039894986107e-06, + "loss": 0.0689, + "step": 28871 + }, + { + "epoch": 78.67029972752043, + "grad_norm": 1.9143258333206177, + "learning_rate": 2.2927416630947653e-06, + "loss": 0.029, + "step": 28872 + }, + { + "epoch": 78.67302452316076, + "grad_norm": 1.934957504272461, + "learning_rate": 2.2921793967147963e-06, + "loss": 0.0273, + "step": 28873 + }, + { + "epoch": 78.6757493188011, + "grad_norm": 3.2638096809387207, + "learning_rate": 2.2916171903630892e-06, + "loss": 0.1178, + "step": 28874 + }, + { + "epoch": 78.67847411444141, + "grad_norm": 2.8287012577056885, + "learning_rate": 2.2910550440440194e-06, + "loss": 0.0563, + "step": 28875 + }, + { + "epoch": 78.68119891008175, + "grad_norm": 4.911534786224365, + "learning_rate": 2.290492957761963e-06, + "loss": 0.0741, + "step": 28876 + }, + { + "epoch": 78.68392370572207, + "grad_norm": 3.7542495727539062, + "learning_rate": 2.2899309315213005e-06, + "loss": 0.0554, + "step": 28877 + }, + { + "epoch": 78.6866485013624, + "grad_norm": 1.7778617143630981, + "learning_rate": 2.2893689653264084e-06, + "loss": 0.0217, + "step": 28878 + }, + { + "epoch": 78.68937329700273, + "grad_norm": 2.246203660964966, + "learning_rate": 2.2888070591816626e-06, + "loss": 0.0799, + "step": 28879 + }, + { + "epoch": 78.69209809264305, + "grad_norm": 2.1796176433563232, + "learning_rate": 2.2882452130914367e-06, + "loss": 0.0411, + "step": 28880 + }, + { + "epoch": 78.69482288828338, + "grad_norm": 2.6442768573760986, + "learning_rate": 2.287683427060109e-06, + "loss": 0.0713, + "step": 28881 + }, + { + "epoch": 78.6975476839237, + "grad_norm": 2.0072710514068604, + "learning_rate": 2.2871217010920567e-06, + "loss": 0.0303, + "step": 28882 + }, + { + "epoch": 78.70027247956403, + "grad_norm": 2.3387610912323, + "learning_rate": 2.286560035191653e-06, + "loss": 0.0906, + "step": 28883 + }, + { + "epoch": 78.70299727520435, + "grad_norm": 3.0095784664154053, + "learning_rate": 2.2859984293632708e-06, + "loss": 0.0347, + "step": 28884 + }, + { + "epoch": 78.70572207084469, + "grad_norm": 3.653873920440674, + "learning_rate": 2.285436883611282e-06, + "loss": 0.0792, + "step": 28885 + }, + { + "epoch": 78.70844686648502, + "grad_norm": 2.7108097076416016, + "learning_rate": 2.284875397940065e-06, + "loss": 0.088, + "step": 28886 + }, + { + "epoch": 78.71117166212534, + "grad_norm": 16.79184341430664, + "learning_rate": 2.284313972353991e-06, + "loss": 0.0313, + "step": 28887 + }, + { + "epoch": 78.71389645776567, + "grad_norm": 2.76053786277771, + "learning_rate": 2.28375260685743e-06, + "loss": 0.0315, + "step": 28888 + }, + { + "epoch": 78.71662125340599, + "grad_norm": 2.97222900390625, + "learning_rate": 2.2831913014547535e-06, + "loss": 0.0624, + "step": 28889 + }, + { + "epoch": 78.71934604904632, + "grad_norm": 1.5932461023330688, + "learning_rate": 2.282630056150338e-06, + "loss": 0.0219, + "step": 28890 + }, + { + "epoch": 78.72207084468666, + "grad_norm": 2.40366530418396, + "learning_rate": 2.2820688709485504e-06, + "loss": 0.1016, + "step": 28891 + }, + { + "epoch": 78.72479564032697, + "grad_norm": 3.8289735317230225, + "learning_rate": 2.2815077458537628e-06, + "loss": 0.0452, + "step": 28892 + }, + { + "epoch": 78.7275204359673, + "grad_norm": 4.441797256469727, + "learning_rate": 2.2809466808703416e-06, + "loss": 0.0864, + "step": 28893 + }, + { + "epoch": 78.73024523160763, + "grad_norm": 4.0520782470703125, + "learning_rate": 2.280385676002661e-06, + "loss": 0.0794, + "step": 28894 + }, + { + "epoch": 78.73297002724796, + "grad_norm": 3.905402421951294, + "learning_rate": 2.2798247312550893e-06, + "loss": 0.0434, + "step": 28895 + }, + { + "epoch": 78.73569482288828, + "grad_norm": 3.881347894668579, + "learning_rate": 2.279263846631994e-06, + "loss": 0.0519, + "step": 28896 + }, + { + "epoch": 78.73841961852861, + "grad_norm": 2.0655436515808105, + "learning_rate": 2.2787030221377403e-06, + "loss": 0.0297, + "step": 28897 + }, + { + "epoch": 78.74114441416894, + "grad_norm": 2.325296401977539, + "learning_rate": 2.278142257776699e-06, + "loss": 0.0238, + "step": 28898 + }, + { + "epoch": 78.74386920980926, + "grad_norm": 2.9133946895599365, + "learning_rate": 2.27758155355324e-06, + "loss": 0.0555, + "step": 28899 + }, + { + "epoch": 78.7465940054496, + "grad_norm": 2.1299450397491455, + "learning_rate": 2.277020909471728e-06, + "loss": 0.0423, + "step": 28900 + }, + { + "epoch": 78.74931880108991, + "grad_norm": 1.8782014846801758, + "learning_rate": 2.2764603255365248e-06, + "loss": 0.0676, + "step": 28901 + }, + { + "epoch": 78.75204359673025, + "grad_norm": 3.7080154418945312, + "learning_rate": 2.2758998017520027e-06, + "loss": 0.1151, + "step": 28902 + }, + { + "epoch": 78.75476839237058, + "grad_norm": 2.812624931335449, + "learning_rate": 2.2753393381225252e-06, + "loss": 0.1553, + "step": 28903 + }, + { + "epoch": 78.7574931880109, + "grad_norm": 2.258704900741577, + "learning_rate": 2.274778934652456e-06, + "loss": 0.0679, + "step": 28904 + }, + { + "epoch": 78.76021798365123, + "grad_norm": 2.920022964477539, + "learning_rate": 2.274218591346157e-06, + "loss": 0.0438, + "step": 28905 + }, + { + "epoch": 78.76294277929155, + "grad_norm": 2.488492727279663, + "learning_rate": 2.2736583082079977e-06, + "loss": 0.0528, + "step": 28906 + }, + { + "epoch": 78.76566757493188, + "grad_norm": 3.3354389667510986, + "learning_rate": 2.273098085242339e-06, + "loss": 0.1207, + "step": 28907 + }, + { + "epoch": 78.7683923705722, + "grad_norm": 1.8576667308807373, + "learning_rate": 2.2725379224535438e-06, + "loss": 0.0341, + "step": 28908 + }, + { + "epoch": 78.77111716621253, + "grad_norm": 3.292917490005493, + "learning_rate": 2.271977819845971e-06, + "loss": 0.086, + "step": 28909 + }, + { + "epoch": 78.77384196185287, + "grad_norm": 3.809830665588379, + "learning_rate": 2.27141777742399e-06, + "loss": 0.1056, + "step": 28910 + }, + { + "epoch": 78.77656675749319, + "grad_norm": 3.4294378757476807, + "learning_rate": 2.2708577951919585e-06, + "loss": 0.1242, + "step": 28911 + }, + { + "epoch": 78.77929155313352, + "grad_norm": 2.9975271224975586, + "learning_rate": 2.270297873154237e-06, + "loss": 0.0297, + "step": 28912 + }, + { + "epoch": 78.78201634877384, + "grad_norm": 1.738965630531311, + "learning_rate": 2.2697380113151848e-06, + "loss": 0.0307, + "step": 28913 + }, + { + "epoch": 78.78474114441417, + "grad_norm": 1.7738715410232544, + "learning_rate": 2.269178209679166e-06, + "loss": 0.0169, + "step": 28914 + }, + { + "epoch": 78.7874659400545, + "grad_norm": 2.0331978797912598, + "learning_rate": 2.2686184682505365e-06, + "loss": 0.0319, + "step": 28915 + }, + { + "epoch": 78.79019073569482, + "grad_norm": 1.8429347276687622, + "learning_rate": 2.2680587870336603e-06, + "loss": 0.1209, + "step": 28916 + }, + { + "epoch": 78.79291553133515, + "grad_norm": 4.196180820465088, + "learning_rate": 2.2674991660328903e-06, + "loss": 0.0637, + "step": 28917 + }, + { + "epoch": 78.79564032697547, + "grad_norm": 2.5511345863342285, + "learning_rate": 2.2669396052525914e-06, + "loss": 0.0232, + "step": 28918 + }, + { + "epoch": 78.7983651226158, + "grad_norm": 3.883326530456543, + "learning_rate": 2.266380104697117e-06, + "loss": 0.3365, + "step": 28919 + }, + { + "epoch": 78.80108991825612, + "grad_norm": 2.1199047565460205, + "learning_rate": 2.265820664370826e-06, + "loss": 0.1337, + "step": 28920 + }, + { + "epoch": 78.80381471389646, + "grad_norm": 1.7725870609283447, + "learning_rate": 2.265261284278072e-06, + "loss": 0.0318, + "step": 28921 + }, + { + "epoch": 78.80653950953679, + "grad_norm": 2.95277738571167, + "learning_rate": 2.264701964423217e-06, + "loss": 0.0561, + "step": 28922 + }, + { + "epoch": 78.80926430517711, + "grad_norm": 3.0791056156158447, + "learning_rate": 2.2641427048106135e-06, + "loss": 0.0705, + "step": 28923 + }, + { + "epoch": 78.81198910081744, + "grad_norm": 3.029740333557129, + "learning_rate": 2.2635835054446186e-06, + "loss": 0.0813, + "step": 28924 + }, + { + "epoch": 78.81471389645776, + "grad_norm": 6.212014198303223, + "learning_rate": 2.2630243663295825e-06, + "loss": 0.0645, + "step": 28925 + }, + { + "epoch": 78.8174386920981, + "grad_norm": 3.0743587017059326, + "learning_rate": 2.2624652874698673e-06, + "loss": 0.0417, + "step": 28926 + }, + { + "epoch": 78.82016348773843, + "grad_norm": 3.5916972160339355, + "learning_rate": 2.2619062688698234e-06, + "loss": 0.1351, + "step": 28927 + }, + { + "epoch": 78.82288828337875, + "grad_norm": 1.8293107748031616, + "learning_rate": 2.2613473105338046e-06, + "loss": 0.0368, + "step": 28928 + }, + { + "epoch": 78.82561307901908, + "grad_norm": 2.0689969062805176, + "learning_rate": 2.2607884124661607e-06, + "loss": 0.0322, + "step": 28929 + }, + { + "epoch": 78.8283378746594, + "grad_norm": 3.2180821895599365, + "learning_rate": 2.2602295746712498e-06, + "loss": 0.1061, + "step": 28930 + }, + { + "epoch": 78.83106267029973, + "grad_norm": 3.7344260215759277, + "learning_rate": 2.2596707971534226e-06, + "loss": 0.0838, + "step": 28931 + }, + { + "epoch": 78.83378746594005, + "grad_norm": 3.4283828735351562, + "learning_rate": 2.2591120799170262e-06, + "loss": 0.1491, + "step": 28932 + }, + { + "epoch": 78.83651226158038, + "grad_norm": 2.585704803466797, + "learning_rate": 2.25855342296642e-06, + "loss": 0.0347, + "step": 28933 + }, + { + "epoch": 78.83923705722071, + "grad_norm": 1.3932832479476929, + "learning_rate": 2.257994826305947e-06, + "loss": 0.0202, + "step": 28934 + }, + { + "epoch": 78.84196185286103, + "grad_norm": 2.4599039554595947, + "learning_rate": 2.2574362899399648e-06, + "loss": 0.0593, + "step": 28935 + }, + { + "epoch": 78.84468664850137, + "grad_norm": 3.06209659576416, + "learning_rate": 2.2568778138728186e-06, + "loss": 0.0655, + "step": 28936 + }, + { + "epoch": 78.84741144414168, + "grad_norm": 3.4642419815063477, + "learning_rate": 2.256319398108859e-06, + "loss": 0.0354, + "step": 28937 + }, + { + "epoch": 78.85013623978202, + "grad_norm": 2.160891532897949, + "learning_rate": 2.255761042652432e-06, + "loss": 0.0268, + "step": 28938 + }, + { + "epoch": 78.85286103542235, + "grad_norm": 2.034299612045288, + "learning_rate": 2.255202747507892e-06, + "loss": 0.0544, + "step": 28939 + }, + { + "epoch": 78.85558583106267, + "grad_norm": 1.9354496002197266, + "learning_rate": 2.2546445126795822e-06, + "loss": 0.1085, + "step": 28940 + }, + { + "epoch": 78.858310626703, + "grad_norm": 2.530433177947998, + "learning_rate": 2.2540863381718502e-06, + "loss": 0.0381, + "step": 28941 + }, + { + "epoch": 78.86103542234332, + "grad_norm": 3.1374988555908203, + "learning_rate": 2.253528223989048e-06, + "loss": 0.095, + "step": 28942 + }, + { + "epoch": 78.86376021798365, + "grad_norm": 2.735203504562378, + "learning_rate": 2.2529701701355167e-06, + "loss": 0.0299, + "step": 28943 + }, + { + "epoch": 78.86648501362397, + "grad_norm": 2.352241039276123, + "learning_rate": 2.252412176615606e-06, + "loss": 0.0291, + "step": 28944 + }, + { + "epoch": 78.8692098092643, + "grad_norm": 2.0535550117492676, + "learning_rate": 2.2518542434336564e-06, + "loss": 0.0235, + "step": 28945 + }, + { + "epoch": 78.87193460490464, + "grad_norm": 2.4184505939483643, + "learning_rate": 2.2512963705940192e-06, + "loss": 0.0378, + "step": 28946 + }, + { + "epoch": 78.87465940054496, + "grad_norm": 2.285931348800659, + "learning_rate": 2.2507385581010364e-06, + "loss": 0.0204, + "step": 28947 + }, + { + "epoch": 78.87738419618529, + "grad_norm": 2.4018497467041016, + "learning_rate": 2.2501808059590537e-06, + "loss": 0.0522, + "step": 28948 + }, + { + "epoch": 78.88010899182561, + "grad_norm": 3.8832502365112305, + "learning_rate": 2.249623114172409e-06, + "loss": 0.0292, + "step": 28949 + }, + { + "epoch": 78.88283378746594, + "grad_norm": 3.2039356231689453, + "learning_rate": 2.2490654827454505e-06, + "loss": 0.1085, + "step": 28950 + }, + { + "epoch": 78.88555858310627, + "grad_norm": 4.351308822631836, + "learning_rate": 2.2485079116825236e-06, + "loss": 0.0428, + "step": 28951 + }, + { + "epoch": 78.88828337874659, + "grad_norm": 2.8200180530548096, + "learning_rate": 2.247950400987968e-06, + "loss": 0.0406, + "step": 28952 + }, + { + "epoch": 78.89100817438693, + "grad_norm": 8.28785228729248, + "learning_rate": 2.247392950666124e-06, + "loss": 0.13, + "step": 28953 + }, + { + "epoch": 78.89373297002724, + "grad_norm": 2.1097002029418945, + "learning_rate": 2.246835560721332e-06, + "loss": 0.0656, + "step": 28954 + }, + { + "epoch": 78.89645776566758, + "grad_norm": 2.7372913360595703, + "learning_rate": 2.246278231157939e-06, + "loss": 0.0768, + "step": 28955 + }, + { + "epoch": 78.8991825613079, + "grad_norm": 2.5888876914978027, + "learning_rate": 2.24572096198028e-06, + "loss": 0.0391, + "step": 28956 + }, + { + "epoch": 78.90190735694823, + "grad_norm": 3.376915216445923, + "learning_rate": 2.2451637531926973e-06, + "loss": 0.0305, + "step": 28957 + }, + { + "epoch": 78.90463215258856, + "grad_norm": 3.2022457122802734, + "learning_rate": 2.244606604799526e-06, + "loss": 0.1114, + "step": 28958 + }, + { + "epoch": 78.90735694822888, + "grad_norm": 2.461902379989624, + "learning_rate": 2.2440495168051134e-06, + "loss": 0.0431, + "step": 28959 + }, + { + "epoch": 78.91008174386921, + "grad_norm": 2.7596118450164795, + "learning_rate": 2.2434924892137923e-06, + "loss": 0.0619, + "step": 28960 + }, + { + "epoch": 78.91280653950953, + "grad_norm": 2.351466178894043, + "learning_rate": 2.2429355220299e-06, + "loss": 0.0379, + "step": 28961 + }, + { + "epoch": 78.91553133514986, + "grad_norm": 1.9727129936218262, + "learning_rate": 2.2423786152577788e-06, + "loss": 0.0273, + "step": 28962 + }, + { + "epoch": 78.9182561307902, + "grad_norm": 3.642521619796753, + "learning_rate": 2.241821768901762e-06, + "loss": 0.111, + "step": 28963 + }, + { + "epoch": 78.92098092643052, + "grad_norm": 2.45471453666687, + "learning_rate": 2.241264982966189e-06, + "loss": 0.0566, + "step": 28964 + }, + { + "epoch": 78.92370572207085, + "grad_norm": 3.0651931762695312, + "learning_rate": 2.2407082574553905e-06, + "loss": 0.0501, + "step": 28965 + }, + { + "epoch": 78.92643051771117, + "grad_norm": 3.414696455001831, + "learning_rate": 2.2401515923737083e-06, + "loss": 0.0405, + "step": 28966 + }, + { + "epoch": 78.9291553133515, + "grad_norm": 4.019133567810059, + "learning_rate": 2.2395949877254776e-06, + "loss": 0.1029, + "step": 28967 + }, + { + "epoch": 78.93188010899182, + "grad_norm": 3.0019774436950684, + "learning_rate": 2.23903844351503e-06, + "loss": 0.083, + "step": 28968 + }, + { + "epoch": 78.93460490463215, + "grad_norm": 2.116072416305542, + "learning_rate": 2.2384819597467033e-06, + "loss": 0.0295, + "step": 28969 + }, + { + "epoch": 78.93732970027249, + "grad_norm": 3.3626227378845215, + "learning_rate": 2.2379255364248252e-06, + "loss": 0.0462, + "step": 28970 + }, + { + "epoch": 78.9400544959128, + "grad_norm": 2.790712356567383, + "learning_rate": 2.237369173553736e-06, + "loss": 0.1157, + "step": 28971 + }, + { + "epoch": 78.94277929155314, + "grad_norm": 2.7577567100524902, + "learning_rate": 2.2368128711377666e-06, + "loss": 0.0585, + "step": 28972 + }, + { + "epoch": 78.94550408719346, + "grad_norm": 2.1706457138061523, + "learning_rate": 2.2362566291812483e-06, + "loss": 0.0237, + "step": 28973 + }, + { + "epoch": 78.94822888283379, + "grad_norm": 2.6240735054016113, + "learning_rate": 2.2357004476885112e-06, + "loss": 0.0548, + "step": 28974 + }, + { + "epoch": 78.95095367847412, + "grad_norm": 4.908451080322266, + "learning_rate": 2.2351443266638918e-06, + "loss": 0.1023, + "step": 28975 + }, + { + "epoch": 78.95367847411444, + "grad_norm": 2.3655176162719727, + "learning_rate": 2.234588266111718e-06, + "loss": 0.065, + "step": 28976 + }, + { + "epoch": 78.95640326975477, + "grad_norm": 2.5295188426971436, + "learning_rate": 2.2340322660363213e-06, + "loss": 0.081, + "step": 28977 + }, + { + "epoch": 78.95912806539509, + "grad_norm": 3.583195686340332, + "learning_rate": 2.2334763264420277e-06, + "loss": 0.0237, + "step": 28978 + }, + { + "epoch": 78.96185286103542, + "grad_norm": 2.523772716522217, + "learning_rate": 2.2329204473331745e-06, + "loss": 0.043, + "step": 28979 + }, + { + "epoch": 78.96457765667574, + "grad_norm": 3.4741899967193604, + "learning_rate": 2.2323646287140856e-06, + "loss": 0.1255, + "step": 28980 + }, + { + "epoch": 78.96730245231608, + "grad_norm": 3.007777214050293, + "learning_rate": 2.2318088705890917e-06, + "loss": 0.0346, + "step": 28981 + }, + { + "epoch": 78.97002724795641, + "grad_norm": 2.4841318130493164, + "learning_rate": 2.2312531729625175e-06, + "loss": 0.0412, + "step": 28982 + }, + { + "epoch": 78.97275204359673, + "grad_norm": 3.2065043449401855, + "learning_rate": 2.230697535838696e-06, + "loss": 0.0738, + "step": 28983 + }, + { + "epoch": 78.97547683923706, + "grad_norm": 2.92630672454834, + "learning_rate": 2.2301419592219496e-06, + "loss": 0.0562, + "step": 28984 + }, + { + "epoch": 78.97820163487738, + "grad_norm": 3.4912874698638916, + "learning_rate": 2.2295864431166105e-06, + "loss": 0.0916, + "step": 28985 + }, + { + "epoch": 78.98092643051771, + "grad_norm": 2.434004783630371, + "learning_rate": 2.229030987526999e-06, + "loss": 0.0305, + "step": 28986 + }, + { + "epoch": 78.98365122615803, + "grad_norm": 2.8450632095336914, + "learning_rate": 2.2284755924574477e-06, + "loss": 0.0804, + "step": 28987 + }, + { + "epoch": 78.98637602179836, + "grad_norm": 3.7656378746032715, + "learning_rate": 2.2279202579122773e-06, + "loss": 0.0881, + "step": 28988 + }, + { + "epoch": 78.9891008174387, + "grad_norm": 4.203093528747559, + "learning_rate": 2.2273649838958133e-06, + "loss": 0.1142, + "step": 28989 + }, + { + "epoch": 78.99182561307902, + "grad_norm": 2.87361478805542, + "learning_rate": 2.2268097704123793e-06, + "loss": 0.0602, + "step": 28990 + }, + { + "epoch": 78.99455040871935, + "grad_norm": 2.962855815887451, + "learning_rate": 2.2262546174663024e-06, + "loss": 0.0651, + "step": 28991 + }, + { + "epoch": 78.99727520435967, + "grad_norm": 2.7653558254241943, + "learning_rate": 2.225699525061905e-06, + "loss": 0.0336, + "step": 28992 + }, + { + "epoch": 79.0, + "grad_norm": 3.1838862895965576, + "learning_rate": 2.2251444932035094e-06, + "loss": 0.0642, + "step": 28993 + }, + { + "epoch": 79.00272479564033, + "grad_norm": 2.9148108959198, + "learning_rate": 2.224589521895435e-06, + "loss": 0.1426, + "step": 28994 + }, + { + "epoch": 79.00544959128065, + "grad_norm": 3.782153844833374, + "learning_rate": 2.22403461114201e-06, + "loss": 0.1301, + "step": 28995 + }, + { + "epoch": 79.00817438692098, + "grad_norm": 4.163833141326904, + "learning_rate": 2.2234797609475536e-06, + "loss": 0.0725, + "step": 28996 + }, + { + "epoch": 79.0108991825613, + "grad_norm": 3.2145962715148926, + "learning_rate": 2.222924971316386e-06, + "loss": 0.0449, + "step": 28997 + }, + { + "epoch": 79.01362397820164, + "grad_norm": 6.8873467445373535, + "learning_rate": 2.222370242252826e-06, + "loss": 0.067, + "step": 28998 + }, + { + "epoch": 79.01634877384195, + "grad_norm": 3.1379776000976562, + "learning_rate": 2.221815573761199e-06, + "loss": 0.0405, + "step": 28999 + }, + { + "epoch": 79.01907356948229, + "grad_norm": 2.1184167861938477, + "learning_rate": 2.2212609658458217e-06, + "loss": 0.0313, + "step": 29000 + }, + { + "epoch": 79.02179836512262, + "grad_norm": 2.5771548748016357, + "learning_rate": 2.2207064185110107e-06, + "loss": 0.0705, + "step": 29001 + }, + { + "epoch": 79.02452316076294, + "grad_norm": 2.5136120319366455, + "learning_rate": 2.220151931761091e-06, + "loss": 0.1279, + "step": 29002 + }, + { + "epoch": 79.02724795640327, + "grad_norm": 1.5938818454742432, + "learning_rate": 2.219597505600375e-06, + "loss": 0.03, + "step": 29003 + }, + { + "epoch": 79.02997275204359, + "grad_norm": 2.7952795028686523, + "learning_rate": 2.219043140033186e-06, + "loss": 0.0843, + "step": 29004 + }, + { + "epoch": 79.03269754768392, + "grad_norm": 2.659262180328369, + "learning_rate": 2.2184888350638378e-06, + "loss": 0.1777, + "step": 29005 + }, + { + "epoch": 79.03542234332426, + "grad_norm": 2.468482494354248, + "learning_rate": 2.2179345906966464e-06, + "loss": 0.0318, + "step": 29006 + }, + { + "epoch": 79.03814713896458, + "grad_norm": 2.700657844543457, + "learning_rate": 2.2173804069359316e-06, + "loss": 0.0941, + "step": 29007 + }, + { + "epoch": 79.04087193460491, + "grad_norm": 1.6931849718093872, + "learning_rate": 2.2168262837860087e-06, + "loss": 0.0305, + "step": 29008 + }, + { + "epoch": 79.04359673024523, + "grad_norm": 2.511362314224243, + "learning_rate": 2.216272221251192e-06, + "loss": 0.0315, + "step": 29009 + }, + { + "epoch": 79.04632152588556, + "grad_norm": 2.1316440105438232, + "learning_rate": 2.215718219335794e-06, + "loss": 0.0325, + "step": 29010 + }, + { + "epoch": 79.04904632152588, + "grad_norm": 2.4834442138671875, + "learning_rate": 2.215164278044134e-06, + "loss": 0.0383, + "step": 29011 + }, + { + "epoch": 79.05177111716621, + "grad_norm": 3.0480587482452393, + "learning_rate": 2.2146103973805243e-06, + "loss": 0.0398, + "step": 29012 + }, + { + "epoch": 79.05449591280654, + "grad_norm": 2.2068545818328857, + "learning_rate": 2.2140565773492783e-06, + "loss": 0.0871, + "step": 29013 + }, + { + "epoch": 79.05722070844686, + "grad_norm": 4.302914142608643, + "learning_rate": 2.213502817954707e-06, + "loss": 0.0996, + "step": 29014 + }, + { + "epoch": 79.0599455040872, + "grad_norm": 2.7306058406829834, + "learning_rate": 2.2129491192011276e-06, + "loss": 0.0247, + "step": 29015 + }, + { + "epoch": 79.06267029972751, + "grad_norm": 4.0557074546813965, + "learning_rate": 2.2123954810928494e-06, + "loss": 0.0666, + "step": 29016 + }, + { + "epoch": 79.06539509536785, + "grad_norm": 2.2466578483581543, + "learning_rate": 2.2118419036341852e-06, + "loss": 0.0856, + "step": 29017 + }, + { + "epoch": 79.06811989100818, + "grad_norm": 3.5039384365081787, + "learning_rate": 2.211288386829442e-06, + "loss": 0.0369, + "step": 29018 + }, + { + "epoch": 79.0708446866485, + "grad_norm": 2.205421209335327, + "learning_rate": 2.2107349306829353e-06, + "loss": 0.0284, + "step": 29019 + }, + { + "epoch": 79.07356948228883, + "grad_norm": 4.472661972045898, + "learning_rate": 2.2101815351989766e-06, + "loss": 0.0522, + "step": 29020 + }, + { + "epoch": 79.07629427792915, + "grad_norm": 3.3279480934143066, + "learning_rate": 2.2096282003818727e-06, + "loss": 0.1035, + "step": 29021 + }, + { + "epoch": 79.07901907356948, + "grad_norm": 3.8901562690734863, + "learning_rate": 2.2090749262359335e-06, + "loss": 0.0403, + "step": 29022 + }, + { + "epoch": 79.0817438692098, + "grad_norm": 1.69046950340271, + "learning_rate": 2.2085217127654667e-06, + "loss": 0.0228, + "step": 29023 + }, + { + "epoch": 79.08446866485014, + "grad_norm": 2.8504533767700195, + "learning_rate": 2.2079685599747836e-06, + "loss": 0.0438, + "step": 29024 + }, + { + "epoch": 79.08719346049047, + "grad_norm": 2.222036838531494, + "learning_rate": 2.2074154678681915e-06, + "loss": 0.0285, + "step": 29025 + }, + { + "epoch": 79.08991825613079, + "grad_norm": 2.6852304935455322, + "learning_rate": 2.2068624364499923e-06, + "loss": 0.0382, + "step": 29026 + }, + { + "epoch": 79.09264305177112, + "grad_norm": 4.05474328994751, + "learning_rate": 2.2063094657245023e-06, + "loss": 0.1143, + "step": 29027 + }, + { + "epoch": 79.09536784741144, + "grad_norm": 1.4751938581466675, + "learning_rate": 2.2057565556960224e-06, + "loss": 0.0177, + "step": 29028 + }, + { + "epoch": 79.09809264305177, + "grad_norm": 2.09287428855896, + "learning_rate": 2.20520370636886e-06, + "loss": 0.0433, + "step": 29029 + }, + { + "epoch": 79.1008174386921, + "grad_norm": 2.2168161869049072, + "learning_rate": 2.2046509177473172e-06, + "loss": 0.0314, + "step": 29030 + }, + { + "epoch": 79.10354223433242, + "grad_norm": 3.78035831451416, + "learning_rate": 2.204098189835705e-06, + "loss": 0.0625, + "step": 29031 + }, + { + "epoch": 79.10626702997276, + "grad_norm": 3.029510498046875, + "learning_rate": 2.203545522638326e-06, + "loss": 0.0353, + "step": 29032 + }, + { + "epoch": 79.10899182561307, + "grad_norm": 2.7755277156829834, + "learning_rate": 2.2029929161594832e-06, + "loss": 0.0292, + "step": 29033 + }, + { + "epoch": 79.11171662125341, + "grad_norm": 3.479027271270752, + "learning_rate": 2.202440370403477e-06, + "loss": 0.0337, + "step": 29034 + }, + { + "epoch": 79.11444141689373, + "grad_norm": 2.9710240364074707, + "learning_rate": 2.201887885374615e-06, + "loss": 0.0308, + "step": 29035 + }, + { + "epoch": 79.11716621253406, + "grad_norm": 2.7454752922058105, + "learning_rate": 2.201335461077201e-06, + "loss": 0.0461, + "step": 29036 + }, + { + "epoch": 79.11989100817439, + "grad_norm": 2.8812928199768066, + "learning_rate": 2.2007830975155366e-06, + "loss": 0.0292, + "step": 29037 + }, + { + "epoch": 79.12261580381471, + "grad_norm": 2.9671459197998047, + "learning_rate": 2.200230794693922e-06, + "loss": 0.0419, + "step": 29038 + }, + { + "epoch": 79.12534059945504, + "grad_norm": 2.3303415775299072, + "learning_rate": 2.1996785526166565e-06, + "loss": 0.0708, + "step": 29039 + }, + { + "epoch": 79.12806539509536, + "grad_norm": 3.224896192550659, + "learning_rate": 2.199126371288045e-06, + "loss": 0.0468, + "step": 29040 + }, + { + "epoch": 79.1307901907357, + "grad_norm": 2.227735996246338, + "learning_rate": 2.1985742507123873e-06, + "loss": 0.0241, + "step": 29041 + }, + { + "epoch": 79.13351498637603, + "grad_norm": 2.878380060195923, + "learning_rate": 2.1980221908939812e-06, + "loss": 0.0379, + "step": 29042 + }, + { + "epoch": 79.13623978201635, + "grad_norm": 2.451493501663208, + "learning_rate": 2.1974701918371253e-06, + "loss": 0.0975, + "step": 29043 + }, + { + "epoch": 79.13896457765668, + "grad_norm": 3.162177085876465, + "learning_rate": 2.196918253546123e-06, + "loss": 0.0339, + "step": 29044 + }, + { + "epoch": 79.141689373297, + "grad_norm": 2.534670829772949, + "learning_rate": 2.1963663760252706e-06, + "loss": 0.0399, + "step": 29045 + }, + { + "epoch": 79.14441416893733, + "grad_norm": 2.1600096225738525, + "learning_rate": 2.195814559278866e-06, + "loss": 0.063, + "step": 29046 + }, + { + "epoch": 79.14713896457765, + "grad_norm": 2.6848669052124023, + "learning_rate": 2.1952628033112023e-06, + "loss": 0.0931, + "step": 29047 + }, + { + "epoch": 79.14986376021798, + "grad_norm": 3.757939100265503, + "learning_rate": 2.194711108126585e-06, + "loss": 0.0976, + "step": 29048 + }, + { + "epoch": 79.15258855585832, + "grad_norm": 2.2765674591064453, + "learning_rate": 2.1941594737293046e-06, + "loss": 0.0368, + "step": 29049 + }, + { + "epoch": 79.15531335149863, + "grad_norm": 2.605943202972412, + "learning_rate": 2.193607900123658e-06, + "loss": 0.0335, + "step": 29050 + }, + { + "epoch": 79.15803814713897, + "grad_norm": 4.46356725692749, + "learning_rate": 2.193056387313943e-06, + "loss": 0.0785, + "step": 29051 + }, + { + "epoch": 79.16076294277929, + "grad_norm": 2.3422508239746094, + "learning_rate": 2.1925049353044516e-06, + "loss": 0.0585, + "step": 29052 + }, + { + "epoch": 79.16348773841962, + "grad_norm": 3.4779980182647705, + "learning_rate": 2.191953544099483e-06, + "loss": 0.1004, + "step": 29053 + }, + { + "epoch": 79.16621253405995, + "grad_norm": 3.1119022369384766, + "learning_rate": 2.1914022137033298e-06, + "loss": 0.1381, + "step": 29054 + }, + { + "epoch": 79.16893732970027, + "grad_norm": 3.0909368991851807, + "learning_rate": 2.1908509441202808e-06, + "loss": 0.0669, + "step": 29055 + }, + { + "epoch": 79.1716621253406, + "grad_norm": 2.227065324783325, + "learning_rate": 2.1902997353546375e-06, + "loss": 0.2358, + "step": 29056 + }, + { + "epoch": 79.17438692098092, + "grad_norm": 2.804032325744629, + "learning_rate": 2.189748587410687e-06, + "loss": 0.0848, + "step": 29057 + }, + { + "epoch": 79.17711171662125, + "grad_norm": 3.4174256324768066, + "learning_rate": 2.1891975002927235e-06, + "loss": 0.0597, + "step": 29058 + }, + { + "epoch": 79.17983651226157, + "grad_norm": 2.1053144931793213, + "learning_rate": 2.188646474005036e-06, + "loss": 0.0192, + "step": 29059 + }, + { + "epoch": 79.1825613079019, + "grad_norm": 2.635653018951416, + "learning_rate": 2.1880955085519217e-06, + "loss": 0.0849, + "step": 29060 + }, + { + "epoch": 79.18528610354224, + "grad_norm": 2.9646215438842773, + "learning_rate": 2.187544603937668e-06, + "loss": 0.0521, + "step": 29061 + }, + { + "epoch": 79.18801089918256, + "grad_norm": 2.1120166778564453, + "learning_rate": 2.1869937601665646e-06, + "loss": 0.0343, + "step": 29062 + }, + { + "epoch": 79.19073569482289, + "grad_norm": 4.583893299102783, + "learning_rate": 2.1864429772428997e-06, + "loss": 0.0392, + "step": 29063 + }, + { + "epoch": 79.19346049046321, + "grad_norm": 3.6696221828460693, + "learning_rate": 2.1858922551709694e-06, + "loss": 0.0763, + "step": 29064 + }, + { + "epoch": 79.19618528610354, + "grad_norm": 4.0118794441223145, + "learning_rate": 2.1853415939550572e-06, + "loss": 0.0663, + "step": 29065 + }, + { + "epoch": 79.19891008174388, + "grad_norm": 3.1027932167053223, + "learning_rate": 2.1847909935994538e-06, + "loss": 0.2138, + "step": 29066 + }, + { + "epoch": 79.2016348773842, + "grad_norm": 2.924137592315674, + "learning_rate": 2.1842404541084437e-06, + "loss": 0.1047, + "step": 29067 + }, + { + "epoch": 79.20435967302453, + "grad_norm": 2.2442281246185303, + "learning_rate": 2.1836899754863207e-06, + "loss": 0.0331, + "step": 29068 + }, + { + "epoch": 79.20708446866485, + "grad_norm": 2.7856338024139404, + "learning_rate": 2.183139557737368e-06, + "loss": 0.1887, + "step": 29069 + }, + { + "epoch": 79.20980926430518, + "grad_norm": 3.261448860168457, + "learning_rate": 2.18258920086587e-06, + "loss": 0.0935, + "step": 29070 + }, + { + "epoch": 79.2125340599455, + "grad_norm": 3.122056007385254, + "learning_rate": 2.1820389048761172e-06, + "loss": 0.0446, + "step": 29071 + }, + { + "epoch": 79.21525885558583, + "grad_norm": 3.940288782119751, + "learning_rate": 2.1814886697723946e-06, + "loss": 0.0401, + "step": 29072 + }, + { + "epoch": 79.21798365122616, + "grad_norm": 1.80351722240448, + "learning_rate": 2.1809384955589873e-06, + "loss": 0.0308, + "step": 29073 + }, + { + "epoch": 79.22070844686648, + "grad_norm": 3.1186141967773438, + "learning_rate": 2.1803883822401795e-06, + "loss": 0.0462, + "step": 29074 + }, + { + "epoch": 79.22343324250681, + "grad_norm": 2.8939812183380127, + "learning_rate": 2.1798383298202518e-06, + "loss": 0.0986, + "step": 29075 + }, + { + "epoch": 79.22615803814713, + "grad_norm": 2.034874677658081, + "learning_rate": 2.1792883383034956e-06, + "loss": 0.0211, + "step": 29076 + }, + { + "epoch": 79.22888283378747, + "grad_norm": 2.3820343017578125, + "learning_rate": 2.1787384076941897e-06, + "loss": 0.1199, + "step": 29077 + }, + { + "epoch": 79.2316076294278, + "grad_norm": 3.194413185119629, + "learning_rate": 2.1781885379966173e-06, + "loss": 0.0778, + "step": 29078 + }, + { + "epoch": 79.23433242506812, + "grad_norm": 2.6934423446655273, + "learning_rate": 2.177638729215057e-06, + "loss": 0.0881, + "step": 29079 + }, + { + "epoch": 79.23705722070845, + "grad_norm": 2.2399747371673584, + "learning_rate": 2.177088981353799e-06, + "loss": 0.0457, + "step": 29080 + }, + { + "epoch": 79.23978201634877, + "grad_norm": 2.8372128009796143, + "learning_rate": 2.1765392944171183e-06, + "loss": 0.0607, + "step": 29081 + }, + { + "epoch": 79.2425068119891, + "grad_norm": 2.8705480098724365, + "learning_rate": 2.1759896684092997e-06, + "loss": 0.0499, + "step": 29082 + }, + { + "epoch": 79.24523160762942, + "grad_norm": 2.626051187515259, + "learning_rate": 2.1754401033346172e-06, + "loss": 0.1157, + "step": 29083 + }, + { + "epoch": 79.24795640326975, + "grad_norm": 2.2016239166259766, + "learning_rate": 2.174890599197359e-06, + "loss": 0.0901, + "step": 29084 + }, + { + "epoch": 79.25068119891009, + "grad_norm": 2.451127290725708, + "learning_rate": 2.174341156001801e-06, + "loss": 0.0398, + "step": 29085 + }, + { + "epoch": 79.2534059945504, + "grad_norm": 2.5305445194244385, + "learning_rate": 2.173791773752223e-06, + "loss": 0.0375, + "step": 29086 + }, + { + "epoch": 79.25613079019074, + "grad_norm": 3.7565362453460693, + "learning_rate": 2.1732424524528984e-06, + "loss": 0.088, + "step": 29087 + }, + { + "epoch": 79.25885558583106, + "grad_norm": 4.2690534591674805, + "learning_rate": 2.172693192108111e-06, + "loss": 0.0655, + "step": 29088 + }, + { + "epoch": 79.26158038147139, + "grad_norm": 3.4888193607330322, + "learning_rate": 2.1721439927221386e-06, + "loss": 0.0292, + "step": 29089 + }, + { + "epoch": 79.26430517711172, + "grad_norm": 2.0520920753479004, + "learning_rate": 2.1715948542992583e-06, + "loss": 0.0201, + "step": 29090 + }, + { + "epoch": 79.26702997275204, + "grad_norm": 2.751879930496216, + "learning_rate": 2.171045776843742e-06, + "loss": 0.0403, + "step": 29091 + }, + { + "epoch": 79.26975476839237, + "grad_norm": 2.667137861251831, + "learning_rate": 2.1704967603598716e-06, + "loss": 0.1036, + "step": 29092 + }, + { + "epoch": 79.2724795640327, + "grad_norm": 2.8200252056121826, + "learning_rate": 2.1699478048519207e-06, + "loss": 0.033, + "step": 29093 + }, + { + "epoch": 79.27520435967303, + "grad_norm": 2.055072069168091, + "learning_rate": 2.169398910324164e-06, + "loss": 0.0403, + "step": 29094 + }, + { + "epoch": 79.27792915531334, + "grad_norm": 2.743004560470581, + "learning_rate": 2.168850076780874e-06, + "loss": 0.0383, + "step": 29095 + }, + { + "epoch": 79.28065395095368, + "grad_norm": 3.5729358196258545, + "learning_rate": 2.1683013042263303e-06, + "loss": 0.0657, + "step": 29096 + }, + { + "epoch": 79.28337874659401, + "grad_norm": 2.585911273956299, + "learning_rate": 2.1677525926648046e-06, + "loss": 0.0852, + "step": 29097 + }, + { + "epoch": 79.28610354223433, + "grad_norm": 2.3793601989746094, + "learning_rate": 2.1672039421005685e-06, + "loss": 0.0654, + "step": 29098 + }, + { + "epoch": 79.28882833787466, + "grad_norm": 4.038046836853027, + "learning_rate": 2.166655352537894e-06, + "loss": 0.0373, + "step": 29099 + }, + { + "epoch": 79.29155313351498, + "grad_norm": 2.678459644317627, + "learning_rate": 2.166106823981058e-06, + "loss": 0.109, + "step": 29100 + }, + { + "epoch": 79.29427792915531, + "grad_norm": 1.7455143928527832, + "learning_rate": 2.1655583564343295e-06, + "loss": 0.0164, + "step": 29101 + }, + { + "epoch": 79.29700272479565, + "grad_norm": 3.4639203548431396, + "learning_rate": 2.1650099499019817e-06, + "loss": 0.1119, + "step": 29102 + }, + { + "epoch": 79.29972752043597, + "grad_norm": 2.804391384124756, + "learning_rate": 2.1644616043882806e-06, + "loss": 0.0621, + "step": 29103 + }, + { + "epoch": 79.3024523160763, + "grad_norm": 2.591519594192505, + "learning_rate": 2.1639133198975003e-06, + "loss": 0.146, + "step": 29104 + }, + { + "epoch": 79.30517711171662, + "grad_norm": 3.3030831813812256, + "learning_rate": 2.1633650964339137e-06, + "loss": 0.032, + "step": 29105 + }, + { + "epoch": 79.30790190735695, + "grad_norm": 2.8341338634490967, + "learning_rate": 2.162816934001787e-06, + "loss": 0.0371, + "step": 29106 + }, + { + "epoch": 79.31062670299727, + "grad_norm": 2.3924429416656494, + "learning_rate": 2.162268832605391e-06, + "loss": 0.1243, + "step": 29107 + }, + { + "epoch": 79.3133514986376, + "grad_norm": 1.8220769166946411, + "learning_rate": 2.161720792248989e-06, + "loss": 0.0221, + "step": 29108 + }, + { + "epoch": 79.31607629427793, + "grad_norm": 2.4537875652313232, + "learning_rate": 2.161172812936857e-06, + "loss": 0.0321, + "step": 29109 + }, + { + "epoch": 79.31880108991825, + "grad_norm": 2.5680668354034424, + "learning_rate": 2.1606248946732578e-06, + "loss": 0.1026, + "step": 29110 + }, + { + "epoch": 79.32152588555859, + "grad_norm": 2.7012076377868652, + "learning_rate": 2.1600770374624604e-06, + "loss": 0.1166, + "step": 29111 + }, + { + "epoch": 79.3242506811989, + "grad_norm": 2.6602818965911865, + "learning_rate": 2.1595292413087277e-06, + "loss": 0.1375, + "step": 29112 + }, + { + "epoch": 79.32697547683924, + "grad_norm": 2.554255247116089, + "learning_rate": 2.1589815062163323e-06, + "loss": 0.0615, + "step": 29113 + }, + { + "epoch": 79.32970027247957, + "grad_norm": 2.9622340202331543, + "learning_rate": 2.1584338321895358e-06, + "loss": 0.0338, + "step": 29114 + }, + { + "epoch": 79.33242506811989, + "grad_norm": 2.0364558696746826, + "learning_rate": 2.157886219232601e-06, + "loss": 0.1146, + "step": 29115 + }, + { + "epoch": 79.33514986376022, + "grad_norm": 2.6309211254119873, + "learning_rate": 2.1573386673498e-06, + "loss": 0.039, + "step": 29116 + }, + { + "epoch": 79.33787465940054, + "grad_norm": 2.2014896869659424, + "learning_rate": 2.156791176545392e-06, + "loss": 0.027, + "step": 29117 + }, + { + "epoch": 79.34059945504087, + "grad_norm": 2.404651165008545, + "learning_rate": 2.156243746823643e-06, + "loss": 0.1221, + "step": 29118 + }, + { + "epoch": 79.34332425068119, + "grad_norm": 3.56484055519104, + "learning_rate": 2.155696378188812e-06, + "loss": 0.0547, + "step": 29119 + }, + { + "epoch": 79.34604904632153, + "grad_norm": 3.12198543548584, + "learning_rate": 2.155149070645167e-06, + "loss": 0.0602, + "step": 29120 + }, + { + "epoch": 79.34877384196186, + "grad_norm": 3.3931684494018555, + "learning_rate": 2.154601824196967e-06, + "loss": 0.1492, + "step": 29121 + }, + { + "epoch": 79.35149863760218, + "grad_norm": 2.0469658374786377, + "learning_rate": 2.1540546388484774e-06, + "loss": 0.0331, + "step": 29122 + }, + { + "epoch": 79.35422343324251, + "grad_norm": 2.0167696475982666, + "learning_rate": 2.1535075146039575e-06, + "loss": 0.1011, + "step": 29123 + }, + { + "epoch": 79.35694822888283, + "grad_norm": 2.6373302936553955, + "learning_rate": 2.152960451467667e-06, + "loss": 0.0665, + "step": 29124 + }, + { + "epoch": 79.35967302452316, + "grad_norm": 3.410719394683838, + "learning_rate": 2.1524134494438697e-06, + "loss": 0.0636, + "step": 29125 + }, + { + "epoch": 79.3623978201635, + "grad_norm": 3.731895923614502, + "learning_rate": 2.151866508536824e-06, + "loss": 0.0741, + "step": 29126 + }, + { + "epoch": 79.36512261580381, + "grad_norm": 4.988549709320068, + "learning_rate": 2.1513196287507898e-06, + "loss": 0.1301, + "step": 29127 + }, + { + "epoch": 79.36784741144415, + "grad_norm": 2.221756935119629, + "learning_rate": 2.1507728100900227e-06, + "loss": 0.0324, + "step": 29128 + }, + { + "epoch": 79.37057220708446, + "grad_norm": 2.468036413192749, + "learning_rate": 2.150226052558787e-06, + "loss": 0.0732, + "step": 29129 + }, + { + "epoch": 79.3732970027248, + "grad_norm": 2.1339199542999268, + "learning_rate": 2.149679356161338e-06, + "loss": 0.0281, + "step": 29130 + }, + { + "epoch": 79.37602179836512, + "grad_norm": 3.1965534687042236, + "learning_rate": 2.1491327209019342e-06, + "loss": 0.0666, + "step": 29131 + }, + { + "epoch": 79.37874659400545, + "grad_norm": 2.404315710067749, + "learning_rate": 2.148586146784829e-06, + "loss": 0.03, + "step": 29132 + }, + { + "epoch": 79.38147138964578, + "grad_norm": 2.7038164138793945, + "learning_rate": 2.148039633814285e-06, + "loss": 0.055, + "step": 29133 + }, + { + "epoch": 79.3841961852861, + "grad_norm": 4.145355701446533, + "learning_rate": 2.1474931819945555e-06, + "loss": 0.1405, + "step": 29134 + }, + { + "epoch": 79.38692098092643, + "grad_norm": 3.433864116668701, + "learning_rate": 2.1469467913298937e-06, + "loss": 0.0691, + "step": 29135 + }, + { + "epoch": 79.38964577656675, + "grad_norm": 3.0650908946990967, + "learning_rate": 2.1464004618245605e-06, + "loss": 0.0622, + "step": 29136 + }, + { + "epoch": 79.39237057220708, + "grad_norm": 4.756199359893799, + "learning_rate": 2.145854193482807e-06, + "loss": 0.1613, + "step": 29137 + }, + { + "epoch": 79.39509536784742, + "grad_norm": 3.309528350830078, + "learning_rate": 2.1453079863088888e-06, + "loss": 0.0246, + "step": 29138 + }, + { + "epoch": 79.39782016348774, + "grad_norm": 2.56789231300354, + "learning_rate": 2.144761840307057e-06, + "loss": 0.0788, + "step": 29139 + }, + { + "epoch": 79.40054495912807, + "grad_norm": 2.227259397506714, + "learning_rate": 2.1442157554815656e-06, + "loss": 0.0305, + "step": 29140 + }, + { + "epoch": 79.40326975476839, + "grad_norm": 3.5943763256073, + "learning_rate": 2.143669731836673e-06, + "loss": 0.0455, + "step": 29141 + }, + { + "epoch": 79.40599455040872, + "grad_norm": 2.7709333896636963, + "learning_rate": 2.1431237693766273e-06, + "loss": 0.0406, + "step": 29142 + }, + { + "epoch": 79.40871934604904, + "grad_norm": 3.2980639934539795, + "learning_rate": 2.1425778681056807e-06, + "loss": 0.0305, + "step": 29143 + }, + { + "epoch": 79.41144414168937, + "grad_norm": 2.189328908920288, + "learning_rate": 2.1420320280280827e-06, + "loss": 0.0328, + "step": 29144 + }, + { + "epoch": 79.4141689373297, + "grad_norm": 2.6904215812683105, + "learning_rate": 2.141486249148089e-06, + "loss": 0.1377, + "step": 29145 + }, + { + "epoch": 79.41689373297002, + "grad_norm": 2.8595118522644043, + "learning_rate": 2.1409405314699473e-06, + "loss": 0.0589, + "step": 29146 + }, + { + "epoch": 79.41961852861036, + "grad_norm": 4.642414569854736, + "learning_rate": 2.1403948749979074e-06, + "loss": 0.1823, + "step": 29147 + }, + { + "epoch": 79.42234332425068, + "grad_norm": 2.5312201976776123, + "learning_rate": 2.139849279736217e-06, + "loss": 0.0408, + "step": 29148 + }, + { + "epoch": 79.42506811989101, + "grad_norm": 5.1673054695129395, + "learning_rate": 2.13930374568913e-06, + "loss": 0.0455, + "step": 29149 + }, + { + "epoch": 79.42779291553134, + "grad_norm": 3.4629383087158203, + "learning_rate": 2.1387582728608913e-06, + "loss": 0.1931, + "step": 29150 + }, + { + "epoch": 79.43051771117166, + "grad_norm": 4.233945369720459, + "learning_rate": 2.138212861255752e-06, + "loss": 0.0495, + "step": 29151 + }, + { + "epoch": 79.433242506812, + "grad_norm": 2.226323366165161, + "learning_rate": 2.1376675108779543e-06, + "loss": 0.0334, + "step": 29152 + }, + { + "epoch": 79.43596730245231, + "grad_norm": 2.4665186405181885, + "learning_rate": 2.137122221731751e-06, + "loss": 0.0258, + "step": 29153 + }, + { + "epoch": 79.43869209809264, + "grad_norm": 3.466925859451294, + "learning_rate": 2.1365769938213876e-06, + "loss": 0.082, + "step": 29154 + }, + { + "epoch": 79.44141689373296, + "grad_norm": 3.4934182167053223, + "learning_rate": 2.1360318271511093e-06, + "loss": 0.0447, + "step": 29155 + }, + { + "epoch": 79.4441416893733, + "grad_norm": 2.2688581943511963, + "learning_rate": 2.1354867217251573e-06, + "loss": 0.0279, + "step": 29156 + }, + { + "epoch": 79.44686648501363, + "grad_norm": 3.084193468093872, + "learning_rate": 2.134941677547786e-06, + "loss": 0.2089, + "step": 29157 + }, + { + "epoch": 79.44959128065395, + "grad_norm": 3.214845895767212, + "learning_rate": 2.1343966946232366e-06, + "loss": 0.1284, + "step": 29158 + }, + { + "epoch": 79.45231607629428, + "grad_norm": 3.1596949100494385, + "learning_rate": 2.1338517729557517e-06, + "loss": 0.0695, + "step": 29159 + }, + { + "epoch": 79.4550408719346, + "grad_norm": 3.507193088531494, + "learning_rate": 2.133306912549574e-06, + "loss": 0.0547, + "step": 29160 + }, + { + "epoch": 79.45776566757493, + "grad_norm": 2.546586275100708, + "learning_rate": 2.1327621134089516e-06, + "loss": 0.0667, + "step": 29161 + }, + { + "epoch": 79.46049046321527, + "grad_norm": 2.6235101222991943, + "learning_rate": 2.132217375538125e-06, + "loss": 0.0511, + "step": 29162 + }, + { + "epoch": 79.46321525885558, + "grad_norm": 2.8926868438720703, + "learning_rate": 2.131672698941335e-06, + "loss": 0.0505, + "step": 29163 + }, + { + "epoch": 79.46594005449592, + "grad_norm": 2.8754851818084717, + "learning_rate": 2.131128083622823e-06, + "loss": 0.1188, + "step": 29164 + }, + { + "epoch": 79.46866485013624, + "grad_norm": 3.165276288986206, + "learning_rate": 2.130583529586835e-06, + "loss": 0.0711, + "step": 29165 + }, + { + "epoch": 79.47138964577657, + "grad_norm": 2.14923095703125, + "learning_rate": 2.130039036837609e-06, + "loss": 0.0497, + "step": 29166 + }, + { + "epoch": 79.47411444141689, + "grad_norm": 3.854116916656494, + "learning_rate": 2.129494605379385e-06, + "loss": 0.0619, + "step": 29167 + }, + { + "epoch": 79.47683923705722, + "grad_norm": 3.4426791667938232, + "learning_rate": 2.1289502352164015e-06, + "loss": 0.0559, + "step": 29168 + }, + { + "epoch": 79.47956403269755, + "grad_norm": 2.8873674869537354, + "learning_rate": 2.1284059263529035e-06, + "loss": 0.1437, + "step": 29169 + }, + { + "epoch": 79.48228882833787, + "grad_norm": 5.089114665985107, + "learning_rate": 2.127861678793126e-06, + "loss": 0.0796, + "step": 29170 + }, + { + "epoch": 79.4850136239782, + "grad_norm": 3.037562847137451, + "learning_rate": 2.1273174925413086e-06, + "loss": 0.0414, + "step": 29171 + }, + { + "epoch": 79.48773841961852, + "grad_norm": 1.9644275903701782, + "learning_rate": 2.126773367601688e-06, + "loss": 0.0197, + "step": 29172 + }, + { + "epoch": 79.49046321525886, + "grad_norm": 4.938040733337402, + "learning_rate": 2.126229303978501e-06, + "loss": 0.0354, + "step": 29173 + }, + { + "epoch": 79.49318801089919, + "grad_norm": 3.319546699523926, + "learning_rate": 2.1256853016759905e-06, + "loss": 0.0453, + "step": 29174 + }, + { + "epoch": 79.49591280653951, + "grad_norm": 1.9399495124816895, + "learning_rate": 2.1251413606983883e-06, + "loss": 0.0294, + "step": 29175 + }, + { + "epoch": 79.49863760217984, + "grad_norm": 3.333191394805908, + "learning_rate": 2.1245974810499326e-06, + "loss": 0.0894, + "step": 29176 + }, + { + "epoch": 79.50136239782016, + "grad_norm": 3.9922356605529785, + "learning_rate": 2.1240536627348553e-06, + "loss": 0.0325, + "step": 29177 + }, + { + "epoch": 79.50408719346049, + "grad_norm": 5.769985675811768, + "learning_rate": 2.1235099057573973e-06, + "loss": 0.0434, + "step": 29178 + }, + { + "epoch": 79.50681198910081, + "grad_norm": 2.921860933303833, + "learning_rate": 2.122966210121791e-06, + "loss": 0.0347, + "step": 29179 + }, + { + "epoch": 79.50953678474114, + "grad_norm": 2.8392391204833984, + "learning_rate": 2.122422575832267e-06, + "loss": 0.1007, + "step": 29180 + }, + { + "epoch": 79.51226158038148, + "grad_norm": 1.9620262384414673, + "learning_rate": 2.1218790028930656e-06, + "loss": 0.0259, + "step": 29181 + }, + { + "epoch": 79.5149863760218, + "grad_norm": 3.7188425064086914, + "learning_rate": 2.121335491308417e-06, + "loss": 0.2629, + "step": 29182 + }, + { + "epoch": 79.51771117166213, + "grad_norm": 2.0695464611053467, + "learning_rate": 2.1207920410825543e-06, + "loss": 0.2256, + "step": 29183 + }, + { + "epoch": 79.52043596730245, + "grad_norm": 1.73047935962677, + "learning_rate": 2.1202486522197063e-06, + "loss": 0.0408, + "step": 29184 + }, + { + "epoch": 79.52316076294278, + "grad_norm": 3.2469305992126465, + "learning_rate": 2.1197053247241116e-06, + "loss": 0.0928, + "step": 29185 + }, + { + "epoch": 79.52588555858311, + "grad_norm": 2.568074941635132, + "learning_rate": 2.1191620585999973e-06, + "loss": 0.0375, + "step": 29186 + }, + { + "epoch": 79.52861035422343, + "grad_norm": 3.095752000808716, + "learning_rate": 2.1186188538515964e-06, + "loss": 0.055, + "step": 29187 + }, + { + "epoch": 79.53133514986376, + "grad_norm": 1.5512783527374268, + "learning_rate": 2.118075710483134e-06, + "loss": 0.0317, + "step": 29188 + }, + { + "epoch": 79.53405994550408, + "grad_norm": 5.7658491134643555, + "learning_rate": 2.117532628498847e-06, + "loss": 0.0593, + "step": 29189 + }, + { + "epoch": 79.53678474114442, + "grad_norm": 4.0881028175354, + "learning_rate": 2.1169896079029607e-06, + "loss": 0.1097, + "step": 29190 + }, + { + "epoch": 79.53950953678473, + "grad_norm": 2.010342597961426, + "learning_rate": 2.116446648699708e-06, + "loss": 0.0211, + "step": 29191 + }, + { + "epoch": 79.54223433242507, + "grad_norm": 3.401838779449463, + "learning_rate": 2.1159037508933154e-06, + "loss": 0.1001, + "step": 29192 + }, + { + "epoch": 79.5449591280654, + "grad_norm": 4.027714252471924, + "learning_rate": 2.115360914488007e-06, + "loss": 0.3034, + "step": 29193 + }, + { + "epoch": 79.54768392370572, + "grad_norm": 3.6595537662506104, + "learning_rate": 2.1148181394880175e-06, + "loss": 0.106, + "step": 29194 + }, + { + "epoch": 79.55040871934605, + "grad_norm": 2.499828577041626, + "learning_rate": 2.1142754258975707e-06, + "loss": 0.0348, + "step": 29195 + }, + { + "epoch": 79.55313351498637, + "grad_norm": 1.8060368299484253, + "learning_rate": 2.1137327737208923e-06, + "loss": 0.034, + "step": 29196 + }, + { + "epoch": 79.5558583106267, + "grad_norm": 3.0636634826660156, + "learning_rate": 2.113190182962207e-06, + "loss": 0.0957, + "step": 29197 + }, + { + "epoch": 79.55858310626704, + "grad_norm": 2.7108492851257324, + "learning_rate": 2.1126476536257446e-06, + "loss": 0.0936, + "step": 29198 + }, + { + "epoch": 79.56130790190736, + "grad_norm": 2.1519253253936768, + "learning_rate": 2.1121051857157294e-06, + "loss": 0.0663, + "step": 29199 + }, + { + "epoch": 79.56403269754769, + "grad_norm": 5.154918193817139, + "learning_rate": 2.1115627792363823e-06, + "loss": 0.0338, + "step": 29200 + }, + { + "epoch": 79.566757493188, + "grad_norm": 2.4038360118865967, + "learning_rate": 2.1110204341919326e-06, + "loss": 0.0319, + "step": 29201 + }, + { + "epoch": 79.56948228882834, + "grad_norm": 2.6924593448638916, + "learning_rate": 2.110478150586602e-06, + "loss": 0.0351, + "step": 29202 + }, + { + "epoch": 79.57220708446866, + "grad_norm": 3.1435282230377197, + "learning_rate": 2.1099359284246144e-06, + "loss": 0.1325, + "step": 29203 + }, + { + "epoch": 79.57493188010899, + "grad_norm": 2.6756949424743652, + "learning_rate": 2.1093937677101884e-06, + "loss": 0.0564, + "step": 29204 + }, + { + "epoch": 79.57765667574932, + "grad_norm": 2.745969295501709, + "learning_rate": 2.1088516684475526e-06, + "loss": 0.0586, + "step": 29205 + }, + { + "epoch": 79.58038147138964, + "grad_norm": 1.9606775045394897, + "learning_rate": 2.1083096306409255e-06, + "loss": 0.0497, + "step": 29206 + }, + { + "epoch": 79.58310626702998, + "grad_norm": 4.065126895904541, + "learning_rate": 2.107767654294528e-06, + "loss": 0.1034, + "step": 29207 + }, + { + "epoch": 79.5858310626703, + "grad_norm": 3.9425268173217773, + "learning_rate": 2.1072257394125828e-06, + "loss": 0.0369, + "step": 29208 + }, + { + "epoch": 79.58855585831063, + "grad_norm": 2.6867868900299072, + "learning_rate": 2.106683885999308e-06, + "loss": 0.0343, + "step": 29209 + }, + { + "epoch": 79.59128065395096, + "grad_norm": 2.64862322807312, + "learning_rate": 2.1061420940589273e-06, + "loss": 0.1393, + "step": 29210 + }, + { + "epoch": 79.59400544959128, + "grad_norm": 4.8482985496521, + "learning_rate": 2.105600363595658e-06, + "loss": 0.1981, + "step": 29211 + }, + { + "epoch": 79.59673024523161, + "grad_norm": 3.8815159797668457, + "learning_rate": 2.1050586946137184e-06, + "loss": 0.0601, + "step": 29212 + }, + { + "epoch": 79.59945504087193, + "grad_norm": 2.8104629516601562, + "learning_rate": 2.104517087117326e-06, + "loss": 0.0347, + "step": 29213 + }, + { + "epoch": 79.60217983651226, + "grad_norm": 7.704208850860596, + "learning_rate": 2.1039755411107023e-06, + "loss": 0.0697, + "step": 29214 + }, + { + "epoch": 79.60490463215258, + "grad_norm": 2.3880417346954346, + "learning_rate": 2.1034340565980636e-06, + "loss": 0.0347, + "step": 29215 + }, + { + "epoch": 79.60762942779292, + "grad_norm": 3.6737351417541504, + "learning_rate": 2.1028926335836253e-06, + "loss": 0.0532, + "step": 29216 + }, + { + "epoch": 79.61035422343325, + "grad_norm": 2.6531341075897217, + "learning_rate": 2.1023512720716033e-06, + "loss": 0.046, + "step": 29217 + }, + { + "epoch": 79.61307901907357, + "grad_norm": 4.844764232635498, + "learning_rate": 2.1018099720662178e-06, + "loss": 0.0858, + "step": 29218 + }, + { + "epoch": 79.6158038147139, + "grad_norm": 2.7919328212738037, + "learning_rate": 2.101268733571682e-06, + "loss": 0.1226, + "step": 29219 + }, + { + "epoch": 79.61852861035422, + "grad_norm": 3.199812173843384, + "learning_rate": 2.100727556592211e-06, + "loss": 0.0742, + "step": 29220 + }, + { + "epoch": 79.62125340599455, + "grad_norm": 2.56154465675354, + "learning_rate": 2.1001864411320174e-06, + "loss": 0.0378, + "step": 29221 + }, + { + "epoch": 79.62397820163488, + "grad_norm": 2.337373733520508, + "learning_rate": 2.0996453871953192e-06, + "loss": 0.1088, + "step": 29222 + }, + { + "epoch": 79.6267029972752, + "grad_norm": 3.0385773181915283, + "learning_rate": 2.0991043947863286e-06, + "loss": 0.1082, + "step": 29223 + }, + { + "epoch": 79.62942779291554, + "grad_norm": 2.6796576976776123, + "learning_rate": 2.0985634639092567e-06, + "loss": 0.0307, + "step": 29224 + }, + { + "epoch": 79.63215258855585, + "grad_norm": 1.8098124265670776, + "learning_rate": 2.0980225945683185e-06, + "loss": 0.0279, + "step": 29225 + }, + { + "epoch": 79.63487738419619, + "grad_norm": 3.3715479373931885, + "learning_rate": 2.097481786767728e-06, + "loss": 0.1815, + "step": 29226 + }, + { + "epoch": 79.6376021798365, + "grad_norm": 2.9014835357666016, + "learning_rate": 2.096941040511695e-06, + "loss": 0.0264, + "step": 29227 + }, + { + "epoch": 79.64032697547684, + "grad_norm": 3.4781887531280518, + "learning_rate": 2.096400355804431e-06, + "loss": 0.0574, + "step": 29228 + }, + { + "epoch": 79.64305177111717, + "grad_norm": 2.586890459060669, + "learning_rate": 2.095859732650144e-06, + "loss": 0.1218, + "step": 29229 + }, + { + "epoch": 79.64577656675749, + "grad_norm": 2.3006093502044678, + "learning_rate": 2.0953191710530495e-06, + "loss": 0.1917, + "step": 29230 + }, + { + "epoch": 79.64850136239782, + "grad_norm": 2.843937873840332, + "learning_rate": 2.0947786710173545e-06, + "loss": 0.074, + "step": 29231 + }, + { + "epoch": 79.65122615803814, + "grad_norm": 3.1083977222442627, + "learning_rate": 2.09423823254727e-06, + "loss": 0.0379, + "step": 29232 + }, + { + "epoch": 79.65395095367847, + "grad_norm": 2.344449043273926, + "learning_rate": 2.093697855647e-06, + "loss": 0.0771, + "step": 29233 + }, + { + "epoch": 79.65667574931881, + "grad_norm": 2.2525219917297363, + "learning_rate": 2.0931575403207594e-06, + "loss": 0.0841, + "step": 29234 + }, + { + "epoch": 79.65940054495913, + "grad_norm": 3.596081256866455, + "learning_rate": 2.0926172865727534e-06, + "loss": 0.0388, + "step": 29235 + }, + { + "epoch": 79.66212534059946, + "grad_norm": 2.5542967319488525, + "learning_rate": 2.09207709440719e-06, + "loss": 0.1207, + "step": 29236 + }, + { + "epoch": 79.66485013623978, + "grad_norm": 3.693990468978882, + "learning_rate": 2.091536963828272e-06, + "loss": 0.0352, + "step": 29237 + }, + { + "epoch": 79.66757493188011, + "grad_norm": 2.903559923171997, + "learning_rate": 2.090996894840214e-06, + "loss": 0.0234, + "step": 29238 + }, + { + "epoch": 79.67029972752043, + "grad_norm": 4.205155849456787, + "learning_rate": 2.0904568874472166e-06, + "loss": 0.0396, + "step": 29239 + }, + { + "epoch": 79.67302452316076, + "grad_norm": 3.108189344406128, + "learning_rate": 2.089916941653486e-06, + "loss": 0.0636, + "step": 29240 + }, + { + "epoch": 79.6757493188011, + "grad_norm": 3.3302626609802246, + "learning_rate": 2.0893770574632253e-06, + "loss": 0.0412, + "step": 29241 + }, + { + "epoch": 79.67847411444141, + "grad_norm": 4.701046466827393, + "learning_rate": 2.088837234880642e-06, + "loss": 0.052, + "step": 29242 + }, + { + "epoch": 79.68119891008175, + "grad_norm": 3.134046792984009, + "learning_rate": 2.0882974739099417e-06, + "loss": 0.0562, + "step": 29243 + }, + { + "epoch": 79.68392370572207, + "grad_norm": 3.2510342597961426, + "learning_rate": 2.087757774555326e-06, + "loss": 0.0754, + "step": 29244 + }, + { + "epoch": 79.6866485013624, + "grad_norm": 3.2784006595611572, + "learning_rate": 2.0872181368209954e-06, + "loss": 0.0261, + "step": 29245 + }, + { + "epoch": 79.68937329700273, + "grad_norm": 3.756096124649048, + "learning_rate": 2.0866785607111583e-06, + "loss": 0.0578, + "step": 29246 + }, + { + "epoch": 79.69209809264305, + "grad_norm": 2.896062135696411, + "learning_rate": 2.0861390462300137e-06, + "loss": 0.0862, + "step": 29247 + }, + { + "epoch": 79.69482288828338, + "grad_norm": 4.018967628479004, + "learning_rate": 2.085599593381764e-06, + "loss": 0.0763, + "step": 29248 + }, + { + "epoch": 79.6975476839237, + "grad_norm": 2.785836696624756, + "learning_rate": 2.085060202170607e-06, + "loss": 0.0802, + "step": 29249 + }, + { + "epoch": 79.70027247956403, + "grad_norm": 3.413893461227417, + "learning_rate": 2.0845208726007484e-06, + "loss": 0.0738, + "step": 29250 + }, + { + "epoch": 79.70299727520435, + "grad_norm": 2.3878374099731445, + "learning_rate": 2.083981604676387e-06, + "loss": 0.0389, + "step": 29251 + }, + { + "epoch": 79.70572207084469, + "grad_norm": 5.857513427734375, + "learning_rate": 2.083442398401723e-06, + "loss": 0.058, + "step": 29252 + }, + { + "epoch": 79.70844686648502, + "grad_norm": 2.4599688053131104, + "learning_rate": 2.082903253780951e-06, + "loss": 0.0212, + "step": 29253 + }, + { + "epoch": 79.71117166212534, + "grad_norm": 2.517099380493164, + "learning_rate": 2.082364170818276e-06, + "loss": 0.0488, + "step": 29254 + }, + { + "epoch": 79.71389645776567, + "grad_norm": 2.4274439811706543, + "learning_rate": 2.081825149517895e-06, + "loss": 0.0428, + "step": 29255 + }, + { + "epoch": 79.71662125340599, + "grad_norm": 2.7039241790771484, + "learning_rate": 2.0812861898840043e-06, + "loss": 0.0368, + "step": 29256 + }, + { + "epoch": 79.71934604904632, + "grad_norm": 3.2438275814056396, + "learning_rate": 2.0807472919207993e-06, + "loss": 0.1247, + "step": 29257 + }, + { + "epoch": 79.72207084468666, + "grad_norm": 3.6895644664764404, + "learning_rate": 2.080208455632482e-06, + "loss": 0.1358, + "step": 29258 + }, + { + "epoch": 79.72479564032697, + "grad_norm": 2.9256253242492676, + "learning_rate": 2.079669681023244e-06, + "loss": 0.0249, + "step": 29259 + }, + { + "epoch": 79.7275204359673, + "grad_norm": 2.9980931282043457, + "learning_rate": 2.079130968097287e-06, + "loss": 0.0327, + "step": 29260 + }, + { + "epoch": 79.73024523160763, + "grad_norm": 2.4223766326904297, + "learning_rate": 2.078592316858802e-06, + "loss": 0.034, + "step": 29261 + }, + { + "epoch": 79.73297002724796, + "grad_norm": 2.9649951457977295, + "learning_rate": 2.0780537273119826e-06, + "loss": 0.0315, + "step": 29262 + }, + { + "epoch": 79.73569482288828, + "grad_norm": 2.3366172313690186, + "learning_rate": 2.077515199461029e-06, + "loss": 0.0314, + "step": 29263 + }, + { + "epoch": 79.73841961852861, + "grad_norm": 5.506527900695801, + "learning_rate": 2.076976733310131e-06, + "loss": 0.1247, + "step": 29264 + }, + { + "epoch": 79.74114441416894, + "grad_norm": 3.715538263320923, + "learning_rate": 2.0764383288634813e-06, + "loss": 0.0854, + "step": 29265 + }, + { + "epoch": 79.74386920980926, + "grad_norm": 3.026465892791748, + "learning_rate": 2.0758999861252783e-06, + "loss": 0.0353, + "step": 29266 + }, + { + "epoch": 79.7465940054496, + "grad_norm": 2.029677391052246, + "learning_rate": 2.0753617050997097e-06, + "loss": 0.0363, + "step": 29267 + }, + { + "epoch": 79.74931880108991, + "grad_norm": 2.721902370452881, + "learning_rate": 2.07482348579097e-06, + "loss": 0.0254, + "step": 29268 + }, + { + "epoch": 79.75204359673025, + "grad_norm": 2.84169340133667, + "learning_rate": 2.074285328203247e-06, + "loss": 0.0557, + "step": 29269 + }, + { + "epoch": 79.75476839237058, + "grad_norm": 2.6797447204589844, + "learning_rate": 2.073747232340737e-06, + "loss": 0.0977, + "step": 29270 + }, + { + "epoch": 79.7574931880109, + "grad_norm": 3.6222918033599854, + "learning_rate": 2.0732091982076286e-06, + "loss": 0.0863, + "step": 29271 + }, + { + "epoch": 79.76021798365123, + "grad_norm": 2.777568817138672, + "learning_rate": 2.072671225808113e-06, + "loss": 0.0815, + "step": 29272 + }, + { + "epoch": 79.76294277929155, + "grad_norm": 2.5429670810699463, + "learning_rate": 2.072133315146375e-06, + "loss": 0.094, + "step": 29273 + }, + { + "epoch": 79.76566757493188, + "grad_norm": 3.273588180541992, + "learning_rate": 2.07159546622661e-06, + "loss": 0.1388, + "step": 29274 + }, + { + "epoch": 79.7683923705722, + "grad_norm": 2.2256669998168945, + "learning_rate": 2.0710576790530046e-06, + "loss": 0.1327, + "step": 29275 + }, + { + "epoch": 79.77111716621253, + "grad_norm": 2.7126142978668213, + "learning_rate": 2.070519953629745e-06, + "loss": 0.0632, + "step": 29276 + }, + { + "epoch": 79.77384196185287, + "grad_norm": 3.8536276817321777, + "learning_rate": 2.069982289961022e-06, + "loss": 0.0495, + "step": 29277 + }, + { + "epoch": 79.77656675749319, + "grad_norm": 2.4987895488739014, + "learning_rate": 2.06944468805102e-06, + "loss": 0.1387, + "step": 29278 + }, + { + "epoch": 79.77929155313352, + "grad_norm": 3.027650833129883, + "learning_rate": 2.0689071479039303e-06, + "loss": 0.1404, + "step": 29279 + }, + { + "epoch": 79.78201634877384, + "grad_norm": 2.678555488586426, + "learning_rate": 2.0683696695239364e-06, + "loss": 0.0637, + "step": 29280 + }, + { + "epoch": 79.78474114441417, + "grad_norm": 3.3591952323913574, + "learning_rate": 2.0678322529152238e-06, + "loss": 0.0582, + "step": 29281 + }, + { + "epoch": 79.7874659400545, + "grad_norm": 1.6419581174850464, + "learning_rate": 2.067294898081975e-06, + "loss": 0.0224, + "step": 29282 + }, + { + "epoch": 79.79019073569482, + "grad_norm": 2.1855525970458984, + "learning_rate": 2.066757605028382e-06, + "loss": 0.0407, + "step": 29283 + }, + { + "epoch": 79.79291553133515, + "grad_norm": 4.04316520690918, + "learning_rate": 2.066220373758625e-06, + "loss": 0.0691, + "step": 29284 + }, + { + "epoch": 79.79564032697547, + "grad_norm": 3.079613208770752, + "learning_rate": 2.065683204276889e-06, + "loss": 0.079, + "step": 29285 + }, + { + "epoch": 79.7983651226158, + "grad_norm": 2.6407501697540283, + "learning_rate": 2.0651460965873537e-06, + "loss": 0.0751, + "step": 29286 + }, + { + "epoch": 79.80108991825612, + "grad_norm": 6.0405964851379395, + "learning_rate": 2.0646090506942084e-06, + "loss": 0.1496, + "step": 29287 + }, + { + "epoch": 79.80381471389646, + "grad_norm": 2.920759439468384, + "learning_rate": 2.0640720666016314e-06, + "loss": 0.0316, + "step": 29288 + }, + { + "epoch": 79.80653950953679, + "grad_norm": 2.829606056213379, + "learning_rate": 2.063535144313804e-06, + "loss": 0.0553, + "step": 29289 + }, + { + "epoch": 79.80926430517711, + "grad_norm": 2.013718605041504, + "learning_rate": 2.0629982838349117e-06, + "loss": 0.0366, + "step": 29290 + }, + { + "epoch": 79.81198910081744, + "grad_norm": 2.5959970951080322, + "learning_rate": 2.0624614851691327e-06, + "loss": 0.0788, + "step": 29291 + }, + { + "epoch": 79.81471389645776, + "grad_norm": 2.969374895095825, + "learning_rate": 2.0619247483206495e-06, + "loss": 0.0889, + "step": 29292 + }, + { + "epoch": 79.8174386920981, + "grad_norm": 2.5356993675231934, + "learning_rate": 2.0613880732936376e-06, + "loss": 0.0347, + "step": 29293 + }, + { + "epoch": 79.82016348773843, + "grad_norm": 4.257425308227539, + "learning_rate": 2.0608514600922793e-06, + "loss": 0.0497, + "step": 29294 + }, + { + "epoch": 79.82288828337875, + "grad_norm": 2.892382860183716, + "learning_rate": 2.0603149087207576e-06, + "loss": 0.0562, + "step": 29295 + }, + { + "epoch": 79.82561307901908, + "grad_norm": 2.452202558517456, + "learning_rate": 2.0597784191832483e-06, + "loss": 0.1419, + "step": 29296 + }, + { + "epoch": 79.8283378746594, + "grad_norm": 2.9188475608825684, + "learning_rate": 2.059241991483928e-06, + "loss": 0.197, + "step": 29297 + }, + { + "epoch": 79.83106267029973, + "grad_norm": 2.675443649291992, + "learning_rate": 2.058705625626973e-06, + "loss": 0.0813, + "step": 29298 + }, + { + "epoch": 79.83378746594005, + "grad_norm": 2.5195724964141846, + "learning_rate": 2.0581693216165668e-06, + "loss": 0.0344, + "step": 29299 + }, + { + "epoch": 79.83651226158038, + "grad_norm": 2.4789111614227295, + "learning_rate": 2.057633079456881e-06, + "loss": 0.0412, + "step": 29300 + }, + { + "epoch": 79.83923705722071, + "grad_norm": 3.065528631210327, + "learning_rate": 2.0570968991520933e-06, + "loss": 0.0346, + "step": 29301 + }, + { + "epoch": 79.84196185286103, + "grad_norm": 3.8140010833740234, + "learning_rate": 2.056560780706377e-06, + "loss": 0.0971, + "step": 29302 + }, + { + "epoch": 79.84468664850137, + "grad_norm": 2.497077465057373, + "learning_rate": 2.0560247241239127e-06, + "loss": 0.0477, + "step": 29303 + }, + { + "epoch": 79.84741144414168, + "grad_norm": 3.2433173656463623, + "learning_rate": 2.0554887294088723e-06, + "loss": 0.078, + "step": 29304 + }, + { + "epoch": 79.85013623978202, + "grad_norm": 2.877556800842285, + "learning_rate": 2.0549527965654293e-06, + "loss": 0.1024, + "step": 29305 + }, + { + "epoch": 79.85286103542235, + "grad_norm": 2.370661973953247, + "learning_rate": 2.0544169255977563e-06, + "loss": 0.0335, + "step": 29306 + }, + { + "epoch": 79.85558583106267, + "grad_norm": 4.0430378913879395, + "learning_rate": 2.0538811165100303e-06, + "loss": 0.0735, + "step": 29307 + }, + { + "epoch": 79.858310626703, + "grad_norm": 3.651853322982788, + "learning_rate": 2.053345369306423e-06, + "loss": 0.1569, + "step": 29308 + }, + { + "epoch": 79.86103542234332, + "grad_norm": 1.9985288381576538, + "learning_rate": 2.052809683991103e-06, + "loss": 0.1131, + "step": 29309 + }, + { + "epoch": 79.86376021798365, + "grad_norm": 2.669971466064453, + "learning_rate": 2.052274060568249e-06, + "loss": 0.0338, + "step": 29310 + }, + { + "epoch": 79.86648501362397, + "grad_norm": 1.5900779962539673, + "learning_rate": 2.0517384990420253e-06, + "loss": 0.0246, + "step": 29311 + }, + { + "epoch": 79.8692098092643, + "grad_norm": 2.7960777282714844, + "learning_rate": 2.0512029994166093e-06, + "loss": 0.045, + "step": 29312 + }, + { + "epoch": 79.87193460490464, + "grad_norm": 3.1913352012634277, + "learning_rate": 2.050667561696168e-06, + "loss": 0.089, + "step": 29313 + }, + { + "epoch": 79.87465940054496, + "grad_norm": 3.306302070617676, + "learning_rate": 2.05013218588487e-06, + "loss": 0.0621, + "step": 29314 + }, + { + "epoch": 79.87738419618529, + "grad_norm": 2.8709847927093506, + "learning_rate": 2.0495968719868895e-06, + "loss": 0.0439, + "step": 29315 + }, + { + "epoch": 79.88010899182561, + "grad_norm": 2.6839709281921387, + "learning_rate": 2.049061620006392e-06, + "loss": 0.1548, + "step": 29316 + }, + { + "epoch": 79.88283378746594, + "grad_norm": 2.072481155395508, + "learning_rate": 2.048526429947547e-06, + "loss": 0.0543, + "step": 29317 + }, + { + "epoch": 79.88555858310627, + "grad_norm": 2.4812171459198, + "learning_rate": 2.0479913018145194e-06, + "loss": 0.027, + "step": 29318 + }, + { + "epoch": 79.88828337874659, + "grad_norm": 3.2204062938690186, + "learning_rate": 2.0474562356114824e-06, + "loss": 0.0632, + "step": 29319 + }, + { + "epoch": 79.89100817438693, + "grad_norm": 4.5732879638671875, + "learning_rate": 2.0469212313426e-06, + "loss": 0.0529, + "step": 29320 + }, + { + "epoch": 79.89373297002724, + "grad_norm": 1.547419548034668, + "learning_rate": 2.04638628901204e-06, + "loss": 0.0858, + "step": 29321 + }, + { + "epoch": 79.89645776566758, + "grad_norm": 2.4170684814453125, + "learning_rate": 2.0458514086239644e-06, + "loss": 0.0456, + "step": 29322 + }, + { + "epoch": 79.8991825613079, + "grad_norm": 3.026855707168579, + "learning_rate": 2.0453165901825445e-06, + "loss": 0.1024, + "step": 29323 + }, + { + "epoch": 79.90190735694823, + "grad_norm": 2.3698346614837646, + "learning_rate": 2.0447818336919433e-06, + "loss": 0.0729, + "step": 29324 + }, + { + "epoch": 79.90463215258856, + "grad_norm": 2.5736029148101807, + "learning_rate": 2.0442471391563244e-06, + "loss": 0.031, + "step": 29325 + }, + { + "epoch": 79.90735694822888, + "grad_norm": 2.27970290184021, + "learning_rate": 2.0437125065798515e-06, + "loss": 0.0251, + "step": 29326 + }, + { + "epoch": 79.91008174386921, + "grad_norm": 1.7866114377975464, + "learning_rate": 2.04317793596669e-06, + "loss": 0.0338, + "step": 29327 + }, + { + "epoch": 79.91280653950953, + "grad_norm": 2.945972442626953, + "learning_rate": 2.0426434273210016e-06, + "loss": 0.0314, + "step": 29328 + }, + { + "epoch": 79.91553133514986, + "grad_norm": 2.1935908794403076, + "learning_rate": 2.042108980646953e-06, + "loss": 0.2351, + "step": 29329 + }, + { + "epoch": 79.9182561307902, + "grad_norm": 2.1854188442230225, + "learning_rate": 2.0415745959486997e-06, + "loss": 0.0354, + "step": 29330 + }, + { + "epoch": 79.92098092643052, + "grad_norm": 2.4516072273254395, + "learning_rate": 2.0410402732304115e-06, + "loss": 0.0598, + "step": 29331 + }, + { + "epoch": 79.92370572207085, + "grad_norm": 2.6645407676696777, + "learning_rate": 2.040506012496244e-06, + "loss": 0.1124, + "step": 29332 + }, + { + "epoch": 79.92643051771117, + "grad_norm": 3.365372896194458, + "learning_rate": 2.03997181375036e-06, + "loss": 0.0555, + "step": 29333 + }, + { + "epoch": 79.9291553133515, + "grad_norm": 2.762101173400879, + "learning_rate": 2.039437676996917e-06, + "loss": 0.0393, + "step": 29334 + }, + { + "epoch": 79.93188010899182, + "grad_norm": 2.4632163047790527, + "learning_rate": 2.0389036022400786e-06, + "loss": 0.1255, + "step": 29335 + }, + { + "epoch": 79.93460490463215, + "grad_norm": 3.0442001819610596, + "learning_rate": 2.038369589484004e-06, + "loss": 0.0764, + "step": 29336 + }, + { + "epoch": 79.93732970027249, + "grad_norm": 1.5549694299697876, + "learning_rate": 2.03783563873285e-06, + "loss": 0.0329, + "step": 29337 + }, + { + "epoch": 79.9400544959128, + "grad_norm": 2.3120741844177246, + "learning_rate": 2.0373017499907743e-06, + "loss": 0.1115, + "step": 29338 + }, + { + "epoch": 79.94277929155314, + "grad_norm": 2.2634379863739014, + "learning_rate": 2.0367679232619385e-06, + "loss": 0.0767, + "step": 29339 + }, + { + "epoch": 79.94550408719346, + "grad_norm": 2.465524435043335, + "learning_rate": 2.0362341585504974e-06, + "loss": 0.1215, + "step": 29340 + }, + { + "epoch": 79.94822888283379, + "grad_norm": 2.9260036945343018, + "learning_rate": 2.0357004558606087e-06, + "loss": 0.028, + "step": 29341 + }, + { + "epoch": 79.95095367847412, + "grad_norm": 2.66758394241333, + "learning_rate": 2.0351668151964253e-06, + "loss": 0.0246, + "step": 29342 + }, + { + "epoch": 79.95367847411444, + "grad_norm": 2.967787027359009, + "learning_rate": 2.034633236562109e-06, + "loss": 0.0928, + "step": 29343 + }, + { + "epoch": 79.95640326975477, + "grad_norm": 1.8456788063049316, + "learning_rate": 2.0340997199618128e-06, + "loss": 0.0205, + "step": 29344 + }, + { + "epoch": 79.95912806539509, + "grad_norm": 2.21388840675354, + "learning_rate": 2.03356626539969e-06, + "loss": 0.0667, + "step": 29345 + }, + { + "epoch": 79.96185286103542, + "grad_norm": 2.046415090560913, + "learning_rate": 2.0330328728798988e-06, + "loss": 0.0266, + "step": 29346 + }, + { + "epoch": 79.96457765667574, + "grad_norm": 4.012266635894775, + "learning_rate": 2.0324995424065884e-06, + "loss": 0.0406, + "step": 29347 + }, + { + "epoch": 79.96730245231608, + "grad_norm": 3.13988995552063, + "learning_rate": 2.0319662739839174e-06, + "loss": 0.0963, + "step": 29348 + }, + { + "epoch": 79.97002724795641, + "grad_norm": 3.302042245864868, + "learning_rate": 2.0314330676160364e-06, + "loss": 0.0347, + "step": 29349 + }, + { + "epoch": 79.97275204359673, + "grad_norm": 2.4337568283081055, + "learning_rate": 2.030899923307097e-06, + "loss": 0.0348, + "step": 29350 + }, + { + "epoch": 79.97547683923706, + "grad_norm": 3.118250608444214, + "learning_rate": 2.0303668410612544e-06, + "loss": 0.1335, + "step": 29351 + }, + { + "epoch": 79.97820163487738, + "grad_norm": 2.537001132965088, + "learning_rate": 2.0298338208826574e-06, + "loss": 0.1521, + "step": 29352 + }, + { + "epoch": 79.98092643051771, + "grad_norm": 3.249803066253662, + "learning_rate": 2.0293008627754597e-06, + "loss": 0.1485, + "step": 29353 + }, + { + "epoch": 79.98365122615803, + "grad_norm": 2.459155321121216, + "learning_rate": 2.0287679667438063e-06, + "loss": 0.0662, + "step": 29354 + }, + { + "epoch": 79.98637602179836, + "grad_norm": 3.170015573501587, + "learning_rate": 2.028235132791855e-06, + "loss": 0.056, + "step": 29355 + }, + { + "epoch": 79.9891008174387, + "grad_norm": 3.1561808586120605, + "learning_rate": 2.027702360923751e-06, + "loss": 0.0354, + "step": 29356 + }, + { + "epoch": 79.99182561307902, + "grad_norm": 3.056755542755127, + "learning_rate": 2.0271696511436457e-06, + "loss": 0.065, + "step": 29357 + }, + { + "epoch": 79.99455040871935, + "grad_norm": 2.7098047733306885, + "learning_rate": 2.0266370034556824e-06, + "loss": 0.1533, + "step": 29358 + }, + { + "epoch": 79.99727520435967, + "grad_norm": 3.2575576305389404, + "learning_rate": 2.0261044178640166e-06, + "loss": 0.1153, + "step": 29359 + }, + { + "epoch": 80.0, + "grad_norm": 3.2451682090759277, + "learning_rate": 2.025571894372794e-06, + "loss": 0.2123, + "step": 29360 + }, + { + "epoch": 80.00272479564033, + "grad_norm": 5.603143215179443, + "learning_rate": 2.02503943298616e-06, + "loss": 0.1196, + "step": 29361 + }, + { + "epoch": 80.00544959128065, + "grad_norm": 2.9784491062164307, + "learning_rate": 2.0245070337082596e-06, + "loss": 0.0473, + "step": 29362 + }, + { + "epoch": 80.00817438692098, + "grad_norm": 12.486374855041504, + "learning_rate": 2.0239746965432417e-06, + "loss": 0.0385, + "step": 29363 + }, + { + "epoch": 80.0108991825613, + "grad_norm": 2.0977165699005127, + "learning_rate": 2.023442421495255e-06, + "loss": 0.099, + "step": 29364 + }, + { + "epoch": 80.01362397820164, + "grad_norm": 1.9674521684646606, + "learning_rate": 2.0229102085684416e-06, + "loss": 0.1507, + "step": 29365 + }, + { + "epoch": 80.01634877384195, + "grad_norm": 2.7131857872009277, + "learning_rate": 2.022378057766947e-06, + "loss": 0.0457, + "step": 29366 + }, + { + "epoch": 80.01907356948229, + "grad_norm": 3.055431604385376, + "learning_rate": 2.021845969094913e-06, + "loss": 0.0425, + "step": 29367 + }, + { + "epoch": 80.02179836512262, + "grad_norm": 3.1296238899230957, + "learning_rate": 2.0213139425564888e-06, + "loss": 0.0586, + "step": 29368 + }, + { + "epoch": 80.02452316076294, + "grad_norm": 2.3376431465148926, + "learning_rate": 2.0207819781558137e-06, + "loss": 0.1063, + "step": 29369 + }, + { + "epoch": 80.02724795640327, + "grad_norm": 1.8747031688690186, + "learning_rate": 2.0202500758970323e-06, + "loss": 0.0199, + "step": 29370 + }, + { + "epoch": 80.02997275204359, + "grad_norm": 2.9020087718963623, + "learning_rate": 2.0197182357842836e-06, + "loss": 0.0577, + "step": 29371 + }, + { + "epoch": 80.03269754768392, + "grad_norm": 2.2700018882751465, + "learning_rate": 2.0191864578217155e-06, + "loss": 0.0366, + "step": 29372 + }, + { + "epoch": 80.03542234332426, + "grad_norm": 2.2061479091644287, + "learning_rate": 2.0186547420134663e-06, + "loss": 0.0298, + "step": 29373 + }, + { + "epoch": 80.03814713896458, + "grad_norm": 2.363985061645508, + "learning_rate": 2.018123088363675e-06, + "loss": 0.0339, + "step": 29374 + }, + { + "epoch": 80.04087193460491, + "grad_norm": 2.4737119674682617, + "learning_rate": 2.017591496876485e-06, + "loss": 0.0684, + "step": 29375 + }, + { + "epoch": 80.04359673024523, + "grad_norm": 2.2740232944488525, + "learning_rate": 2.0170599675560376e-06, + "loss": 0.0408, + "step": 29376 + }, + { + "epoch": 80.04632152588556, + "grad_norm": 2.1201000213623047, + "learning_rate": 2.0165285004064692e-06, + "loss": 0.033, + "step": 29377 + }, + { + "epoch": 80.04904632152588, + "grad_norm": 1.6579976081848145, + "learning_rate": 2.0159970954319173e-06, + "loss": 0.0203, + "step": 29378 + }, + { + "epoch": 80.05177111716621, + "grad_norm": 1.8335825204849243, + "learning_rate": 2.0154657526365227e-06, + "loss": 0.0234, + "step": 29379 + }, + { + "epoch": 80.05449591280654, + "grad_norm": 3.6377949714660645, + "learning_rate": 2.014934472024427e-06, + "loss": 0.038, + "step": 29380 + }, + { + "epoch": 80.05722070844686, + "grad_norm": 4.581460475921631, + "learning_rate": 2.014403253599765e-06, + "loss": 0.197, + "step": 29381 + }, + { + "epoch": 80.0599455040872, + "grad_norm": 1.6591564416885376, + "learning_rate": 2.0138720973666727e-06, + "loss": 0.0246, + "step": 29382 + }, + { + "epoch": 80.06267029972751, + "grad_norm": 3.421288251876831, + "learning_rate": 2.0133410033292854e-06, + "loss": 0.0461, + "step": 29383 + }, + { + "epoch": 80.06539509536785, + "grad_norm": 1.9600965976715088, + "learning_rate": 2.0128099714917436e-06, + "loss": 0.1076, + "step": 29384 + }, + { + "epoch": 80.06811989100818, + "grad_norm": 2.0340168476104736, + "learning_rate": 2.0122790018581805e-06, + "loss": 0.1289, + "step": 29385 + }, + { + "epoch": 80.0708446866485, + "grad_norm": 2.848813056945801, + "learning_rate": 2.0117480944327317e-06, + "loss": 0.059, + "step": 29386 + }, + { + "epoch": 80.07356948228883, + "grad_norm": 1.989477276802063, + "learning_rate": 2.011217249219529e-06, + "loss": 0.0154, + "step": 29387 + }, + { + "epoch": 80.07629427792915, + "grad_norm": 2.7358896732330322, + "learning_rate": 2.010686466222712e-06, + "loss": 0.0796, + "step": 29388 + }, + { + "epoch": 80.07901907356948, + "grad_norm": 2.944010019302368, + "learning_rate": 2.0101557454464115e-06, + "loss": 0.108, + "step": 29389 + }, + { + "epoch": 80.0817438692098, + "grad_norm": 2.212073802947998, + "learning_rate": 2.009625086894761e-06, + "loss": 0.0466, + "step": 29390 + }, + { + "epoch": 80.08446866485014, + "grad_norm": 2.7997961044311523, + "learning_rate": 2.0090944905718913e-06, + "loss": 0.1205, + "step": 29391 + }, + { + "epoch": 80.08719346049047, + "grad_norm": 3.7996926307678223, + "learning_rate": 2.0085639564819383e-06, + "loss": 0.1322, + "step": 29392 + }, + { + "epoch": 80.08991825613079, + "grad_norm": 3.034207582473755, + "learning_rate": 2.0080334846290317e-06, + "loss": 0.0531, + "step": 29393 + }, + { + "epoch": 80.09264305177112, + "grad_norm": 2.514934539794922, + "learning_rate": 2.007503075017303e-06, + "loss": 0.0628, + "step": 29394 + }, + { + "epoch": 80.09536784741144, + "grad_norm": 2.12790584564209, + "learning_rate": 2.006972727650881e-06, + "loss": 0.0301, + "step": 29395 + }, + { + "epoch": 80.09809264305177, + "grad_norm": 5.728973865509033, + "learning_rate": 2.0064424425339014e-06, + "loss": 0.0709, + "step": 29396 + }, + { + "epoch": 80.1008174386921, + "grad_norm": 2.994800329208374, + "learning_rate": 2.0059122196704872e-06, + "loss": 0.0362, + "step": 29397 + }, + { + "epoch": 80.10354223433242, + "grad_norm": 2.195781946182251, + "learning_rate": 2.0053820590647744e-06, + "loss": 0.064, + "step": 29398 + }, + { + "epoch": 80.10626702997276, + "grad_norm": 2.763132333755493, + "learning_rate": 2.004851960720886e-06, + "loss": 0.0763, + "step": 29399 + }, + { + "epoch": 80.10899182561307, + "grad_norm": 2.22554612159729, + "learning_rate": 2.0043219246429555e-06, + "loss": 0.0471, + "step": 29400 + }, + { + "epoch": 80.11171662125341, + "grad_norm": 2.436314821243286, + "learning_rate": 2.003791950835109e-06, + "loss": 0.0404, + "step": 29401 + }, + { + "epoch": 80.11444141689373, + "grad_norm": 2.6080710887908936, + "learning_rate": 2.0032620393014734e-06, + "loss": 0.0383, + "step": 29402 + }, + { + "epoch": 80.11716621253406, + "grad_norm": 3.8651154041290283, + "learning_rate": 2.0027321900461726e-06, + "loss": 0.0282, + "step": 29403 + }, + { + "epoch": 80.11989100817439, + "grad_norm": 3.0691099166870117, + "learning_rate": 2.002202403073339e-06, + "loss": 0.0568, + "step": 29404 + }, + { + "epoch": 80.12261580381471, + "grad_norm": 2.3447935581207275, + "learning_rate": 2.0016726783870966e-06, + "loss": 0.0899, + "step": 29405 + }, + { + "epoch": 80.12534059945504, + "grad_norm": 3.291969060897827, + "learning_rate": 2.001143015991569e-06, + "loss": 0.1161, + "step": 29406 + }, + { + "epoch": 80.12806539509536, + "grad_norm": 3.1843996047973633, + "learning_rate": 2.0006134158908796e-06, + "loss": 0.1323, + "step": 29407 + }, + { + "epoch": 80.1307901907357, + "grad_norm": 3.0894100666046143, + "learning_rate": 2.0000838780891573e-06, + "loss": 0.0523, + "step": 29408 + }, + { + "epoch": 80.13351498637603, + "grad_norm": 2.975862503051758, + "learning_rate": 1.9995544025905254e-06, + "loss": 0.0464, + "step": 29409 + }, + { + "epoch": 80.13623978201635, + "grad_norm": 2.842663288116455, + "learning_rate": 1.9990249893991064e-06, + "loss": 0.0436, + "step": 29410 + }, + { + "epoch": 80.13896457765668, + "grad_norm": 2.7382287979125977, + "learning_rate": 1.9984956385190204e-06, + "loss": 0.1006, + "step": 29411 + }, + { + "epoch": 80.141689373297, + "grad_norm": 2.1449384689331055, + "learning_rate": 1.9979663499543956e-06, + "loss": 0.0441, + "step": 29412 + }, + { + "epoch": 80.14441416893733, + "grad_norm": 1.671662449836731, + "learning_rate": 1.9974371237093505e-06, + "loss": 0.021, + "step": 29413 + }, + { + "epoch": 80.14713896457765, + "grad_norm": 3.9940028190612793, + "learning_rate": 1.996907959788006e-06, + "loss": 0.13, + "step": 29414 + }, + { + "epoch": 80.14986376021798, + "grad_norm": 2.6534218788146973, + "learning_rate": 1.9963788581944832e-06, + "loss": 0.0688, + "step": 29415 + }, + { + "epoch": 80.15258855585832, + "grad_norm": 2.4782872200012207, + "learning_rate": 1.995849818932908e-06, + "loss": 0.0342, + "step": 29416 + }, + { + "epoch": 80.15531335149863, + "grad_norm": 2.70391845703125, + "learning_rate": 1.9953208420073965e-06, + "loss": 0.0345, + "step": 29417 + }, + { + "epoch": 80.15803814713897, + "grad_norm": 1.8681391477584839, + "learning_rate": 1.9947919274220693e-06, + "loss": 0.0328, + "step": 29418 + }, + { + "epoch": 80.16076294277929, + "grad_norm": 2.7991154193878174, + "learning_rate": 1.994263075181042e-06, + "loss": 0.0431, + "step": 29419 + }, + { + "epoch": 80.16348773841962, + "grad_norm": 3.968597173690796, + "learning_rate": 1.993734285288439e-06, + "loss": 0.1206, + "step": 29420 + }, + { + "epoch": 80.16621253405995, + "grad_norm": 3.151745080947876, + "learning_rate": 1.9932055577483743e-06, + "loss": 0.0595, + "step": 29421 + }, + { + "epoch": 80.16893732970027, + "grad_norm": 3.6714539527893066, + "learning_rate": 1.9926768925649685e-06, + "loss": 0.1386, + "step": 29422 + }, + { + "epoch": 80.1716621253406, + "grad_norm": 2.5412685871124268, + "learning_rate": 1.992148289742334e-06, + "loss": 0.1026, + "step": 29423 + }, + { + "epoch": 80.17438692098092, + "grad_norm": 2.7091026306152344, + "learning_rate": 1.9916197492845947e-06, + "loss": 0.0359, + "step": 29424 + }, + { + "epoch": 80.17711171662125, + "grad_norm": 2.3547556400299072, + "learning_rate": 1.991091271195862e-06, + "loss": 0.0682, + "step": 29425 + }, + { + "epoch": 80.17983651226157, + "grad_norm": 3.9136271476745605, + "learning_rate": 1.9905628554802525e-06, + "loss": 0.0985, + "step": 29426 + }, + { + "epoch": 80.1825613079019, + "grad_norm": 2.6397290229797363, + "learning_rate": 1.9900345021418797e-06, + "loss": 0.0194, + "step": 29427 + }, + { + "epoch": 80.18528610354224, + "grad_norm": 2.6623542308807373, + "learning_rate": 1.9895062111848628e-06, + "loss": 0.0303, + "step": 29428 + }, + { + "epoch": 80.18801089918256, + "grad_norm": 3.0329337120056152, + "learning_rate": 1.9889779826133136e-06, + "loss": 0.0453, + "step": 29429 + }, + { + "epoch": 80.19073569482289, + "grad_norm": 3.3232171535491943, + "learning_rate": 1.9884498164313458e-06, + "loss": 0.125, + "step": 29430 + }, + { + "epoch": 80.19346049046321, + "grad_norm": 2.496865749359131, + "learning_rate": 1.9879217126430704e-06, + "loss": 0.0364, + "step": 29431 + }, + { + "epoch": 80.19618528610354, + "grad_norm": 2.626728057861328, + "learning_rate": 1.9873936712526033e-06, + "loss": 0.0434, + "step": 29432 + }, + { + "epoch": 80.19891008174388, + "grad_norm": 2.1771438121795654, + "learning_rate": 1.9868656922640596e-06, + "loss": 0.0249, + "step": 29433 + }, + { + "epoch": 80.2016348773842, + "grad_norm": 2.1724393367767334, + "learning_rate": 1.986337775681546e-06, + "loss": 0.0338, + "step": 29434 + }, + { + "epoch": 80.20435967302453, + "grad_norm": 2.520867347717285, + "learning_rate": 1.9858099215091773e-06, + "loss": 0.1075, + "step": 29435 + }, + { + "epoch": 80.20708446866485, + "grad_norm": 2.6357574462890625, + "learning_rate": 1.9852821297510605e-06, + "loss": 0.0428, + "step": 29436 + }, + { + "epoch": 80.20980926430518, + "grad_norm": 2.61205792427063, + "learning_rate": 1.9847544004113105e-06, + "loss": 0.1401, + "step": 29437 + }, + { + "epoch": 80.2125340599455, + "grad_norm": 2.8970611095428467, + "learning_rate": 1.9842267334940357e-06, + "loss": 0.0986, + "step": 29438 + }, + { + "epoch": 80.21525885558583, + "grad_norm": 2.5879549980163574, + "learning_rate": 1.9836991290033427e-06, + "loss": 0.1085, + "step": 29439 + }, + { + "epoch": 80.21798365122616, + "grad_norm": 3.0536818504333496, + "learning_rate": 1.9831715869433456e-06, + "loss": 0.1055, + "step": 29440 + }, + { + "epoch": 80.22070844686648, + "grad_norm": 3.0303287506103516, + "learning_rate": 1.982644107318149e-06, + "loss": 0.0795, + "step": 29441 + }, + { + "epoch": 80.22343324250681, + "grad_norm": 3.1025660037994385, + "learning_rate": 1.9821166901318634e-06, + "loss": 0.1188, + "step": 29442 + }, + { + "epoch": 80.22615803814713, + "grad_norm": 2.673023223876953, + "learning_rate": 1.981589335388592e-06, + "loss": 0.0362, + "step": 29443 + }, + { + "epoch": 80.22888283378747, + "grad_norm": 3.098051071166992, + "learning_rate": 1.9810620430924465e-06, + "loss": 0.0554, + "step": 29444 + }, + { + "epoch": 80.2316076294278, + "grad_norm": 3.2103559970855713, + "learning_rate": 1.980534813247532e-06, + "loss": 0.0276, + "step": 29445 + }, + { + "epoch": 80.23433242506812, + "grad_norm": 2.42803955078125, + "learning_rate": 1.9800076458579552e-06, + "loss": 0.0573, + "step": 29446 + }, + { + "epoch": 80.23705722070845, + "grad_norm": 8.295357704162598, + "learning_rate": 1.9794805409278174e-06, + "loss": 0.0739, + "step": 29447 + }, + { + "epoch": 80.23978201634877, + "grad_norm": 2.6432881355285645, + "learning_rate": 1.978953498461227e-06, + "loss": 0.0654, + "step": 29448 + }, + { + "epoch": 80.2425068119891, + "grad_norm": 2.679471492767334, + "learning_rate": 1.978426518462291e-06, + "loss": 0.042, + "step": 29449 + }, + { + "epoch": 80.24523160762942, + "grad_norm": 2.8455731868743896, + "learning_rate": 1.9778996009351116e-06, + "loss": 0.0489, + "step": 29450 + }, + { + "epoch": 80.24795640326975, + "grad_norm": 1.6808359622955322, + "learning_rate": 1.977372745883792e-06, + "loss": 0.0202, + "step": 29451 + }, + { + "epoch": 80.25068119891009, + "grad_norm": 2.7449731826782227, + "learning_rate": 1.976845953312432e-06, + "loss": 0.0441, + "step": 29452 + }, + { + "epoch": 80.2534059945504, + "grad_norm": 3.0539281368255615, + "learning_rate": 1.9763192232251405e-06, + "loss": 0.0288, + "step": 29453 + }, + { + "epoch": 80.25613079019074, + "grad_norm": 2.833569288253784, + "learning_rate": 1.975792555626017e-06, + "loss": 0.082, + "step": 29454 + }, + { + "epoch": 80.25885558583106, + "grad_norm": 3.311829090118408, + "learning_rate": 1.975265950519163e-06, + "loss": 0.0599, + "step": 29455 + }, + { + "epoch": 80.26158038147139, + "grad_norm": 4.416215896606445, + "learning_rate": 1.9747394079086756e-06, + "loss": 0.1164, + "step": 29456 + }, + { + "epoch": 80.26430517711172, + "grad_norm": 2.7725939750671387, + "learning_rate": 1.974212927798663e-06, + "loss": 0.1197, + "step": 29457 + }, + { + "epoch": 80.26702997275204, + "grad_norm": 3.2645301818847656, + "learning_rate": 1.973686510193221e-06, + "loss": 0.1733, + "step": 29458 + }, + { + "epoch": 80.26975476839237, + "grad_norm": 1.6957669258117676, + "learning_rate": 1.973160155096452e-06, + "loss": 0.0206, + "step": 29459 + }, + { + "epoch": 80.2724795640327, + "grad_norm": 2.67549991607666, + "learning_rate": 1.9726338625124488e-06, + "loss": 0.0783, + "step": 29460 + }, + { + "epoch": 80.27520435967303, + "grad_norm": 2.7992019653320312, + "learning_rate": 1.972107632445318e-06, + "loss": 0.2081, + "step": 29461 + }, + { + "epoch": 80.27792915531334, + "grad_norm": 2.060793161392212, + "learning_rate": 1.971581464899155e-06, + "loss": 0.0415, + "step": 29462 + }, + { + "epoch": 80.28065395095368, + "grad_norm": 2.4207475185394287, + "learning_rate": 1.9710553598780534e-06, + "loss": 0.0286, + "step": 29463 + }, + { + "epoch": 80.28337874659401, + "grad_norm": 2.4379923343658447, + "learning_rate": 1.9705293173861182e-06, + "loss": 0.087, + "step": 29464 + }, + { + "epoch": 80.28610354223433, + "grad_norm": 2.448291301727295, + "learning_rate": 1.9700033374274386e-06, + "loss": 0.0326, + "step": 29465 + }, + { + "epoch": 80.28882833787466, + "grad_norm": 2.084537982940674, + "learning_rate": 1.9694774200061175e-06, + "loss": 0.0452, + "step": 29466 + }, + { + "epoch": 80.29155313351498, + "grad_norm": 3.169152021408081, + "learning_rate": 1.9689515651262482e-06, + "loss": 0.0483, + "step": 29467 + }, + { + "epoch": 80.29427792915531, + "grad_norm": 2.543179988861084, + "learning_rate": 1.9684257727919233e-06, + "loss": 0.0755, + "step": 29468 + }, + { + "epoch": 80.29700272479565, + "grad_norm": 2.1362757682800293, + "learning_rate": 1.9679000430072414e-06, + "loss": 0.0315, + "step": 29469 + }, + { + "epoch": 80.29972752043597, + "grad_norm": 1.747061014175415, + "learning_rate": 1.9673743757762963e-06, + "loss": 0.0251, + "step": 29470 + }, + { + "epoch": 80.3024523160763, + "grad_norm": 1.8823891878128052, + "learning_rate": 1.9668487711031804e-06, + "loss": 0.0182, + "step": 29471 + }, + { + "epoch": 80.30517711171662, + "grad_norm": 3.2333693504333496, + "learning_rate": 1.9663232289919854e-06, + "loss": 0.1943, + "step": 29472 + }, + { + "epoch": 80.30790190735695, + "grad_norm": 2.659660816192627, + "learning_rate": 1.9657977494468095e-06, + "loss": 0.0508, + "step": 29473 + }, + { + "epoch": 80.31062670299727, + "grad_norm": 2.9786505699157715, + "learning_rate": 1.9652723324717415e-06, + "loss": 0.0924, + "step": 29474 + }, + { + "epoch": 80.3133514986376, + "grad_norm": 2.215651273727417, + "learning_rate": 1.964746978070875e-06, + "loss": 0.0407, + "step": 29475 + }, + { + "epoch": 80.31607629427793, + "grad_norm": 2.2558863162994385, + "learning_rate": 1.964221686248298e-06, + "loss": 0.0474, + "step": 29476 + }, + { + "epoch": 80.31880108991825, + "grad_norm": 5.30399751663208, + "learning_rate": 1.9636964570081054e-06, + "loss": 0.0456, + "step": 29477 + }, + { + "epoch": 80.32152588555859, + "grad_norm": 2.3896677494049072, + "learning_rate": 1.9631712903543854e-06, + "loss": 0.0298, + "step": 29478 + }, + { + "epoch": 80.3242506811989, + "grad_norm": 2.5672144889831543, + "learning_rate": 1.9626461862912304e-06, + "loss": 0.0937, + "step": 29479 + }, + { + "epoch": 80.32697547683924, + "grad_norm": 2.6122467517852783, + "learning_rate": 1.962121144822725e-06, + "loss": 0.055, + "step": 29480 + }, + { + "epoch": 80.32970027247957, + "grad_norm": 1.9325565099716187, + "learning_rate": 1.9615961659529637e-06, + "loss": 0.067, + "step": 29481 + }, + { + "epoch": 80.33242506811989, + "grad_norm": 2.978832483291626, + "learning_rate": 1.961071249686033e-06, + "loss": 0.0476, + "step": 29482 + }, + { + "epoch": 80.33514986376022, + "grad_norm": 1.8789916038513184, + "learning_rate": 1.9605463960260186e-06, + "loss": 0.1755, + "step": 29483 + }, + { + "epoch": 80.33787465940054, + "grad_norm": 2.263629198074341, + "learning_rate": 1.960021604977009e-06, + "loss": 0.0376, + "step": 29484 + }, + { + "epoch": 80.34059945504087, + "grad_norm": 3.0086748600006104, + "learning_rate": 1.9594968765430956e-06, + "loss": 0.1481, + "step": 29485 + }, + { + "epoch": 80.34332425068119, + "grad_norm": 2.566378355026245, + "learning_rate": 1.9589722107283628e-06, + "loss": 0.0287, + "step": 29486 + }, + { + "epoch": 80.34604904632153, + "grad_norm": 2.287869930267334, + "learning_rate": 1.958447607536894e-06, + "loss": 0.0499, + "step": 29487 + }, + { + "epoch": 80.34877384196186, + "grad_norm": 2.3460464477539062, + "learning_rate": 1.9579230669727745e-06, + "loss": 0.0203, + "step": 29488 + }, + { + "epoch": 80.35149863760218, + "grad_norm": 4.031327724456787, + "learning_rate": 1.957398589040094e-06, + "loss": 0.0498, + "step": 29489 + }, + { + "epoch": 80.35422343324251, + "grad_norm": 3.1813266277313232, + "learning_rate": 1.9568741737429344e-06, + "loss": 0.0727, + "step": 29490 + }, + { + "epoch": 80.35694822888283, + "grad_norm": 9.18799114227295, + "learning_rate": 1.9563498210853792e-06, + "loss": 0.1077, + "step": 29491 + }, + { + "epoch": 80.35967302452316, + "grad_norm": 1.7899898290634155, + "learning_rate": 1.9558255310715103e-06, + "loss": 0.02, + "step": 29492 + }, + { + "epoch": 80.3623978201635, + "grad_norm": 2.570700168609619, + "learning_rate": 1.955301303705417e-06, + "loss": 0.0657, + "step": 29493 + }, + { + "epoch": 80.36512261580381, + "grad_norm": 2.8046064376831055, + "learning_rate": 1.9547771389911774e-06, + "loss": 0.0527, + "step": 29494 + }, + { + "epoch": 80.36784741144415, + "grad_norm": 2.3152570724487305, + "learning_rate": 1.9542530369328738e-06, + "loss": 0.0241, + "step": 29495 + }, + { + "epoch": 80.37057220708446, + "grad_norm": 2.5495524406433105, + "learning_rate": 1.9537289975345876e-06, + "loss": 0.0737, + "step": 29496 + }, + { + "epoch": 80.3732970027248, + "grad_norm": 2.499063014984131, + "learning_rate": 1.9532050208004014e-06, + "loss": 0.042, + "step": 29497 + }, + { + "epoch": 80.37602179836512, + "grad_norm": 2.108701467514038, + "learning_rate": 1.9526811067343977e-06, + "loss": 0.0295, + "step": 29498 + }, + { + "epoch": 80.37874659400545, + "grad_norm": 2.7002453804016113, + "learning_rate": 1.952157255340653e-06, + "loss": 0.0809, + "step": 29499 + }, + { + "epoch": 80.38147138964578, + "grad_norm": 4.181662082672119, + "learning_rate": 1.9516334666232474e-06, + "loss": 0.2036, + "step": 29500 + }, + { + "epoch": 80.3841961852861, + "grad_norm": 2.412010908126831, + "learning_rate": 1.95110974058626e-06, + "loss": 0.1952, + "step": 29501 + }, + { + "epoch": 80.38692098092643, + "grad_norm": 1.9975512027740479, + "learning_rate": 1.950586077233775e-06, + "loss": 0.0217, + "step": 29502 + }, + { + "epoch": 80.38964577656675, + "grad_norm": 3.2104544639587402, + "learning_rate": 1.950062476569865e-06, + "loss": 0.0391, + "step": 29503 + }, + { + "epoch": 80.39237057220708, + "grad_norm": 2.4745044708251953, + "learning_rate": 1.9495389385986076e-06, + "loss": 0.0281, + "step": 29504 + }, + { + "epoch": 80.39509536784742, + "grad_norm": 3.938070297241211, + "learning_rate": 1.9490154633240843e-06, + "loss": 0.0378, + "step": 29505 + }, + { + "epoch": 80.39782016348774, + "grad_norm": 3.3507866859436035, + "learning_rate": 1.948492050750369e-06, + "loss": 0.0598, + "step": 29506 + }, + { + "epoch": 80.40054495912807, + "grad_norm": 2.580538034439087, + "learning_rate": 1.9479687008815396e-06, + "loss": 0.058, + "step": 29507 + }, + { + "epoch": 80.40326975476839, + "grad_norm": 2.0212392807006836, + "learning_rate": 1.947445413721667e-06, + "loss": 0.0596, + "step": 29508 + }, + { + "epoch": 80.40599455040872, + "grad_norm": 2.680859327316284, + "learning_rate": 1.9469221892748337e-06, + "loss": 0.1228, + "step": 29509 + }, + { + "epoch": 80.40871934604904, + "grad_norm": 2.15167498588562, + "learning_rate": 1.9463990275451107e-06, + "loss": 0.0312, + "step": 29510 + }, + { + "epoch": 80.41144414168937, + "grad_norm": 3.37306809425354, + "learning_rate": 1.9458759285365723e-06, + "loss": 0.0562, + "step": 29511 + }, + { + "epoch": 80.4141689373297, + "grad_norm": 4.165459156036377, + "learning_rate": 1.9453528922532915e-06, + "loss": 0.1646, + "step": 29512 + }, + { + "epoch": 80.41689373297002, + "grad_norm": 10.101032257080078, + "learning_rate": 1.944829918699346e-06, + "loss": 0.0368, + "step": 29513 + }, + { + "epoch": 80.41961852861036, + "grad_norm": 3.278978109359741, + "learning_rate": 1.944307007878805e-06, + "loss": 0.0734, + "step": 29514 + }, + { + "epoch": 80.42234332425068, + "grad_norm": 1.8675167560577393, + "learning_rate": 1.943784159795742e-06, + "loss": 0.0249, + "step": 29515 + }, + { + "epoch": 80.42506811989101, + "grad_norm": 2.862319231033325, + "learning_rate": 1.943261374454226e-06, + "loss": 0.0537, + "step": 29516 + }, + { + "epoch": 80.42779291553134, + "grad_norm": 3.1203036308288574, + "learning_rate": 1.9427386518583313e-06, + "loss": 0.0373, + "step": 29517 + }, + { + "epoch": 80.43051771117166, + "grad_norm": 2.046741247177124, + "learning_rate": 1.942215992012131e-06, + "loss": 0.0633, + "step": 29518 + }, + { + "epoch": 80.433242506812, + "grad_norm": 2.4257113933563232, + "learning_rate": 1.9416933949196926e-06, + "loss": 0.0294, + "step": 29519 + }, + { + "epoch": 80.43596730245231, + "grad_norm": 2.9155521392822266, + "learning_rate": 1.9411708605850875e-06, + "loss": 0.0995, + "step": 29520 + }, + { + "epoch": 80.43869209809264, + "grad_norm": 3.372971534729004, + "learning_rate": 1.9406483890123817e-06, + "loss": 0.0745, + "step": 29521 + }, + { + "epoch": 80.44141689373296, + "grad_norm": 3.321413278579712, + "learning_rate": 1.9401259802056495e-06, + "loss": 0.0567, + "step": 29522 + }, + { + "epoch": 80.4441416893733, + "grad_norm": 2.972351551055908, + "learning_rate": 1.939603634168957e-06, + "loss": 0.0472, + "step": 29523 + }, + { + "epoch": 80.44686648501363, + "grad_norm": 2.0562520027160645, + "learning_rate": 1.939081350906369e-06, + "loss": 0.0208, + "step": 29524 + }, + { + "epoch": 80.44959128065395, + "grad_norm": 2.546272039413452, + "learning_rate": 1.9385591304219585e-06, + "loss": 0.0519, + "step": 29525 + }, + { + "epoch": 80.45231607629428, + "grad_norm": 2.502002239227295, + "learning_rate": 1.93803697271979e-06, + "loss": 0.0257, + "step": 29526 + }, + { + "epoch": 80.4550408719346, + "grad_norm": 1.9413026571273804, + "learning_rate": 1.937514877803931e-06, + "loss": 0.0201, + "step": 29527 + }, + { + "epoch": 80.45776566757493, + "grad_norm": 2.404670000076294, + "learning_rate": 1.9369928456784425e-06, + "loss": 0.0417, + "step": 29528 + }, + { + "epoch": 80.46049046321527, + "grad_norm": 1.6891522407531738, + "learning_rate": 1.936470876347398e-06, + "loss": 0.1206, + "step": 29529 + }, + { + "epoch": 80.46321525885558, + "grad_norm": 2.2138748168945312, + "learning_rate": 1.935948969814858e-06, + "loss": 0.0304, + "step": 29530 + }, + { + "epoch": 80.46594005449592, + "grad_norm": 3.2485358715057373, + "learning_rate": 1.935427126084889e-06, + "loss": 0.1371, + "step": 29531 + }, + { + "epoch": 80.46866485013624, + "grad_norm": 2.471385955810547, + "learning_rate": 1.934905345161551e-06, + "loss": 0.0367, + "step": 29532 + }, + { + "epoch": 80.47138964577657, + "grad_norm": 4.403931140899658, + "learning_rate": 1.9343836270489124e-06, + "loss": 0.0605, + "step": 29533 + }, + { + "epoch": 80.47411444141689, + "grad_norm": 3.497035026550293, + "learning_rate": 1.933861971751032e-06, + "loss": 0.106, + "step": 29534 + }, + { + "epoch": 80.47683923705722, + "grad_norm": 3.98860502243042, + "learning_rate": 1.9333403792719783e-06, + "loss": 0.0593, + "step": 29535 + }, + { + "epoch": 80.47956403269755, + "grad_norm": 1.806820273399353, + "learning_rate": 1.9328188496158095e-06, + "loss": 0.0182, + "step": 29536 + }, + { + "epoch": 80.48228882833787, + "grad_norm": 2.6612436771392822, + "learning_rate": 1.9322973827865854e-06, + "loss": 0.0582, + "step": 29537 + }, + { + "epoch": 80.4850136239782, + "grad_norm": 2.6918468475341797, + "learning_rate": 1.9317759787883727e-06, + "loss": 0.0577, + "step": 29538 + }, + { + "epoch": 80.48773841961852, + "grad_norm": 2.69391131401062, + "learning_rate": 1.931254637625228e-06, + "loss": 0.0372, + "step": 29539 + }, + { + "epoch": 80.49046321525886, + "grad_norm": 3.332688093185425, + "learning_rate": 1.9307333593012134e-06, + "loss": 0.0772, + "step": 29540 + }, + { + "epoch": 80.49318801089919, + "grad_norm": 4.455597400665283, + "learning_rate": 1.9302121438203847e-06, + "loss": 0.2296, + "step": 29541 + }, + { + "epoch": 80.49591280653951, + "grad_norm": 2.459177017211914, + "learning_rate": 1.929690991186808e-06, + "loss": 0.0352, + "step": 29542 + }, + { + "epoch": 80.49863760217984, + "grad_norm": 4.751394748687744, + "learning_rate": 1.9291699014045362e-06, + "loss": 0.1556, + "step": 29543 + }, + { + "epoch": 80.50136239782016, + "grad_norm": 2.685845136642456, + "learning_rate": 1.92864887447763e-06, + "loss": 0.0608, + "step": 29544 + }, + { + "epoch": 80.50408719346049, + "grad_norm": 2.879746675491333, + "learning_rate": 1.928127910410145e-06, + "loss": 0.1232, + "step": 29545 + }, + { + "epoch": 80.50681198910081, + "grad_norm": 2.6398751735687256, + "learning_rate": 1.9276070092061414e-06, + "loss": 0.0738, + "step": 29546 + }, + { + "epoch": 80.50953678474114, + "grad_norm": 2.0282692909240723, + "learning_rate": 1.927086170869675e-06, + "loss": 0.049, + "step": 29547 + }, + { + "epoch": 80.51226158038148, + "grad_norm": 3.3353421688079834, + "learning_rate": 1.926565395404799e-06, + "loss": 0.0535, + "step": 29548 + }, + { + "epoch": 80.5149863760218, + "grad_norm": 7.86765718460083, + "learning_rate": 1.9260446828155745e-06, + "loss": 0.2399, + "step": 29549 + }, + { + "epoch": 80.51771117166213, + "grad_norm": 2.7736849784851074, + "learning_rate": 1.9255240331060543e-06, + "loss": 0.0579, + "step": 29550 + }, + { + "epoch": 80.52043596730245, + "grad_norm": 3.1279215812683105, + "learning_rate": 1.92500344628029e-06, + "loss": 0.0769, + "step": 29551 + }, + { + "epoch": 80.52316076294278, + "grad_norm": 2.62282395362854, + "learning_rate": 1.9244829223423424e-06, + "loss": 0.0527, + "step": 29552 + }, + { + "epoch": 80.52588555858311, + "grad_norm": 2.7637453079223633, + "learning_rate": 1.9239624612962593e-06, + "loss": 0.3223, + "step": 29553 + }, + { + "epoch": 80.52861035422343, + "grad_norm": 2.9348785877227783, + "learning_rate": 1.9234420631460982e-06, + "loss": 0.0361, + "step": 29554 + }, + { + "epoch": 80.53133514986376, + "grad_norm": 2.3062024116516113, + "learning_rate": 1.922921727895911e-06, + "loss": 0.0804, + "step": 29555 + }, + { + "epoch": 80.53405994550408, + "grad_norm": 2.510293960571289, + "learning_rate": 1.9224014555497493e-06, + "loss": 0.035, + "step": 29556 + }, + { + "epoch": 80.53678474114442, + "grad_norm": 3.1365272998809814, + "learning_rate": 1.921881246111662e-06, + "loss": 0.071, + "step": 29557 + }, + { + "epoch": 80.53950953678473, + "grad_norm": 1.9490344524383545, + "learning_rate": 1.9213610995857067e-06, + "loss": 0.0237, + "step": 29558 + }, + { + "epoch": 80.54223433242507, + "grad_norm": 2.332551956176758, + "learning_rate": 1.9208410159759316e-06, + "loss": 0.0429, + "step": 29559 + }, + { + "epoch": 80.5449591280654, + "grad_norm": 2.3657114505767822, + "learning_rate": 1.9203209952863866e-06, + "loss": 0.0288, + "step": 29560 + }, + { + "epoch": 80.54768392370572, + "grad_norm": 2.3163259029388428, + "learning_rate": 1.9198010375211185e-06, + "loss": 0.0274, + "step": 29561 + }, + { + "epoch": 80.55040871934605, + "grad_norm": 2.813373327255249, + "learning_rate": 1.919281142684183e-06, + "loss": 0.0843, + "step": 29562 + }, + { + "epoch": 80.55313351498637, + "grad_norm": 2.549604654312134, + "learning_rate": 1.918761310779624e-06, + "loss": 0.0838, + "step": 29563 + }, + { + "epoch": 80.5558583106267, + "grad_norm": 1.7128933668136597, + "learning_rate": 1.9182415418114943e-06, + "loss": 0.1445, + "step": 29564 + }, + { + "epoch": 80.55858310626704, + "grad_norm": 2.762568473815918, + "learning_rate": 1.917721835783836e-06, + "loss": 0.1624, + "step": 29565 + }, + { + "epoch": 80.56130790190736, + "grad_norm": 2.697061777114868, + "learning_rate": 1.9172021927007024e-06, + "loss": 0.0706, + "step": 29566 + }, + { + "epoch": 80.56403269754769, + "grad_norm": 2.739628791809082, + "learning_rate": 1.9166826125661376e-06, + "loss": 0.1294, + "step": 29567 + }, + { + "epoch": 80.566757493188, + "grad_norm": 2.1490402221679688, + "learning_rate": 1.916163095384188e-06, + "loss": 0.0579, + "step": 29568 + }, + { + "epoch": 80.56948228882834, + "grad_norm": 2.475924015045166, + "learning_rate": 1.9156436411588963e-06, + "loss": 0.1306, + "step": 29569 + }, + { + "epoch": 80.57220708446866, + "grad_norm": 3.805649518966675, + "learning_rate": 1.9151242498943155e-06, + "loss": 0.127, + "step": 29570 + }, + { + "epoch": 80.57493188010899, + "grad_norm": 2.7910525798797607, + "learning_rate": 1.9146049215944886e-06, + "loss": 0.0492, + "step": 29571 + }, + { + "epoch": 80.57765667574932, + "grad_norm": 3.0342190265655518, + "learning_rate": 1.914085656263457e-06, + "loss": 0.0756, + "step": 29572 + }, + { + "epoch": 80.58038147138964, + "grad_norm": 3.363170623779297, + "learning_rate": 1.9135664539052634e-06, + "loss": 0.1101, + "step": 29573 + }, + { + "epoch": 80.58310626702998, + "grad_norm": 2.4629461765289307, + "learning_rate": 1.913047314523957e-06, + "loss": 0.0563, + "step": 29574 + }, + { + "epoch": 80.5858310626703, + "grad_norm": 1.9890810251235962, + "learning_rate": 1.9125282381235775e-06, + "loss": 0.0379, + "step": 29575 + }, + { + "epoch": 80.58855585831063, + "grad_norm": 1.9922795295715332, + "learning_rate": 1.912009224708168e-06, + "loss": 0.0497, + "step": 29576 + }, + { + "epoch": 80.59128065395096, + "grad_norm": 1.87977933883667, + "learning_rate": 1.9114902742817675e-06, + "loss": 0.0368, + "step": 29577 + }, + { + "epoch": 80.59400544959128, + "grad_norm": 3.2104647159576416, + "learning_rate": 1.9109713868484235e-06, + "loss": 0.0456, + "step": 29578 + }, + { + "epoch": 80.59673024523161, + "grad_norm": 1.9903428554534912, + "learning_rate": 1.910452562412174e-06, + "loss": 0.0478, + "step": 29579 + }, + { + "epoch": 80.59945504087193, + "grad_norm": 2.8873534202575684, + "learning_rate": 1.9099338009770596e-06, + "loss": 0.14, + "step": 29580 + }, + { + "epoch": 80.60217983651226, + "grad_norm": 2.1759111881256104, + "learning_rate": 1.9094151025471175e-06, + "loss": 0.04, + "step": 29581 + }, + { + "epoch": 80.60490463215258, + "grad_norm": 3.4681735038757324, + "learning_rate": 1.908896467126392e-06, + "loss": 0.0684, + "step": 29582 + }, + { + "epoch": 80.60762942779292, + "grad_norm": 2.570377826690674, + "learning_rate": 1.908377894718921e-06, + "loss": 0.0733, + "step": 29583 + }, + { + "epoch": 80.61035422343325, + "grad_norm": 3.0153040885925293, + "learning_rate": 1.907859385328743e-06, + "loss": 0.1376, + "step": 29584 + }, + { + "epoch": 80.61307901907357, + "grad_norm": 4.000795841217041, + "learning_rate": 1.9073409389598929e-06, + "loss": 0.0762, + "step": 29585 + }, + { + "epoch": 80.6158038147139, + "grad_norm": 2.1445767879486084, + "learning_rate": 1.9068225556164112e-06, + "loss": 0.0305, + "step": 29586 + }, + { + "epoch": 80.61852861035422, + "grad_norm": 1.8627997636795044, + "learning_rate": 1.9063042353023375e-06, + "loss": 0.116, + "step": 29587 + }, + { + "epoch": 80.62125340599455, + "grad_norm": 2.578044891357422, + "learning_rate": 1.9057859780217058e-06, + "loss": 0.0274, + "step": 29588 + }, + { + "epoch": 80.62397820163488, + "grad_norm": 1.7357089519500732, + "learning_rate": 1.9052677837785505e-06, + "loss": 0.068, + "step": 29589 + }, + { + "epoch": 80.6267029972752, + "grad_norm": 2.2578418254852295, + "learning_rate": 1.9047496525769104e-06, + "loss": 0.0427, + "step": 29590 + }, + { + "epoch": 80.62942779291554, + "grad_norm": 2.87907338142395, + "learning_rate": 1.9042315844208203e-06, + "loss": 0.0822, + "step": 29591 + }, + { + "epoch": 80.63215258855585, + "grad_norm": 3.326517105102539, + "learning_rate": 1.9037135793143135e-06, + "loss": 0.0258, + "step": 29592 + }, + { + "epoch": 80.63487738419619, + "grad_norm": 2.6102454662323, + "learning_rate": 1.9031956372614236e-06, + "loss": 0.0653, + "step": 29593 + }, + { + "epoch": 80.6376021798365, + "grad_norm": 2.579186201095581, + "learning_rate": 1.902677758266186e-06, + "loss": 0.1855, + "step": 29594 + }, + { + "epoch": 80.64032697547684, + "grad_norm": 1.9239168167114258, + "learning_rate": 1.9021599423326353e-06, + "loss": 0.0207, + "step": 29595 + }, + { + "epoch": 80.64305177111717, + "grad_norm": 2.068316698074341, + "learning_rate": 1.9016421894648006e-06, + "loss": 0.0191, + "step": 29596 + }, + { + "epoch": 80.64577656675749, + "grad_norm": 2.4410226345062256, + "learning_rate": 1.9011244996667144e-06, + "loss": 0.1417, + "step": 29597 + }, + { + "epoch": 80.64850136239782, + "grad_norm": 2.3196847438812256, + "learning_rate": 1.900606872942413e-06, + "loss": 0.0582, + "step": 29598 + }, + { + "epoch": 80.65122615803814, + "grad_norm": 2.043778896331787, + "learning_rate": 1.9000893092959238e-06, + "loss": 0.0334, + "step": 29599 + }, + { + "epoch": 80.65395095367847, + "grad_norm": 3.3655807971954346, + "learning_rate": 1.8995718087312787e-06, + "loss": 0.1447, + "step": 29600 + }, + { + "epoch": 80.65667574931881, + "grad_norm": 2.0184550285339355, + "learning_rate": 1.8990543712525045e-06, + "loss": 0.0302, + "step": 29601 + }, + { + "epoch": 80.65940054495913, + "grad_norm": 3.035971164703369, + "learning_rate": 1.898536996863637e-06, + "loss": 0.0293, + "step": 29602 + }, + { + "epoch": 80.66212534059946, + "grad_norm": 2.2015907764434814, + "learning_rate": 1.8980196855687005e-06, + "loss": 0.0292, + "step": 29603 + }, + { + "epoch": 80.66485013623978, + "grad_norm": 3.003671884536743, + "learning_rate": 1.8975024373717277e-06, + "loss": 0.165, + "step": 29604 + }, + { + "epoch": 80.66757493188011, + "grad_norm": 2.6577353477478027, + "learning_rate": 1.8969852522767452e-06, + "loss": 0.0577, + "step": 29605 + }, + { + "epoch": 80.67029972752043, + "grad_norm": 3.1609206199645996, + "learning_rate": 1.8964681302877786e-06, + "loss": 0.0766, + "step": 29606 + }, + { + "epoch": 80.67302452316076, + "grad_norm": 2.8355610370635986, + "learning_rate": 1.8959510714088603e-06, + "loss": 0.0501, + "step": 29607 + }, + { + "epoch": 80.6757493188011, + "grad_norm": 4.325540065765381, + "learning_rate": 1.8954340756440137e-06, + "loss": 0.0815, + "step": 29608 + }, + { + "epoch": 80.67847411444141, + "grad_norm": 3.164767026901245, + "learning_rate": 1.8949171429972657e-06, + "loss": 0.0952, + "step": 29609 + }, + { + "epoch": 80.68119891008175, + "grad_norm": 3.5869052410125732, + "learning_rate": 1.8944002734726396e-06, + "loss": 0.0416, + "step": 29610 + }, + { + "epoch": 80.68392370572207, + "grad_norm": 1.9556015729904175, + "learning_rate": 1.8938834670741656e-06, + "loss": 0.026, + "step": 29611 + }, + { + "epoch": 80.6866485013624, + "grad_norm": 3.7239344120025635, + "learning_rate": 1.8933667238058672e-06, + "loss": 0.0569, + "step": 29612 + }, + { + "epoch": 80.68937329700273, + "grad_norm": 2.3650319576263428, + "learning_rate": 1.8928500436717645e-06, + "loss": 0.036, + "step": 29613 + }, + { + "epoch": 80.69209809264305, + "grad_norm": 2.493445634841919, + "learning_rate": 1.8923334266758874e-06, + "loss": 0.0907, + "step": 29614 + }, + { + "epoch": 80.69482288828338, + "grad_norm": 2.0561065673828125, + "learning_rate": 1.8918168728222564e-06, + "loss": 0.0496, + "step": 29615 + }, + { + "epoch": 80.6975476839237, + "grad_norm": 2.926267385482788, + "learning_rate": 1.8913003821148957e-06, + "loss": 0.0413, + "step": 29616 + }, + { + "epoch": 80.70027247956403, + "grad_norm": 4.192161560058594, + "learning_rate": 1.8907839545578233e-06, + "loss": 0.0425, + "step": 29617 + }, + { + "epoch": 80.70299727520435, + "grad_norm": 2.738772392272949, + "learning_rate": 1.890267590155066e-06, + "loss": 0.0775, + "step": 29618 + }, + { + "epoch": 80.70572207084469, + "grad_norm": 4.501349925994873, + "learning_rate": 1.8897512889106451e-06, + "loss": 0.1273, + "step": 29619 + }, + { + "epoch": 80.70844686648502, + "grad_norm": 3.0270581245422363, + "learning_rate": 1.8892350508285773e-06, + "loss": 0.0584, + "step": 29620 + }, + { + "epoch": 80.71117166212534, + "grad_norm": 3.082486629486084, + "learning_rate": 1.8887188759128883e-06, + "loss": 0.0452, + "step": 29621 + }, + { + "epoch": 80.71389645776567, + "grad_norm": 1.7954591512680054, + "learning_rate": 1.8882027641675927e-06, + "loss": 0.0294, + "step": 29622 + }, + { + "epoch": 80.71662125340599, + "grad_norm": 3.0222692489624023, + "learning_rate": 1.887686715596716e-06, + "loss": 0.0832, + "step": 29623 + }, + { + "epoch": 80.71934604904632, + "grad_norm": 2.030682325363159, + "learning_rate": 1.887170730204274e-06, + "loss": 0.0511, + "step": 29624 + }, + { + "epoch": 80.72207084468666, + "grad_norm": 1.996232271194458, + "learning_rate": 1.886654807994286e-06, + "loss": 0.0907, + "step": 29625 + }, + { + "epoch": 80.72479564032697, + "grad_norm": 5.397789001464844, + "learning_rate": 1.8861389489707648e-06, + "loss": 0.1492, + "step": 29626 + }, + { + "epoch": 80.7275204359673, + "grad_norm": 4.474803447723389, + "learning_rate": 1.8856231531377367e-06, + "loss": 0.041, + "step": 29627 + }, + { + "epoch": 80.73024523160763, + "grad_norm": 2.154280185699463, + "learning_rate": 1.8851074204992137e-06, + "loss": 0.0496, + "step": 29628 + }, + { + "epoch": 80.73297002724796, + "grad_norm": 2.165541887283325, + "learning_rate": 1.8845917510592126e-06, + "loss": 0.0884, + "step": 29629 + }, + { + "epoch": 80.73569482288828, + "grad_norm": 1.7544691562652588, + "learning_rate": 1.884076144821747e-06, + "loss": 0.0949, + "step": 29630 + }, + { + "epoch": 80.73841961852861, + "grad_norm": 1.7653148174285889, + "learning_rate": 1.8835606017908382e-06, + "loss": 0.0242, + "step": 29631 + }, + { + "epoch": 80.74114441416894, + "grad_norm": 2.971686363220215, + "learning_rate": 1.883045121970498e-06, + "loss": 0.0607, + "step": 29632 + }, + { + "epoch": 80.74386920980926, + "grad_norm": 2.4125564098358154, + "learning_rate": 1.8825297053647418e-06, + "loss": 0.0361, + "step": 29633 + }, + { + "epoch": 80.7465940054496, + "grad_norm": 2.2299764156341553, + "learning_rate": 1.8820143519775792e-06, + "loss": 0.0652, + "step": 29634 + }, + { + "epoch": 80.74931880108991, + "grad_norm": 3.280430555343628, + "learning_rate": 1.8814990618130313e-06, + "loss": 0.1178, + "step": 29635 + }, + { + "epoch": 80.75204359673025, + "grad_norm": 2.1842055320739746, + "learning_rate": 1.8809838348751065e-06, + "loss": 0.0427, + "step": 29636 + }, + { + "epoch": 80.75476839237058, + "grad_norm": 2.3917200565338135, + "learning_rate": 1.8804686711678167e-06, + "loss": 0.0917, + "step": 29637 + }, + { + "epoch": 80.7574931880109, + "grad_norm": 2.8943660259246826, + "learning_rate": 1.8799535706951743e-06, + "loss": 0.0653, + "step": 29638 + }, + { + "epoch": 80.76021798365123, + "grad_norm": 4.0513081550598145, + "learning_rate": 1.8794385334611953e-06, + "loss": 0.0316, + "step": 29639 + }, + { + "epoch": 80.76294277929155, + "grad_norm": 5.677994251251221, + "learning_rate": 1.8789235594698885e-06, + "loss": 0.034, + "step": 29640 + }, + { + "epoch": 80.76566757493188, + "grad_norm": 2.3507676124572754, + "learning_rate": 1.8784086487252628e-06, + "loss": 0.1498, + "step": 29641 + }, + { + "epoch": 80.7683923705722, + "grad_norm": 2.821159839630127, + "learning_rate": 1.8778938012313263e-06, + "loss": 0.1113, + "step": 29642 + }, + { + "epoch": 80.77111716621253, + "grad_norm": 2.3692619800567627, + "learning_rate": 1.8773790169920947e-06, + "loss": 0.0594, + "step": 29643 + }, + { + "epoch": 80.77384196185287, + "grad_norm": 2.7331764698028564, + "learning_rate": 1.8768642960115735e-06, + "loss": 0.0585, + "step": 29644 + }, + { + "epoch": 80.77656675749319, + "grad_norm": 3.1903886795043945, + "learning_rate": 1.8763496382937718e-06, + "loss": 0.0552, + "step": 29645 + }, + { + "epoch": 80.77929155313352, + "grad_norm": 8.227446556091309, + "learning_rate": 1.8758350438426954e-06, + "loss": 0.0899, + "step": 29646 + }, + { + "epoch": 80.78201634877384, + "grad_norm": 2.9153196811676025, + "learning_rate": 1.8753205126623564e-06, + "loss": 0.1175, + "step": 29647 + }, + { + "epoch": 80.78474114441417, + "grad_norm": 3.3126773834228516, + "learning_rate": 1.8748060447567595e-06, + "loss": 0.1439, + "step": 29648 + }, + { + "epoch": 80.7874659400545, + "grad_norm": 1.6990525722503662, + "learning_rate": 1.8742916401299128e-06, + "loss": 0.0241, + "step": 29649 + }, + { + "epoch": 80.79019073569482, + "grad_norm": 3.0038223266601562, + "learning_rate": 1.8737772987858172e-06, + "loss": 0.0768, + "step": 29650 + }, + { + "epoch": 80.79291553133515, + "grad_norm": 3.690922498703003, + "learning_rate": 1.8732630207284863e-06, + "loss": 0.0282, + "step": 29651 + }, + { + "epoch": 80.79564032697547, + "grad_norm": 2.6866910457611084, + "learning_rate": 1.8727488059619203e-06, + "loss": 0.0992, + "step": 29652 + }, + { + "epoch": 80.7983651226158, + "grad_norm": 2.986560106277466, + "learning_rate": 1.872234654490126e-06, + "loss": 0.1254, + "step": 29653 + }, + { + "epoch": 80.80108991825612, + "grad_norm": 1.9595917463302612, + "learning_rate": 1.8717205663171034e-06, + "loss": 0.0236, + "step": 29654 + }, + { + "epoch": 80.80381471389646, + "grad_norm": 2.430351734161377, + "learning_rate": 1.8712065414468595e-06, + "loss": 0.0429, + "step": 29655 + }, + { + "epoch": 80.80653950953679, + "grad_norm": 2.9290590286254883, + "learning_rate": 1.8706925798833997e-06, + "loss": 0.0515, + "step": 29656 + }, + { + "epoch": 80.80926430517711, + "grad_norm": 3.7299163341522217, + "learning_rate": 1.8701786816307255e-06, + "loss": 0.0623, + "step": 29657 + }, + { + "epoch": 80.81198910081744, + "grad_norm": 2.51239275932312, + "learning_rate": 1.8696648466928347e-06, + "loss": 0.1859, + "step": 29658 + }, + { + "epoch": 80.81471389645776, + "grad_norm": 2.1915643215179443, + "learning_rate": 1.8691510750737352e-06, + "loss": 0.0233, + "step": 29659 + }, + { + "epoch": 80.8174386920981, + "grad_norm": 2.2097456455230713, + "learning_rate": 1.8686373667774248e-06, + "loss": 0.0321, + "step": 29660 + }, + { + "epoch": 80.82016348773843, + "grad_norm": 2.278515577316284, + "learning_rate": 1.8681237218079063e-06, + "loss": 0.0328, + "step": 29661 + }, + { + "epoch": 80.82288828337875, + "grad_norm": 4.386941432952881, + "learning_rate": 1.8676101401691748e-06, + "loss": 0.103, + "step": 29662 + }, + { + "epoch": 80.82561307901908, + "grad_norm": 3.178586483001709, + "learning_rate": 1.8670966218652365e-06, + "loss": 0.114, + "step": 29663 + }, + { + "epoch": 80.8283378746594, + "grad_norm": 2.8836803436279297, + "learning_rate": 1.866583166900089e-06, + "loss": 0.0487, + "step": 29664 + }, + { + "epoch": 80.83106267029973, + "grad_norm": 2.9946720600128174, + "learning_rate": 1.866069775277729e-06, + "loss": 0.0349, + "step": 29665 + }, + { + "epoch": 80.83378746594005, + "grad_norm": 2.5141279697418213, + "learning_rate": 1.8655564470021526e-06, + "loss": 0.0285, + "step": 29666 + }, + { + "epoch": 80.83651226158038, + "grad_norm": 2.748910427093506, + "learning_rate": 1.8650431820773651e-06, + "loss": 0.0798, + "step": 29667 + }, + { + "epoch": 80.83923705722071, + "grad_norm": 2.2487642765045166, + "learning_rate": 1.864529980507358e-06, + "loss": 0.0364, + "step": 29668 + }, + { + "epoch": 80.84196185286103, + "grad_norm": 1.5930827856063843, + "learning_rate": 1.8640168422961303e-06, + "loss": 0.0229, + "step": 29669 + }, + { + "epoch": 80.84468664850137, + "grad_norm": 4.5194292068481445, + "learning_rate": 1.8635037674476752e-06, + "loss": 0.1947, + "step": 29670 + }, + { + "epoch": 80.84741144414168, + "grad_norm": 3.067448139190674, + "learning_rate": 1.8629907559659922e-06, + "loss": 0.0555, + "step": 29671 + }, + { + "epoch": 80.85013623978202, + "grad_norm": 2.2344095706939697, + "learning_rate": 1.8624778078550743e-06, + "loss": 0.0264, + "step": 29672 + }, + { + "epoch": 80.85286103542235, + "grad_norm": 2.330422878265381, + "learning_rate": 1.8619649231189186e-06, + "loss": 0.0391, + "step": 29673 + }, + { + "epoch": 80.85558583106267, + "grad_norm": 2.7653892040252686, + "learning_rate": 1.8614521017615196e-06, + "loss": 0.0508, + "step": 29674 + }, + { + "epoch": 80.858310626703, + "grad_norm": 2.0616846084594727, + "learning_rate": 1.8609393437868662e-06, + "loss": 0.1164, + "step": 29675 + }, + { + "epoch": 80.86103542234332, + "grad_norm": 2.1021788120269775, + "learning_rate": 1.8604266491989575e-06, + "loss": 0.0286, + "step": 29676 + }, + { + "epoch": 80.86376021798365, + "grad_norm": 2.714175224304199, + "learning_rate": 1.859914018001785e-06, + "loss": 0.0982, + "step": 29677 + }, + { + "epoch": 80.86648501362397, + "grad_norm": 1.7867244482040405, + "learning_rate": 1.8594014501993362e-06, + "loss": 0.0801, + "step": 29678 + }, + { + "epoch": 80.8692098092643, + "grad_norm": 2.017289876937866, + "learning_rate": 1.8588889457956106e-06, + "loss": 0.0291, + "step": 29679 + }, + { + "epoch": 80.87193460490464, + "grad_norm": 1.6092020273208618, + "learning_rate": 1.8583765047945956e-06, + "loss": 0.0186, + "step": 29680 + }, + { + "epoch": 80.87465940054496, + "grad_norm": 3.8612475395202637, + "learning_rate": 1.8578641272002818e-06, + "loss": 0.1904, + "step": 29681 + }, + { + "epoch": 80.87738419618529, + "grad_norm": 3.600154399871826, + "learning_rate": 1.857351813016659e-06, + "loss": 0.0456, + "step": 29682 + }, + { + "epoch": 80.88010899182561, + "grad_norm": 2.4364824295043945, + "learning_rate": 1.8568395622477198e-06, + "loss": 0.025, + "step": 29683 + }, + { + "epoch": 80.88283378746594, + "grad_norm": 4.23787260055542, + "learning_rate": 1.856327374897452e-06, + "loss": 0.1376, + "step": 29684 + }, + { + "epoch": 80.88555858310627, + "grad_norm": 2.548859119415283, + "learning_rate": 1.8558152509698446e-06, + "loss": 0.038, + "step": 29685 + }, + { + "epoch": 80.88828337874659, + "grad_norm": 1.9448168277740479, + "learning_rate": 1.8553031904688833e-06, + "loss": 0.0614, + "step": 29686 + }, + { + "epoch": 80.89100817438693, + "grad_norm": 3.829408884048462, + "learning_rate": 1.8547911933985607e-06, + "loss": 0.2498, + "step": 29687 + }, + { + "epoch": 80.89373297002724, + "grad_norm": 2.3729562759399414, + "learning_rate": 1.8542792597628622e-06, + "loss": 0.0553, + "step": 29688 + }, + { + "epoch": 80.89645776566758, + "grad_norm": 2.532068967819214, + "learning_rate": 1.8537673895657726e-06, + "loss": 0.0325, + "step": 29689 + }, + { + "epoch": 80.8991825613079, + "grad_norm": 2.1381380558013916, + "learning_rate": 1.853255582811283e-06, + "loss": 0.0198, + "step": 29690 + }, + { + "epoch": 80.90190735694823, + "grad_norm": 2.2383947372436523, + "learning_rate": 1.8527438395033747e-06, + "loss": 0.0384, + "step": 29691 + }, + { + "epoch": 80.90463215258856, + "grad_norm": 3.122887372970581, + "learning_rate": 1.8522321596460368e-06, + "loss": 0.0869, + "step": 29692 + }, + { + "epoch": 80.90735694822888, + "grad_norm": 3.0096633434295654, + "learning_rate": 1.8517205432432527e-06, + "loss": 0.0855, + "step": 29693 + }, + { + "epoch": 80.91008174386921, + "grad_norm": 3.814385175704956, + "learning_rate": 1.851208990299007e-06, + "loss": 0.0641, + "step": 29694 + }, + { + "epoch": 80.91280653950953, + "grad_norm": 3.931626319885254, + "learning_rate": 1.850697500817281e-06, + "loss": 0.075, + "step": 29695 + }, + { + "epoch": 80.91553133514986, + "grad_norm": 2.4536795616149902, + "learning_rate": 1.8501860748020629e-06, + "loss": 0.0468, + "step": 29696 + }, + { + "epoch": 80.9182561307902, + "grad_norm": 10.569121360778809, + "learning_rate": 1.8496747122573333e-06, + "loss": 0.0817, + "step": 29697 + }, + { + "epoch": 80.92098092643052, + "grad_norm": 2.4495747089385986, + "learning_rate": 1.8491634131870716e-06, + "loss": 0.1734, + "step": 29698 + }, + { + "epoch": 80.92370572207085, + "grad_norm": 2.783935785293579, + "learning_rate": 1.848652177595267e-06, + "loss": 0.0599, + "step": 29699 + }, + { + "epoch": 80.92643051771117, + "grad_norm": 1.924935221672058, + "learning_rate": 1.848141005485895e-06, + "loss": 0.0269, + "step": 29700 + }, + { + "epoch": 80.9291553133515, + "grad_norm": 5.172467231750488, + "learning_rate": 1.8476298968629401e-06, + "loss": 0.0405, + "step": 29701 + }, + { + "epoch": 80.93188010899182, + "grad_norm": 2.371753215789795, + "learning_rate": 1.8471188517303774e-06, + "loss": 0.0359, + "step": 29702 + }, + { + "epoch": 80.93460490463215, + "grad_norm": 2.5195109844207764, + "learning_rate": 1.846607870092194e-06, + "loss": 0.0991, + "step": 29703 + }, + { + "epoch": 80.93732970027249, + "grad_norm": 2.765890598297119, + "learning_rate": 1.8460969519523664e-06, + "loss": 0.0414, + "step": 29704 + }, + { + "epoch": 80.9400544959128, + "grad_norm": 3.039405584335327, + "learning_rate": 1.845586097314872e-06, + "loss": 0.047, + "step": 29705 + }, + { + "epoch": 80.94277929155314, + "grad_norm": 3.6830575466156006, + "learning_rate": 1.845075306183689e-06, + "loss": 0.0483, + "step": 29706 + }, + { + "epoch": 80.94550408719346, + "grad_norm": 2.1750757694244385, + "learning_rate": 1.8445645785627974e-06, + "loss": 0.1033, + "step": 29707 + }, + { + "epoch": 80.94822888283379, + "grad_norm": 3.339379072189331, + "learning_rate": 1.8440539144561763e-06, + "loss": 0.0714, + "step": 29708 + }, + { + "epoch": 80.95095367847412, + "grad_norm": 2.8890480995178223, + "learning_rate": 1.8435433138678017e-06, + "loss": 0.1083, + "step": 29709 + }, + { + "epoch": 80.95367847411444, + "grad_norm": 2.765408992767334, + "learning_rate": 1.8430327768016475e-06, + "loss": 0.0389, + "step": 29710 + }, + { + "epoch": 80.95640326975477, + "grad_norm": 2.0470902919769287, + "learning_rate": 1.84252230326169e-06, + "loss": 0.0867, + "step": 29711 + }, + { + "epoch": 80.95912806539509, + "grad_norm": 2.717745780944824, + "learning_rate": 1.8420118932519092e-06, + "loss": 0.0569, + "step": 29712 + }, + { + "epoch": 80.96185286103542, + "grad_norm": 3.666560411453247, + "learning_rate": 1.8415015467762764e-06, + "loss": 0.0859, + "step": 29713 + }, + { + "epoch": 80.96457765667574, + "grad_norm": 3.9778239727020264, + "learning_rate": 1.8409912638387684e-06, + "loss": 0.0852, + "step": 29714 + }, + { + "epoch": 80.96730245231608, + "grad_norm": 3.1109132766723633, + "learning_rate": 1.840481044443354e-06, + "loss": 0.0373, + "step": 29715 + }, + { + "epoch": 80.97002724795641, + "grad_norm": 2.45131778717041, + "learning_rate": 1.8399708885940136e-06, + "loss": 0.0559, + "step": 29716 + }, + { + "epoch": 80.97275204359673, + "grad_norm": 3.836390495300293, + "learning_rate": 1.8394607962947164e-06, + "loss": 0.0799, + "step": 29717 + }, + { + "epoch": 80.97547683923706, + "grad_norm": 2.3351268768310547, + "learning_rate": 1.8389507675494367e-06, + "loss": 0.025, + "step": 29718 + }, + { + "epoch": 80.97820163487738, + "grad_norm": 2.296884775161743, + "learning_rate": 1.8384408023621437e-06, + "loss": 0.1174, + "step": 29719 + }, + { + "epoch": 80.98092643051771, + "grad_norm": 1.9378864765167236, + "learning_rate": 1.8379309007368129e-06, + "loss": 0.1176, + "step": 29720 + }, + { + "epoch": 80.98365122615803, + "grad_norm": 2.872282028198242, + "learning_rate": 1.8374210626774137e-06, + "loss": 0.0511, + "step": 29721 + }, + { + "epoch": 80.98637602179836, + "grad_norm": 1.8208796977996826, + "learning_rate": 1.8369112881879136e-06, + "loss": 0.0693, + "step": 29722 + }, + { + "epoch": 80.9891008174387, + "grad_norm": 2.248429298400879, + "learning_rate": 1.8364015772722887e-06, + "loss": 0.0229, + "step": 29723 + }, + { + "epoch": 80.99182561307902, + "grad_norm": 4.804901123046875, + "learning_rate": 1.8358919299345024e-06, + "loss": 0.0479, + "step": 29724 + }, + { + "epoch": 80.99455040871935, + "grad_norm": 2.6181886196136475, + "learning_rate": 1.8353823461785304e-06, + "loss": 0.0536, + "step": 29725 + }, + { + "epoch": 80.99727520435967, + "grad_norm": 2.9905195236206055, + "learning_rate": 1.834872826008338e-06, + "loss": 0.0317, + "step": 29726 + }, + { + "epoch": 81.0, + "grad_norm": 2.4764912128448486, + "learning_rate": 1.8343633694278895e-06, + "loss": 0.0516, + "step": 29727 + }, + { + "epoch": 81.00272479564033, + "grad_norm": 2.7293291091918945, + "learning_rate": 1.83385397644116e-06, + "loss": 0.0323, + "step": 29728 + }, + { + "epoch": 81.00544959128065, + "grad_norm": 2.3819448947906494, + "learning_rate": 1.8333446470521122e-06, + "loss": 0.064, + "step": 29729 + }, + { + "epoch": 81.00817438692098, + "grad_norm": 3.2576510906219482, + "learning_rate": 1.8328353812647136e-06, + "loss": 0.0536, + "step": 29730 + }, + { + "epoch": 81.0108991825613, + "grad_norm": 2.521439552307129, + "learning_rate": 1.8323261790829283e-06, + "loss": 0.1308, + "step": 29731 + }, + { + "epoch": 81.01362397820164, + "grad_norm": 2.4987714290618896, + "learning_rate": 1.831817040510726e-06, + "loss": 0.0503, + "step": 29732 + }, + { + "epoch": 81.01634877384195, + "grad_norm": 2.5798354148864746, + "learning_rate": 1.8313079655520693e-06, + "loss": 0.0357, + "step": 29733 + }, + { + "epoch": 81.01907356948229, + "grad_norm": 2.3716537952423096, + "learning_rate": 1.8307989542109238e-06, + "loss": 0.1051, + "step": 29734 + }, + { + "epoch": 81.02179836512262, + "grad_norm": 2.076399564743042, + "learning_rate": 1.83029000649125e-06, + "loss": 0.0361, + "step": 29735 + }, + { + "epoch": 81.02452316076294, + "grad_norm": 1.5192015171051025, + "learning_rate": 1.8297811223970174e-06, + "loss": 0.0232, + "step": 29736 + }, + { + "epoch": 81.02724795640327, + "grad_norm": 1.9292784929275513, + "learning_rate": 1.8292723019321867e-06, + "loss": 0.0476, + "step": 29737 + }, + { + "epoch": 81.02997275204359, + "grad_norm": 2.645071268081665, + "learning_rate": 1.8287635451007202e-06, + "loss": 0.0393, + "step": 29738 + }, + { + "epoch": 81.03269754768392, + "grad_norm": 4.546024799346924, + "learning_rate": 1.8282548519065778e-06, + "loss": 0.2184, + "step": 29739 + }, + { + "epoch": 81.03542234332426, + "grad_norm": 2.8581202030181885, + "learning_rate": 1.8277462223537257e-06, + "loss": 0.0244, + "step": 29740 + }, + { + "epoch": 81.03814713896458, + "grad_norm": 1.6781800985336304, + "learning_rate": 1.8272376564461203e-06, + "loss": 0.0252, + "step": 29741 + }, + { + "epoch": 81.04087193460491, + "grad_norm": 2.3823750019073486, + "learning_rate": 1.8267291541877287e-06, + "loss": 0.0301, + "step": 29742 + }, + { + "epoch": 81.04359673024523, + "grad_norm": 2.648144483566284, + "learning_rate": 1.826220715582504e-06, + "loss": 0.148, + "step": 29743 + }, + { + "epoch": 81.04632152588556, + "grad_norm": 2.7481918334960938, + "learning_rate": 1.8257123406344125e-06, + "loss": 0.0814, + "step": 29744 + }, + { + "epoch": 81.04904632152588, + "grad_norm": 2.714812994003296, + "learning_rate": 1.8252040293474093e-06, + "loss": 0.0236, + "step": 29745 + }, + { + "epoch": 81.05177111716621, + "grad_norm": 2.4104068279266357, + "learning_rate": 1.824695781725454e-06, + "loss": 0.0238, + "step": 29746 + }, + { + "epoch": 81.05449591280654, + "grad_norm": 2.3135838508605957, + "learning_rate": 1.8241875977725032e-06, + "loss": 0.0279, + "step": 29747 + }, + { + "epoch": 81.05722070844686, + "grad_norm": 2.8281619548797607, + "learning_rate": 1.823679477492518e-06, + "loss": 0.0625, + "step": 29748 + }, + { + "epoch": 81.0599455040872, + "grad_norm": 2.4785587787628174, + "learning_rate": 1.8231714208894547e-06, + "loss": 0.2692, + "step": 29749 + }, + { + "epoch": 81.06267029972751, + "grad_norm": 2.241762161254883, + "learning_rate": 1.8226634279672684e-06, + "loss": 0.0283, + "step": 29750 + }, + { + "epoch": 81.06539509536785, + "grad_norm": 1.611305832862854, + "learning_rate": 1.822155498729914e-06, + "loss": 0.0215, + "step": 29751 + }, + { + "epoch": 81.06811989100818, + "grad_norm": 4.047661781311035, + "learning_rate": 1.8216476331813516e-06, + "loss": 0.18, + "step": 29752 + }, + { + "epoch": 81.0708446866485, + "grad_norm": 2.6989967823028564, + "learning_rate": 1.8211398313255347e-06, + "loss": 0.0994, + "step": 29753 + }, + { + "epoch": 81.07356948228883, + "grad_norm": 2.2276933193206787, + "learning_rate": 1.8206320931664168e-06, + "loss": 0.058, + "step": 29754 + }, + { + "epoch": 81.07629427792915, + "grad_norm": 2.4780147075653076, + "learning_rate": 1.8201244187079514e-06, + "loss": 0.0956, + "step": 29755 + }, + { + "epoch": 81.07901907356948, + "grad_norm": 2.6041982173919678, + "learning_rate": 1.8196168079540954e-06, + "loss": 0.1367, + "step": 29756 + }, + { + "epoch": 81.0817438692098, + "grad_norm": 2.5354366302490234, + "learning_rate": 1.8191092609088e-06, + "loss": 0.0642, + "step": 29757 + }, + { + "epoch": 81.08446866485014, + "grad_norm": 3.1977767944335938, + "learning_rate": 1.8186017775760167e-06, + "loss": 0.063, + "step": 29758 + }, + { + "epoch": 81.08719346049047, + "grad_norm": 2.9032578468322754, + "learning_rate": 1.818094357959702e-06, + "loss": 0.0409, + "step": 29759 + }, + { + "epoch": 81.08991825613079, + "grad_norm": 3.4103946685791016, + "learning_rate": 1.8175870020638032e-06, + "loss": 0.0905, + "step": 29760 + }, + { + "epoch": 81.09264305177112, + "grad_norm": 2.9289729595184326, + "learning_rate": 1.8170797098922744e-06, + "loss": 0.0762, + "step": 29761 + }, + { + "epoch": 81.09536784741144, + "grad_norm": 4.693163871765137, + "learning_rate": 1.8165724814490671e-06, + "loss": 0.0816, + "step": 29762 + }, + { + "epoch": 81.09809264305177, + "grad_norm": 2.403782844543457, + "learning_rate": 1.816065316738126e-06, + "loss": 0.0336, + "step": 29763 + }, + { + "epoch": 81.1008174386921, + "grad_norm": 2.709383964538574, + "learning_rate": 1.8155582157634077e-06, + "loss": 0.0806, + "step": 29764 + }, + { + "epoch": 81.10354223433242, + "grad_norm": 2.2318778038024902, + "learning_rate": 1.8150511785288593e-06, + "loss": 0.0926, + "step": 29765 + }, + { + "epoch": 81.10626702997276, + "grad_norm": 2.6320977210998535, + "learning_rate": 1.8145442050384287e-06, + "loss": 0.0997, + "step": 29766 + }, + { + "epoch": 81.10899182561307, + "grad_norm": 2.7063615322113037, + "learning_rate": 1.8140372952960617e-06, + "loss": 0.0531, + "step": 29767 + }, + { + "epoch": 81.11171662125341, + "grad_norm": 2.643054485321045, + "learning_rate": 1.8135304493057104e-06, + "loss": 0.1194, + "step": 29768 + }, + { + "epoch": 81.11444141689373, + "grad_norm": 1.9962857961654663, + "learning_rate": 1.813023667071322e-06, + "loss": 0.0352, + "step": 29769 + }, + { + "epoch": 81.11716621253406, + "grad_norm": 2.9487380981445312, + "learning_rate": 1.8125169485968409e-06, + "loss": 0.0857, + "step": 29770 + }, + { + "epoch": 81.11989100817439, + "grad_norm": 3.3684611320495605, + "learning_rate": 1.8120102938862115e-06, + "loss": 0.0842, + "step": 29771 + }, + { + "epoch": 81.12261580381471, + "grad_norm": 2.9693615436553955, + "learning_rate": 1.8115037029433857e-06, + "loss": 0.0575, + "step": 29772 + }, + { + "epoch": 81.12534059945504, + "grad_norm": 2.80663800239563, + "learning_rate": 1.8109971757723055e-06, + "loss": 0.0278, + "step": 29773 + }, + { + "epoch": 81.12806539509536, + "grad_norm": 16.64714241027832, + "learning_rate": 1.8104907123769155e-06, + "loss": 0.0515, + "step": 29774 + }, + { + "epoch": 81.1307901907357, + "grad_norm": 2.446871042251587, + "learning_rate": 1.8099843127611572e-06, + "loss": 0.1008, + "step": 29775 + }, + { + "epoch": 81.13351498637603, + "grad_norm": 2.202486753463745, + "learning_rate": 1.8094779769289782e-06, + "loss": 0.0224, + "step": 29776 + }, + { + "epoch": 81.13623978201635, + "grad_norm": 2.504746913909912, + "learning_rate": 1.8089717048843236e-06, + "loss": 0.1461, + "step": 29777 + }, + { + "epoch": 81.13896457765668, + "grad_norm": 4.355173587799072, + "learning_rate": 1.8084654966311333e-06, + "loss": 0.0335, + "step": 29778 + }, + { + "epoch": 81.141689373297, + "grad_norm": 3.3645434379577637, + "learning_rate": 1.8079593521733496e-06, + "loss": 0.0375, + "step": 29779 + }, + { + "epoch": 81.14441416893733, + "grad_norm": 2.8605713844299316, + "learning_rate": 1.8074532715149129e-06, + "loss": 0.0259, + "step": 29780 + }, + { + "epoch": 81.14713896457765, + "grad_norm": 5.118342876434326, + "learning_rate": 1.806947254659769e-06, + "loss": 0.0438, + "step": 29781 + }, + { + "epoch": 81.14986376021798, + "grad_norm": 2.464529275894165, + "learning_rate": 1.8064413016118566e-06, + "loss": 0.0957, + "step": 29782 + }, + { + "epoch": 81.15258855585832, + "grad_norm": 3.3721847534179688, + "learning_rate": 1.805935412375115e-06, + "loss": 0.0667, + "step": 29783 + }, + { + "epoch": 81.15531335149863, + "grad_norm": 2.146632671356201, + "learning_rate": 1.8054295869534822e-06, + "loss": 0.0327, + "step": 29784 + }, + { + "epoch": 81.15803814713897, + "grad_norm": 2.9291207790374756, + "learning_rate": 1.8049238253509027e-06, + "loss": 0.0807, + "step": 29785 + }, + { + "epoch": 81.16076294277929, + "grad_norm": 3.279160976409912, + "learning_rate": 1.8044181275713136e-06, + "loss": 0.0594, + "step": 29786 + }, + { + "epoch": 81.16348773841962, + "grad_norm": 2.5780253410339355, + "learning_rate": 1.803912493618648e-06, + "loss": 0.197, + "step": 29787 + }, + { + "epoch": 81.16621253405995, + "grad_norm": 3.292588710784912, + "learning_rate": 1.8034069234968521e-06, + "loss": 0.0959, + "step": 29788 + }, + { + "epoch": 81.16893732970027, + "grad_norm": 2.65609073638916, + "learning_rate": 1.802901417209859e-06, + "loss": 0.0677, + "step": 29789 + }, + { + "epoch": 81.1716621253406, + "grad_norm": 3.3790442943573, + "learning_rate": 1.802395974761605e-06, + "loss": 0.0349, + "step": 29790 + }, + { + "epoch": 81.17438692098092, + "grad_norm": 3.52130126953125, + "learning_rate": 1.8018905961560252e-06, + "loss": 0.2011, + "step": 29791 + }, + { + "epoch": 81.17711171662125, + "grad_norm": 2.5949528217315674, + "learning_rate": 1.8013852813970578e-06, + "loss": 0.0688, + "step": 29792 + }, + { + "epoch": 81.17983651226157, + "grad_norm": 2.531221628189087, + "learning_rate": 1.800880030488641e-06, + "loss": 0.0314, + "step": 29793 + }, + { + "epoch": 81.1825613079019, + "grad_norm": 2.031641721725464, + "learning_rate": 1.8003748434347056e-06, + "loss": 0.0306, + "step": 29794 + }, + { + "epoch": 81.18528610354224, + "grad_norm": 2.294825553894043, + "learning_rate": 1.7998697202391879e-06, + "loss": 0.0275, + "step": 29795 + }, + { + "epoch": 81.18801089918256, + "grad_norm": 2.5791168212890625, + "learning_rate": 1.7993646609060178e-06, + "loss": 0.1291, + "step": 29796 + }, + { + "epoch": 81.19073569482289, + "grad_norm": 2.418940782546997, + "learning_rate": 1.7988596654391344e-06, + "loss": 0.0325, + "step": 29797 + }, + { + "epoch": 81.19346049046321, + "grad_norm": 2.2982542514801025, + "learning_rate": 1.7983547338424679e-06, + "loss": 0.0644, + "step": 29798 + }, + { + "epoch": 81.19618528610354, + "grad_norm": 2.1509060859680176, + "learning_rate": 1.7978498661199517e-06, + "loss": 0.0413, + "step": 29799 + }, + { + "epoch": 81.19891008174388, + "grad_norm": 2.949258327484131, + "learning_rate": 1.7973450622755128e-06, + "loss": 0.0663, + "step": 29800 + }, + { + "epoch": 81.2016348773842, + "grad_norm": 3.26342511177063, + "learning_rate": 1.7968403223130903e-06, + "loss": 0.0394, + "step": 29801 + }, + { + "epoch": 81.20435967302453, + "grad_norm": 1.684457778930664, + "learning_rate": 1.79633564623661e-06, + "loss": 0.0191, + "step": 29802 + }, + { + "epoch": 81.20708446866485, + "grad_norm": 2.2108731269836426, + "learning_rate": 1.7958310340500052e-06, + "loss": 0.0283, + "step": 29803 + }, + { + "epoch": 81.20980926430518, + "grad_norm": 1.8673276901245117, + "learning_rate": 1.7953264857572007e-06, + "loss": 0.03, + "step": 29804 + }, + { + "epoch": 81.2125340599455, + "grad_norm": 2.0287740230560303, + "learning_rate": 1.794822001362132e-06, + "loss": 0.0336, + "step": 29805 + }, + { + "epoch": 81.21525885558583, + "grad_norm": 3.3488810062408447, + "learning_rate": 1.7943175808687263e-06, + "loss": 0.0333, + "step": 29806 + }, + { + "epoch": 81.21798365122616, + "grad_norm": 4.035453796386719, + "learning_rate": 1.793813224280908e-06, + "loss": 0.1081, + "step": 29807 + }, + { + "epoch": 81.22070844686648, + "grad_norm": 1.9230246543884277, + "learning_rate": 1.793308931602611e-06, + "loss": 0.0775, + "step": 29808 + }, + { + "epoch": 81.22343324250681, + "grad_norm": 2.6343846321105957, + "learning_rate": 1.7928047028377593e-06, + "loss": 0.0838, + "step": 29809 + }, + { + "epoch": 81.22615803814713, + "grad_norm": 2.7012295722961426, + "learning_rate": 1.792300537990278e-06, + "loss": 0.0493, + "step": 29810 + }, + { + "epoch": 81.22888283378747, + "grad_norm": 7.361477851867676, + "learning_rate": 1.7917964370640995e-06, + "loss": 0.0706, + "step": 29811 + }, + { + "epoch": 81.2316076294278, + "grad_norm": 3.7112202644348145, + "learning_rate": 1.7912924000631426e-06, + "loss": 0.0466, + "step": 29812 + }, + { + "epoch": 81.23433242506812, + "grad_norm": 3.7624340057373047, + "learning_rate": 1.790788426991339e-06, + "loss": 0.0584, + "step": 29813 + }, + { + "epoch": 81.23705722070845, + "grad_norm": 2.4636874198913574, + "learning_rate": 1.7902845178526108e-06, + "loss": 0.0584, + "step": 29814 + }, + { + "epoch": 81.23978201634877, + "grad_norm": 2.357530117034912, + "learning_rate": 1.7897806726508825e-06, + "loss": 0.0387, + "step": 29815 + }, + { + "epoch": 81.2425068119891, + "grad_norm": 2.0760278701782227, + "learning_rate": 1.789276891390076e-06, + "loss": 0.0282, + "step": 29816 + }, + { + "epoch": 81.24523160762942, + "grad_norm": 2.263711452484131, + "learning_rate": 1.7887731740741199e-06, + "loss": 0.115, + "step": 29817 + }, + { + "epoch": 81.24795640326975, + "grad_norm": 3.8498334884643555, + "learning_rate": 1.7882695207069333e-06, + "loss": 0.0714, + "step": 29818 + }, + { + "epoch": 81.25068119891009, + "grad_norm": 2.1670942306518555, + "learning_rate": 1.787765931292439e-06, + "loss": 0.0296, + "step": 29819 + }, + { + "epoch": 81.2534059945504, + "grad_norm": 4.979239463806152, + "learning_rate": 1.7872624058345578e-06, + "loss": 0.2006, + "step": 29820 + }, + { + "epoch": 81.25613079019074, + "grad_norm": 2.578134775161743, + "learning_rate": 1.7867589443372145e-06, + "loss": 0.1225, + "step": 29821 + }, + { + "epoch": 81.25885558583106, + "grad_norm": 2.23673939704895, + "learning_rate": 1.7862555468043286e-06, + "loss": 0.1429, + "step": 29822 + }, + { + "epoch": 81.26158038147139, + "grad_norm": 2.3067750930786133, + "learning_rate": 1.7857522132398197e-06, + "loss": 0.0632, + "step": 29823 + }, + { + "epoch": 81.26430517711172, + "grad_norm": 3.627553939819336, + "learning_rate": 1.785248943647605e-06, + "loss": 0.065, + "step": 29824 + }, + { + "epoch": 81.26702997275204, + "grad_norm": 1.98140287399292, + "learning_rate": 1.7847457380316114e-06, + "loss": 0.023, + "step": 29825 + }, + { + "epoch": 81.26975476839237, + "grad_norm": 3.2189109325408936, + "learning_rate": 1.7842425963957522e-06, + "loss": 0.168, + "step": 29826 + }, + { + "epoch": 81.2724795640327, + "grad_norm": 2.831796169281006, + "learning_rate": 1.7837395187439454e-06, + "loss": 0.0354, + "step": 29827 + }, + { + "epoch": 81.27520435967303, + "grad_norm": 2.3508572578430176, + "learning_rate": 1.7832365050801104e-06, + "loss": 0.0255, + "step": 29828 + }, + { + "epoch": 81.27792915531334, + "grad_norm": 1.9571527242660522, + "learning_rate": 1.7827335554081671e-06, + "loss": 0.1761, + "step": 29829 + }, + { + "epoch": 81.28065395095368, + "grad_norm": 3.471651792526245, + "learning_rate": 1.7822306697320313e-06, + "loss": 0.0968, + "step": 29830 + }, + { + "epoch": 81.28337874659401, + "grad_norm": 2.7563226222991943, + "learning_rate": 1.7817278480556188e-06, + "loss": 0.0277, + "step": 29831 + }, + { + "epoch": 81.28610354223433, + "grad_norm": 6.3749680519104, + "learning_rate": 1.7812250903828421e-06, + "loss": 0.0312, + "step": 29832 + }, + { + "epoch": 81.28882833787466, + "grad_norm": 2.8318443298339844, + "learning_rate": 1.7807223967176223e-06, + "loss": 0.0378, + "step": 29833 + }, + { + "epoch": 81.29155313351498, + "grad_norm": 2.431612968444824, + "learning_rate": 1.7802197670638722e-06, + "loss": 0.0307, + "step": 29834 + }, + { + "epoch": 81.29427792915531, + "grad_norm": 5.3716349601745605, + "learning_rate": 1.779717201425506e-06, + "loss": 0.0495, + "step": 29835 + }, + { + "epoch": 81.29700272479565, + "grad_norm": 2.0733096599578857, + "learning_rate": 1.7792146998064352e-06, + "loss": 0.0274, + "step": 29836 + }, + { + "epoch": 81.29972752043597, + "grad_norm": 2.359156370162964, + "learning_rate": 1.778712262210578e-06, + "loss": 0.166, + "step": 29837 + }, + { + "epoch": 81.3024523160763, + "grad_norm": 3.301111936569214, + "learning_rate": 1.7782098886418452e-06, + "loss": 0.0467, + "step": 29838 + }, + { + "epoch": 81.30517711171662, + "grad_norm": 2.5791015625, + "learning_rate": 1.77770757910415e-06, + "loss": 0.0334, + "step": 29839 + }, + { + "epoch": 81.30790190735695, + "grad_norm": 2.3258755207061768, + "learning_rate": 1.7772053336013994e-06, + "loss": 0.1319, + "step": 29840 + }, + { + "epoch": 81.31062670299727, + "grad_norm": 2.801180601119995, + "learning_rate": 1.7767031521375133e-06, + "loss": 0.0821, + "step": 29841 + }, + { + "epoch": 81.3133514986376, + "grad_norm": 3.4304990768432617, + "learning_rate": 1.7762010347163971e-06, + "loss": 0.047, + "step": 29842 + }, + { + "epoch": 81.31607629427793, + "grad_norm": 2.7437901496887207, + "learning_rate": 1.7756989813419633e-06, + "loss": 0.0402, + "step": 29843 + }, + { + "epoch": 81.31880108991825, + "grad_norm": 3.671950578689575, + "learning_rate": 1.7751969920181179e-06, + "loss": 0.0481, + "step": 29844 + }, + { + "epoch": 81.32152588555859, + "grad_norm": 3.3324074745178223, + "learning_rate": 1.774695066748774e-06, + "loss": 0.0638, + "step": 29845 + }, + { + "epoch": 81.3242506811989, + "grad_norm": 3.460700511932373, + "learning_rate": 1.774193205537843e-06, + "loss": 0.0431, + "step": 29846 + }, + { + "epoch": 81.32697547683924, + "grad_norm": 4.062001705169678, + "learning_rate": 1.7736914083892299e-06, + "loss": 0.0891, + "step": 29847 + }, + { + "epoch": 81.32970027247957, + "grad_norm": 2.143021583557129, + "learning_rate": 1.7731896753068444e-06, + "loss": 0.0907, + "step": 29848 + }, + { + "epoch": 81.33242506811989, + "grad_norm": 2.740246295928955, + "learning_rate": 1.7726880062945895e-06, + "loss": 0.038, + "step": 29849 + }, + { + "epoch": 81.33514986376022, + "grad_norm": 2.9971389770507812, + "learning_rate": 1.7721864013563784e-06, + "loss": 0.1202, + "step": 29850 + }, + { + "epoch": 81.33787465940054, + "grad_norm": 2.616865634918213, + "learning_rate": 1.7716848604961144e-06, + "loss": 0.0839, + "step": 29851 + }, + { + "epoch": 81.34059945504087, + "grad_norm": 1.8004435300827026, + "learning_rate": 1.7711833837177017e-06, + "loss": 0.0193, + "step": 29852 + }, + { + "epoch": 81.34332425068119, + "grad_norm": 2.3700060844421387, + "learning_rate": 1.7706819710250512e-06, + "loss": 0.0437, + "step": 29853 + }, + { + "epoch": 81.34604904632153, + "grad_norm": 2.3682754039764404, + "learning_rate": 1.770180622422063e-06, + "loss": 0.0686, + "step": 29854 + }, + { + "epoch": 81.34877384196186, + "grad_norm": 3.4635727405548096, + "learning_rate": 1.7696793379126442e-06, + "loss": 0.1762, + "step": 29855 + }, + { + "epoch": 81.35149863760218, + "grad_norm": 3.5942399501800537, + "learning_rate": 1.769178117500696e-06, + "loss": 0.1508, + "step": 29856 + }, + { + "epoch": 81.35422343324251, + "grad_norm": 3.25348162651062, + "learning_rate": 1.7686769611901255e-06, + "loss": 0.0376, + "step": 29857 + }, + { + "epoch": 81.35694822888283, + "grad_norm": 3.1193687915802, + "learning_rate": 1.7681758689848338e-06, + "loss": 0.0826, + "step": 29858 + }, + { + "epoch": 81.35967302452316, + "grad_norm": 2.747248888015747, + "learning_rate": 1.7676748408887235e-06, + "loss": 0.0591, + "step": 29859 + }, + { + "epoch": 81.3623978201635, + "grad_norm": 2.7811264991760254, + "learning_rate": 1.7671738769056945e-06, + "loss": 0.133, + "step": 29860 + }, + { + "epoch": 81.36512261580381, + "grad_norm": 3.5850346088409424, + "learning_rate": 1.7666729770396495e-06, + "loss": 0.0386, + "step": 29861 + }, + { + "epoch": 81.36784741144415, + "grad_norm": 1.7230792045593262, + "learning_rate": 1.7661721412944943e-06, + "loss": 0.0554, + "step": 29862 + }, + { + "epoch": 81.37057220708446, + "grad_norm": 3.7165582180023193, + "learning_rate": 1.7656713696741246e-06, + "loss": 0.0675, + "step": 29863 + }, + { + "epoch": 81.3732970027248, + "grad_norm": 2.740318536758423, + "learning_rate": 1.7651706621824405e-06, + "loss": 0.0725, + "step": 29864 + }, + { + "epoch": 81.37602179836512, + "grad_norm": 2.3790948390960693, + "learning_rate": 1.7646700188233411e-06, + "loss": 0.0211, + "step": 29865 + }, + { + "epoch": 81.37874659400545, + "grad_norm": 1.86640202999115, + "learning_rate": 1.764169439600728e-06, + "loss": 0.1383, + "step": 29866 + }, + { + "epoch": 81.38147138964578, + "grad_norm": 3.29257869720459, + "learning_rate": 1.763668924518499e-06, + "loss": 0.047, + "step": 29867 + }, + { + "epoch": 81.3841961852861, + "grad_norm": 2.2106664180755615, + "learning_rate": 1.763168473580551e-06, + "loss": 0.0818, + "step": 29868 + }, + { + "epoch": 81.38692098092643, + "grad_norm": 2.619067668914795, + "learning_rate": 1.7626680867907787e-06, + "loss": 0.0582, + "step": 29869 + }, + { + "epoch": 81.38964577656675, + "grad_norm": 3.078220844268799, + "learning_rate": 1.7621677641530855e-06, + "loss": 0.257, + "step": 29870 + }, + { + "epoch": 81.39237057220708, + "grad_norm": 3.548492670059204, + "learning_rate": 1.761667505671365e-06, + "loss": 0.0604, + "step": 29871 + }, + { + "epoch": 81.39509536784742, + "grad_norm": 2.28106427192688, + "learning_rate": 1.7611673113495098e-06, + "loss": 0.0374, + "step": 29872 + }, + { + "epoch": 81.39782016348774, + "grad_norm": 2.0537807941436768, + "learning_rate": 1.7606671811914212e-06, + "loss": 0.0179, + "step": 29873 + }, + { + "epoch": 81.40054495912807, + "grad_norm": 2.14174747467041, + "learning_rate": 1.7601671152009903e-06, + "loss": 0.0263, + "step": 29874 + }, + { + "epoch": 81.40326975476839, + "grad_norm": 3.556363582611084, + "learning_rate": 1.7596671133821142e-06, + "loss": 0.0538, + "step": 29875 + }, + { + "epoch": 81.40599455040872, + "grad_norm": 2.0083611011505127, + "learning_rate": 1.7591671757386818e-06, + "loss": 0.0298, + "step": 29876 + }, + { + "epoch": 81.40871934604904, + "grad_norm": 2.6074280738830566, + "learning_rate": 1.7586673022745936e-06, + "loss": 0.1115, + "step": 29877 + }, + { + "epoch": 81.41144414168937, + "grad_norm": 3.154125213623047, + "learning_rate": 1.7581674929937354e-06, + "loss": 0.0352, + "step": 29878 + }, + { + "epoch": 81.4141689373297, + "grad_norm": 1.8756235837936401, + "learning_rate": 1.7576677479000072e-06, + "loss": 0.0249, + "step": 29879 + }, + { + "epoch": 81.41689373297002, + "grad_norm": 2.6808886528015137, + "learning_rate": 1.7571680669972969e-06, + "loss": 0.1049, + "step": 29880 + }, + { + "epoch": 81.41961852861036, + "grad_norm": 2.7920801639556885, + "learning_rate": 1.7566684502894938e-06, + "loss": 0.0524, + "step": 29881 + }, + { + "epoch": 81.42234332425068, + "grad_norm": 2.620394706726074, + "learning_rate": 1.7561688977804946e-06, + "loss": 0.0293, + "step": 29882 + }, + { + "epoch": 81.42506811989101, + "grad_norm": 2.0136470794677734, + "learning_rate": 1.7556694094741867e-06, + "loss": 0.0302, + "step": 29883 + }, + { + "epoch": 81.42779291553134, + "grad_norm": 2.3976151943206787, + "learning_rate": 1.7551699853744587e-06, + "loss": 0.0619, + "step": 29884 + }, + { + "epoch": 81.43051771117166, + "grad_norm": 10.679306983947754, + "learning_rate": 1.7546706254852008e-06, + "loss": 0.0429, + "step": 29885 + }, + { + "epoch": 81.433242506812, + "grad_norm": 2.1830060482025146, + "learning_rate": 1.7541713298103036e-06, + "loss": 0.0413, + "step": 29886 + }, + { + "epoch": 81.43596730245231, + "grad_norm": 2.6556344032287598, + "learning_rate": 1.753672098353656e-06, + "loss": 0.064, + "step": 29887 + }, + { + "epoch": 81.43869209809264, + "grad_norm": 2.9608054161071777, + "learning_rate": 1.7531729311191436e-06, + "loss": 0.0666, + "step": 29888 + }, + { + "epoch": 81.44141689373296, + "grad_norm": 3.7339558601379395, + "learning_rate": 1.7526738281106537e-06, + "loss": 0.0741, + "step": 29889 + }, + { + "epoch": 81.4441416893733, + "grad_norm": 5.09855318069458, + "learning_rate": 1.7521747893320762e-06, + "loss": 0.0683, + "step": 29890 + }, + { + "epoch": 81.44686648501363, + "grad_norm": 2.303555965423584, + "learning_rate": 1.7516758147872958e-06, + "loss": 0.0665, + "step": 29891 + }, + { + "epoch": 81.44959128065395, + "grad_norm": 2.3130557537078857, + "learning_rate": 1.7511769044801996e-06, + "loss": 0.0345, + "step": 29892 + }, + { + "epoch": 81.45231607629428, + "grad_norm": 2.083970069885254, + "learning_rate": 1.7506780584146688e-06, + "loss": 0.0852, + "step": 29893 + }, + { + "epoch": 81.4550408719346, + "grad_norm": 3.7353780269622803, + "learning_rate": 1.7501792765945947e-06, + "loss": 0.1158, + "step": 29894 + }, + { + "epoch": 81.45776566757493, + "grad_norm": 2.5525665283203125, + "learning_rate": 1.7496805590238586e-06, + "loss": 0.0521, + "step": 29895 + }, + { + "epoch": 81.46049046321527, + "grad_norm": 3.040743589401245, + "learning_rate": 1.7491819057063419e-06, + "loss": 0.0464, + "step": 29896 + }, + { + "epoch": 81.46321525885558, + "grad_norm": 3.0327980518341064, + "learning_rate": 1.7486833166459316e-06, + "loss": 0.0427, + "step": 29897 + }, + { + "epoch": 81.46594005449592, + "grad_norm": 1.9803370237350464, + "learning_rate": 1.7481847918465133e-06, + "loss": 0.0217, + "step": 29898 + }, + { + "epoch": 81.46866485013624, + "grad_norm": 2.665926456451416, + "learning_rate": 1.7476863313119653e-06, + "loss": 0.0726, + "step": 29899 + }, + { + "epoch": 81.47138964577657, + "grad_norm": 2.0836374759674072, + "learning_rate": 1.7471879350461706e-06, + "loss": 0.0342, + "step": 29900 + }, + { + "epoch": 81.47411444141689, + "grad_norm": 2.743572950363159, + "learning_rate": 1.7466896030530078e-06, + "loss": 0.0377, + "step": 29901 + }, + { + "epoch": 81.47683923705722, + "grad_norm": 2.8299994468688965, + "learning_rate": 1.7461913353363635e-06, + "loss": 0.0573, + "step": 29902 + }, + { + "epoch": 81.47956403269755, + "grad_norm": 3.7928919792175293, + "learning_rate": 1.745693131900116e-06, + "loss": 0.0939, + "step": 29903 + }, + { + "epoch": 81.48228882833787, + "grad_norm": 2.3251705169677734, + "learning_rate": 1.745194992748145e-06, + "loss": 0.0331, + "step": 29904 + }, + { + "epoch": 81.4850136239782, + "grad_norm": 1.957998275756836, + "learning_rate": 1.7446969178843265e-06, + "loss": 0.026, + "step": 29905 + }, + { + "epoch": 81.48773841961852, + "grad_norm": 2.587820529937744, + "learning_rate": 1.7441989073125453e-06, + "loss": 0.0477, + "step": 29906 + }, + { + "epoch": 81.49046321525886, + "grad_norm": 2.38033390045166, + "learning_rate": 1.7437009610366773e-06, + "loss": 0.0337, + "step": 29907 + }, + { + "epoch": 81.49318801089919, + "grad_norm": 2.0060131549835205, + "learning_rate": 1.7432030790606003e-06, + "loss": 0.0511, + "step": 29908 + }, + { + "epoch": 81.49591280653951, + "grad_norm": 2.593278646469116, + "learning_rate": 1.742705261388189e-06, + "loss": 0.0331, + "step": 29909 + }, + { + "epoch": 81.49863760217984, + "grad_norm": 2.8909037113189697, + "learning_rate": 1.742207508023327e-06, + "loss": 0.0859, + "step": 29910 + }, + { + "epoch": 81.50136239782016, + "grad_norm": 3.4047446250915527, + "learning_rate": 1.7417098189698866e-06, + "loss": 0.0426, + "step": 29911 + }, + { + "epoch": 81.50408719346049, + "grad_norm": 3.3756182193756104, + "learning_rate": 1.741212194231744e-06, + "loss": 0.1363, + "step": 29912 + }, + { + "epoch": 81.50681198910081, + "grad_norm": 2.3397152423858643, + "learning_rate": 1.7407146338127713e-06, + "loss": 0.0369, + "step": 29913 + }, + { + "epoch": 81.50953678474114, + "grad_norm": 2.27807879447937, + "learning_rate": 1.7402171377168509e-06, + "loss": 0.0342, + "step": 29914 + }, + { + "epoch": 81.51226158038148, + "grad_norm": 1.9141989946365356, + "learning_rate": 1.7397197059478543e-06, + "loss": 0.0731, + "step": 29915 + }, + { + "epoch": 81.5149863760218, + "grad_norm": 3.7800650596618652, + "learning_rate": 1.7392223385096542e-06, + "loss": 0.059, + "step": 29916 + }, + { + "epoch": 81.51771117166213, + "grad_norm": 2.881908416748047, + "learning_rate": 1.7387250354061225e-06, + "loss": 0.035, + "step": 29917 + }, + { + "epoch": 81.52043596730245, + "grad_norm": 3.036841869354248, + "learning_rate": 1.7382277966411366e-06, + "loss": 0.0469, + "step": 29918 + }, + { + "epoch": 81.52316076294278, + "grad_norm": 2.2260324954986572, + "learning_rate": 1.7377306222185663e-06, + "loss": 0.045, + "step": 29919 + }, + { + "epoch": 81.52588555858311, + "grad_norm": 2.8261077404022217, + "learning_rate": 1.7372335121422857e-06, + "loss": 0.043, + "step": 29920 + }, + { + "epoch": 81.52861035422343, + "grad_norm": 4.075632572174072, + "learning_rate": 1.7367364664161602e-06, + "loss": 0.0724, + "step": 29921 + }, + { + "epoch": 81.53133514986376, + "grad_norm": 3.843763828277588, + "learning_rate": 1.736239485044069e-06, + "loss": 0.0865, + "step": 29922 + }, + { + "epoch": 81.53405994550408, + "grad_norm": 5.14616584777832, + "learning_rate": 1.7357425680298778e-06, + "loss": 0.0412, + "step": 29923 + }, + { + "epoch": 81.53678474114442, + "grad_norm": 2.7485291957855225, + "learning_rate": 1.7352457153774583e-06, + "loss": 0.1001, + "step": 29924 + }, + { + "epoch": 81.53950953678473, + "grad_norm": 3.3290557861328125, + "learning_rate": 1.734748927090676e-06, + "loss": 0.0421, + "step": 29925 + }, + { + "epoch": 81.54223433242507, + "grad_norm": 3.092393636703491, + "learning_rate": 1.7342522031734054e-06, + "loss": 0.0351, + "step": 29926 + }, + { + "epoch": 81.5449591280654, + "grad_norm": 2.5042364597320557, + "learning_rate": 1.7337555436295128e-06, + "loss": 0.0471, + "step": 29927 + }, + { + "epoch": 81.54768392370572, + "grad_norm": 2.964219808578491, + "learning_rate": 1.733258948462866e-06, + "loss": 0.0653, + "step": 29928 + }, + { + "epoch": 81.55040871934605, + "grad_norm": 2.377936601638794, + "learning_rate": 1.7327624176773306e-06, + "loss": 0.0304, + "step": 29929 + }, + { + "epoch": 81.55313351498637, + "grad_norm": 6.652313232421875, + "learning_rate": 1.7322659512767748e-06, + "loss": 0.1374, + "step": 29930 + }, + { + "epoch": 81.5558583106267, + "grad_norm": 3.4335744380950928, + "learning_rate": 1.7317695492650676e-06, + "loss": 0.0881, + "step": 29931 + }, + { + "epoch": 81.55858310626704, + "grad_norm": 1.9838346242904663, + "learning_rate": 1.731273211646074e-06, + "loss": 0.0295, + "step": 29932 + }, + { + "epoch": 81.56130790190736, + "grad_norm": 1.8397482633590698, + "learning_rate": 1.7307769384236584e-06, + "loss": 0.0735, + "step": 29933 + }, + { + "epoch": 81.56403269754769, + "grad_norm": 3.7043726444244385, + "learning_rate": 1.7302807296016833e-06, + "loss": 0.0695, + "step": 29934 + }, + { + "epoch": 81.566757493188, + "grad_norm": 2.511993169784546, + "learning_rate": 1.7297845851840177e-06, + "loss": 0.0996, + "step": 29935 + }, + { + "epoch": 81.56948228882834, + "grad_norm": 3.044713020324707, + "learning_rate": 1.7292885051745246e-06, + "loss": 0.1011, + "step": 29936 + }, + { + "epoch": 81.57220708446866, + "grad_norm": 1.742403268814087, + "learning_rate": 1.7287924895770624e-06, + "loss": 0.0359, + "step": 29937 + }, + { + "epoch": 81.57493188010899, + "grad_norm": 2.31221079826355, + "learning_rate": 1.7282965383955019e-06, + "loss": 0.0305, + "step": 29938 + }, + { + "epoch": 81.57765667574932, + "grad_norm": 1.7335597276687622, + "learning_rate": 1.7278006516337008e-06, + "loss": 0.0253, + "step": 29939 + }, + { + "epoch": 81.58038147138964, + "grad_norm": 2.5325331687927246, + "learning_rate": 1.727304829295523e-06, + "loss": 0.132, + "step": 29940 + }, + { + "epoch": 81.58310626702998, + "grad_norm": 3.9940176010131836, + "learning_rate": 1.7268090713848262e-06, + "loss": 0.0905, + "step": 29941 + }, + { + "epoch": 81.5858310626703, + "grad_norm": 3.1452503204345703, + "learning_rate": 1.7263133779054763e-06, + "loss": 0.0342, + "step": 29942 + }, + { + "epoch": 81.58855585831063, + "grad_norm": 3.458385705947876, + "learning_rate": 1.7258177488613316e-06, + "loss": 0.0243, + "step": 29943 + }, + { + "epoch": 81.59128065395096, + "grad_norm": 2.0628957748413086, + "learning_rate": 1.7253221842562518e-06, + "loss": 0.0232, + "step": 29944 + }, + { + "epoch": 81.59400544959128, + "grad_norm": 2.961764097213745, + "learning_rate": 1.7248266840940941e-06, + "loss": 0.0457, + "step": 29945 + }, + { + "epoch": 81.59673024523161, + "grad_norm": 2.7390084266662598, + "learning_rate": 1.7243312483787222e-06, + "loss": 0.044, + "step": 29946 + }, + { + "epoch": 81.59945504087193, + "grad_norm": 1.9267858266830444, + "learning_rate": 1.7238358771139896e-06, + "loss": 0.0211, + "step": 29947 + }, + { + "epoch": 81.60217983651226, + "grad_norm": 1.6273704767227173, + "learning_rate": 1.7233405703037599e-06, + "loss": 0.0186, + "step": 29948 + }, + { + "epoch": 81.60490463215258, + "grad_norm": 2.7950947284698486, + "learning_rate": 1.7228453279518863e-06, + "loss": 0.085, + "step": 29949 + }, + { + "epoch": 81.60762942779292, + "grad_norm": 3.9736552238464355, + "learning_rate": 1.7223501500622252e-06, + "loss": 0.1084, + "step": 29950 + }, + { + "epoch": 81.61035422343325, + "grad_norm": 3.1905932426452637, + "learning_rate": 1.7218550366386378e-06, + "loss": 0.0843, + "step": 29951 + }, + { + "epoch": 81.61307901907357, + "grad_norm": 2.498032569885254, + "learning_rate": 1.7213599876849762e-06, + "loss": 0.045, + "step": 29952 + }, + { + "epoch": 81.6158038147139, + "grad_norm": 3.981534242630005, + "learning_rate": 1.7208650032050966e-06, + "loss": 0.0526, + "step": 29953 + }, + { + "epoch": 81.61852861035422, + "grad_norm": 2.571485996246338, + "learning_rate": 1.7203700832028513e-06, + "loss": 0.0667, + "step": 29954 + }, + { + "epoch": 81.62125340599455, + "grad_norm": 3.0207929611206055, + "learning_rate": 1.7198752276821007e-06, + "loss": 0.0285, + "step": 29955 + }, + { + "epoch": 81.62397820163488, + "grad_norm": 5.051114082336426, + "learning_rate": 1.7193804366466948e-06, + "loss": 0.1077, + "step": 29956 + }, + { + "epoch": 81.6267029972752, + "grad_norm": 2.274768352508545, + "learning_rate": 1.7188857101004873e-06, + "loss": 0.0813, + "step": 29957 + }, + { + "epoch": 81.62942779291554, + "grad_norm": 2.348160982131958, + "learning_rate": 1.7183910480473287e-06, + "loss": 0.1317, + "step": 29958 + }, + { + "epoch": 81.63215258855585, + "grad_norm": 1.8370074033737183, + "learning_rate": 1.7178964504910766e-06, + "loss": 0.0225, + "step": 29959 + }, + { + "epoch": 81.63487738419619, + "grad_norm": 2.805293560028076, + "learning_rate": 1.7174019174355805e-06, + "loss": 0.0744, + "step": 29960 + }, + { + "epoch": 81.6376021798365, + "grad_norm": 2.7617228031158447, + "learning_rate": 1.7169074488846905e-06, + "loss": 0.0433, + "step": 29961 + }, + { + "epoch": 81.64032697547684, + "grad_norm": 2.7769405841827393, + "learning_rate": 1.716413044842259e-06, + "loss": 0.0554, + "step": 29962 + }, + { + "epoch": 81.64305177111717, + "grad_norm": 3.071134328842163, + "learning_rate": 1.7159187053121373e-06, + "loss": 0.0972, + "step": 29963 + }, + { + "epoch": 81.64577656675749, + "grad_norm": 2.6598658561706543, + "learning_rate": 1.7154244302981715e-06, + "loss": 0.081, + "step": 29964 + }, + { + "epoch": 81.64850136239782, + "grad_norm": 3.348020315170288, + "learning_rate": 1.7149302198042162e-06, + "loss": 0.0742, + "step": 29965 + }, + { + "epoch": 81.65122615803814, + "grad_norm": 2.5943949222564697, + "learning_rate": 1.7144360738341148e-06, + "loss": 0.1429, + "step": 29966 + }, + { + "epoch": 81.65395095367847, + "grad_norm": 3.244645118713379, + "learning_rate": 1.713941992391721e-06, + "loss": 0.0366, + "step": 29967 + }, + { + "epoch": 81.65667574931881, + "grad_norm": 3.5837454795837402, + "learning_rate": 1.7134479754808808e-06, + "loss": 0.0822, + "step": 29968 + }, + { + "epoch": 81.65940054495913, + "grad_norm": 2.711371421813965, + "learning_rate": 1.712954023105441e-06, + "loss": 0.0778, + "step": 29969 + }, + { + "epoch": 81.66212534059946, + "grad_norm": 3.1979498863220215, + "learning_rate": 1.712460135269246e-06, + "loss": 0.0403, + "step": 29970 + }, + { + "epoch": 81.66485013623978, + "grad_norm": 2.8670384883880615, + "learning_rate": 1.7119663119761476e-06, + "loss": 0.0244, + "step": 29971 + }, + { + "epoch": 81.66757493188011, + "grad_norm": 2.829710006713867, + "learning_rate": 1.711472553229988e-06, + "loss": 0.0542, + "step": 29972 + }, + { + "epoch": 81.67029972752043, + "grad_norm": 2.1916730403900146, + "learning_rate": 1.7109788590346132e-06, + "loss": 0.0261, + "step": 29973 + }, + { + "epoch": 81.67302452316076, + "grad_norm": 3.1586687564849854, + "learning_rate": 1.7104852293938668e-06, + "loss": 0.0513, + "step": 29974 + }, + { + "epoch": 81.6757493188011, + "grad_norm": 2.4942362308502197, + "learning_rate": 1.7099916643115965e-06, + "loss": 0.1349, + "step": 29975 + }, + { + "epoch": 81.67847411444141, + "grad_norm": 2.431182622909546, + "learning_rate": 1.709498163791644e-06, + "loss": 0.0737, + "step": 29976 + }, + { + "epoch": 81.68119891008175, + "grad_norm": 2.157503843307495, + "learning_rate": 1.709004727837854e-06, + "loss": 0.0685, + "step": 29977 + }, + { + "epoch": 81.68392370572207, + "grad_norm": 3.029843330383301, + "learning_rate": 1.7085113564540657e-06, + "loss": 0.2559, + "step": 29978 + }, + { + "epoch": 81.6866485013624, + "grad_norm": 3.3971712589263916, + "learning_rate": 1.7080180496441257e-06, + "loss": 0.027, + "step": 29979 + }, + { + "epoch": 81.68937329700273, + "grad_norm": 3.483119487762451, + "learning_rate": 1.7075248074118745e-06, + "loss": 0.0348, + "step": 29980 + }, + { + "epoch": 81.69209809264305, + "grad_norm": 3.3105521202087402, + "learning_rate": 1.7070316297611512e-06, + "loss": 0.0393, + "step": 29981 + }, + { + "epoch": 81.69482288828338, + "grad_norm": 2.3459017276763916, + "learning_rate": 1.7065385166957982e-06, + "loss": 0.0441, + "step": 29982 + }, + { + "epoch": 81.6975476839237, + "grad_norm": 2.717716693878174, + "learning_rate": 1.7060454682196592e-06, + "loss": 0.0672, + "step": 29983 + }, + { + "epoch": 81.70027247956403, + "grad_norm": 3.3285694122314453, + "learning_rate": 1.7055524843365711e-06, + "loss": 0.0441, + "step": 29984 + }, + { + "epoch": 81.70299727520435, + "grad_norm": 2.250732183456421, + "learning_rate": 1.7050595650503732e-06, + "loss": 0.15, + "step": 29985 + }, + { + "epoch": 81.70572207084469, + "grad_norm": 4.812022686004639, + "learning_rate": 1.7045667103649021e-06, + "loss": 0.053, + "step": 29986 + }, + { + "epoch": 81.70844686648502, + "grad_norm": 3.1134819984436035, + "learning_rate": 1.7040739202840006e-06, + "loss": 0.2067, + "step": 29987 + }, + { + "epoch": 81.71117166212534, + "grad_norm": 2.6714956760406494, + "learning_rate": 1.7035811948115044e-06, + "loss": 0.0581, + "step": 29988 + }, + { + "epoch": 81.71389645776567, + "grad_norm": 2.735435962677002, + "learning_rate": 1.7030885339512505e-06, + "loss": 0.0703, + "step": 29989 + }, + { + "epoch": 81.71662125340599, + "grad_norm": 3.5400795936584473, + "learning_rate": 1.7025959377070745e-06, + "loss": 0.0434, + "step": 29990 + }, + { + "epoch": 81.71934604904632, + "grad_norm": 3.131110906600952, + "learning_rate": 1.7021034060828157e-06, + "loss": 0.0251, + "step": 29991 + }, + { + "epoch": 81.72207084468666, + "grad_norm": 2.1790151596069336, + "learning_rate": 1.70161093908231e-06, + "loss": 0.1077, + "step": 29992 + }, + { + "epoch": 81.72479564032697, + "grad_norm": 2.450204849243164, + "learning_rate": 1.7011185367093897e-06, + "loss": 0.087, + "step": 29993 + }, + { + "epoch": 81.7275204359673, + "grad_norm": 4.017487049102783, + "learning_rate": 1.7006261989678895e-06, + "loss": 0.062, + "step": 29994 + }, + { + "epoch": 81.73024523160763, + "grad_norm": 2.6964058876037598, + "learning_rate": 1.7001339258616478e-06, + "loss": 0.0718, + "step": 29995 + }, + { + "epoch": 81.73297002724796, + "grad_norm": 2.3090856075286865, + "learning_rate": 1.6996417173944957e-06, + "loss": 0.0529, + "step": 29996 + }, + { + "epoch": 81.73569482288828, + "grad_norm": 2.345402956008911, + "learning_rate": 1.6991495735702667e-06, + "loss": 0.1334, + "step": 29997 + }, + { + "epoch": 81.73841961852861, + "grad_norm": 2.830742835998535, + "learning_rate": 1.6986574943927913e-06, + "loss": 0.0771, + "step": 29998 + }, + { + "epoch": 81.74114441416894, + "grad_norm": 1.844018578529358, + "learning_rate": 1.6981654798659041e-06, + "loss": 0.0328, + "step": 29999 + }, + { + "epoch": 81.74386920980926, + "grad_norm": 4.724454402923584, + "learning_rate": 1.69767352999344e-06, + "loss": 0.0495, + "step": 30000 + }, + { + "epoch": 81.7465940054496, + "grad_norm": 3.6605615615844727, + "learning_rate": 1.6971816447792266e-06, + "loss": 0.1277, + "step": 30001 + }, + { + "epoch": 81.74931880108991, + "grad_norm": 2.996783494949341, + "learning_rate": 1.6966898242270935e-06, + "loss": 0.0268, + "step": 30002 + }, + { + "epoch": 81.75204359673025, + "grad_norm": 2.80468487739563, + "learning_rate": 1.6961980683408742e-06, + "loss": 0.0672, + "step": 30003 + }, + { + "epoch": 81.75476839237058, + "grad_norm": 2.24398136138916, + "learning_rate": 1.6957063771243977e-06, + "loss": 0.0511, + "step": 30004 + }, + { + "epoch": 81.7574931880109, + "grad_norm": 2.3950204849243164, + "learning_rate": 1.695214750581493e-06, + "loss": 0.032, + "step": 30005 + }, + { + "epoch": 81.76021798365123, + "grad_norm": 2.247523307800293, + "learning_rate": 1.6947231887159854e-06, + "loss": 0.0359, + "step": 30006 + }, + { + "epoch": 81.76294277929155, + "grad_norm": 2.835435628890991, + "learning_rate": 1.6942316915317091e-06, + "loss": 0.1541, + "step": 30007 + }, + { + "epoch": 81.76566757493188, + "grad_norm": 2.9872546195983887, + "learning_rate": 1.6937402590324892e-06, + "loss": 0.0295, + "step": 30008 + }, + { + "epoch": 81.7683923705722, + "grad_norm": 3.174426317214966, + "learning_rate": 1.6932488912221523e-06, + "loss": 0.0427, + "step": 30009 + }, + { + "epoch": 81.77111716621253, + "grad_norm": 3.640789747238159, + "learning_rate": 1.6927575881045243e-06, + "loss": 0.0435, + "step": 30010 + }, + { + "epoch": 81.77384196185287, + "grad_norm": 3.952859401702881, + "learning_rate": 1.6922663496834346e-06, + "loss": 0.1197, + "step": 30011 + }, + { + "epoch": 81.77656675749319, + "grad_norm": 2.8318142890930176, + "learning_rate": 1.6917751759627066e-06, + "loss": 0.1828, + "step": 30012 + }, + { + "epoch": 81.77929155313352, + "grad_norm": 2.7179439067840576, + "learning_rate": 1.6912840669461672e-06, + "loss": 0.0764, + "step": 30013 + }, + { + "epoch": 81.78201634877384, + "grad_norm": 3.1840264797210693, + "learning_rate": 1.6907930226376367e-06, + "loss": 0.1202, + "step": 30014 + }, + { + "epoch": 81.78474114441417, + "grad_norm": 2.3267662525177, + "learning_rate": 1.6903020430409456e-06, + "loss": 0.0383, + "step": 30015 + }, + { + "epoch": 81.7874659400545, + "grad_norm": 4.1154561042785645, + "learning_rate": 1.6898111281599129e-06, + "loss": 0.0715, + "step": 30016 + }, + { + "epoch": 81.79019073569482, + "grad_norm": 3.4539682865142822, + "learning_rate": 1.6893202779983654e-06, + "loss": 0.0504, + "step": 30017 + }, + { + "epoch": 81.79291553133515, + "grad_norm": 3.567556619644165, + "learning_rate": 1.6888294925601235e-06, + "loss": 0.0273, + "step": 30018 + }, + { + "epoch": 81.79564032697547, + "grad_norm": 3.3005082607269287, + "learning_rate": 1.6883387718490086e-06, + "loss": 0.2091, + "step": 30019 + }, + { + "epoch": 81.7983651226158, + "grad_norm": 2.836658000946045, + "learning_rate": 1.6878481158688454e-06, + "loss": 0.1856, + "step": 30020 + }, + { + "epoch": 81.80108991825612, + "grad_norm": 1.7724984884262085, + "learning_rate": 1.6873575246234542e-06, + "loss": 0.038, + "step": 30021 + }, + { + "epoch": 81.80381471389646, + "grad_norm": 2.244910717010498, + "learning_rate": 1.6868669981166553e-06, + "loss": 0.1502, + "step": 30022 + }, + { + "epoch": 81.80653950953679, + "grad_norm": 2.91497540473938, + "learning_rate": 1.6863765363522654e-06, + "loss": 0.0359, + "step": 30023 + }, + { + "epoch": 81.80926430517711, + "grad_norm": 2.6984496116638184, + "learning_rate": 1.685886139334111e-06, + "loss": 0.0374, + "step": 30024 + }, + { + "epoch": 81.81198910081744, + "grad_norm": 1.5971429347991943, + "learning_rate": 1.685395807066007e-06, + "loss": 0.0205, + "step": 30025 + }, + { + "epoch": 81.81471389645776, + "grad_norm": 2.5110671520233154, + "learning_rate": 1.68490553955177e-06, + "loss": 0.1074, + "step": 30026 + }, + { + "epoch": 81.8174386920981, + "grad_norm": 2.5040781497955322, + "learning_rate": 1.6844153367952242e-06, + "loss": 0.0366, + "step": 30027 + }, + { + "epoch": 81.82016348773843, + "grad_norm": 2.7937262058258057, + "learning_rate": 1.6839251988001838e-06, + "loss": 0.0691, + "step": 30028 + }, + { + "epoch": 81.82288828337875, + "grad_norm": 2.183349370956421, + "learning_rate": 1.6834351255704673e-06, + "loss": 0.0204, + "step": 30029 + }, + { + "epoch": 81.82561307901908, + "grad_norm": 5.8651299476623535, + "learning_rate": 1.6829451171098865e-06, + "loss": 0.1189, + "step": 30030 + }, + { + "epoch": 81.8283378746594, + "grad_norm": 2.891397476196289, + "learning_rate": 1.6824551734222649e-06, + "loss": 0.1082, + "step": 30031 + }, + { + "epoch": 81.83106267029973, + "grad_norm": 2.7424800395965576, + "learning_rate": 1.681965294511414e-06, + "loss": 0.0313, + "step": 30032 + }, + { + "epoch": 81.83378746594005, + "grad_norm": 2.4093427658081055, + "learning_rate": 1.6814754803811474e-06, + "loss": 0.1106, + "step": 30033 + }, + { + "epoch": 81.83651226158038, + "grad_norm": 2.4709415435791016, + "learning_rate": 1.6809857310352852e-06, + "loss": 0.025, + "step": 30034 + }, + { + "epoch": 81.83923705722071, + "grad_norm": 1.8941694498062134, + "learning_rate": 1.6804960464776344e-06, + "loss": 0.0174, + "step": 30035 + }, + { + "epoch": 81.84196185286103, + "grad_norm": 2.468430280685425, + "learning_rate": 1.6800064267120163e-06, + "loss": 0.091, + "step": 30036 + }, + { + "epoch": 81.84468664850137, + "grad_norm": 1.7741538286209106, + "learning_rate": 1.6795168717422404e-06, + "loss": 0.0239, + "step": 30037 + }, + { + "epoch": 81.84741144414168, + "grad_norm": 1.6462080478668213, + "learning_rate": 1.6790273815721191e-06, + "loss": 0.0177, + "step": 30038 + }, + { + "epoch": 81.85013623978202, + "grad_norm": 2.0248351097106934, + "learning_rate": 1.6785379562054615e-06, + "loss": 0.052, + "step": 30039 + }, + { + "epoch": 81.85286103542235, + "grad_norm": 4.469536781311035, + "learning_rate": 1.6780485956460857e-06, + "loss": 0.0991, + "step": 30040 + }, + { + "epoch": 81.85558583106267, + "grad_norm": 3.5721821784973145, + "learning_rate": 1.6775592998977995e-06, + "loss": 0.1362, + "step": 30041 + }, + { + "epoch": 81.858310626703, + "grad_norm": 2.6830410957336426, + "learning_rate": 1.6770700689644138e-06, + "loss": 0.1015, + "step": 30042 + }, + { + "epoch": 81.86103542234332, + "grad_norm": 2.327113389968872, + "learning_rate": 1.676580902849736e-06, + "loss": 0.0263, + "step": 30043 + }, + { + "epoch": 81.86376021798365, + "grad_norm": 2.0420827865600586, + "learning_rate": 1.67609180155758e-06, + "loss": 0.1379, + "step": 30044 + }, + { + "epoch": 81.86648501362397, + "grad_norm": 3.5153493881225586, + "learning_rate": 1.6756027650917539e-06, + "loss": 0.0818, + "step": 30045 + }, + { + "epoch": 81.8692098092643, + "grad_norm": 2.7035679817199707, + "learning_rate": 1.6751137934560635e-06, + "loss": 0.0357, + "step": 30046 + }, + { + "epoch": 81.87193460490464, + "grad_norm": 3.255575180053711, + "learning_rate": 1.6746248866543201e-06, + "loss": 0.0938, + "step": 30047 + }, + { + "epoch": 81.87465940054496, + "grad_norm": 2.4730582237243652, + "learning_rate": 1.6741360446903309e-06, + "loss": 0.1371, + "step": 30048 + }, + { + "epoch": 81.87738419618529, + "grad_norm": 2.590402841567993, + "learning_rate": 1.6736472675679028e-06, + "loss": 0.1255, + "step": 30049 + }, + { + "epoch": 81.88010899182561, + "grad_norm": 2.0248920917510986, + "learning_rate": 1.6731585552908381e-06, + "loss": 0.0314, + "step": 30050 + }, + { + "epoch": 81.88283378746594, + "grad_norm": 2.2059524059295654, + "learning_rate": 1.672669907862947e-06, + "loss": 0.039, + "step": 30051 + }, + { + "epoch": 81.88555858310627, + "grad_norm": 2.7759554386138916, + "learning_rate": 1.672181325288037e-06, + "loss": 0.0268, + "step": 30052 + }, + { + "epoch": 81.88828337874659, + "grad_norm": 2.258518934249878, + "learning_rate": 1.6716928075699112e-06, + "loss": 0.0287, + "step": 30053 + }, + { + "epoch": 81.89100817438693, + "grad_norm": 4.108890533447266, + "learning_rate": 1.6712043547123735e-06, + "loss": 0.1903, + "step": 30054 + }, + { + "epoch": 81.89373297002724, + "grad_norm": 2.274536609649658, + "learning_rate": 1.6707159667192263e-06, + "loss": 0.0939, + "step": 30055 + }, + { + "epoch": 81.89645776566758, + "grad_norm": 2.4938838481903076, + "learning_rate": 1.6702276435942776e-06, + "loss": 0.0664, + "step": 30056 + }, + { + "epoch": 81.8991825613079, + "grad_norm": 4.16168737411499, + "learning_rate": 1.6697393853413269e-06, + "loss": 0.0636, + "step": 30057 + }, + { + "epoch": 81.90190735694823, + "grad_norm": 2.1645264625549316, + "learning_rate": 1.6692511919641786e-06, + "loss": 0.0273, + "step": 30058 + }, + { + "epoch": 81.90463215258856, + "grad_norm": 2.435659885406494, + "learning_rate": 1.6687630634666308e-06, + "loss": 0.028, + "step": 30059 + }, + { + "epoch": 81.90735694822888, + "grad_norm": 2.16802978515625, + "learning_rate": 1.6682749998524917e-06, + "loss": 0.0704, + "step": 30060 + }, + { + "epoch": 81.91008174386921, + "grad_norm": 3.9329493045806885, + "learning_rate": 1.667787001125557e-06, + "loss": 0.0345, + "step": 30061 + }, + { + "epoch": 81.91280653950953, + "grad_norm": 2.289764642715454, + "learning_rate": 1.6672990672896304e-06, + "loss": 0.0725, + "step": 30062 + }, + { + "epoch": 81.91553133514986, + "grad_norm": 2.794121265411377, + "learning_rate": 1.666811198348508e-06, + "loss": 0.1162, + "step": 30063 + }, + { + "epoch": 81.9182561307902, + "grad_norm": 2.8760757446289062, + "learning_rate": 1.6663233943059932e-06, + "loss": 0.0466, + "step": 30064 + }, + { + "epoch": 81.92098092643052, + "grad_norm": 2.378352403640747, + "learning_rate": 1.6658356551658838e-06, + "loss": 0.0318, + "step": 30065 + }, + { + "epoch": 81.92370572207085, + "grad_norm": 1.9247372150421143, + "learning_rate": 1.6653479809319795e-06, + "loss": 0.0197, + "step": 30066 + }, + { + "epoch": 81.92643051771117, + "grad_norm": 2.9816741943359375, + "learning_rate": 1.6648603716080725e-06, + "loss": 0.0324, + "step": 30067 + }, + { + "epoch": 81.9291553133515, + "grad_norm": 3.170616626739502, + "learning_rate": 1.6643728271979665e-06, + "loss": 0.0464, + "step": 30068 + }, + { + "epoch": 81.93188010899182, + "grad_norm": 2.9416186809539795, + "learning_rate": 1.6638853477054573e-06, + "loss": 0.0441, + "step": 30069 + }, + { + "epoch": 81.93460490463215, + "grad_norm": 2.3222405910491943, + "learning_rate": 1.663397933134342e-06, + "loss": 0.1783, + "step": 30070 + }, + { + "epoch": 81.93732970027249, + "grad_norm": 2.681143283843994, + "learning_rate": 1.6629105834884119e-06, + "loss": 0.0392, + "step": 30071 + }, + { + "epoch": 81.9400544959128, + "grad_norm": 3.0393142700195312, + "learning_rate": 1.6624232987714695e-06, + "loss": 0.0428, + "step": 30072 + }, + { + "epoch": 81.94277929155314, + "grad_norm": 2.3829312324523926, + "learning_rate": 1.6619360789873051e-06, + "loss": 0.1214, + "step": 30073 + }, + { + "epoch": 81.94550408719346, + "grad_norm": 1.8362236022949219, + "learning_rate": 1.6614489241397148e-06, + "loss": 0.0311, + "step": 30074 + }, + { + "epoch": 81.94822888283379, + "grad_norm": 2.6642162799835205, + "learning_rate": 1.6609618342324884e-06, + "loss": 0.0326, + "step": 30075 + }, + { + "epoch": 81.95095367847412, + "grad_norm": 2.634880542755127, + "learning_rate": 1.6604748092694268e-06, + "loss": 0.1138, + "step": 30076 + }, + { + "epoch": 81.95367847411444, + "grad_norm": 2.1546363830566406, + "learning_rate": 1.6599878492543175e-06, + "loss": 0.0406, + "step": 30077 + }, + { + "epoch": 81.95640326975477, + "grad_norm": 1.9578328132629395, + "learning_rate": 1.6595009541909558e-06, + "loss": 0.0404, + "step": 30078 + }, + { + "epoch": 81.95912806539509, + "grad_norm": 1.6919559240341187, + "learning_rate": 1.6590141240831281e-06, + "loss": 0.0204, + "step": 30079 + }, + { + "epoch": 81.96185286103542, + "grad_norm": 3.3523151874542236, + "learning_rate": 1.658527358934634e-06, + "loss": 0.0442, + "step": 30080 + }, + { + "epoch": 81.96457765667574, + "grad_norm": 2.374912738800049, + "learning_rate": 1.6580406587492592e-06, + "loss": 0.0308, + "step": 30081 + }, + { + "epoch": 81.96730245231608, + "grad_norm": 2.683181047439575, + "learning_rate": 1.6575540235307964e-06, + "loss": 0.0939, + "step": 30082 + }, + { + "epoch": 81.97002724795641, + "grad_norm": 2.0993354320526123, + "learning_rate": 1.6570674532830312e-06, + "loss": 0.118, + "step": 30083 + }, + { + "epoch": 81.97275204359673, + "grad_norm": 2.8864526748657227, + "learning_rate": 1.6565809480097583e-06, + "loss": 0.2046, + "step": 30084 + }, + { + "epoch": 81.97547683923706, + "grad_norm": 3.024050712585449, + "learning_rate": 1.6560945077147628e-06, + "loss": 0.0806, + "step": 30085 + }, + { + "epoch": 81.97820163487738, + "grad_norm": 1.5702760219573975, + "learning_rate": 1.655608132401837e-06, + "loss": 0.028, + "step": 30086 + }, + { + "epoch": 81.98092643051771, + "grad_norm": 3.0154566764831543, + "learning_rate": 1.6551218220747634e-06, + "loss": 0.0572, + "step": 30087 + }, + { + "epoch": 81.98365122615803, + "grad_norm": 1.8100252151489258, + "learning_rate": 1.6546355767373357e-06, + "loss": 0.0587, + "step": 30088 + }, + { + "epoch": 81.98637602179836, + "grad_norm": 2.5257043838500977, + "learning_rate": 1.6541493963933375e-06, + "loss": 0.0676, + "step": 30089 + }, + { + "epoch": 81.9891008174387, + "grad_norm": 2.980360984802246, + "learning_rate": 1.6536632810465547e-06, + "loss": 0.0469, + "step": 30090 + }, + { + "epoch": 81.99182561307902, + "grad_norm": 2.4827728271484375, + "learning_rate": 1.653177230700771e-06, + "loss": 0.0408, + "step": 30091 + }, + { + "epoch": 81.99455040871935, + "grad_norm": 2.323294162750244, + "learning_rate": 1.6526912453597776e-06, + "loss": 0.1011, + "step": 30092 + }, + { + "epoch": 81.99727520435967, + "grad_norm": 2.739640951156616, + "learning_rate": 1.6522053250273551e-06, + "loss": 0.0432, + "step": 30093 + }, + { + "epoch": 82.0, + "grad_norm": 3.3195836544036865, + "learning_rate": 1.6517194697072903e-06, + "loss": 0.0561, + "step": 30094 + }, + { + "epoch": 82.00272479564033, + "grad_norm": 2.452608823776245, + "learning_rate": 1.6512336794033622e-06, + "loss": 0.0643, + "step": 30095 + }, + { + "epoch": 82.00544959128065, + "grad_norm": 4.400585651397705, + "learning_rate": 1.6507479541193595e-06, + "loss": 0.0629, + "step": 30096 + }, + { + "epoch": 82.00817438692098, + "grad_norm": 2.563040256500244, + "learning_rate": 1.650262293859064e-06, + "loss": 0.1783, + "step": 30097 + }, + { + "epoch": 82.0108991825613, + "grad_norm": 2.6949498653411865, + "learning_rate": 1.6497766986262564e-06, + "loss": 0.0358, + "step": 30098 + }, + { + "epoch": 82.01362397820164, + "grad_norm": 5.2082695960998535, + "learning_rate": 1.6492911684247171e-06, + "loss": 0.2074, + "step": 30099 + }, + { + "epoch": 82.01634877384195, + "grad_norm": 2.20147705078125, + "learning_rate": 1.6488057032582316e-06, + "loss": 0.0349, + "step": 30100 + }, + { + "epoch": 82.01907356948229, + "grad_norm": 2.8832318782806396, + "learning_rate": 1.6483203031305784e-06, + "loss": 0.0414, + "step": 30101 + }, + { + "epoch": 82.02179836512262, + "grad_norm": 2.864335060119629, + "learning_rate": 1.6478349680455351e-06, + "loss": 0.0621, + "step": 30102 + }, + { + "epoch": 82.02452316076294, + "grad_norm": 2.6042680740356445, + "learning_rate": 1.6473496980068882e-06, + "loss": 0.0221, + "step": 30103 + }, + { + "epoch": 82.02724795640327, + "grad_norm": 2.670797348022461, + "learning_rate": 1.6468644930184097e-06, + "loss": 0.0546, + "step": 30104 + }, + { + "epoch": 82.02997275204359, + "grad_norm": 2.3810532093048096, + "learning_rate": 1.6463793530838834e-06, + "loss": 0.0671, + "step": 30105 + }, + { + "epoch": 82.03269754768392, + "grad_norm": 2.194476842880249, + "learning_rate": 1.6458942782070864e-06, + "loss": 0.025, + "step": 30106 + }, + { + "epoch": 82.03542234332426, + "grad_norm": 2.59818434715271, + "learning_rate": 1.6454092683917954e-06, + "loss": 0.0617, + "step": 30107 + }, + { + "epoch": 82.03814713896458, + "grad_norm": 3.1329987049102783, + "learning_rate": 1.6449243236417866e-06, + "loss": 0.126, + "step": 30108 + }, + { + "epoch": 82.04087193460491, + "grad_norm": 2.04888653755188, + "learning_rate": 1.6444394439608402e-06, + "loss": 0.0331, + "step": 30109 + }, + { + "epoch": 82.04359673024523, + "grad_norm": 2.1385014057159424, + "learning_rate": 1.6439546293527309e-06, + "loss": 0.049, + "step": 30110 + }, + { + "epoch": 82.04632152588556, + "grad_norm": 2.791651487350464, + "learning_rate": 1.6434698798212312e-06, + "loss": 0.141, + "step": 30111 + }, + { + "epoch": 82.04904632152588, + "grad_norm": 3.0007333755493164, + "learning_rate": 1.6429851953701214e-06, + "loss": 0.0712, + "step": 30112 + }, + { + "epoch": 82.05177111716621, + "grad_norm": 2.4517953395843506, + "learning_rate": 1.6425005760031742e-06, + "loss": 0.0281, + "step": 30113 + }, + { + "epoch": 82.05449591280654, + "grad_norm": 2.233431577682495, + "learning_rate": 1.642016021724163e-06, + "loss": 0.046, + "step": 30114 + }, + { + "epoch": 82.05722070844686, + "grad_norm": 2.6009597778320312, + "learning_rate": 1.6415315325368608e-06, + "loss": 0.059, + "step": 30115 + }, + { + "epoch": 82.0599455040872, + "grad_norm": 3.337405204772949, + "learning_rate": 1.641047108445044e-06, + "loss": 0.1318, + "step": 30116 + }, + { + "epoch": 82.06267029972751, + "grad_norm": 4.06247091293335, + "learning_rate": 1.6405627494524823e-06, + "loss": 0.2333, + "step": 30117 + }, + { + "epoch": 82.06539509536785, + "grad_norm": 1.3780720233917236, + "learning_rate": 1.64007845556295e-06, + "loss": 0.0476, + "step": 30118 + }, + { + "epoch": 82.06811989100818, + "grad_norm": 2.218391180038452, + "learning_rate": 1.6395942267802145e-06, + "loss": 0.0264, + "step": 30119 + }, + { + "epoch": 82.0708446866485, + "grad_norm": 2.4761962890625, + "learning_rate": 1.6391100631080504e-06, + "loss": 0.0741, + "step": 30120 + }, + { + "epoch": 82.07356948228883, + "grad_norm": 2.4118857383728027, + "learning_rate": 1.63862596455023e-06, + "loss": 0.0349, + "step": 30121 + }, + { + "epoch": 82.07629427792915, + "grad_norm": 2.839411973953247, + "learning_rate": 1.6381419311105217e-06, + "loss": 0.0471, + "step": 30122 + }, + { + "epoch": 82.07901907356948, + "grad_norm": 2.217923879623413, + "learning_rate": 1.6376579627926958e-06, + "loss": 0.0646, + "step": 30123 + }, + { + "epoch": 82.0817438692098, + "grad_norm": 2.5746586322784424, + "learning_rate": 1.637174059600517e-06, + "loss": 0.0703, + "step": 30124 + }, + { + "epoch": 82.08446866485014, + "grad_norm": 3.2880475521087646, + "learning_rate": 1.6366902215377612e-06, + "loss": 0.0555, + "step": 30125 + }, + { + "epoch": 82.08719346049047, + "grad_norm": 2.633786916732788, + "learning_rate": 1.6362064486081908e-06, + "loss": 0.022, + "step": 30126 + }, + { + "epoch": 82.08991825613079, + "grad_norm": 2.3178820610046387, + "learning_rate": 1.6357227408155773e-06, + "loss": 0.0597, + "step": 30127 + }, + { + "epoch": 82.09264305177112, + "grad_norm": 2.050793170928955, + "learning_rate": 1.6352390981636823e-06, + "loss": 0.0733, + "step": 30128 + }, + { + "epoch": 82.09536784741144, + "grad_norm": 1.5514721870422363, + "learning_rate": 1.6347555206562792e-06, + "loss": 0.0161, + "step": 30129 + }, + { + "epoch": 82.09809264305177, + "grad_norm": 2.0822415351867676, + "learning_rate": 1.6342720082971297e-06, + "loss": 0.0417, + "step": 30130 + }, + { + "epoch": 82.1008174386921, + "grad_norm": 2.493922233581543, + "learning_rate": 1.6337885610900017e-06, + "loss": 0.115, + "step": 30131 + }, + { + "epoch": 82.10354223433242, + "grad_norm": 2.7690391540527344, + "learning_rate": 1.6333051790386556e-06, + "loss": 0.0793, + "step": 30132 + }, + { + "epoch": 82.10626702997276, + "grad_norm": 2.0981123447418213, + "learning_rate": 1.6328218621468628e-06, + "loss": 0.0507, + "step": 30133 + }, + { + "epoch": 82.10899182561307, + "grad_norm": 3.4307641983032227, + "learning_rate": 1.6323386104183836e-06, + "loss": 0.039, + "step": 30134 + }, + { + "epoch": 82.11171662125341, + "grad_norm": 2.3298115730285645, + "learning_rate": 1.6318554238569807e-06, + "loss": 0.0244, + "step": 30135 + }, + { + "epoch": 82.11444141689373, + "grad_norm": 2.2847211360931396, + "learning_rate": 1.6313723024664175e-06, + "loss": 0.034, + "step": 30136 + }, + { + "epoch": 82.11716621253406, + "grad_norm": 2.782477855682373, + "learning_rate": 1.6308892462504599e-06, + "loss": 0.0363, + "step": 30137 + }, + { + "epoch": 82.11989100817439, + "grad_norm": 2.7747435569763184, + "learning_rate": 1.6304062552128674e-06, + "loss": 0.0752, + "step": 30138 + }, + { + "epoch": 82.12261580381471, + "grad_norm": 2.447909116744995, + "learning_rate": 1.6299233293574012e-06, + "loss": 0.0733, + "step": 30139 + }, + { + "epoch": 82.12534059945504, + "grad_norm": 2.572230100631714, + "learning_rate": 1.6294404686878207e-06, + "loss": 0.0378, + "step": 30140 + }, + { + "epoch": 82.12806539509536, + "grad_norm": 2.5960028171539307, + "learning_rate": 1.6289576732078916e-06, + "loss": 0.0273, + "step": 30141 + }, + { + "epoch": 82.1307901907357, + "grad_norm": 1.7044440507888794, + "learning_rate": 1.6284749429213697e-06, + "loss": 0.0255, + "step": 30142 + }, + { + "epoch": 82.13351498637603, + "grad_norm": 3.533142328262329, + "learning_rate": 1.6279922778320156e-06, + "loss": 0.1516, + "step": 30143 + }, + { + "epoch": 82.13623978201635, + "grad_norm": 3.6024680137634277, + "learning_rate": 1.6275096779435862e-06, + "loss": 0.0331, + "step": 30144 + }, + { + "epoch": 82.13896457765668, + "grad_norm": 3.0792603492736816, + "learning_rate": 1.6270271432598438e-06, + "loss": 0.0983, + "step": 30145 + }, + { + "epoch": 82.141689373297, + "grad_norm": 1.7023431062698364, + "learning_rate": 1.6265446737845458e-06, + "loss": 0.024, + "step": 30146 + }, + { + "epoch": 82.14441416893733, + "grad_norm": 2.2191717624664307, + "learning_rate": 1.626062269521448e-06, + "loss": 0.0654, + "step": 30147 + }, + { + "epoch": 82.14713896457765, + "grad_norm": 3.3200104236602783, + "learning_rate": 1.6255799304743048e-06, + "loss": 0.0301, + "step": 30148 + }, + { + "epoch": 82.14986376021798, + "grad_norm": 2.1497583389282227, + "learning_rate": 1.6250976566468779e-06, + "loss": 0.0361, + "step": 30149 + }, + { + "epoch": 82.15258855585832, + "grad_norm": 2.7354648113250732, + "learning_rate": 1.624615448042921e-06, + "loss": 0.0253, + "step": 30150 + }, + { + "epoch": 82.15531335149863, + "grad_norm": 3.8269991874694824, + "learning_rate": 1.6241333046661888e-06, + "loss": 0.1245, + "step": 30151 + }, + { + "epoch": 82.15803814713897, + "grad_norm": 3.1344497203826904, + "learning_rate": 1.6236512265204352e-06, + "loss": 0.0348, + "step": 30152 + }, + { + "epoch": 82.16076294277929, + "grad_norm": 2.80470609664917, + "learning_rate": 1.623169213609419e-06, + "loss": 0.0376, + "step": 30153 + }, + { + "epoch": 82.16348773841962, + "grad_norm": 3.6900198459625244, + "learning_rate": 1.6226872659368885e-06, + "loss": 0.0383, + "step": 30154 + }, + { + "epoch": 82.16621253405995, + "grad_norm": 3.068413257598877, + "learning_rate": 1.622205383506602e-06, + "loss": 0.0623, + "step": 30155 + }, + { + "epoch": 82.16893732970027, + "grad_norm": 2.7594008445739746, + "learning_rate": 1.6217235663223085e-06, + "loss": 0.1019, + "step": 30156 + }, + { + "epoch": 82.1716621253406, + "grad_norm": 3.374462604522705, + "learning_rate": 1.621241814387764e-06, + "loss": 0.0805, + "step": 30157 + }, + { + "epoch": 82.17438692098092, + "grad_norm": 2.7398502826690674, + "learning_rate": 1.6207601277067197e-06, + "loss": 0.0295, + "step": 30158 + }, + { + "epoch": 82.17711171662125, + "grad_norm": 2.4901440143585205, + "learning_rate": 1.6202785062829252e-06, + "loss": 0.0471, + "step": 30159 + }, + { + "epoch": 82.17983651226157, + "grad_norm": 2.8590476512908936, + "learning_rate": 1.6197969501201295e-06, + "loss": 0.0231, + "step": 30160 + }, + { + "epoch": 82.1825613079019, + "grad_norm": 10.413185119628906, + "learning_rate": 1.6193154592220871e-06, + "loss": 0.115, + "step": 30161 + }, + { + "epoch": 82.18528610354224, + "grad_norm": 2.662334680557251, + "learning_rate": 1.6188340335925478e-06, + "loss": 0.0684, + "step": 30162 + }, + { + "epoch": 82.18801089918256, + "grad_norm": 2.848132848739624, + "learning_rate": 1.6183526732352583e-06, + "loss": 0.042, + "step": 30163 + }, + { + "epoch": 82.19073569482289, + "grad_norm": 2.152181386947632, + "learning_rate": 1.6178713781539658e-06, + "loss": 0.0454, + "step": 30164 + }, + { + "epoch": 82.19346049046321, + "grad_norm": 2.8709352016448975, + "learning_rate": 1.6173901483524246e-06, + "loss": 0.1143, + "step": 30165 + }, + { + "epoch": 82.19618528610354, + "grad_norm": 2.3323049545288086, + "learning_rate": 1.6169089838343776e-06, + "loss": 0.0748, + "step": 30166 + }, + { + "epoch": 82.19891008174388, + "grad_norm": 2.783975839614868, + "learning_rate": 1.6164278846035752e-06, + "loss": 0.0835, + "step": 30167 + }, + { + "epoch": 82.2016348773842, + "grad_norm": 3.9515433311462402, + "learning_rate": 1.61594685066376e-06, + "loss": 0.032, + "step": 30168 + }, + { + "epoch": 82.20435967302453, + "grad_norm": 2.7064707279205322, + "learning_rate": 1.6154658820186819e-06, + "loss": 0.1027, + "step": 30169 + }, + { + "epoch": 82.20708446866485, + "grad_norm": 2.2218239307403564, + "learning_rate": 1.6149849786720873e-06, + "loss": 0.1038, + "step": 30170 + }, + { + "epoch": 82.20980926430518, + "grad_norm": 2.2611162662506104, + "learning_rate": 1.6145041406277162e-06, + "loss": 0.0419, + "step": 30171 + }, + { + "epoch": 82.2125340599455, + "grad_norm": 2.452496290206909, + "learning_rate": 1.6140233678893203e-06, + "loss": 0.0332, + "step": 30172 + }, + { + "epoch": 82.21525885558583, + "grad_norm": 2.9502222537994385, + "learning_rate": 1.6135426604606375e-06, + "loss": 0.0842, + "step": 30173 + }, + { + "epoch": 82.21798365122616, + "grad_norm": 3.4729695320129395, + "learning_rate": 1.613062018345417e-06, + "loss": 0.1134, + "step": 30174 + }, + { + "epoch": 82.22070844686648, + "grad_norm": 2.6018288135528564, + "learning_rate": 1.6125814415473994e-06, + "loss": 0.0486, + "step": 30175 + }, + { + "epoch": 82.22343324250681, + "grad_norm": 3.1216282844543457, + "learning_rate": 1.6121009300703262e-06, + "loss": 0.0929, + "step": 30176 + }, + { + "epoch": 82.22615803814713, + "grad_norm": 4.083061218261719, + "learning_rate": 1.6116204839179428e-06, + "loss": 0.0389, + "step": 30177 + }, + { + "epoch": 82.22888283378747, + "grad_norm": 3.2521812915802, + "learning_rate": 1.611140103093989e-06, + "loss": 0.0638, + "step": 30178 + }, + { + "epoch": 82.2316076294278, + "grad_norm": 1.6322013139724731, + "learning_rate": 1.6106597876022057e-06, + "loss": 0.0196, + "step": 30179 + }, + { + "epoch": 82.23433242506812, + "grad_norm": 2.0123422145843506, + "learning_rate": 1.6101795374463314e-06, + "loss": 0.0249, + "step": 30180 + }, + { + "epoch": 82.23705722070845, + "grad_norm": 1.8605958223342896, + "learning_rate": 1.6096993526301118e-06, + "loss": 0.09, + "step": 30181 + }, + { + "epoch": 82.23978201634877, + "grad_norm": 2.4019317626953125, + "learning_rate": 1.6092192331572843e-06, + "loss": 0.0282, + "step": 30182 + }, + { + "epoch": 82.2425068119891, + "grad_norm": 2.736300468444824, + "learning_rate": 1.6087391790315866e-06, + "loss": 0.0564, + "step": 30183 + }, + { + "epoch": 82.24523160762942, + "grad_norm": 3.2253520488739014, + "learning_rate": 1.6082591902567557e-06, + "loss": 0.1209, + "step": 30184 + }, + { + "epoch": 82.24795640326975, + "grad_norm": 3.003744125366211, + "learning_rate": 1.6077792668365344e-06, + "loss": 0.1923, + "step": 30185 + }, + { + "epoch": 82.25068119891009, + "grad_norm": 1.6995396614074707, + "learning_rate": 1.6072994087746585e-06, + "loss": 0.0435, + "step": 30186 + }, + { + "epoch": 82.2534059945504, + "grad_norm": 2.5432207584381104, + "learning_rate": 1.606819616074864e-06, + "loss": 0.0893, + "step": 30187 + }, + { + "epoch": 82.25613079019074, + "grad_norm": 2.037693500518799, + "learning_rate": 1.6063398887408866e-06, + "loss": 0.0284, + "step": 30188 + }, + { + "epoch": 82.25885558583106, + "grad_norm": 1.7175441980361938, + "learning_rate": 1.6058602267764633e-06, + "loss": 0.0694, + "step": 30189 + }, + { + "epoch": 82.26158038147139, + "grad_norm": 2.559647798538208, + "learning_rate": 1.6053806301853337e-06, + "loss": 0.0397, + "step": 30190 + }, + { + "epoch": 82.26430517711172, + "grad_norm": 4.633242130279541, + "learning_rate": 1.6049010989712288e-06, + "loss": 0.2483, + "step": 30191 + }, + { + "epoch": 82.26702997275204, + "grad_norm": 1.9954807758331299, + "learning_rate": 1.6044216331378837e-06, + "loss": 0.1054, + "step": 30192 + }, + { + "epoch": 82.26975476839237, + "grad_norm": 2.322779893875122, + "learning_rate": 1.603942232689031e-06, + "loss": 0.038, + "step": 30193 + }, + { + "epoch": 82.2724795640327, + "grad_norm": 2.8108303546905518, + "learning_rate": 1.6034628976284084e-06, + "loss": 0.0412, + "step": 30194 + }, + { + "epoch": 82.27520435967303, + "grad_norm": 2.5841689109802246, + "learning_rate": 1.6029836279597455e-06, + "loss": 0.044, + "step": 30195 + }, + { + "epoch": 82.27792915531334, + "grad_norm": 3.463477611541748, + "learning_rate": 1.602504423686775e-06, + "loss": 0.0629, + "step": 30196 + }, + { + "epoch": 82.28065395095368, + "grad_norm": 2.757986545562744, + "learning_rate": 1.6020252848132311e-06, + "loss": 0.0304, + "step": 30197 + }, + { + "epoch": 82.28337874659401, + "grad_norm": 3.4663634300231934, + "learning_rate": 1.6015462113428436e-06, + "loss": 0.0537, + "step": 30198 + }, + { + "epoch": 82.28610354223433, + "grad_norm": 2.922712564468384, + "learning_rate": 1.601067203279345e-06, + "loss": 0.0741, + "step": 30199 + }, + { + "epoch": 82.28882833787466, + "grad_norm": 2.993884325027466, + "learning_rate": 1.6005882606264621e-06, + "loss": 0.0383, + "step": 30200 + }, + { + "epoch": 82.29155313351498, + "grad_norm": 3.265608072280884, + "learning_rate": 1.6001093833879288e-06, + "loss": 0.1017, + "step": 30201 + }, + { + "epoch": 82.29427792915531, + "grad_norm": 3.439603805541992, + "learning_rate": 1.5996305715674743e-06, + "loss": 0.0472, + "step": 30202 + }, + { + "epoch": 82.29700272479565, + "grad_norm": 1.7652721405029297, + "learning_rate": 1.5991518251688265e-06, + "loss": 0.0213, + "step": 30203 + }, + { + "epoch": 82.29972752043597, + "grad_norm": 2.2727067470550537, + "learning_rate": 1.5986731441957114e-06, + "loss": 0.0291, + "step": 30204 + }, + { + "epoch": 82.3024523160763, + "grad_norm": 2.3539865016937256, + "learning_rate": 1.5981945286518597e-06, + "loss": 0.076, + "step": 30205 + }, + { + "epoch": 82.30517711171662, + "grad_norm": 3.262967824935913, + "learning_rate": 1.597715978541e-06, + "loss": 0.083, + "step": 30206 + }, + { + "epoch": 82.30790190735695, + "grad_norm": 3.4969043731689453, + "learning_rate": 1.597237493866859e-06, + "loss": 0.0956, + "step": 30207 + }, + { + "epoch": 82.31062670299727, + "grad_norm": 2.654318332672119, + "learning_rate": 1.5967590746331619e-06, + "loss": 0.0367, + "step": 30208 + }, + { + "epoch": 82.3133514986376, + "grad_norm": 2.8982152938842773, + "learning_rate": 1.5962807208436315e-06, + "loss": 0.0437, + "step": 30209 + }, + { + "epoch": 82.31607629427793, + "grad_norm": 5.074118614196777, + "learning_rate": 1.5958024325019993e-06, + "loss": 0.0481, + "step": 30210 + }, + { + "epoch": 82.31880108991825, + "grad_norm": 1.6220102310180664, + "learning_rate": 1.595324209611987e-06, + "loss": 0.0343, + "step": 30211 + }, + { + "epoch": 82.32152588555859, + "grad_norm": 3.144766092300415, + "learning_rate": 1.594846052177319e-06, + "loss": 0.2532, + "step": 30212 + }, + { + "epoch": 82.3242506811989, + "grad_norm": 2.7922792434692383, + "learning_rate": 1.594367960201718e-06, + "loss": 0.0801, + "step": 30213 + }, + { + "epoch": 82.32697547683924, + "grad_norm": 3.7109549045562744, + "learning_rate": 1.5938899336889102e-06, + "loss": 0.1202, + "step": 30214 + }, + { + "epoch": 82.32970027247957, + "grad_norm": 3.6727981567382812, + "learning_rate": 1.5934119726426177e-06, + "loss": 0.0345, + "step": 30215 + }, + { + "epoch": 82.33242506811989, + "grad_norm": 5.282775402069092, + "learning_rate": 1.5929340770665614e-06, + "loss": 0.1466, + "step": 30216 + }, + { + "epoch": 82.33514986376022, + "grad_norm": 2.2777795791625977, + "learning_rate": 1.5924562469644623e-06, + "loss": 0.0508, + "step": 30217 + }, + { + "epoch": 82.33787465940054, + "grad_norm": 2.966745615005493, + "learning_rate": 1.5919784823400452e-06, + "loss": 0.1701, + "step": 30218 + }, + { + "epoch": 82.34059945504087, + "grad_norm": 1.6942039728164673, + "learning_rate": 1.5915007831970297e-06, + "loss": 0.026, + "step": 30219 + }, + { + "epoch": 82.34332425068119, + "grad_norm": 2.008901357650757, + "learning_rate": 1.5910231495391326e-06, + "loss": 0.1946, + "step": 30220 + }, + { + "epoch": 82.34604904632153, + "grad_norm": 3.4828262329101562, + "learning_rate": 1.5905455813700788e-06, + "loss": 0.062, + "step": 30221 + }, + { + "epoch": 82.34877384196186, + "grad_norm": 2.490074872970581, + "learning_rate": 1.590068078693584e-06, + "loss": 0.1156, + "step": 30222 + }, + { + "epoch": 82.35149863760218, + "grad_norm": 2.6140756607055664, + "learning_rate": 1.58959064151337e-06, + "loss": 0.0433, + "step": 30223 + }, + { + "epoch": 82.35422343324251, + "grad_norm": 2.654006242752075, + "learning_rate": 1.5891132698331536e-06, + "loss": 0.0487, + "step": 30224 + }, + { + "epoch": 82.35694822888283, + "grad_norm": 1.9457130432128906, + "learning_rate": 1.5886359636566494e-06, + "loss": 0.025, + "step": 30225 + }, + { + "epoch": 82.35967302452316, + "grad_norm": 3.361292600631714, + "learning_rate": 1.5881587229875806e-06, + "loss": 0.0654, + "step": 30226 + }, + { + "epoch": 82.3623978201635, + "grad_norm": 2.7696139812469482, + "learning_rate": 1.5876815478296602e-06, + "loss": 0.1032, + "step": 30227 + }, + { + "epoch": 82.36512261580381, + "grad_norm": 1.7006996870040894, + "learning_rate": 1.5872044381866058e-06, + "loss": 0.024, + "step": 30228 + }, + { + "epoch": 82.36784741144415, + "grad_norm": 2.56009840965271, + "learning_rate": 1.5867273940621297e-06, + "loss": 0.0395, + "step": 30229 + }, + { + "epoch": 82.37057220708446, + "grad_norm": 1.888870120048523, + "learning_rate": 1.5862504154599522e-06, + "loss": 0.0238, + "step": 30230 + }, + { + "epoch": 82.3732970027248, + "grad_norm": 2.4918346405029297, + "learning_rate": 1.5857735023837861e-06, + "loss": 0.0254, + "step": 30231 + }, + { + "epoch": 82.37602179836512, + "grad_norm": 2.846223831176758, + "learning_rate": 1.585296654837345e-06, + "loss": 0.0959, + "step": 30232 + }, + { + "epoch": 82.37874659400545, + "grad_norm": 2.0135998725891113, + "learning_rate": 1.5848198728243402e-06, + "loss": 0.0236, + "step": 30233 + }, + { + "epoch": 82.38147138964578, + "grad_norm": 2.7633562088012695, + "learning_rate": 1.5843431563484902e-06, + "loss": 0.0304, + "step": 30234 + }, + { + "epoch": 82.3841961852861, + "grad_norm": 1.961612582206726, + "learning_rate": 1.583866505413505e-06, + "loss": 0.0755, + "step": 30235 + }, + { + "epoch": 82.38692098092643, + "grad_norm": 2.5416512489318848, + "learning_rate": 1.5833899200230963e-06, + "loss": 0.0487, + "step": 30236 + }, + { + "epoch": 82.38964577656675, + "grad_norm": 2.978325128555298, + "learning_rate": 1.582913400180973e-06, + "loss": 0.1387, + "step": 30237 + }, + { + "epoch": 82.39237057220708, + "grad_norm": 2.6418581008911133, + "learning_rate": 1.5824369458908518e-06, + "loss": 0.1327, + "step": 30238 + }, + { + "epoch": 82.39509536784742, + "grad_norm": 2.6299800872802734, + "learning_rate": 1.581960557156441e-06, + "loss": 0.055, + "step": 30239 + }, + { + "epoch": 82.39782016348774, + "grad_norm": 4.451153755187988, + "learning_rate": 1.5814842339814485e-06, + "loss": 0.1029, + "step": 30240 + }, + { + "epoch": 82.40054495912807, + "grad_norm": 5.714231967926025, + "learning_rate": 1.5810079763695852e-06, + "loss": 0.0235, + "step": 30241 + }, + { + "epoch": 82.40326975476839, + "grad_norm": 1.663466215133667, + "learning_rate": 1.5805317843245638e-06, + "loss": 0.0168, + "step": 30242 + }, + { + "epoch": 82.40599455040872, + "grad_norm": 2.099660873413086, + "learning_rate": 1.5800556578500891e-06, + "loss": 0.0273, + "step": 30243 + }, + { + "epoch": 82.40871934604904, + "grad_norm": 3.4054901599884033, + "learning_rate": 1.5795795969498706e-06, + "loss": 0.08, + "step": 30244 + }, + { + "epoch": 82.41144414168937, + "grad_norm": 4.001406669616699, + "learning_rate": 1.579103601627613e-06, + "loss": 0.1298, + "step": 30245 + }, + { + "epoch": 82.4141689373297, + "grad_norm": 3.6959145069122314, + "learning_rate": 1.5786276718870274e-06, + "loss": 0.0782, + "step": 30246 + }, + { + "epoch": 82.41689373297002, + "grad_norm": 2.4311442375183105, + "learning_rate": 1.578151807731818e-06, + "loss": 0.0359, + "step": 30247 + }, + { + "epoch": 82.41961852861036, + "grad_norm": 2.4477179050445557, + "learning_rate": 1.5776760091656918e-06, + "loss": 0.0998, + "step": 30248 + }, + { + "epoch": 82.42234332425068, + "grad_norm": 2.8573293685913086, + "learning_rate": 1.577200276192351e-06, + "loss": 0.0335, + "step": 30249 + }, + { + "epoch": 82.42506811989101, + "grad_norm": 3.3418049812316895, + "learning_rate": 1.5767246088155064e-06, + "loss": 0.1005, + "step": 30250 + }, + { + "epoch": 82.42779291553134, + "grad_norm": 2.3806207180023193, + "learning_rate": 1.5762490070388592e-06, + "loss": 0.0373, + "step": 30251 + }, + { + "epoch": 82.43051771117166, + "grad_norm": 2.034852981567383, + "learning_rate": 1.5757734708661144e-06, + "loss": 0.0329, + "step": 30252 + }, + { + "epoch": 82.433242506812, + "grad_norm": 2.5034232139587402, + "learning_rate": 1.575298000300971e-06, + "loss": 0.0387, + "step": 30253 + }, + { + "epoch": 82.43596730245231, + "grad_norm": 2.270033359527588, + "learning_rate": 1.5748225953471385e-06, + "loss": 0.0799, + "step": 30254 + }, + { + "epoch": 82.43869209809264, + "grad_norm": 2.658634901046753, + "learning_rate": 1.5743472560083162e-06, + "loss": 0.1347, + "step": 30255 + }, + { + "epoch": 82.44141689373296, + "grad_norm": 5.519894123077393, + "learning_rate": 1.5738719822882064e-06, + "loss": 0.0948, + "step": 30256 + }, + { + "epoch": 82.4441416893733, + "grad_norm": 2.8614137172698975, + "learning_rate": 1.5733967741905087e-06, + "loss": 0.1078, + "step": 30257 + }, + { + "epoch": 82.44686648501363, + "grad_norm": 2.6079354286193848, + "learning_rate": 1.5729216317189245e-06, + "loss": 0.0734, + "step": 30258 + }, + { + "epoch": 82.44959128065395, + "grad_norm": 2.9450924396514893, + "learning_rate": 1.5724465548771584e-06, + "loss": 0.0694, + "step": 30259 + }, + { + "epoch": 82.45231607629428, + "grad_norm": 2.2583277225494385, + "learning_rate": 1.5719715436689076e-06, + "loss": 0.0238, + "step": 30260 + }, + { + "epoch": 82.4550408719346, + "grad_norm": 3.2999963760375977, + "learning_rate": 1.5714965980978692e-06, + "loss": 0.11, + "step": 30261 + }, + { + "epoch": 82.45776566757493, + "grad_norm": 1.9584386348724365, + "learning_rate": 1.5710217181677456e-06, + "loss": 0.0169, + "step": 30262 + }, + { + "epoch": 82.46049046321527, + "grad_norm": 2.5350840091705322, + "learning_rate": 1.570546903882233e-06, + "loss": 0.0436, + "step": 30263 + }, + { + "epoch": 82.46321525885558, + "grad_norm": 3.3207385540008545, + "learning_rate": 1.5700721552450315e-06, + "loss": 0.0593, + "step": 30264 + }, + { + "epoch": 82.46594005449592, + "grad_norm": 2.6607284545898438, + "learning_rate": 1.5695974722598328e-06, + "loss": 0.0351, + "step": 30265 + }, + { + "epoch": 82.46866485013624, + "grad_norm": 1.9403024911880493, + "learning_rate": 1.5691228549303406e-06, + "loss": 0.0352, + "step": 30266 + }, + { + "epoch": 82.47138964577657, + "grad_norm": 2.3460240364074707, + "learning_rate": 1.5686483032602484e-06, + "loss": 0.029, + "step": 30267 + }, + { + "epoch": 82.47411444141689, + "grad_norm": 2.857072591781616, + "learning_rate": 1.5681738172532513e-06, + "loss": 0.0429, + "step": 30268 + }, + { + "epoch": 82.47683923705722, + "grad_norm": 2.1656620502471924, + "learning_rate": 1.5676993969130439e-06, + "loss": 0.0262, + "step": 30269 + }, + { + "epoch": 82.47956403269755, + "grad_norm": 3.6469504833221436, + "learning_rate": 1.5672250422433233e-06, + "loss": 0.0514, + "step": 30270 + }, + { + "epoch": 82.48228882833787, + "grad_norm": 1.6631399393081665, + "learning_rate": 1.5667507532477833e-06, + "loss": 0.0191, + "step": 30271 + }, + { + "epoch": 82.4850136239782, + "grad_norm": 2.5740177631378174, + "learning_rate": 1.5662765299301174e-06, + "loss": 0.0697, + "step": 30272 + }, + { + "epoch": 82.48773841961852, + "grad_norm": 2.5435543060302734, + "learning_rate": 1.5658023722940151e-06, + "loss": 0.1915, + "step": 30273 + }, + { + "epoch": 82.49046321525886, + "grad_norm": 3.1907248497009277, + "learning_rate": 1.5653282803431734e-06, + "loss": 0.0545, + "step": 30274 + }, + { + "epoch": 82.49318801089919, + "grad_norm": 4.00557804107666, + "learning_rate": 1.564854254081285e-06, + "loss": 0.0563, + "step": 30275 + }, + { + "epoch": 82.49591280653951, + "grad_norm": 2.2429308891296387, + "learning_rate": 1.5643802935120411e-06, + "loss": 0.035, + "step": 30276 + }, + { + "epoch": 82.49863760217984, + "grad_norm": 3.5843381881713867, + "learning_rate": 1.5639063986391322e-06, + "loss": 0.1553, + "step": 30277 + }, + { + "epoch": 82.50136239782016, + "grad_norm": 1.9688689708709717, + "learning_rate": 1.5634325694662455e-06, + "loss": 0.0358, + "step": 30278 + }, + { + "epoch": 82.50408719346049, + "grad_norm": 2.6274609565734863, + "learning_rate": 1.5629588059970769e-06, + "loss": 0.031, + "step": 30279 + }, + { + "epoch": 82.50681198910081, + "grad_norm": 2.148953676223755, + "learning_rate": 1.5624851082353143e-06, + "loss": 0.1204, + "step": 30280 + }, + { + "epoch": 82.50953678474114, + "grad_norm": 2.4428417682647705, + "learning_rate": 1.562011476184645e-06, + "loss": 0.034, + "step": 30281 + }, + { + "epoch": 82.51226158038148, + "grad_norm": 2.7503209114074707, + "learning_rate": 1.561537909848757e-06, + "loss": 0.0346, + "step": 30282 + }, + { + "epoch": 82.5149863760218, + "grad_norm": 2.4017913341522217, + "learning_rate": 1.561064409231342e-06, + "loss": 0.0484, + "step": 30283 + }, + { + "epoch": 82.51771117166213, + "grad_norm": 2.8435680866241455, + "learning_rate": 1.560590974336087e-06, + "loss": 0.0574, + "step": 30284 + }, + { + "epoch": 82.52043596730245, + "grad_norm": 1.748368740081787, + "learning_rate": 1.5601176051666744e-06, + "loss": 0.035, + "step": 30285 + }, + { + "epoch": 82.52316076294278, + "grad_norm": 3.2250211238861084, + "learning_rate": 1.559644301726797e-06, + "loss": 0.0543, + "step": 30286 + }, + { + "epoch": 82.52588555858311, + "grad_norm": 1.9527214765548706, + "learning_rate": 1.5591710640201385e-06, + "loss": 0.0245, + "step": 30287 + }, + { + "epoch": 82.52861035422343, + "grad_norm": 2.7119812965393066, + "learning_rate": 1.5586978920503836e-06, + "loss": 0.0351, + "step": 30288 + }, + { + "epoch": 82.53133514986376, + "grad_norm": 1.9051939249038696, + "learning_rate": 1.5582247858212152e-06, + "loss": 0.033, + "step": 30289 + }, + { + "epoch": 82.53405994550408, + "grad_norm": 2.1461281776428223, + "learning_rate": 1.5577517453363234e-06, + "loss": 0.0296, + "step": 30290 + }, + { + "epoch": 82.53678474114442, + "grad_norm": 3.381720542907715, + "learning_rate": 1.5572787705993863e-06, + "loss": 0.0357, + "step": 30291 + }, + { + "epoch": 82.53950953678473, + "grad_norm": 2.9295082092285156, + "learning_rate": 1.5568058616140934e-06, + "loss": 0.0379, + "step": 30292 + }, + { + "epoch": 82.54223433242507, + "grad_norm": 3.9110260009765625, + "learning_rate": 1.5563330183841252e-06, + "loss": 0.0748, + "step": 30293 + }, + { + "epoch": 82.5449591280654, + "grad_norm": 2.8895926475524902, + "learning_rate": 1.5558602409131606e-06, + "loss": 0.054, + "step": 30294 + }, + { + "epoch": 82.54768392370572, + "grad_norm": 4.43402624130249, + "learning_rate": 1.555387529204887e-06, + "loss": 0.0612, + "step": 30295 + }, + { + "epoch": 82.55040871934605, + "grad_norm": 2.748997449874878, + "learning_rate": 1.5549148832629834e-06, + "loss": 0.1353, + "step": 30296 + }, + { + "epoch": 82.55313351498637, + "grad_norm": 2.1949260234832764, + "learning_rate": 1.5544423030911316e-06, + "loss": 0.0277, + "step": 30297 + }, + { + "epoch": 82.5558583106267, + "grad_norm": 2.609607696533203, + "learning_rate": 1.5539697886930082e-06, + "loss": 0.056, + "step": 30298 + }, + { + "epoch": 82.55858310626704, + "grad_norm": 2.2071664333343506, + "learning_rate": 1.5534973400722986e-06, + "loss": 0.0159, + "step": 30299 + }, + { + "epoch": 82.56130790190736, + "grad_norm": 2.790907621383667, + "learning_rate": 1.5530249572326806e-06, + "loss": 0.0301, + "step": 30300 + }, + { + "epoch": 82.56403269754769, + "grad_norm": 2.826721668243408, + "learning_rate": 1.5525526401778313e-06, + "loss": 0.0798, + "step": 30301 + }, + { + "epoch": 82.566757493188, + "grad_norm": 3.125518560409546, + "learning_rate": 1.5520803889114288e-06, + "loss": 0.2181, + "step": 30302 + }, + { + "epoch": 82.56948228882834, + "grad_norm": 2.3341801166534424, + "learning_rate": 1.5516082034371538e-06, + "loss": 0.1092, + "step": 30303 + }, + { + "epoch": 82.57220708446866, + "grad_norm": 3.8021793365478516, + "learning_rate": 1.5511360837586832e-06, + "loss": 0.2114, + "step": 30304 + }, + { + "epoch": 82.57493188010899, + "grad_norm": 3.2330422401428223, + "learning_rate": 1.5506640298796927e-06, + "loss": 0.0796, + "step": 30305 + }, + { + "epoch": 82.57765667574932, + "grad_norm": 2.2091379165649414, + "learning_rate": 1.5501920418038553e-06, + "loss": 0.0378, + "step": 30306 + }, + { + "epoch": 82.58038147138964, + "grad_norm": 2.6230266094207764, + "learning_rate": 1.5497201195348532e-06, + "loss": 0.0766, + "step": 30307 + }, + { + "epoch": 82.58310626702998, + "grad_norm": 3.9569058418273926, + "learning_rate": 1.5492482630763594e-06, + "loss": 0.0507, + "step": 30308 + }, + { + "epoch": 82.5858310626703, + "grad_norm": 2.079242706298828, + "learning_rate": 1.5487764724320453e-06, + "loss": 0.0662, + "step": 30309 + }, + { + "epoch": 82.58855585831063, + "grad_norm": 2.6884078979492188, + "learning_rate": 1.548304747605589e-06, + "loss": 0.0497, + "step": 30310 + }, + { + "epoch": 82.59128065395096, + "grad_norm": 1.6678122282028198, + "learning_rate": 1.5478330886006643e-06, + "loss": 0.0262, + "step": 30311 + }, + { + "epoch": 82.59400544959128, + "grad_norm": 2.8677210807800293, + "learning_rate": 1.5473614954209449e-06, + "loss": 0.0311, + "step": 30312 + }, + { + "epoch": 82.59673024523161, + "grad_norm": 3.624225378036499, + "learning_rate": 1.546889968070101e-06, + "loss": 0.128, + "step": 30313 + }, + { + "epoch": 82.59945504087193, + "grad_norm": 2.751782178878784, + "learning_rate": 1.5464185065518034e-06, + "loss": 0.0441, + "step": 30314 + }, + { + "epoch": 82.60217983651226, + "grad_norm": 3.056368112564087, + "learning_rate": 1.54594711086973e-06, + "loss": 0.0949, + "step": 30315 + }, + { + "epoch": 82.60490463215258, + "grad_norm": 1.8355586528778076, + "learning_rate": 1.5454757810275468e-06, + "loss": 0.0197, + "step": 30316 + }, + { + "epoch": 82.60762942779292, + "grad_norm": 2.217400074005127, + "learning_rate": 1.5450045170289275e-06, + "loss": 0.103, + "step": 30317 + }, + { + "epoch": 82.61035422343325, + "grad_norm": 2.9036612510681152, + "learning_rate": 1.544533318877538e-06, + "loss": 0.1514, + "step": 30318 + }, + { + "epoch": 82.61307901907357, + "grad_norm": 3.0461792945861816, + "learning_rate": 1.5440621865770533e-06, + "loss": 0.0303, + "step": 30319 + }, + { + "epoch": 82.6158038147139, + "grad_norm": 2.601266860961914, + "learning_rate": 1.5435911201311405e-06, + "loss": 0.051, + "step": 30320 + }, + { + "epoch": 82.61852861035422, + "grad_norm": 2.228388786315918, + "learning_rate": 1.5431201195434664e-06, + "loss": 0.0476, + "step": 30321 + }, + { + "epoch": 82.62125340599455, + "grad_norm": 2.456087350845337, + "learning_rate": 1.5426491848176995e-06, + "loss": 0.1547, + "step": 30322 + }, + { + "epoch": 82.62397820163488, + "grad_norm": 4.665582180023193, + "learning_rate": 1.542178315957511e-06, + "loss": 0.0913, + "step": 30323 + }, + { + "epoch": 82.6267029972752, + "grad_norm": 1.9684175252914429, + "learning_rate": 1.541707512966566e-06, + "loss": 0.0295, + "step": 30324 + }, + { + "epoch": 82.62942779291554, + "grad_norm": 3.1616861820220947, + "learning_rate": 1.541236775848529e-06, + "loss": 0.1428, + "step": 30325 + }, + { + "epoch": 82.63215258855585, + "grad_norm": 5.245412826538086, + "learning_rate": 1.5407661046070643e-06, + "loss": 0.0353, + "step": 30326 + }, + { + "epoch": 82.63487738419619, + "grad_norm": 2.222473382949829, + "learning_rate": 1.5402954992458451e-06, + "loss": 0.0297, + "step": 30327 + }, + { + "epoch": 82.6376021798365, + "grad_norm": 2.7224769592285156, + "learning_rate": 1.5398249597685334e-06, + "loss": 0.2564, + "step": 30328 + }, + { + "epoch": 82.64032697547684, + "grad_norm": 4.054591178894043, + "learning_rate": 1.5393544861787912e-06, + "loss": 0.0649, + "step": 30329 + }, + { + "epoch": 82.64305177111717, + "grad_norm": 2.383607864379883, + "learning_rate": 1.5388840784802817e-06, + "loss": 0.0678, + "step": 30330 + }, + { + "epoch": 82.64577656675749, + "grad_norm": 2.370311975479126, + "learning_rate": 1.5384137366766739e-06, + "loss": 0.0459, + "step": 30331 + }, + { + "epoch": 82.64850136239782, + "grad_norm": 2.658867835998535, + "learning_rate": 1.5379434607716271e-06, + "loss": 0.0666, + "step": 30332 + }, + { + "epoch": 82.65122615803814, + "grad_norm": 2.7283833026885986, + "learning_rate": 1.537473250768804e-06, + "loss": 0.0381, + "step": 30333 + }, + { + "epoch": 82.65395095367847, + "grad_norm": 1.801334261894226, + "learning_rate": 1.537003106671865e-06, + "loss": 0.0211, + "step": 30334 + }, + { + "epoch": 82.65667574931881, + "grad_norm": 2.466092586517334, + "learning_rate": 1.536533028484476e-06, + "loss": 0.0835, + "step": 30335 + }, + { + "epoch": 82.65940054495913, + "grad_norm": 2.314575672149658, + "learning_rate": 1.5360630162102953e-06, + "loss": 0.0376, + "step": 30336 + }, + { + "epoch": 82.66212534059946, + "grad_norm": 2.093158006668091, + "learning_rate": 1.535593069852983e-06, + "loss": 0.0272, + "step": 30337 + }, + { + "epoch": 82.66485013623978, + "grad_norm": 3.99423885345459, + "learning_rate": 1.5351231894161967e-06, + "loss": 0.0568, + "step": 30338 + }, + { + "epoch": 82.66757493188011, + "grad_norm": 3.385798692703247, + "learning_rate": 1.534653374903602e-06, + "loss": 0.1196, + "step": 30339 + }, + { + "epoch": 82.67029972752043, + "grad_norm": 3.752199411392212, + "learning_rate": 1.5341836263188537e-06, + "loss": 0.0334, + "step": 30340 + }, + { + "epoch": 82.67302452316076, + "grad_norm": 2.3044042587280273, + "learning_rate": 1.53371394366561e-06, + "loss": 0.0671, + "step": 30341 + }, + { + "epoch": 82.6757493188011, + "grad_norm": 2.897268772125244, + "learning_rate": 1.5332443269475284e-06, + "loss": 0.1777, + "step": 30342 + }, + { + "epoch": 82.67847411444141, + "grad_norm": 2.632194757461548, + "learning_rate": 1.5327747761682677e-06, + "loss": 0.1456, + "step": 30343 + }, + { + "epoch": 82.68119891008175, + "grad_norm": 2.468472719192505, + "learning_rate": 1.5323052913314863e-06, + "loss": 0.0263, + "step": 30344 + }, + { + "epoch": 82.68392370572207, + "grad_norm": 2.753012180328369, + "learning_rate": 1.531835872440839e-06, + "loss": 0.0849, + "step": 30345 + }, + { + "epoch": 82.6866485013624, + "grad_norm": 2.3302366733551025, + "learning_rate": 1.5313665194999816e-06, + "loss": 0.0476, + "step": 30346 + }, + { + "epoch": 82.68937329700273, + "grad_norm": 3.279644012451172, + "learning_rate": 1.530897232512566e-06, + "loss": 0.037, + "step": 30347 + }, + { + "epoch": 82.69209809264305, + "grad_norm": 3.16890549659729, + "learning_rate": 1.5304280114822534e-06, + "loss": 0.0423, + "step": 30348 + }, + { + "epoch": 82.69482288828338, + "grad_norm": 1.5937548875808716, + "learning_rate": 1.5299588564126944e-06, + "loss": 0.0194, + "step": 30349 + }, + { + "epoch": 82.6975476839237, + "grad_norm": 2.417611598968506, + "learning_rate": 1.5294897673075405e-06, + "loss": 0.0385, + "step": 30350 + }, + { + "epoch": 82.70027247956403, + "grad_norm": 2.9801692962646484, + "learning_rate": 1.5290207441704507e-06, + "loss": 0.0501, + "step": 30351 + }, + { + "epoch": 82.70299727520435, + "grad_norm": 2.648916482925415, + "learning_rate": 1.5285517870050748e-06, + "loss": 0.1549, + "step": 30352 + }, + { + "epoch": 82.70572207084469, + "grad_norm": 2.461791515350342, + "learning_rate": 1.528082895815065e-06, + "loss": 0.1026, + "step": 30353 + }, + { + "epoch": 82.70844686648502, + "grad_norm": 2.5765380859375, + "learning_rate": 1.5276140706040698e-06, + "loss": 0.0536, + "step": 30354 + }, + { + "epoch": 82.71117166212534, + "grad_norm": 2.104875326156616, + "learning_rate": 1.5271453113757462e-06, + "loss": 0.0284, + "step": 30355 + }, + { + "epoch": 82.71389645776567, + "grad_norm": 3.0429880619049072, + "learning_rate": 1.5266766181337423e-06, + "loss": 0.0596, + "step": 30356 + }, + { + "epoch": 82.71662125340599, + "grad_norm": 2.4085068702697754, + "learning_rate": 1.5262079908817084e-06, + "loss": 0.0319, + "step": 30357 + }, + { + "epoch": 82.71934604904632, + "grad_norm": 3.892064332962036, + "learning_rate": 1.5257394296232907e-06, + "loss": 0.096, + "step": 30358 + }, + { + "epoch": 82.72207084468666, + "grad_norm": 1.9599765539169312, + "learning_rate": 1.5252709343621452e-06, + "loss": 0.0277, + "step": 30359 + }, + { + "epoch": 82.72479564032697, + "grad_norm": 2.7941465377807617, + "learning_rate": 1.5248025051019145e-06, + "loss": 0.0881, + "step": 30360 + }, + { + "epoch": 82.7275204359673, + "grad_norm": 3.0377144813537598, + "learning_rate": 1.524334141846251e-06, + "loss": 0.0847, + "step": 30361 + }, + { + "epoch": 82.73024523160763, + "grad_norm": 2.1820876598358154, + "learning_rate": 1.5238658445987997e-06, + "loss": 0.0345, + "step": 30362 + }, + { + "epoch": 82.73297002724796, + "grad_norm": 4.174436569213867, + "learning_rate": 1.5233976133632067e-06, + "loss": 0.0917, + "step": 30363 + }, + { + "epoch": 82.73569482288828, + "grad_norm": 3.4797418117523193, + "learning_rate": 1.5229294481431233e-06, + "loss": 0.1001, + "step": 30364 + }, + { + "epoch": 82.73841961852861, + "grad_norm": 2.293530225753784, + "learning_rate": 1.5224613489421914e-06, + "loss": 0.0307, + "step": 30365 + }, + { + "epoch": 82.74114441416894, + "grad_norm": 2.3010637760162354, + "learning_rate": 1.5219933157640576e-06, + "loss": 0.0726, + "step": 30366 + }, + { + "epoch": 82.74386920980926, + "grad_norm": 2.6362626552581787, + "learning_rate": 1.521525348612366e-06, + "loss": 0.1183, + "step": 30367 + }, + { + "epoch": 82.7465940054496, + "grad_norm": 3.284475564956665, + "learning_rate": 1.5210574474907635e-06, + "loss": 0.0678, + "step": 30368 + }, + { + "epoch": 82.74931880108991, + "grad_norm": 1.8884029388427734, + "learning_rate": 1.520589612402893e-06, + "loss": 0.0197, + "step": 30369 + }, + { + "epoch": 82.75204359673025, + "grad_norm": 2.4459478855133057, + "learning_rate": 1.5201218433523945e-06, + "loss": 0.0264, + "step": 30370 + }, + { + "epoch": 82.75476839237058, + "grad_norm": 1.9934412240982056, + "learning_rate": 1.5196541403429176e-06, + "loss": 0.0404, + "step": 30371 + }, + { + "epoch": 82.7574931880109, + "grad_norm": 4.480851650238037, + "learning_rate": 1.5191865033781005e-06, + "loss": 0.0641, + "step": 30372 + }, + { + "epoch": 82.76021798365123, + "grad_norm": 3.1816046237945557, + "learning_rate": 1.518718932461587e-06, + "loss": 0.0825, + "step": 30373 + }, + { + "epoch": 82.76294277929155, + "grad_norm": 3.600402593612671, + "learning_rate": 1.518251427597014e-06, + "loss": 0.1267, + "step": 30374 + }, + { + "epoch": 82.76566757493188, + "grad_norm": 2.135265827178955, + "learning_rate": 1.5177839887880287e-06, + "loss": 0.0391, + "step": 30375 + }, + { + "epoch": 82.7683923705722, + "grad_norm": 1.769209384918213, + "learning_rate": 1.5173166160382692e-06, + "loss": 0.0286, + "step": 30376 + }, + { + "epoch": 82.77111716621253, + "grad_norm": 2.300689697265625, + "learning_rate": 1.5168493093513714e-06, + "loss": 0.0462, + "step": 30377 + }, + { + "epoch": 82.77384196185287, + "grad_norm": 5.4529948234558105, + "learning_rate": 1.5163820687309816e-06, + "loss": 0.0331, + "step": 30378 + }, + { + "epoch": 82.77656675749319, + "grad_norm": 3.395545244216919, + "learning_rate": 1.5159148941807323e-06, + "loss": 0.0498, + "step": 30379 + }, + { + "epoch": 82.77929155313352, + "grad_norm": 3.3990988731384277, + "learning_rate": 1.5154477857042672e-06, + "loss": 0.0288, + "step": 30380 + }, + { + "epoch": 82.78201634877384, + "grad_norm": 2.8645358085632324, + "learning_rate": 1.5149807433052222e-06, + "loss": 0.1668, + "step": 30381 + }, + { + "epoch": 82.78474114441417, + "grad_norm": 1.9748790264129639, + "learning_rate": 1.5145137669872334e-06, + "loss": 0.0238, + "step": 30382 + }, + { + "epoch": 82.7874659400545, + "grad_norm": 2.9800281524658203, + "learning_rate": 1.5140468567539357e-06, + "loss": 0.095, + "step": 30383 + }, + { + "epoch": 82.79019073569482, + "grad_norm": 2.9694268703460693, + "learning_rate": 1.5135800126089707e-06, + "loss": 0.0295, + "step": 30384 + }, + { + "epoch": 82.79291553133515, + "grad_norm": 2.362278699874878, + "learning_rate": 1.5131132345559718e-06, + "loss": 0.0309, + "step": 30385 + }, + { + "epoch": 82.79564032697547, + "grad_norm": 2.7103750705718994, + "learning_rate": 1.5126465225985731e-06, + "loss": 0.0697, + "step": 30386 + }, + { + "epoch": 82.7983651226158, + "grad_norm": 2.0758557319641113, + "learning_rate": 1.5121798767404084e-06, + "loss": 0.0233, + "step": 30387 + }, + { + "epoch": 82.80108991825612, + "grad_norm": 2.3000056743621826, + "learning_rate": 1.5117132969851156e-06, + "loss": 0.047, + "step": 30388 + }, + { + "epoch": 82.80381471389646, + "grad_norm": 3.21502423286438, + "learning_rate": 1.5112467833363265e-06, + "loss": 0.0957, + "step": 30389 + }, + { + "epoch": 82.80653950953679, + "grad_norm": 2.4644534587860107, + "learning_rate": 1.5107803357976748e-06, + "loss": 0.0904, + "step": 30390 + }, + { + "epoch": 82.80926430517711, + "grad_norm": 2.0804672241210938, + "learning_rate": 1.5103139543727895e-06, + "loss": 0.0291, + "step": 30391 + }, + { + "epoch": 82.81198910081744, + "grad_norm": 2.8503310680389404, + "learning_rate": 1.5098476390653082e-06, + "loss": 0.1207, + "step": 30392 + }, + { + "epoch": 82.81471389645776, + "grad_norm": 2.9527807235717773, + "learning_rate": 1.509381389878861e-06, + "loss": 0.0517, + "step": 30393 + }, + { + "epoch": 82.8174386920981, + "grad_norm": 3.389192581176758, + "learning_rate": 1.5089152068170755e-06, + "loss": 0.0401, + "step": 30394 + }, + { + "epoch": 82.82016348773843, + "grad_norm": 3.221360921859741, + "learning_rate": 1.5084490898835857e-06, + "loss": 0.0496, + "step": 30395 + }, + { + "epoch": 82.82288828337875, + "grad_norm": 2.4442756175994873, + "learning_rate": 1.5079830390820226e-06, + "loss": 0.0295, + "step": 30396 + }, + { + "epoch": 82.82561307901908, + "grad_norm": 3.3505232334136963, + "learning_rate": 1.5075170544160145e-06, + "loss": 0.0624, + "step": 30397 + }, + { + "epoch": 82.8283378746594, + "grad_norm": 1.7819381952285767, + "learning_rate": 1.5070511358891904e-06, + "loss": 0.0206, + "step": 30398 + }, + { + "epoch": 82.83106267029973, + "grad_norm": 2.8520798683166504, + "learning_rate": 1.5065852835051764e-06, + "loss": 0.031, + "step": 30399 + }, + { + "epoch": 82.83378746594005, + "grad_norm": 2.9648475646972656, + "learning_rate": 1.5061194972676041e-06, + "loss": 0.0932, + "step": 30400 + }, + { + "epoch": 82.83651226158038, + "grad_norm": 2.1956398487091064, + "learning_rate": 1.5056537771801016e-06, + "loss": 0.042, + "step": 30401 + }, + { + "epoch": 82.83923705722071, + "grad_norm": 3.113151788711548, + "learning_rate": 1.5051881232462928e-06, + "loss": 0.0357, + "step": 30402 + }, + { + "epoch": 82.84196185286103, + "grad_norm": 3.4155240058898926, + "learning_rate": 1.5047225354698037e-06, + "loss": 0.0434, + "step": 30403 + }, + { + "epoch": 82.84468664850137, + "grad_norm": 3.0014431476593018, + "learning_rate": 1.5042570138542645e-06, + "loss": 0.0336, + "step": 30404 + }, + { + "epoch": 82.84741144414168, + "grad_norm": 2.3759243488311768, + "learning_rate": 1.503791558403298e-06, + "loss": 0.0439, + "step": 30405 + }, + { + "epoch": 82.85013623978202, + "grad_norm": 3.328617572784424, + "learning_rate": 1.5033261691205292e-06, + "loss": 0.2054, + "step": 30406 + }, + { + "epoch": 82.85286103542235, + "grad_norm": 3.585984230041504, + "learning_rate": 1.5028608460095807e-06, + "loss": 0.0538, + "step": 30407 + }, + { + "epoch": 82.85558583106267, + "grad_norm": 2.3514294624328613, + "learning_rate": 1.5023955890740804e-06, + "loss": 0.0342, + "step": 30408 + }, + { + "epoch": 82.858310626703, + "grad_norm": 3.1947872638702393, + "learning_rate": 1.5019303983176504e-06, + "loss": 0.0362, + "step": 30409 + }, + { + "epoch": 82.86103542234332, + "grad_norm": 2.9419167041778564, + "learning_rate": 1.501465273743913e-06, + "loss": 0.0327, + "step": 30410 + }, + { + "epoch": 82.86376021798365, + "grad_norm": 3.953352212905884, + "learning_rate": 1.5010002153564873e-06, + "loss": 0.106, + "step": 30411 + }, + { + "epoch": 82.86648501362397, + "grad_norm": 2.5346102714538574, + "learning_rate": 1.5005352231589987e-06, + "loss": 0.0364, + "step": 30412 + }, + { + "epoch": 82.8692098092643, + "grad_norm": 1.6460795402526855, + "learning_rate": 1.5000702971550707e-06, + "loss": 0.0216, + "step": 30413 + }, + { + "epoch": 82.87193460490464, + "grad_norm": 3.1867313385009766, + "learning_rate": 1.4996054373483215e-06, + "loss": 0.1681, + "step": 30414 + }, + { + "epoch": 82.87465940054496, + "grad_norm": 2.953021764755249, + "learning_rate": 1.4991406437423694e-06, + "loss": 0.1105, + "step": 30415 + }, + { + "epoch": 82.87738419618529, + "grad_norm": 2.1132028102874756, + "learning_rate": 1.4986759163408393e-06, + "loss": 0.0472, + "step": 30416 + }, + { + "epoch": 82.88010899182561, + "grad_norm": 2.8401522636413574, + "learning_rate": 1.498211255147347e-06, + "loss": 0.1408, + "step": 30417 + }, + { + "epoch": 82.88283378746594, + "grad_norm": 2.509892702102661, + "learning_rate": 1.497746660165511e-06, + "loss": 0.0973, + "step": 30418 + }, + { + "epoch": 82.88555858310627, + "grad_norm": 2.653618097305298, + "learning_rate": 1.4972821313989495e-06, + "loss": 0.0714, + "step": 30419 + }, + { + "epoch": 82.88828337874659, + "grad_norm": 2.429211378097534, + "learning_rate": 1.4968176688512824e-06, + "loss": 0.0202, + "step": 30420 + }, + { + "epoch": 82.89100817438693, + "grad_norm": 2.8095321655273438, + "learning_rate": 1.4963532725261266e-06, + "loss": 0.0642, + "step": 30421 + }, + { + "epoch": 82.89373297002724, + "grad_norm": 3.2260658740997314, + "learning_rate": 1.495888942427096e-06, + "loss": 0.0577, + "step": 30422 + }, + { + "epoch": 82.89645776566758, + "grad_norm": 1.9967072010040283, + "learning_rate": 1.4954246785578085e-06, + "loss": 0.0706, + "step": 30423 + }, + { + "epoch": 82.8991825613079, + "grad_norm": 1.501876950263977, + "learning_rate": 1.4949604809218809e-06, + "loss": 0.0172, + "step": 30424 + }, + { + "epoch": 82.90190735694823, + "grad_norm": 6.5108819007873535, + "learning_rate": 1.4944963495229281e-06, + "loss": 0.0757, + "step": 30425 + }, + { + "epoch": 82.90463215258856, + "grad_norm": 2.5461976528167725, + "learning_rate": 1.4940322843645628e-06, + "loss": 0.0275, + "step": 30426 + }, + { + "epoch": 82.90735694822888, + "grad_norm": 2.8796920776367188, + "learning_rate": 1.4935682854503986e-06, + "loss": 0.0397, + "step": 30427 + }, + { + "epoch": 82.91008174386921, + "grad_norm": 3.414139986038208, + "learning_rate": 1.4931043527840538e-06, + "loss": 0.1772, + "step": 30428 + }, + { + "epoch": 82.91280653950953, + "grad_norm": 3.3438730239868164, + "learning_rate": 1.4926404863691357e-06, + "loss": 0.0849, + "step": 30429 + }, + { + "epoch": 82.91553133514986, + "grad_norm": 2.3764259815216064, + "learning_rate": 1.4921766862092612e-06, + "loss": 0.0252, + "step": 30430 + }, + { + "epoch": 82.9182561307902, + "grad_norm": 3.374160051345825, + "learning_rate": 1.491712952308042e-06, + "loss": 0.0494, + "step": 30431 + }, + { + "epoch": 82.92098092643052, + "grad_norm": 5.138745307922363, + "learning_rate": 1.4912492846690862e-06, + "loss": 0.0846, + "step": 30432 + }, + { + "epoch": 82.92370572207085, + "grad_norm": 2.571094512939453, + "learning_rate": 1.4907856832960088e-06, + "loss": 0.0702, + "step": 30433 + }, + { + "epoch": 82.92643051771117, + "grad_norm": 3.858018636703491, + "learning_rate": 1.490322148192419e-06, + "loss": 0.1358, + "step": 30434 + }, + { + "epoch": 82.9291553133515, + "grad_norm": 2.0177221298217773, + "learning_rate": 1.489858679361923e-06, + "loss": 0.0293, + "step": 30435 + }, + { + "epoch": 82.93188010899182, + "grad_norm": 1.7879647016525269, + "learning_rate": 1.4893952768081377e-06, + "loss": 0.0308, + "step": 30436 + }, + { + "epoch": 82.93460490463215, + "grad_norm": 2.2398107051849365, + "learning_rate": 1.488931940534667e-06, + "loss": 0.1906, + "step": 30437 + }, + { + "epoch": 82.93732970027249, + "grad_norm": 2.5204010009765625, + "learning_rate": 1.4884686705451213e-06, + "loss": 0.1873, + "step": 30438 + }, + { + "epoch": 82.9400544959128, + "grad_norm": 2.8309268951416016, + "learning_rate": 1.4880054668431043e-06, + "loss": 0.0631, + "step": 30439 + }, + { + "epoch": 82.94277929155314, + "grad_norm": 1.8874447345733643, + "learning_rate": 1.48754232943223e-06, + "loss": 0.025, + "step": 30440 + }, + { + "epoch": 82.94550408719346, + "grad_norm": 2.8392603397369385, + "learning_rate": 1.487079258316101e-06, + "loss": 0.1589, + "step": 30441 + }, + { + "epoch": 82.94822888283379, + "grad_norm": 4.089603900909424, + "learning_rate": 1.4866162534983252e-06, + "loss": 0.0425, + "step": 30442 + }, + { + "epoch": 82.95095367847412, + "grad_norm": 4.412265777587891, + "learning_rate": 1.4861533149825058e-06, + "loss": 0.0697, + "step": 30443 + }, + { + "epoch": 82.95367847411444, + "grad_norm": 2.268439292907715, + "learning_rate": 1.485690442772253e-06, + "loss": 0.0246, + "step": 30444 + }, + { + "epoch": 82.95640326975477, + "grad_norm": 2.5823121070861816, + "learning_rate": 1.4852276368711694e-06, + "loss": 0.0963, + "step": 30445 + }, + { + "epoch": 82.95912806539509, + "grad_norm": 3.604337692260742, + "learning_rate": 1.4847648972828554e-06, + "loss": 0.0265, + "step": 30446 + }, + { + "epoch": 82.96185286103542, + "grad_norm": 2.5100910663604736, + "learning_rate": 1.4843022240109218e-06, + "loss": 0.0226, + "step": 30447 + }, + { + "epoch": 82.96457765667574, + "grad_norm": 2.983286142349243, + "learning_rate": 1.4838396170589653e-06, + "loss": 0.0363, + "step": 30448 + }, + { + "epoch": 82.96730245231608, + "grad_norm": 2.635679244995117, + "learning_rate": 1.4833770764305944e-06, + "loss": 0.0891, + "step": 30449 + }, + { + "epoch": 82.97002724795641, + "grad_norm": 2.105109691619873, + "learning_rate": 1.4829146021294083e-06, + "loss": 0.0314, + "step": 30450 + }, + { + "epoch": 82.97275204359673, + "grad_norm": 3.193880558013916, + "learning_rate": 1.4824521941590097e-06, + "loss": 0.0221, + "step": 30451 + }, + { + "epoch": 82.97547683923706, + "grad_norm": 3.5505714416503906, + "learning_rate": 1.4819898525229958e-06, + "loss": 0.0597, + "step": 30452 + }, + { + "epoch": 82.97820163487738, + "grad_norm": 4.77075719833374, + "learning_rate": 1.4815275772249748e-06, + "loss": 0.0641, + "step": 30453 + }, + { + "epoch": 82.98092643051771, + "grad_norm": 3.000122308731079, + "learning_rate": 1.4810653682685417e-06, + "loss": 0.1045, + "step": 30454 + }, + { + "epoch": 82.98365122615803, + "grad_norm": 2.824181079864502, + "learning_rate": 1.4806032256572978e-06, + "loss": 0.1285, + "step": 30455 + }, + { + "epoch": 82.98637602179836, + "grad_norm": 2.2954354286193848, + "learning_rate": 1.4801411493948392e-06, + "loss": 0.1122, + "step": 30456 + }, + { + "epoch": 82.9891008174387, + "grad_norm": 2.3021657466888428, + "learning_rate": 1.47967913948477e-06, + "loss": 0.0271, + "step": 30457 + }, + { + "epoch": 82.99182561307902, + "grad_norm": 2.3377256393432617, + "learning_rate": 1.4792171959306844e-06, + "loss": 0.0824, + "step": 30458 + }, + { + "epoch": 82.99455040871935, + "grad_norm": 2.6584062576293945, + "learning_rate": 1.4787553187361793e-06, + "loss": 0.0325, + "step": 30459 + }, + { + "epoch": 82.99727520435967, + "grad_norm": 4.0611371994018555, + "learning_rate": 1.4782935079048567e-06, + "loss": 0.0837, + "step": 30460 + }, + { + "epoch": 83.0, + "grad_norm": 3.178171396255493, + "learning_rate": 1.4778317634403082e-06, + "loss": 0.0384, + "step": 30461 + }, + { + "epoch": 83.00272479564033, + "grad_norm": 2.2527153491973877, + "learning_rate": 1.4773700853461337e-06, + "loss": 0.0552, + "step": 30462 + }, + { + "epoch": 83.00544959128065, + "grad_norm": 2.4300429821014404, + "learning_rate": 1.4769084736259232e-06, + "loss": 0.0335, + "step": 30463 + }, + { + "epoch": 83.00817438692098, + "grad_norm": 2.9316818714141846, + "learning_rate": 1.4764469282832749e-06, + "loss": 0.0597, + "step": 30464 + }, + { + "epoch": 83.0108991825613, + "grad_norm": 2.5857608318328857, + "learning_rate": 1.4759854493217863e-06, + "loss": 0.0337, + "step": 30465 + }, + { + "epoch": 83.01362397820164, + "grad_norm": 3.271679639816284, + "learning_rate": 1.4755240367450485e-06, + "loss": 0.0271, + "step": 30466 + }, + { + "epoch": 83.01634877384195, + "grad_norm": 1.6700094938278198, + "learning_rate": 1.4750626905566557e-06, + "loss": 0.0189, + "step": 30467 + }, + { + "epoch": 83.01907356948229, + "grad_norm": 2.1981701850891113, + "learning_rate": 1.4746014107601969e-06, + "loss": 0.0901, + "step": 30468 + }, + { + "epoch": 83.02179836512262, + "grad_norm": 2.88409686088562, + "learning_rate": 1.4741401973592718e-06, + "loss": 0.0715, + "step": 30469 + }, + { + "epoch": 83.02452316076294, + "grad_norm": 3.3284995555877686, + "learning_rate": 1.4736790503574672e-06, + "loss": 0.019, + "step": 30470 + }, + { + "epoch": 83.02724795640327, + "grad_norm": 3.269502878189087, + "learning_rate": 1.473217969758376e-06, + "loss": 0.0818, + "step": 30471 + }, + { + "epoch": 83.02997275204359, + "grad_norm": 2.178234577178955, + "learning_rate": 1.4727569555655863e-06, + "loss": 0.0653, + "step": 30472 + }, + { + "epoch": 83.03269754768392, + "grad_norm": 2.9592747688293457, + "learning_rate": 1.4722960077826941e-06, + "loss": 0.1468, + "step": 30473 + }, + { + "epoch": 83.03542234332426, + "grad_norm": 3.2190043926239014, + "learning_rate": 1.4718351264132858e-06, + "loss": 0.0342, + "step": 30474 + }, + { + "epoch": 83.03814713896458, + "grad_norm": 2.257591485977173, + "learning_rate": 1.4713743114609501e-06, + "loss": 0.0391, + "step": 30475 + }, + { + "epoch": 83.04087193460491, + "grad_norm": 4.885451793670654, + "learning_rate": 1.4709135629292759e-06, + "loss": 0.0525, + "step": 30476 + }, + { + "epoch": 83.04359673024523, + "grad_norm": 2.8167476654052734, + "learning_rate": 1.4704528808218544e-06, + "loss": 0.1154, + "step": 30477 + }, + { + "epoch": 83.04632152588556, + "grad_norm": 2.9282259941101074, + "learning_rate": 1.4699922651422705e-06, + "loss": 0.2091, + "step": 30478 + }, + { + "epoch": 83.04904632152588, + "grad_norm": 3.9317188262939453, + "learning_rate": 1.4695317158941126e-06, + "loss": 0.0426, + "step": 30479 + }, + { + "epoch": 83.05177111716621, + "grad_norm": 2.7909698486328125, + "learning_rate": 1.4690712330809653e-06, + "loss": 0.0469, + "step": 30480 + }, + { + "epoch": 83.05449591280654, + "grad_norm": 2.0851080417633057, + "learning_rate": 1.4686108167064162e-06, + "loss": 0.1813, + "step": 30481 + }, + { + "epoch": 83.05722070844686, + "grad_norm": 2.5919992923736572, + "learning_rate": 1.4681504667740544e-06, + "loss": 0.0915, + "step": 30482 + }, + { + "epoch": 83.0599455040872, + "grad_norm": 2.0471487045288086, + "learning_rate": 1.4676901832874612e-06, + "loss": 0.0525, + "step": 30483 + }, + { + "epoch": 83.06267029972751, + "grad_norm": 2.909069776535034, + "learning_rate": 1.467229966250221e-06, + "loss": 0.0646, + "step": 30484 + }, + { + "epoch": 83.06539509536785, + "grad_norm": 3.2137203216552734, + "learning_rate": 1.4667698156659205e-06, + "loss": 0.0466, + "step": 30485 + }, + { + "epoch": 83.06811989100818, + "grad_norm": 3.1511332988739014, + "learning_rate": 1.4663097315381426e-06, + "loss": 0.1227, + "step": 30486 + }, + { + "epoch": 83.0708446866485, + "grad_norm": 3.3379552364349365, + "learning_rate": 1.4658497138704697e-06, + "loss": 0.0275, + "step": 30487 + }, + { + "epoch": 83.07356948228883, + "grad_norm": 1.6353423595428467, + "learning_rate": 1.4653897626664825e-06, + "loss": 0.111, + "step": 30488 + }, + { + "epoch": 83.07629427792915, + "grad_norm": 2.2430222034454346, + "learning_rate": 1.4649298779297671e-06, + "loss": 0.0451, + "step": 30489 + }, + { + "epoch": 83.07901907356948, + "grad_norm": 2.024216651916504, + "learning_rate": 1.4644700596639028e-06, + "loss": 0.0292, + "step": 30490 + }, + { + "epoch": 83.0817438692098, + "grad_norm": 2.4999301433563232, + "learning_rate": 1.4640103078724722e-06, + "loss": 0.1379, + "step": 30491 + }, + { + "epoch": 83.08446866485014, + "grad_norm": 2.5175302028656006, + "learning_rate": 1.4635506225590511e-06, + "loss": 0.0499, + "step": 30492 + }, + { + "epoch": 83.08719346049047, + "grad_norm": 1.646105408668518, + "learning_rate": 1.4630910037272262e-06, + "loss": 0.0364, + "step": 30493 + }, + { + "epoch": 83.08991825613079, + "grad_norm": 2.1817586421966553, + "learning_rate": 1.4626314513805728e-06, + "loss": 0.0451, + "step": 30494 + }, + { + "epoch": 83.09264305177112, + "grad_norm": 2.398751974105835, + "learning_rate": 1.4621719655226718e-06, + "loss": 0.0199, + "step": 30495 + }, + { + "epoch": 83.09536784741144, + "grad_norm": 2.215655565261841, + "learning_rate": 1.461712546157098e-06, + "loss": 0.0998, + "step": 30496 + }, + { + "epoch": 83.09809264305177, + "grad_norm": 3.4925975799560547, + "learning_rate": 1.461253193287434e-06, + "loss": 0.0876, + "step": 30497 + }, + { + "epoch": 83.1008174386921, + "grad_norm": 2.289992332458496, + "learning_rate": 1.4607939069172539e-06, + "loss": 0.0528, + "step": 30498 + }, + { + "epoch": 83.10354223433242, + "grad_norm": 3.3366615772247314, + "learning_rate": 1.4603346870501377e-06, + "loss": 0.0846, + "step": 30499 + }, + { + "epoch": 83.10626702997276, + "grad_norm": 2.611370325088501, + "learning_rate": 1.4598755336896575e-06, + "loss": 0.0329, + "step": 30500 + }, + { + "epoch": 83.10899182561307, + "grad_norm": 2.5329489707946777, + "learning_rate": 1.4594164468393945e-06, + "loss": 0.0361, + "step": 30501 + }, + { + "epoch": 83.11171662125341, + "grad_norm": 3.375791549682617, + "learning_rate": 1.4589574265029216e-06, + "loss": 0.0822, + "step": 30502 + }, + { + "epoch": 83.11444141689373, + "grad_norm": 2.672603130340576, + "learning_rate": 1.4584984726838136e-06, + "loss": 0.0269, + "step": 30503 + }, + { + "epoch": 83.11716621253406, + "grad_norm": 1.6498534679412842, + "learning_rate": 1.4580395853856412e-06, + "loss": 0.029, + "step": 30504 + }, + { + "epoch": 83.11989100817439, + "grad_norm": 3.100522994995117, + "learning_rate": 1.4575807646119844e-06, + "loss": 0.1374, + "step": 30505 + }, + { + "epoch": 83.12261580381471, + "grad_norm": 3.5831732749938965, + "learning_rate": 1.4571220103664142e-06, + "loss": 0.1449, + "step": 30506 + }, + { + "epoch": 83.12534059945504, + "grad_norm": 3.589817762374878, + "learning_rate": 1.4566633226525028e-06, + "loss": 0.1358, + "step": 30507 + }, + { + "epoch": 83.12806539509536, + "grad_norm": 3.455409526824951, + "learning_rate": 1.456204701473819e-06, + "loss": 0.0396, + "step": 30508 + }, + { + "epoch": 83.1307901907357, + "grad_norm": 2.8189685344696045, + "learning_rate": 1.4557461468339418e-06, + "loss": 0.0313, + "step": 30509 + }, + { + "epoch": 83.13351498637603, + "grad_norm": 3.691716432571411, + "learning_rate": 1.4552876587364373e-06, + "loss": 0.0425, + "step": 30510 + }, + { + "epoch": 83.13623978201635, + "grad_norm": 3.000974655151367, + "learning_rate": 1.4548292371848782e-06, + "loss": 0.0935, + "step": 30511 + }, + { + "epoch": 83.13896457765668, + "grad_norm": 1.9675675630569458, + "learning_rate": 1.4543708821828317e-06, + "loss": 0.0187, + "step": 30512 + }, + { + "epoch": 83.141689373297, + "grad_norm": 2.303309917449951, + "learning_rate": 1.4539125937338727e-06, + "loss": 0.0364, + "step": 30513 + }, + { + "epoch": 83.14441416893733, + "grad_norm": 3.037252902984619, + "learning_rate": 1.453454371841566e-06, + "loss": 0.1173, + "step": 30514 + }, + { + "epoch": 83.14713896457765, + "grad_norm": 1.996396541595459, + "learning_rate": 1.4529962165094803e-06, + "loss": 0.0722, + "step": 30515 + }, + { + "epoch": 83.14986376021798, + "grad_norm": 2.8723056316375732, + "learning_rate": 1.4525381277411864e-06, + "loss": 0.0352, + "step": 30516 + }, + { + "epoch": 83.15258855585832, + "grad_norm": 2.116116762161255, + "learning_rate": 1.452080105540249e-06, + "loss": 0.0233, + "step": 30517 + }, + { + "epoch": 83.15531335149863, + "grad_norm": 3.4875447750091553, + "learning_rate": 1.451622149910239e-06, + "loss": 0.0553, + "step": 30518 + }, + { + "epoch": 83.15803814713897, + "grad_norm": 3.095039129257202, + "learning_rate": 1.4511642608547195e-06, + "loss": 0.1883, + "step": 30519 + }, + { + "epoch": 83.16076294277929, + "grad_norm": 5.829368591308594, + "learning_rate": 1.4507064383772585e-06, + "loss": 0.1004, + "step": 30520 + }, + { + "epoch": 83.16348773841962, + "grad_norm": 2.4921467304229736, + "learning_rate": 1.4502486824814176e-06, + "loss": 0.1027, + "step": 30521 + }, + { + "epoch": 83.16621253405995, + "grad_norm": 3.3920462131500244, + "learning_rate": 1.4497909931707677e-06, + "loss": 0.0785, + "step": 30522 + }, + { + "epoch": 83.16893732970027, + "grad_norm": 1.6282061338424683, + "learning_rate": 1.4493333704488698e-06, + "loss": 0.0198, + "step": 30523 + }, + { + "epoch": 83.1716621253406, + "grad_norm": 1.7396368980407715, + "learning_rate": 1.4488758143192871e-06, + "loss": 0.0244, + "step": 30524 + }, + { + "epoch": 83.17438692098092, + "grad_norm": 2.3437485694885254, + "learning_rate": 1.4484183247855853e-06, + "loss": 0.1113, + "step": 30525 + }, + { + "epoch": 83.17711171662125, + "grad_norm": 2.6190948486328125, + "learning_rate": 1.4479609018513275e-06, + "loss": 0.0672, + "step": 30526 + }, + { + "epoch": 83.17983651226157, + "grad_norm": 2.357954502105713, + "learning_rate": 1.4475035455200748e-06, + "loss": 0.0504, + "step": 30527 + }, + { + "epoch": 83.1825613079019, + "grad_norm": 5.0774922370910645, + "learning_rate": 1.4470462557953869e-06, + "loss": 0.0404, + "step": 30528 + }, + { + "epoch": 83.18528610354224, + "grad_norm": 2.440586805343628, + "learning_rate": 1.4465890326808297e-06, + "loss": 0.0441, + "step": 30529 + }, + { + "epoch": 83.18801089918256, + "grad_norm": 1.9190253019332886, + "learning_rate": 1.4461318761799615e-06, + "loss": 0.0274, + "step": 30530 + }, + { + "epoch": 83.19073569482289, + "grad_norm": 3.7399632930755615, + "learning_rate": 1.4456747862963427e-06, + "loss": 0.0589, + "step": 30531 + }, + { + "epoch": 83.19346049046321, + "grad_norm": 2.8228495121002197, + "learning_rate": 1.4452177630335318e-06, + "loss": 0.0787, + "step": 30532 + }, + { + "epoch": 83.19618528610354, + "grad_norm": 4.243612766265869, + "learning_rate": 1.444760806395089e-06, + "loss": 0.0576, + "step": 30533 + }, + { + "epoch": 83.19891008174388, + "grad_norm": 2.3741116523742676, + "learning_rate": 1.4443039163845761e-06, + "loss": 0.0338, + "step": 30534 + }, + { + "epoch": 83.2016348773842, + "grad_norm": 2.946852684020996, + "learning_rate": 1.4438470930055492e-06, + "loss": 0.0667, + "step": 30535 + }, + { + "epoch": 83.20435967302453, + "grad_norm": 2.58840274810791, + "learning_rate": 1.4433903362615654e-06, + "loss": 0.0751, + "step": 30536 + }, + { + "epoch": 83.20708446866485, + "grad_norm": 2.3835275173187256, + "learning_rate": 1.4429336461561804e-06, + "loss": 0.1215, + "step": 30537 + }, + { + "epoch": 83.20980926430518, + "grad_norm": 1.418433666229248, + "learning_rate": 1.4424770226929551e-06, + "loss": 0.029, + "step": 30538 + }, + { + "epoch": 83.2125340599455, + "grad_norm": 3.596494436264038, + "learning_rate": 1.4420204658754432e-06, + "loss": 0.0902, + "step": 30539 + }, + { + "epoch": 83.21525885558583, + "grad_norm": 2.294933795928955, + "learning_rate": 1.4415639757071998e-06, + "loss": 0.1384, + "step": 30540 + }, + { + "epoch": 83.21798365122616, + "grad_norm": 2.1866657733917236, + "learning_rate": 1.4411075521917794e-06, + "loss": 0.0433, + "step": 30541 + }, + { + "epoch": 83.22070844686648, + "grad_norm": 1.8189126253128052, + "learning_rate": 1.4406511953327397e-06, + "loss": 0.0631, + "step": 30542 + }, + { + "epoch": 83.22343324250681, + "grad_norm": 2.6391940116882324, + "learning_rate": 1.4401949051336328e-06, + "loss": 0.1192, + "step": 30543 + }, + { + "epoch": 83.22615803814713, + "grad_norm": 4.100677967071533, + "learning_rate": 1.4397386815980107e-06, + "loss": 0.1347, + "step": 30544 + }, + { + "epoch": 83.22888283378747, + "grad_norm": 2.553624391555786, + "learning_rate": 1.4392825247294307e-06, + "loss": 0.0775, + "step": 30545 + }, + { + "epoch": 83.2316076294278, + "grad_norm": 2.033749580383301, + "learning_rate": 1.4388264345314419e-06, + "loss": 0.0284, + "step": 30546 + }, + { + "epoch": 83.23433242506812, + "grad_norm": 2.9180612564086914, + "learning_rate": 1.438370411007598e-06, + "loss": 0.0624, + "step": 30547 + }, + { + "epoch": 83.23705722070845, + "grad_norm": 1.4826465845108032, + "learning_rate": 1.4379144541614476e-06, + "loss": 0.0225, + "step": 30548 + }, + { + "epoch": 83.23978201634877, + "grad_norm": 4.95634126663208, + "learning_rate": 1.4374585639965433e-06, + "loss": 0.065, + "step": 30549 + }, + { + "epoch": 83.2425068119891, + "grad_norm": 2.916814088821411, + "learning_rate": 1.437002740516439e-06, + "loss": 0.0676, + "step": 30550 + }, + { + "epoch": 83.24523160762942, + "grad_norm": 3.431065559387207, + "learning_rate": 1.4365469837246816e-06, + "loss": 0.0545, + "step": 30551 + }, + { + "epoch": 83.24795640326975, + "grad_norm": 1.5764778852462769, + "learning_rate": 1.4360912936248206e-06, + "loss": 0.023, + "step": 30552 + }, + { + "epoch": 83.25068119891009, + "grad_norm": 2.429016590118408, + "learning_rate": 1.4356356702204033e-06, + "loss": 0.0626, + "step": 30553 + }, + { + "epoch": 83.2534059945504, + "grad_norm": 2.5421488285064697, + "learning_rate": 1.4351801135149812e-06, + "loss": 0.0632, + "step": 30554 + }, + { + "epoch": 83.25613079019074, + "grad_norm": 1.6964192390441895, + "learning_rate": 1.4347246235121003e-06, + "loss": 0.0745, + "step": 30555 + }, + { + "epoch": 83.25885558583106, + "grad_norm": 2.7233622074127197, + "learning_rate": 1.434269200215309e-06, + "loss": 0.2518, + "step": 30556 + }, + { + "epoch": 83.26158038147139, + "grad_norm": 2.3182289600372314, + "learning_rate": 1.4338138436281512e-06, + "loss": 0.0272, + "step": 30557 + }, + { + "epoch": 83.26430517711172, + "grad_norm": 2.4392614364624023, + "learning_rate": 1.4333585537541782e-06, + "loss": 0.026, + "step": 30558 + }, + { + "epoch": 83.26702997275204, + "grad_norm": 2.2778537273406982, + "learning_rate": 1.432903330596933e-06, + "loss": 0.0846, + "step": 30559 + }, + { + "epoch": 83.26975476839237, + "grad_norm": 2.0409388542175293, + "learning_rate": 1.4324481741599606e-06, + "loss": 0.0413, + "step": 30560 + }, + { + "epoch": 83.2724795640327, + "grad_norm": 2.103501081466675, + "learning_rate": 1.4319930844468032e-06, + "loss": 0.0439, + "step": 30561 + }, + { + "epoch": 83.27520435967303, + "grad_norm": 2.7763302326202393, + "learning_rate": 1.4315380614610109e-06, + "loss": 0.1452, + "step": 30562 + }, + { + "epoch": 83.27792915531334, + "grad_norm": 2.781834125518799, + "learning_rate": 1.4310831052061248e-06, + "loss": 0.0546, + "step": 30563 + }, + { + "epoch": 83.28065395095368, + "grad_norm": 2.491203784942627, + "learning_rate": 1.4306282156856866e-06, + "loss": 0.0893, + "step": 30564 + }, + { + "epoch": 83.28337874659401, + "grad_norm": 2.416351318359375, + "learning_rate": 1.430173392903238e-06, + "loss": 0.0614, + "step": 30565 + }, + { + "epoch": 83.28610354223433, + "grad_norm": 2.570690393447876, + "learning_rate": 1.4297186368623262e-06, + "loss": 0.0201, + "step": 30566 + }, + { + "epoch": 83.28882833787466, + "grad_norm": 2.3026962280273438, + "learning_rate": 1.4292639475664872e-06, + "loss": 0.089, + "step": 30567 + }, + { + "epoch": 83.29155313351498, + "grad_norm": 3.0163443088531494, + "learning_rate": 1.4288093250192669e-06, + "loss": 0.1858, + "step": 30568 + }, + { + "epoch": 83.29427792915531, + "grad_norm": 2.9206223487854004, + "learning_rate": 1.4283547692242017e-06, + "loss": 0.0482, + "step": 30569 + }, + { + "epoch": 83.29700272479565, + "grad_norm": 3.8568670749664307, + "learning_rate": 1.4279002801848352e-06, + "loss": 0.0684, + "step": 30570 + }, + { + "epoch": 83.29972752043597, + "grad_norm": 2.722461462020874, + "learning_rate": 1.4274458579047056e-06, + "loss": 0.0273, + "step": 30571 + }, + { + "epoch": 83.3024523160763, + "grad_norm": 4.237865447998047, + "learning_rate": 1.4269915023873526e-06, + "loss": 0.0704, + "step": 30572 + }, + { + "epoch": 83.30517711171662, + "grad_norm": 2.010971784591675, + "learning_rate": 1.4265372136363109e-06, + "loss": 0.0262, + "step": 30573 + }, + { + "epoch": 83.30790190735695, + "grad_norm": 1.8063124418258667, + "learning_rate": 1.4260829916551245e-06, + "loss": 0.022, + "step": 30574 + }, + { + "epoch": 83.31062670299727, + "grad_norm": 2.8567333221435547, + "learning_rate": 1.425628836447327e-06, + "loss": 0.0369, + "step": 30575 + }, + { + "epoch": 83.3133514986376, + "grad_norm": 2.1532137393951416, + "learning_rate": 1.4251747480164557e-06, + "loss": 0.0679, + "step": 30576 + }, + { + "epoch": 83.31607629427793, + "grad_norm": 4.473711967468262, + "learning_rate": 1.4247207263660467e-06, + "loss": 0.1316, + "step": 30577 + }, + { + "epoch": 83.31880108991825, + "grad_norm": 3.0395073890686035, + "learning_rate": 1.4242667714996371e-06, + "loss": 0.0936, + "step": 30578 + }, + { + "epoch": 83.32152588555859, + "grad_norm": 2.379467725753784, + "learning_rate": 1.4238128834207633e-06, + "loss": 0.046, + "step": 30579 + }, + { + "epoch": 83.3242506811989, + "grad_norm": 3.5517351627349854, + "learning_rate": 1.4233590621329585e-06, + "loss": 0.0663, + "step": 30580 + }, + { + "epoch": 83.32697547683924, + "grad_norm": 3.2514889240264893, + "learning_rate": 1.4229053076397547e-06, + "loss": 0.1059, + "step": 30581 + }, + { + "epoch": 83.32970027247957, + "grad_norm": 3.2749216556549072, + "learning_rate": 1.4224516199446915e-06, + "loss": 0.1151, + "step": 30582 + }, + { + "epoch": 83.33242506811989, + "grad_norm": 1.983525037765503, + "learning_rate": 1.4219979990512977e-06, + "loss": 0.0227, + "step": 30583 + }, + { + "epoch": 83.33514986376022, + "grad_norm": 2.9139275550842285, + "learning_rate": 1.4215444449631054e-06, + "loss": 0.0809, + "step": 30584 + }, + { + "epoch": 83.33787465940054, + "grad_norm": 2.6436755657196045, + "learning_rate": 1.4210909576836496e-06, + "loss": 0.054, + "step": 30585 + }, + { + "epoch": 83.34059945504087, + "grad_norm": 2.570117235183716, + "learning_rate": 1.4206375372164628e-06, + "loss": 0.0635, + "step": 30586 + }, + { + "epoch": 83.34332425068119, + "grad_norm": 2.180441379547119, + "learning_rate": 1.4201841835650755e-06, + "loss": 0.1727, + "step": 30587 + }, + { + "epoch": 83.34604904632153, + "grad_norm": 1.9770933389663696, + "learning_rate": 1.419730896733017e-06, + "loss": 0.0207, + "step": 30588 + }, + { + "epoch": 83.34877384196186, + "grad_norm": 2.7037570476531982, + "learning_rate": 1.419277676723816e-06, + "loss": 0.0652, + "step": 30589 + }, + { + "epoch": 83.35149863760218, + "grad_norm": 2.091167688369751, + "learning_rate": 1.418824523541007e-06, + "loss": 0.0382, + "step": 30590 + }, + { + "epoch": 83.35422343324251, + "grad_norm": 4.447286128997803, + "learning_rate": 1.4183714371881164e-06, + "loss": 0.095, + "step": 30591 + }, + { + "epoch": 83.35694822888283, + "grad_norm": 3.060070753097534, + "learning_rate": 1.4179184176686722e-06, + "loss": 0.1467, + "step": 30592 + }, + { + "epoch": 83.35967302452316, + "grad_norm": 2.0797278881073, + "learning_rate": 1.4174654649862007e-06, + "loss": 0.0241, + "step": 30593 + }, + { + "epoch": 83.3623978201635, + "grad_norm": 2.980470895767212, + "learning_rate": 1.4170125791442346e-06, + "loss": 0.0349, + "step": 30594 + }, + { + "epoch": 83.36512261580381, + "grad_norm": 2.5694875717163086, + "learning_rate": 1.4165597601462987e-06, + "loss": 0.0486, + "step": 30595 + }, + { + "epoch": 83.36784741144415, + "grad_norm": 5.260220050811768, + "learning_rate": 1.4161070079959193e-06, + "loss": 0.0368, + "step": 30596 + }, + { + "epoch": 83.37057220708446, + "grad_norm": 2.054333209991455, + "learning_rate": 1.4156543226966191e-06, + "loss": 0.0455, + "step": 30597 + }, + { + "epoch": 83.3732970027248, + "grad_norm": 2.686857223510742, + "learning_rate": 1.4152017042519295e-06, + "loss": 0.0733, + "step": 30598 + }, + { + "epoch": 83.37602179836512, + "grad_norm": 2.216090202331543, + "learning_rate": 1.4147491526653723e-06, + "loss": 0.0734, + "step": 30599 + }, + { + "epoch": 83.37874659400545, + "grad_norm": 1.8555707931518555, + "learning_rate": 1.4142966679404724e-06, + "loss": 0.0211, + "step": 30600 + }, + { + "epoch": 83.38147138964578, + "grad_norm": 3.099801778793335, + "learning_rate": 1.4138442500807524e-06, + "loss": 0.0465, + "step": 30601 + }, + { + "epoch": 83.3841961852861, + "grad_norm": 2.2599716186523438, + "learning_rate": 1.4133918990897366e-06, + "loss": 0.021, + "step": 30602 + }, + { + "epoch": 83.38692098092643, + "grad_norm": 3.633221387863159, + "learning_rate": 1.4129396149709496e-06, + "loss": 0.0861, + "step": 30603 + }, + { + "epoch": 83.38964577656675, + "grad_norm": 2.193885087966919, + "learning_rate": 1.412487397727914e-06, + "loss": 0.0466, + "step": 30604 + }, + { + "epoch": 83.39237057220708, + "grad_norm": 2.2453367710113525, + "learning_rate": 1.4120352473641497e-06, + "loss": 0.0618, + "step": 30605 + }, + { + "epoch": 83.39509536784742, + "grad_norm": 3.7001543045043945, + "learning_rate": 1.4115831638831756e-06, + "loss": 0.0586, + "step": 30606 + }, + { + "epoch": 83.39782016348774, + "grad_norm": 3.756469249725342, + "learning_rate": 1.411131147288518e-06, + "loss": 0.1001, + "step": 30607 + }, + { + "epoch": 83.40054495912807, + "grad_norm": 2.7054014205932617, + "learning_rate": 1.4106791975836941e-06, + "loss": 0.0302, + "step": 30608 + }, + { + "epoch": 83.40326975476839, + "grad_norm": 1.775532603263855, + "learning_rate": 1.4102273147722235e-06, + "loss": 0.02, + "step": 30609 + }, + { + "epoch": 83.40599455040872, + "grad_norm": 3.216789960861206, + "learning_rate": 1.4097754988576273e-06, + "loss": 0.029, + "step": 30610 + }, + { + "epoch": 83.40871934604904, + "grad_norm": 1.575819492340088, + "learning_rate": 1.4093237498434232e-06, + "loss": 0.0206, + "step": 30611 + }, + { + "epoch": 83.41144414168937, + "grad_norm": 1.5731652975082397, + "learning_rate": 1.408872067733128e-06, + "loss": 0.0312, + "step": 30612 + }, + { + "epoch": 83.4141689373297, + "grad_norm": 2.619858741760254, + "learning_rate": 1.4084204525302602e-06, + "loss": 0.0825, + "step": 30613 + }, + { + "epoch": 83.41689373297002, + "grad_norm": 2.8369081020355225, + "learning_rate": 1.4079689042383394e-06, + "loss": 0.0654, + "step": 30614 + }, + { + "epoch": 83.41961852861036, + "grad_norm": 2.1706619262695312, + "learning_rate": 1.407517422860879e-06, + "loss": 0.0266, + "step": 30615 + }, + { + "epoch": 83.42234332425068, + "grad_norm": 3.0266902446746826, + "learning_rate": 1.4070660084013977e-06, + "loss": 0.0541, + "step": 30616 + }, + { + "epoch": 83.42506811989101, + "grad_norm": 6.6772356033325195, + "learning_rate": 1.4066146608634068e-06, + "loss": 0.0365, + "step": 30617 + }, + { + "epoch": 83.42779291553134, + "grad_norm": 1.6007728576660156, + "learning_rate": 1.4061633802504237e-06, + "loss": 0.0336, + "step": 30618 + }, + { + "epoch": 83.43051771117166, + "grad_norm": 4.361444473266602, + "learning_rate": 1.4057121665659667e-06, + "loss": 0.0641, + "step": 30619 + }, + { + "epoch": 83.433242506812, + "grad_norm": 2.419548273086548, + "learning_rate": 1.4052610198135475e-06, + "loss": 0.0233, + "step": 30620 + }, + { + "epoch": 83.43596730245231, + "grad_norm": 3.443169593811035, + "learning_rate": 1.4048099399966774e-06, + "loss": 0.0995, + "step": 30621 + }, + { + "epoch": 83.43869209809264, + "grad_norm": 3.115429639816284, + "learning_rate": 1.4043589271188695e-06, + "loss": 0.0538, + "step": 30622 + }, + { + "epoch": 83.44141689373296, + "grad_norm": 3.2137451171875, + "learning_rate": 1.4039079811836398e-06, + "loss": 0.0373, + "step": 30623 + }, + { + "epoch": 83.4441416893733, + "grad_norm": 2.704097270965576, + "learning_rate": 1.4034571021944976e-06, + "loss": 0.1261, + "step": 30624 + }, + { + "epoch": 83.44686648501363, + "grad_norm": 3.3638358116149902, + "learning_rate": 1.4030062901549557e-06, + "loss": 0.0397, + "step": 30625 + }, + { + "epoch": 83.44959128065395, + "grad_norm": 1.66252863407135, + "learning_rate": 1.4025555450685213e-06, + "loss": 0.0215, + "step": 30626 + }, + { + "epoch": 83.45231607629428, + "grad_norm": 1.5898563861846924, + "learning_rate": 1.4021048669387094e-06, + "loss": 0.0215, + "step": 30627 + }, + { + "epoch": 83.4550408719346, + "grad_norm": 1.9060828685760498, + "learning_rate": 1.4016542557690282e-06, + "loss": 0.0272, + "step": 30628 + }, + { + "epoch": 83.45776566757493, + "grad_norm": 2.683668613433838, + "learning_rate": 1.4012037115629873e-06, + "loss": 0.0589, + "step": 30629 + }, + { + "epoch": 83.46049046321527, + "grad_norm": 3.511038303375244, + "learning_rate": 1.4007532343240936e-06, + "loss": 0.0573, + "step": 30630 + }, + { + "epoch": 83.46321525885558, + "grad_norm": 2.3716983795166016, + "learning_rate": 1.400302824055858e-06, + "loss": 0.0301, + "step": 30631 + }, + { + "epoch": 83.46594005449592, + "grad_norm": 2.2675628662109375, + "learning_rate": 1.3998524807617875e-06, + "loss": 0.0228, + "step": 30632 + }, + { + "epoch": 83.46866485013624, + "grad_norm": 2.15134596824646, + "learning_rate": 1.399402204445387e-06, + "loss": 0.0221, + "step": 30633 + }, + { + "epoch": 83.47138964577657, + "grad_norm": 2.639045476913452, + "learning_rate": 1.3989519951101682e-06, + "loss": 0.0328, + "step": 30634 + }, + { + "epoch": 83.47411444141689, + "grad_norm": 2.77884578704834, + "learning_rate": 1.3985018527596316e-06, + "loss": 0.0475, + "step": 30635 + }, + { + "epoch": 83.47683923705722, + "grad_norm": 1.6611262559890747, + "learning_rate": 1.398051777397288e-06, + "loss": 0.0355, + "step": 30636 + }, + { + "epoch": 83.47956403269755, + "grad_norm": 2.4296114444732666, + "learning_rate": 1.3976017690266397e-06, + "loss": 0.0592, + "step": 30637 + }, + { + "epoch": 83.48228882833787, + "grad_norm": 3.121490478515625, + "learning_rate": 1.3971518276511909e-06, + "loss": 0.0489, + "step": 30638 + }, + { + "epoch": 83.4850136239782, + "grad_norm": 3.141040325164795, + "learning_rate": 1.3967019532744475e-06, + "loss": 0.0381, + "step": 30639 + }, + { + "epoch": 83.48773841961852, + "grad_norm": 4.265635013580322, + "learning_rate": 1.3962521458999135e-06, + "loss": 0.0633, + "step": 30640 + }, + { + "epoch": 83.49046321525886, + "grad_norm": 2.9381966590881348, + "learning_rate": 1.3958024055310903e-06, + "loss": 0.0284, + "step": 30641 + }, + { + "epoch": 83.49318801089919, + "grad_norm": 4.230826377868652, + "learning_rate": 1.39535273217148e-06, + "loss": 0.1055, + "step": 30642 + }, + { + "epoch": 83.49591280653951, + "grad_norm": 2.1036412715911865, + "learning_rate": 1.3949031258245872e-06, + "loss": 0.0441, + "step": 30643 + }, + { + "epoch": 83.49863760217984, + "grad_norm": 2.635373115539551, + "learning_rate": 1.3944535864939112e-06, + "loss": 0.0543, + "step": 30644 + }, + { + "epoch": 83.50136239782016, + "grad_norm": 3.0548596382141113, + "learning_rate": 1.394004114182954e-06, + "loss": 0.1288, + "step": 30645 + }, + { + "epoch": 83.50408719346049, + "grad_norm": 3.0379130840301514, + "learning_rate": 1.393554708895214e-06, + "loss": 0.0715, + "step": 30646 + }, + { + "epoch": 83.50681198910081, + "grad_norm": 2.745727062225342, + "learning_rate": 1.3931053706341946e-06, + "loss": 0.0361, + "step": 30647 + }, + { + "epoch": 83.50953678474114, + "grad_norm": 3.432950019836426, + "learning_rate": 1.3926560994033945e-06, + "loss": 0.03, + "step": 30648 + }, + { + "epoch": 83.51226158038148, + "grad_norm": 1.986212134361267, + "learning_rate": 1.3922068952063107e-06, + "loss": 0.04, + "step": 30649 + }, + { + "epoch": 83.5149863760218, + "grad_norm": 2.554323673248291, + "learning_rate": 1.3917577580464414e-06, + "loss": 0.0786, + "step": 30650 + }, + { + "epoch": 83.51771117166213, + "grad_norm": 2.3508431911468506, + "learning_rate": 1.3913086879272874e-06, + "loss": 0.1057, + "step": 30651 + }, + { + "epoch": 83.52043596730245, + "grad_norm": 2.4980311393737793, + "learning_rate": 1.3908596848523436e-06, + "loss": 0.042, + "step": 30652 + }, + { + "epoch": 83.52316076294278, + "grad_norm": 2.53886342048645, + "learning_rate": 1.390410748825106e-06, + "loss": 0.0601, + "step": 30653 + }, + { + "epoch": 83.52588555858311, + "grad_norm": 1.843441367149353, + "learning_rate": 1.389961879849072e-06, + "loss": 0.0921, + "step": 30654 + }, + { + "epoch": 83.52861035422343, + "grad_norm": 2.445556640625, + "learning_rate": 1.3895130779277398e-06, + "loss": 0.0538, + "step": 30655 + }, + { + "epoch": 83.53133514986376, + "grad_norm": 3.4484446048736572, + "learning_rate": 1.3890643430646033e-06, + "loss": 0.0788, + "step": 30656 + }, + { + "epoch": 83.53405994550408, + "grad_norm": 1.5983630418777466, + "learning_rate": 1.3886156752631563e-06, + "loss": 0.1406, + "step": 30657 + }, + { + "epoch": 83.53678474114442, + "grad_norm": 3.125032901763916, + "learning_rate": 1.3881670745268904e-06, + "loss": 0.0841, + "step": 30658 + }, + { + "epoch": 83.53950953678473, + "grad_norm": 2.777785539627075, + "learning_rate": 1.3877185408593052e-06, + "loss": 0.035, + "step": 30659 + }, + { + "epoch": 83.54223433242507, + "grad_norm": 3.1854898929595947, + "learning_rate": 1.38727007426389e-06, + "loss": 0.0733, + "step": 30660 + }, + { + "epoch": 83.5449591280654, + "grad_norm": 3.2417075634002686, + "learning_rate": 1.3868216747441388e-06, + "loss": 0.0559, + "step": 30661 + }, + { + "epoch": 83.54768392370572, + "grad_norm": 2.797309160232544, + "learning_rate": 1.386373342303542e-06, + "loss": 0.0914, + "step": 30662 + }, + { + "epoch": 83.55040871934605, + "grad_norm": 2.2952725887298584, + "learning_rate": 1.3859250769455933e-06, + "loss": 0.043, + "step": 30663 + }, + { + "epoch": 83.55313351498637, + "grad_norm": 2.7266359329223633, + "learning_rate": 1.3854768786737826e-06, + "loss": 0.0312, + "step": 30664 + }, + { + "epoch": 83.5558583106267, + "grad_norm": 3.4587957859039307, + "learning_rate": 1.3850287474916013e-06, + "loss": 0.0401, + "step": 30665 + }, + { + "epoch": 83.55858310626704, + "grad_norm": 4.483211994171143, + "learning_rate": 1.3845806834025365e-06, + "loss": 0.0289, + "step": 30666 + }, + { + "epoch": 83.56130790190736, + "grad_norm": 2.459195852279663, + "learning_rate": 1.3841326864100823e-06, + "loss": 0.0427, + "step": 30667 + }, + { + "epoch": 83.56403269754769, + "grad_norm": 5.380830764770508, + "learning_rate": 1.3836847565177258e-06, + "loss": 0.0282, + "step": 30668 + }, + { + "epoch": 83.566757493188, + "grad_norm": 2.1368446350097656, + "learning_rate": 1.3832368937289543e-06, + "loss": 0.0287, + "step": 30669 + }, + { + "epoch": 83.56948228882834, + "grad_norm": 3.613755941390991, + "learning_rate": 1.3827890980472547e-06, + "loss": 0.0407, + "step": 30670 + }, + { + "epoch": 83.57220708446866, + "grad_norm": 3.5539443492889404, + "learning_rate": 1.3823413694761167e-06, + "loss": 0.0673, + "step": 30671 + }, + { + "epoch": 83.57493188010899, + "grad_norm": 2.5715603828430176, + "learning_rate": 1.3818937080190287e-06, + "loss": 0.0749, + "step": 30672 + }, + { + "epoch": 83.57765667574932, + "grad_norm": 2.368882894515991, + "learning_rate": 1.3814461136794755e-06, + "loss": 0.0874, + "step": 30673 + }, + { + "epoch": 83.58038147138964, + "grad_norm": 3.156682014465332, + "learning_rate": 1.3809985864609398e-06, + "loss": 0.0434, + "step": 30674 + }, + { + "epoch": 83.58310626702998, + "grad_norm": 3.6735572814941406, + "learning_rate": 1.3805511263669113e-06, + "loss": 0.1656, + "step": 30675 + }, + { + "epoch": 83.5858310626703, + "grad_norm": 2.4326329231262207, + "learning_rate": 1.3801037334008738e-06, + "loss": 0.0489, + "step": 30676 + }, + { + "epoch": 83.58855585831063, + "grad_norm": 2.5024240016937256, + "learning_rate": 1.379656407566311e-06, + "loss": 0.1442, + "step": 30677 + }, + { + "epoch": 83.59128065395096, + "grad_norm": 3.217705011367798, + "learning_rate": 1.3792091488667047e-06, + "loss": 0.038, + "step": 30678 + }, + { + "epoch": 83.59400544959128, + "grad_norm": 3.0005221366882324, + "learning_rate": 1.3787619573055421e-06, + "loss": 0.0558, + "step": 30679 + }, + { + "epoch": 83.59673024523161, + "grad_norm": 2.5085296630859375, + "learning_rate": 1.378314832886305e-06, + "loss": 0.039, + "step": 30680 + }, + { + "epoch": 83.59945504087193, + "grad_norm": 2.812469005584717, + "learning_rate": 1.3778677756124724e-06, + "loss": 0.0897, + "step": 30681 + }, + { + "epoch": 83.60217983651226, + "grad_norm": 2.7174370288848877, + "learning_rate": 1.3774207854875277e-06, + "loss": 0.1178, + "step": 30682 + }, + { + "epoch": 83.60490463215258, + "grad_norm": 2.182560682296753, + "learning_rate": 1.3769738625149532e-06, + "loss": 0.1622, + "step": 30683 + }, + { + "epoch": 83.60762942779292, + "grad_norm": 2.84898042678833, + "learning_rate": 1.3765270066982294e-06, + "loss": 0.0395, + "step": 30684 + }, + { + "epoch": 83.61035422343325, + "grad_norm": 2.567331075668335, + "learning_rate": 1.3760802180408362e-06, + "loss": 0.0294, + "step": 30685 + }, + { + "epoch": 83.61307901907357, + "grad_norm": 3.532907485961914, + "learning_rate": 1.3756334965462502e-06, + "loss": 0.0791, + "step": 30686 + }, + { + "epoch": 83.6158038147139, + "grad_norm": 3.5884735584259033, + "learning_rate": 1.3751868422179527e-06, + "loss": 0.048, + "step": 30687 + }, + { + "epoch": 83.61852861035422, + "grad_norm": 2.8066675662994385, + "learning_rate": 1.3747402550594246e-06, + "loss": 0.105, + "step": 30688 + }, + { + "epoch": 83.62125340599455, + "grad_norm": 4.59223747253418, + "learning_rate": 1.3742937350741414e-06, + "loss": 0.0326, + "step": 30689 + }, + { + "epoch": 83.62397820163488, + "grad_norm": 2.3158602714538574, + "learning_rate": 1.3738472822655824e-06, + "loss": 0.0263, + "step": 30690 + }, + { + "epoch": 83.6267029972752, + "grad_norm": 2.349701404571533, + "learning_rate": 1.3734008966372192e-06, + "loss": 0.0312, + "step": 30691 + }, + { + "epoch": 83.62942779291554, + "grad_norm": 2.4214534759521484, + "learning_rate": 1.3729545781925357e-06, + "loss": 0.0301, + "step": 30692 + }, + { + "epoch": 83.63215258855585, + "grad_norm": 2.4475653171539307, + "learning_rate": 1.3725083269350038e-06, + "loss": 0.0569, + "step": 30693 + }, + { + "epoch": 83.63487738419619, + "grad_norm": 4.429915904998779, + "learning_rate": 1.3720621428680991e-06, + "loss": 0.029, + "step": 30694 + }, + { + "epoch": 83.6376021798365, + "grad_norm": 3.721404552459717, + "learning_rate": 1.3716160259952948e-06, + "loss": 0.1161, + "step": 30695 + }, + { + "epoch": 83.64032697547684, + "grad_norm": 1.9863237142562866, + "learning_rate": 1.3711699763200692e-06, + "loss": 0.0211, + "step": 30696 + }, + { + "epoch": 83.64305177111717, + "grad_norm": 3.1300644874572754, + "learning_rate": 1.370723993845895e-06, + "loss": 0.2092, + "step": 30697 + }, + { + "epoch": 83.64577656675749, + "grad_norm": 5.223509311676025, + "learning_rate": 1.3702780785762415e-06, + "loss": 0.0372, + "step": 30698 + }, + { + "epoch": 83.64850136239782, + "grad_norm": 3.500175714492798, + "learning_rate": 1.3698322305145871e-06, + "loss": 0.0512, + "step": 30699 + }, + { + "epoch": 83.65122615803814, + "grad_norm": 2.1549646854400635, + "learning_rate": 1.3693864496644017e-06, + "loss": 0.0806, + "step": 30700 + }, + { + "epoch": 83.65395095367847, + "grad_norm": 2.5164310932159424, + "learning_rate": 1.3689407360291562e-06, + "loss": 0.0874, + "step": 30701 + }, + { + "epoch": 83.65667574931881, + "grad_norm": 2.9584224224090576, + "learning_rate": 1.3684950896123205e-06, + "loss": 0.223, + "step": 30702 + }, + { + "epoch": 83.65940054495913, + "grad_norm": 3.1741037368774414, + "learning_rate": 1.3680495104173697e-06, + "loss": 0.112, + "step": 30703 + }, + { + "epoch": 83.66212534059946, + "grad_norm": 3.3103814125061035, + "learning_rate": 1.3676039984477684e-06, + "loss": 0.045, + "step": 30704 + }, + { + "epoch": 83.66485013623978, + "grad_norm": 2.4003143310546875, + "learning_rate": 1.3671585537069931e-06, + "loss": 0.0453, + "step": 30705 + }, + { + "epoch": 83.66757493188011, + "grad_norm": 2.857621669769287, + "learning_rate": 1.3667131761985076e-06, + "loss": 0.0537, + "step": 30706 + }, + { + "epoch": 83.67029972752043, + "grad_norm": 2.950096845626831, + "learning_rate": 1.3662678659257811e-06, + "loss": 0.0477, + "step": 30707 + }, + { + "epoch": 83.67302452316076, + "grad_norm": 2.1988792419433594, + "learning_rate": 1.3658226228922844e-06, + "loss": 0.0796, + "step": 30708 + }, + { + "epoch": 83.6757493188011, + "grad_norm": 2.5007739067077637, + "learning_rate": 1.3653774471014825e-06, + "loss": 0.0622, + "step": 30709 + }, + { + "epoch": 83.67847411444141, + "grad_norm": 1.994951605796814, + "learning_rate": 1.3649323385568435e-06, + "loss": 0.0213, + "step": 30710 + }, + { + "epoch": 83.68119891008175, + "grad_norm": 2.182677745819092, + "learning_rate": 1.3644872972618316e-06, + "loss": 0.0238, + "step": 30711 + }, + { + "epoch": 83.68392370572207, + "grad_norm": 1.9833247661590576, + "learning_rate": 1.3640423232199174e-06, + "loss": 0.1247, + "step": 30712 + }, + { + "epoch": 83.6866485013624, + "grad_norm": 5.841768264770508, + "learning_rate": 1.3635974164345634e-06, + "loss": 0.0509, + "step": 30713 + }, + { + "epoch": 83.68937329700273, + "grad_norm": 2.157848834991455, + "learning_rate": 1.3631525769092336e-06, + "loss": 0.0432, + "step": 30714 + }, + { + "epoch": 83.69209809264305, + "grad_norm": 3.3198623657226562, + "learning_rate": 1.362707804647393e-06, + "loss": 0.1129, + "step": 30715 + }, + { + "epoch": 83.69482288828338, + "grad_norm": 7.962392330169678, + "learning_rate": 1.3622630996525067e-06, + "loss": 0.1005, + "step": 30716 + }, + { + "epoch": 83.6975476839237, + "grad_norm": 2.285831928253174, + "learning_rate": 1.3618184619280383e-06, + "loss": 0.141, + "step": 30717 + }, + { + "epoch": 83.70027247956403, + "grad_norm": 3.1766984462738037, + "learning_rate": 1.3613738914774477e-06, + "loss": 0.0723, + "step": 30718 + }, + { + "epoch": 83.70299727520435, + "grad_norm": 2.1154513359069824, + "learning_rate": 1.3609293883042007e-06, + "loss": 0.0608, + "step": 30719 + }, + { + "epoch": 83.70572207084469, + "grad_norm": 2.6665258407592773, + "learning_rate": 1.360484952411758e-06, + "loss": 0.101, + "step": 30720 + }, + { + "epoch": 83.70844686648502, + "grad_norm": 2.3414156436920166, + "learning_rate": 1.3600405838035779e-06, + "loss": 0.0314, + "step": 30721 + }, + { + "epoch": 83.71117166212534, + "grad_norm": 2.286808729171753, + "learning_rate": 1.3595962824831255e-06, + "loss": 0.0941, + "step": 30722 + }, + { + "epoch": 83.71389645776567, + "grad_norm": 1.7137775421142578, + "learning_rate": 1.3591520484538578e-06, + "loss": 0.0461, + "step": 30723 + }, + { + "epoch": 83.71662125340599, + "grad_norm": 2.542334794998169, + "learning_rate": 1.3587078817192378e-06, + "loss": 0.0527, + "step": 30724 + }, + { + "epoch": 83.71934604904632, + "grad_norm": 2.442690372467041, + "learning_rate": 1.3582637822827228e-06, + "loss": 0.0823, + "step": 30725 + }, + { + "epoch": 83.72207084468666, + "grad_norm": 1.598746657371521, + "learning_rate": 1.3578197501477708e-06, + "loss": 0.0205, + "step": 30726 + }, + { + "epoch": 83.72479564032697, + "grad_norm": 4.047211647033691, + "learning_rate": 1.3573757853178392e-06, + "loss": 0.1028, + "step": 30727 + }, + { + "epoch": 83.7275204359673, + "grad_norm": 2.4902350902557373, + "learning_rate": 1.3569318877963878e-06, + "loss": 0.1635, + "step": 30728 + }, + { + "epoch": 83.73024523160763, + "grad_norm": 2.145904541015625, + "learning_rate": 1.3564880575868734e-06, + "loss": 0.0409, + "step": 30729 + }, + { + "epoch": 83.73297002724796, + "grad_norm": 2.8706185817718506, + "learning_rate": 1.3560442946927522e-06, + "loss": 0.0326, + "step": 30730 + }, + { + "epoch": 83.73569482288828, + "grad_norm": 3.4135332107543945, + "learning_rate": 1.355600599117477e-06, + "loss": 0.0359, + "step": 30731 + }, + { + "epoch": 83.73841961852861, + "grad_norm": 3.3279924392700195, + "learning_rate": 1.3551569708645084e-06, + "loss": 0.1347, + "step": 30732 + }, + { + "epoch": 83.74114441416894, + "grad_norm": 3.154670000076294, + "learning_rate": 1.3547134099372993e-06, + "loss": 0.0558, + "step": 30733 + }, + { + "epoch": 83.74386920980926, + "grad_norm": 2.459663152694702, + "learning_rate": 1.3542699163393036e-06, + "loss": 0.0403, + "step": 30734 + }, + { + "epoch": 83.7465940054496, + "grad_norm": 2.3531036376953125, + "learning_rate": 1.353826490073974e-06, + "loss": 0.0515, + "step": 30735 + }, + { + "epoch": 83.74931880108991, + "grad_norm": 2.820645809173584, + "learning_rate": 1.3533831311447665e-06, + "loss": 0.0406, + "step": 30736 + }, + { + "epoch": 83.75204359673025, + "grad_norm": 2.0220279693603516, + "learning_rate": 1.3529398395551342e-06, + "loss": 0.0183, + "step": 30737 + }, + { + "epoch": 83.75476839237058, + "grad_norm": 3.94909930229187, + "learning_rate": 1.3524966153085272e-06, + "loss": 0.0858, + "step": 30738 + }, + { + "epoch": 83.7574931880109, + "grad_norm": 2.462339162826538, + "learning_rate": 1.3520534584083932e-06, + "loss": 0.0272, + "step": 30739 + }, + { + "epoch": 83.76021798365123, + "grad_norm": 2.521505832672119, + "learning_rate": 1.351610368858194e-06, + "loss": 0.0499, + "step": 30740 + }, + { + "epoch": 83.76294277929155, + "grad_norm": 3.2271714210510254, + "learning_rate": 1.351167346661375e-06, + "loss": 0.0789, + "step": 30741 + }, + { + "epoch": 83.76566757493188, + "grad_norm": 3.7426722049713135, + "learning_rate": 1.3507243918213864e-06, + "loss": 0.0493, + "step": 30742 + }, + { + "epoch": 83.7683923705722, + "grad_norm": 2.64389967918396, + "learning_rate": 1.3502815043416751e-06, + "loss": 0.1364, + "step": 30743 + }, + { + "epoch": 83.77111716621253, + "grad_norm": 2.8800723552703857, + "learning_rate": 1.349838684225695e-06, + "loss": 0.1093, + "step": 30744 + }, + { + "epoch": 83.77384196185287, + "grad_norm": 3.1709158420562744, + "learning_rate": 1.3493959314768934e-06, + "loss": 0.1316, + "step": 30745 + }, + { + "epoch": 83.77656675749319, + "grad_norm": 2.8967678546905518, + "learning_rate": 1.3489532460987176e-06, + "loss": 0.0496, + "step": 30746 + }, + { + "epoch": 83.77929155313352, + "grad_norm": 1.6467289924621582, + "learning_rate": 1.3485106280946137e-06, + "loss": 0.0194, + "step": 30747 + }, + { + "epoch": 83.78201634877384, + "grad_norm": 2.877261161804199, + "learning_rate": 1.348068077468032e-06, + "loss": 0.0649, + "step": 30748 + }, + { + "epoch": 83.78474114441417, + "grad_norm": 2.013784170150757, + "learning_rate": 1.3476255942224193e-06, + "loss": 0.1587, + "step": 30749 + }, + { + "epoch": 83.7874659400545, + "grad_norm": 2.0299766063690186, + "learning_rate": 1.3471831783612189e-06, + "loss": 0.0246, + "step": 30750 + }, + { + "epoch": 83.79019073569482, + "grad_norm": 1.8846317529678345, + "learning_rate": 1.3467408298878747e-06, + "loss": 0.0325, + "step": 30751 + }, + { + "epoch": 83.79291553133515, + "grad_norm": 2.4729061126708984, + "learning_rate": 1.3462985488058366e-06, + "loss": 0.115, + "step": 30752 + }, + { + "epoch": 83.79564032697547, + "grad_norm": 3.446141481399536, + "learning_rate": 1.3458563351185482e-06, + "loss": 0.0824, + "step": 30753 + }, + { + "epoch": 83.7983651226158, + "grad_norm": 3.2303617000579834, + "learning_rate": 1.3454141888294514e-06, + "loss": 0.0343, + "step": 30754 + }, + { + "epoch": 83.80108991825612, + "grad_norm": 2.0372912883758545, + "learning_rate": 1.3449721099419876e-06, + "loss": 0.026, + "step": 30755 + }, + { + "epoch": 83.80381471389646, + "grad_norm": 2.161118507385254, + "learning_rate": 1.3445300984596032e-06, + "loss": 0.0423, + "step": 30756 + }, + { + "epoch": 83.80653950953679, + "grad_norm": 4.139506816864014, + "learning_rate": 1.344088154385741e-06, + "loss": 0.0711, + "step": 30757 + }, + { + "epoch": 83.80926430517711, + "grad_norm": 2.070422649383545, + "learning_rate": 1.3436462777238424e-06, + "loss": 0.0359, + "step": 30758 + }, + { + "epoch": 83.81198910081744, + "grad_norm": 3.227454900741577, + "learning_rate": 1.343204468477346e-06, + "loss": 0.1504, + "step": 30759 + }, + { + "epoch": 83.81471389645776, + "grad_norm": 2.8671176433563232, + "learning_rate": 1.3427627266496967e-06, + "loss": 0.0839, + "step": 30760 + }, + { + "epoch": 83.8174386920981, + "grad_norm": 1.9733912944793701, + "learning_rate": 1.342321052244333e-06, + "loss": 0.029, + "step": 30761 + }, + { + "epoch": 83.82016348773843, + "grad_norm": 3.2461791038513184, + "learning_rate": 1.3418794452646932e-06, + "loss": 0.0461, + "step": 30762 + }, + { + "epoch": 83.82288828337875, + "grad_norm": 2.115133285522461, + "learning_rate": 1.3414379057142158e-06, + "loss": 0.1248, + "step": 30763 + }, + { + "epoch": 83.82561307901908, + "grad_norm": 1.7545677423477173, + "learning_rate": 1.3409964335963443e-06, + "loss": 0.0162, + "step": 30764 + }, + { + "epoch": 83.8283378746594, + "grad_norm": 2.0505893230438232, + "learning_rate": 1.3405550289145131e-06, + "loss": 0.0707, + "step": 30765 + }, + { + "epoch": 83.83106267029973, + "grad_norm": 2.327916383743286, + "learning_rate": 1.3401136916721614e-06, + "loss": 0.0438, + "step": 30766 + }, + { + "epoch": 83.83378746594005, + "grad_norm": 2.9162378311157227, + "learning_rate": 1.339672421872722e-06, + "loss": 0.0292, + "step": 30767 + }, + { + "epoch": 83.83651226158038, + "grad_norm": 2.5131583213806152, + "learning_rate": 1.339231219519639e-06, + "loss": 0.1061, + "step": 30768 + }, + { + "epoch": 83.83923705722071, + "grad_norm": 3.5404741764068604, + "learning_rate": 1.3387900846163427e-06, + "loss": 0.1621, + "step": 30769 + }, + { + "epoch": 83.84196185286103, + "grad_norm": 2.8070809841156006, + "learning_rate": 1.3383490171662717e-06, + "loss": 0.062, + "step": 30770 + }, + { + "epoch": 83.84468664850137, + "grad_norm": 2.572690486907959, + "learning_rate": 1.3379080171728575e-06, + "loss": 0.0701, + "step": 30771 + }, + { + "epoch": 83.84741144414168, + "grad_norm": 4.501012325286865, + "learning_rate": 1.3374670846395388e-06, + "loss": 0.0436, + "step": 30772 + }, + { + "epoch": 83.85013623978202, + "grad_norm": 3.021658182144165, + "learning_rate": 1.3370262195697449e-06, + "loss": 0.0804, + "step": 30773 + }, + { + "epoch": 83.85286103542235, + "grad_norm": 2.2155721187591553, + "learning_rate": 1.336585421966915e-06, + "loss": 0.028, + "step": 30774 + }, + { + "epoch": 83.85558583106267, + "grad_norm": 2.8366146087646484, + "learning_rate": 1.3361446918344789e-06, + "loss": 0.041, + "step": 30775 + }, + { + "epoch": 83.858310626703, + "grad_norm": 3.742677688598633, + "learning_rate": 1.3357040291758661e-06, + "loss": 0.0359, + "step": 30776 + }, + { + "epoch": 83.86103542234332, + "grad_norm": 3.1085548400878906, + "learning_rate": 1.3352634339945147e-06, + "loss": 0.1177, + "step": 30777 + }, + { + "epoch": 83.86376021798365, + "grad_norm": 2.6871159076690674, + "learning_rate": 1.3348229062938522e-06, + "loss": 0.029, + "step": 30778 + }, + { + "epoch": 83.86648501362397, + "grad_norm": 2.5326735973358154, + "learning_rate": 1.3343824460773103e-06, + "loss": 0.1137, + "step": 30779 + }, + { + "epoch": 83.8692098092643, + "grad_norm": 3.30340313911438, + "learning_rate": 1.3339420533483171e-06, + "loss": 0.047, + "step": 30780 + }, + { + "epoch": 83.87193460490464, + "grad_norm": 3.567577600479126, + "learning_rate": 1.3335017281103059e-06, + "loss": 0.1472, + "step": 30781 + }, + { + "epoch": 83.87465940054496, + "grad_norm": 1.5896742343902588, + "learning_rate": 1.3330614703667045e-06, + "loss": 0.0453, + "step": 30782 + }, + { + "epoch": 83.87738419618529, + "grad_norm": 2.422525644302368, + "learning_rate": 1.3326212801209392e-06, + "loss": 0.0347, + "step": 30783 + }, + { + "epoch": 83.88010899182561, + "grad_norm": 2.526461362838745, + "learning_rate": 1.332181157376442e-06, + "loss": 0.0426, + "step": 30784 + }, + { + "epoch": 83.88283378746594, + "grad_norm": 2.8503379821777344, + "learning_rate": 1.33174110213664e-06, + "loss": 0.0658, + "step": 30785 + }, + { + "epoch": 83.88555858310627, + "grad_norm": 2.456122636795044, + "learning_rate": 1.3313011144049593e-06, + "loss": 0.0412, + "step": 30786 + }, + { + "epoch": 83.88828337874659, + "grad_norm": 1.6854655742645264, + "learning_rate": 1.3308611941848237e-06, + "loss": 0.0227, + "step": 30787 + }, + { + "epoch": 83.89100817438693, + "grad_norm": 2.3722498416900635, + "learning_rate": 1.330421341479664e-06, + "loss": 0.0312, + "step": 30788 + }, + { + "epoch": 83.89373297002724, + "grad_norm": 2.219261646270752, + "learning_rate": 1.3299815562929052e-06, + "loss": 0.0359, + "step": 30789 + }, + { + "epoch": 83.89645776566758, + "grad_norm": 3.1999733448028564, + "learning_rate": 1.3295418386279679e-06, + "loss": 0.0357, + "step": 30790 + }, + { + "epoch": 83.8991825613079, + "grad_norm": 2.2349696159362793, + "learning_rate": 1.3291021884882815e-06, + "loss": 0.0189, + "step": 30791 + }, + { + "epoch": 83.90190735694823, + "grad_norm": 4.736440658569336, + "learning_rate": 1.3286626058772668e-06, + "loss": 0.0338, + "step": 30792 + }, + { + "epoch": 83.90463215258856, + "grad_norm": 2.3881900310516357, + "learning_rate": 1.3282230907983507e-06, + "loss": 0.1011, + "step": 30793 + }, + { + "epoch": 83.90735694822888, + "grad_norm": 2.436798095703125, + "learning_rate": 1.327783643254954e-06, + "loss": 0.1332, + "step": 30794 + }, + { + "epoch": 83.91008174386921, + "grad_norm": 3.1069788932800293, + "learning_rate": 1.3273442632504985e-06, + "loss": 0.0848, + "step": 30795 + }, + { + "epoch": 83.91280653950953, + "grad_norm": 2.8002724647521973, + "learning_rate": 1.3269049507884057e-06, + "loss": 0.1597, + "step": 30796 + }, + { + "epoch": 83.91553133514986, + "grad_norm": 4.678211212158203, + "learning_rate": 1.3264657058720998e-06, + "loss": 0.1286, + "step": 30797 + }, + { + "epoch": 83.9182561307902, + "grad_norm": 3.485680103302002, + "learning_rate": 1.326026528504999e-06, + "loss": 0.1663, + "step": 30798 + }, + { + "epoch": 83.92098092643052, + "grad_norm": 2.8237295150756836, + "learning_rate": 1.325587418690525e-06, + "loss": 0.124, + "step": 30799 + }, + { + "epoch": 83.92370572207085, + "grad_norm": 2.188760995864868, + "learning_rate": 1.325148376432095e-06, + "loss": 0.0598, + "step": 30800 + }, + { + "epoch": 83.92643051771117, + "grad_norm": 2.43650221824646, + "learning_rate": 1.324709401733133e-06, + "loss": 0.028, + "step": 30801 + }, + { + "epoch": 83.9291553133515, + "grad_norm": 1.6160179376602173, + "learning_rate": 1.3242704945970541e-06, + "loss": 0.0201, + "step": 30802 + }, + { + "epoch": 83.93188010899182, + "grad_norm": 3.291584014892578, + "learning_rate": 1.3238316550272767e-06, + "loss": 0.0403, + "step": 30803 + }, + { + "epoch": 83.93460490463215, + "grad_norm": 3.426374673843384, + "learning_rate": 1.323392883027218e-06, + "loss": 0.0413, + "step": 30804 + }, + { + "epoch": 83.93732970027249, + "grad_norm": 4.177335262298584, + "learning_rate": 1.3229541786002987e-06, + "loss": 0.0972, + "step": 30805 + }, + { + "epoch": 83.9400544959128, + "grad_norm": 3.023916006088257, + "learning_rate": 1.3225155417499325e-06, + "loss": 0.1318, + "step": 30806 + }, + { + "epoch": 83.94277929155314, + "grad_norm": 2.683013916015625, + "learning_rate": 1.3220769724795334e-06, + "loss": 0.0687, + "step": 30807 + }, + { + "epoch": 83.94550408719346, + "grad_norm": 3.029341697692871, + "learning_rate": 1.32163847079252e-06, + "loss": 0.1477, + "step": 30808 + }, + { + "epoch": 83.94822888283379, + "grad_norm": 2.1001205444335938, + "learning_rate": 1.3212000366923095e-06, + "loss": 0.0492, + "step": 30809 + }, + { + "epoch": 83.95095367847412, + "grad_norm": 1.5391870737075806, + "learning_rate": 1.3207616701823135e-06, + "loss": 0.0199, + "step": 30810 + }, + { + "epoch": 83.95367847411444, + "grad_norm": 2.2881364822387695, + "learning_rate": 1.3203233712659457e-06, + "loss": 0.0889, + "step": 30811 + }, + { + "epoch": 83.95640326975477, + "grad_norm": 3.243116855621338, + "learning_rate": 1.3198851399466184e-06, + "loss": 0.0865, + "step": 30812 + }, + { + "epoch": 83.95912806539509, + "grad_norm": 3.009913206100464, + "learning_rate": 1.3194469762277485e-06, + "loss": 0.0822, + "step": 30813 + }, + { + "epoch": 83.96185286103542, + "grad_norm": 4.149927616119385, + "learning_rate": 1.3190088801127454e-06, + "loss": 0.0555, + "step": 30814 + }, + { + "epoch": 83.96457765667574, + "grad_norm": 1.8183202743530273, + "learning_rate": 1.3185708516050233e-06, + "loss": 0.025, + "step": 30815 + }, + { + "epoch": 83.96730245231608, + "grad_norm": 2.282015800476074, + "learning_rate": 1.3181328907079883e-06, + "loss": 0.0359, + "step": 30816 + }, + { + "epoch": 83.97002724795641, + "grad_norm": 1.651680827140808, + "learning_rate": 1.3176949974250575e-06, + "loss": 0.0199, + "step": 30817 + }, + { + "epoch": 83.97275204359673, + "grad_norm": 3.44093656539917, + "learning_rate": 1.3172571717596393e-06, + "loss": 0.0732, + "step": 30818 + }, + { + "epoch": 83.97547683923706, + "grad_norm": 2.1605823040008545, + "learning_rate": 1.3168194137151423e-06, + "loss": 0.026, + "step": 30819 + }, + { + "epoch": 83.97820163487738, + "grad_norm": 2.1238672733306885, + "learning_rate": 1.3163817232949738e-06, + "loss": 0.0295, + "step": 30820 + }, + { + "epoch": 83.98092643051771, + "grad_norm": 2.07331919670105, + "learning_rate": 1.3159441005025475e-06, + "loss": 0.0894, + "step": 30821 + }, + { + "epoch": 83.98365122615803, + "grad_norm": 3.058595895767212, + "learning_rate": 1.3155065453412696e-06, + "loss": 0.1239, + "step": 30822 + }, + { + "epoch": 83.98637602179836, + "grad_norm": 5.056929588317871, + "learning_rate": 1.3150690578145465e-06, + "loss": 0.1538, + "step": 30823 + }, + { + "epoch": 83.9891008174387, + "grad_norm": 1.865096092224121, + "learning_rate": 1.314631637925784e-06, + "loss": 0.0318, + "step": 30824 + }, + { + "epoch": 83.99182561307902, + "grad_norm": 2.403432607650757, + "learning_rate": 1.3141942856783908e-06, + "loss": 0.052, + "step": 30825 + }, + { + "epoch": 83.99455040871935, + "grad_norm": 2.6325230598449707, + "learning_rate": 1.313757001075775e-06, + "loss": 0.1049, + "step": 30826 + }, + { + "epoch": 83.99727520435967, + "grad_norm": 1.7367075681686401, + "learning_rate": 1.3133197841213396e-06, + "loss": 0.1423, + "step": 30827 + }, + { + "epoch": 84.0, + "grad_norm": 2.738262414932251, + "learning_rate": 1.3128826348184886e-06, + "loss": 0.0675, + "step": 30828 + }, + { + "epoch": 84.00272479564033, + "grad_norm": 2.9976625442504883, + "learning_rate": 1.3124455531706304e-06, + "loss": 0.075, + "step": 30829 + }, + { + "epoch": 84.00544959128065, + "grad_norm": 11.635932922363281, + "learning_rate": 1.3120085391811666e-06, + "loss": 0.0366, + "step": 30830 + }, + { + "epoch": 84.00817438692098, + "grad_norm": 2.359337568283081, + "learning_rate": 1.3115715928535e-06, + "loss": 0.025, + "step": 30831 + }, + { + "epoch": 84.0108991825613, + "grad_norm": 1.7224256992340088, + "learning_rate": 1.3111347141910324e-06, + "loss": 0.0272, + "step": 30832 + }, + { + "epoch": 84.01362397820164, + "grad_norm": 2.0104165077209473, + "learning_rate": 1.3106979031971701e-06, + "loss": 0.0425, + "step": 30833 + }, + { + "epoch": 84.01634877384195, + "grad_norm": 3.3771467208862305, + "learning_rate": 1.3102611598753135e-06, + "loss": 0.1773, + "step": 30834 + }, + { + "epoch": 84.01907356948229, + "grad_norm": 2.174729108810425, + "learning_rate": 1.3098244842288622e-06, + "loss": 0.0293, + "step": 30835 + }, + { + "epoch": 84.02179836512262, + "grad_norm": 3.263211965560913, + "learning_rate": 1.3093878762612167e-06, + "loss": 0.0771, + "step": 30836 + }, + { + "epoch": 84.02452316076294, + "grad_norm": 2.6361441612243652, + "learning_rate": 1.308951335975781e-06, + "loss": 0.0822, + "step": 30837 + }, + { + "epoch": 84.02724795640327, + "grad_norm": 4.018730640411377, + "learning_rate": 1.3085148633759525e-06, + "loss": 0.1253, + "step": 30838 + }, + { + "epoch": 84.02997275204359, + "grad_norm": 2.339142084121704, + "learning_rate": 1.3080784584651308e-06, + "loss": 0.0258, + "step": 30839 + }, + { + "epoch": 84.03269754768392, + "grad_norm": 2.0447726249694824, + "learning_rate": 1.3076421212467117e-06, + "loss": 0.0882, + "step": 30840 + }, + { + "epoch": 84.03542234332426, + "grad_norm": 2.7352120876312256, + "learning_rate": 1.307205851724097e-06, + "loss": 0.0681, + "step": 30841 + }, + { + "epoch": 84.03814713896458, + "grad_norm": 2.458771228790283, + "learning_rate": 1.3067696499006832e-06, + "loss": 0.0378, + "step": 30842 + }, + { + "epoch": 84.04087193460491, + "grad_norm": 2.5709726810455322, + "learning_rate": 1.3063335157798685e-06, + "loss": 0.0618, + "step": 30843 + }, + { + "epoch": 84.04359673024523, + "grad_norm": 3.4718542098999023, + "learning_rate": 1.305897449365049e-06, + "loss": 0.0762, + "step": 30844 + }, + { + "epoch": 84.04632152588556, + "grad_norm": 2.1422181129455566, + "learning_rate": 1.3054614506596186e-06, + "loss": 0.0276, + "step": 30845 + }, + { + "epoch": 84.04904632152588, + "grad_norm": 1.9626917839050293, + "learning_rate": 1.305025519666976e-06, + "loss": 0.0225, + "step": 30846 + }, + { + "epoch": 84.05177111716621, + "grad_norm": 2.641353130340576, + "learning_rate": 1.3045896563905147e-06, + "loss": 0.1121, + "step": 30847 + }, + { + "epoch": 84.05449591280654, + "grad_norm": 3.349381923675537, + "learning_rate": 1.3041538608336279e-06, + "loss": 0.0983, + "step": 30848 + }, + { + "epoch": 84.05722070844686, + "grad_norm": 9.3013334274292, + "learning_rate": 1.3037181329997128e-06, + "loss": 0.1697, + "step": 30849 + }, + { + "epoch": 84.0599455040872, + "grad_norm": 2.1191818714141846, + "learning_rate": 1.3032824728921612e-06, + "loss": 0.0515, + "step": 30850 + }, + { + "epoch": 84.06267029972751, + "grad_norm": 2.3567941188812256, + "learning_rate": 1.3028468805143657e-06, + "loss": 0.075, + "step": 30851 + }, + { + "epoch": 84.06539509536785, + "grad_norm": 4.8907928466796875, + "learning_rate": 1.302411355869716e-06, + "loss": 0.0441, + "step": 30852 + }, + { + "epoch": 84.06811989100818, + "grad_norm": 4.172059059143066, + "learning_rate": 1.3019758989616094e-06, + "loss": 0.1561, + "step": 30853 + }, + { + "epoch": 84.0708446866485, + "grad_norm": 2.6362855434417725, + "learning_rate": 1.3015405097934342e-06, + "loss": 0.0486, + "step": 30854 + }, + { + "epoch": 84.07356948228883, + "grad_norm": 2.9769845008850098, + "learning_rate": 1.301105188368582e-06, + "loss": 0.0565, + "step": 30855 + }, + { + "epoch": 84.07629427792915, + "grad_norm": 3.011777639389038, + "learning_rate": 1.3006699346904406e-06, + "loss": 0.074, + "step": 30856 + }, + { + "epoch": 84.07901907356948, + "grad_norm": 3.191282272338867, + "learning_rate": 1.3002347487624035e-06, + "loss": 0.146, + "step": 30857 + }, + { + "epoch": 84.0817438692098, + "grad_norm": 2.3934123516082764, + "learning_rate": 1.299799630587858e-06, + "loss": 0.0353, + "step": 30858 + }, + { + "epoch": 84.08446866485014, + "grad_norm": 2.757439374923706, + "learning_rate": 1.2993645801701914e-06, + "loss": 0.0457, + "step": 30859 + }, + { + "epoch": 84.08719346049047, + "grad_norm": 2.566817283630371, + "learning_rate": 1.2989295975127957e-06, + "loss": 0.0434, + "step": 30860 + }, + { + "epoch": 84.08991825613079, + "grad_norm": 2.684659481048584, + "learning_rate": 1.2984946826190537e-06, + "loss": 0.0312, + "step": 30861 + }, + { + "epoch": 84.09264305177112, + "grad_norm": 2.3274450302124023, + "learning_rate": 1.2980598354923567e-06, + "loss": 0.124, + "step": 30862 + }, + { + "epoch": 84.09536784741144, + "grad_norm": 1.5184946060180664, + "learning_rate": 1.2976250561360904e-06, + "loss": 0.0163, + "step": 30863 + }, + { + "epoch": 84.09809264305177, + "grad_norm": 4.458086013793945, + "learning_rate": 1.2971903445536393e-06, + "loss": 0.0395, + "step": 30864 + }, + { + "epoch": 84.1008174386921, + "grad_norm": 3.278067111968994, + "learning_rate": 1.2967557007483888e-06, + "loss": 0.0714, + "step": 30865 + }, + { + "epoch": 84.10354223433242, + "grad_norm": 6.933575630187988, + "learning_rate": 1.296321124723726e-06, + "loss": 0.1478, + "step": 30866 + }, + { + "epoch": 84.10626702997276, + "grad_norm": 1.8300024271011353, + "learning_rate": 1.2958866164830342e-06, + "loss": 0.0407, + "step": 30867 + }, + { + "epoch": 84.10899182561307, + "grad_norm": 1.7332144975662231, + "learning_rate": 1.295452176029698e-06, + "loss": 0.026, + "step": 30868 + }, + { + "epoch": 84.11171662125341, + "grad_norm": 2.7168946266174316, + "learning_rate": 1.2950178033670969e-06, + "loss": 0.0295, + "step": 30869 + }, + { + "epoch": 84.11444141689373, + "grad_norm": 3.1485800743103027, + "learning_rate": 1.2945834984986194e-06, + "loss": 0.0709, + "step": 30870 + }, + { + "epoch": 84.11716621253406, + "grad_norm": 2.4771053791046143, + "learning_rate": 1.2941492614276463e-06, + "loss": 0.0236, + "step": 30871 + }, + { + "epoch": 84.11989100817439, + "grad_norm": 2.1699888706207275, + "learning_rate": 1.2937150921575548e-06, + "loss": 0.0328, + "step": 30872 + }, + { + "epoch": 84.12261580381471, + "grad_norm": 2.5949923992156982, + "learning_rate": 1.293280990691733e-06, + "loss": 0.0341, + "step": 30873 + }, + { + "epoch": 84.12534059945504, + "grad_norm": 4.152580261230469, + "learning_rate": 1.292846957033559e-06, + "loss": 0.0759, + "step": 30874 + }, + { + "epoch": 84.12806539509536, + "grad_norm": 1.6484575271606445, + "learning_rate": 1.2924129911864126e-06, + "loss": 0.02, + "step": 30875 + }, + { + "epoch": 84.1307901907357, + "grad_norm": 8.59929084777832, + "learning_rate": 1.2919790931536714e-06, + "loss": 0.1513, + "step": 30876 + }, + { + "epoch": 84.13351498637603, + "grad_norm": 2.347327709197998, + "learning_rate": 1.291545262938716e-06, + "loss": 0.0391, + "step": 30877 + }, + { + "epoch": 84.13623978201635, + "grad_norm": 2.467940330505371, + "learning_rate": 1.291111500544928e-06, + "loss": 0.1548, + "step": 30878 + }, + { + "epoch": 84.13896457765668, + "grad_norm": 3.4825150966644287, + "learning_rate": 1.2906778059756842e-06, + "loss": 0.107, + "step": 30879 + }, + { + "epoch": 84.141689373297, + "grad_norm": 2.71108078956604, + "learning_rate": 1.2902441792343611e-06, + "loss": 0.0523, + "step": 30880 + }, + { + "epoch": 84.14441416893733, + "grad_norm": 3.5202860832214355, + "learning_rate": 1.2898106203243343e-06, + "loss": 0.1405, + "step": 30881 + }, + { + "epoch": 84.14713896457765, + "grad_norm": 2.7637648582458496, + "learning_rate": 1.2893771292489833e-06, + "loss": 0.1779, + "step": 30882 + }, + { + "epoch": 84.14986376021798, + "grad_norm": 2.0411412715911865, + "learning_rate": 1.2889437060116827e-06, + "loss": 0.0222, + "step": 30883 + }, + { + "epoch": 84.15258855585832, + "grad_norm": 2.349391222000122, + "learning_rate": 1.2885103506158091e-06, + "loss": 0.0362, + "step": 30884 + }, + { + "epoch": 84.15531335149863, + "grad_norm": 2.401488780975342, + "learning_rate": 1.2880770630647344e-06, + "loss": 0.0329, + "step": 30885 + }, + { + "epoch": 84.15803814713897, + "grad_norm": 3.2894418239593506, + "learning_rate": 1.2876438433618365e-06, + "loss": 0.0998, + "step": 30886 + }, + { + "epoch": 84.16076294277929, + "grad_norm": 3.3366899490356445, + "learning_rate": 1.2872106915104876e-06, + "loss": 0.1908, + "step": 30887 + }, + { + "epoch": 84.16348773841962, + "grad_norm": 2.944432497024536, + "learning_rate": 1.2867776075140625e-06, + "loss": 0.0735, + "step": 30888 + }, + { + "epoch": 84.16621253405995, + "grad_norm": 4.728024482727051, + "learning_rate": 1.2863445913759299e-06, + "loss": 0.0296, + "step": 30889 + }, + { + "epoch": 84.16893732970027, + "grad_norm": 2.4820241928100586, + "learning_rate": 1.2859116430994677e-06, + "loss": 0.0621, + "step": 30890 + }, + { + "epoch": 84.1716621253406, + "grad_norm": 1.9522933959960938, + "learning_rate": 1.285478762688046e-06, + "loss": 0.0211, + "step": 30891 + }, + { + "epoch": 84.17438692098092, + "grad_norm": 2.085561513900757, + "learning_rate": 1.285045950145032e-06, + "loss": 0.0729, + "step": 30892 + }, + { + "epoch": 84.17711171662125, + "grad_norm": 3.332383394241333, + "learning_rate": 1.2846132054738026e-06, + "loss": 0.0444, + "step": 30893 + }, + { + "epoch": 84.17983651226157, + "grad_norm": 2.9827792644500732, + "learning_rate": 1.284180528677722e-06, + "loss": 0.0545, + "step": 30894 + }, + { + "epoch": 84.1825613079019, + "grad_norm": 4.191866874694824, + "learning_rate": 1.2837479197601654e-06, + "loss": 0.0446, + "step": 30895 + }, + { + "epoch": 84.18528610354224, + "grad_norm": 3.2883105278015137, + "learning_rate": 1.2833153787245e-06, + "loss": 0.0655, + "step": 30896 + }, + { + "epoch": 84.18801089918256, + "grad_norm": 4.032162666320801, + "learning_rate": 1.282882905574091e-06, + "loss": 0.0128, + "step": 30897 + }, + { + "epoch": 84.19073569482289, + "grad_norm": 3.0079433917999268, + "learning_rate": 1.2824505003123123e-06, + "loss": 0.0341, + "step": 30898 + }, + { + "epoch": 84.19346049046321, + "grad_norm": 2.4322404861450195, + "learning_rate": 1.2820181629425276e-06, + "loss": 0.0564, + "step": 30899 + }, + { + "epoch": 84.19618528610354, + "grad_norm": 4.670801162719727, + "learning_rate": 1.2815858934681059e-06, + "loss": 0.0239, + "step": 30900 + }, + { + "epoch": 84.19891008174388, + "grad_norm": 2.6506736278533936, + "learning_rate": 1.2811536918924095e-06, + "loss": 0.044, + "step": 30901 + }, + { + "epoch": 84.2016348773842, + "grad_norm": 2.5493180751800537, + "learning_rate": 1.2807215582188104e-06, + "loss": 0.1176, + "step": 30902 + }, + { + "epoch": 84.20435967302453, + "grad_norm": 2.146432638168335, + "learning_rate": 1.2802894924506703e-06, + "loss": 0.0423, + "step": 30903 + }, + { + "epoch": 84.20708446866485, + "grad_norm": 2.18966007232666, + "learning_rate": 1.2798574945913556e-06, + "loss": 0.0201, + "step": 30904 + }, + { + "epoch": 84.20980926430518, + "grad_norm": 3.3071603775024414, + "learning_rate": 1.2794255646442278e-06, + "loss": 0.0583, + "step": 30905 + }, + { + "epoch": 84.2125340599455, + "grad_norm": 3.4619028568267822, + "learning_rate": 1.2789937026126553e-06, + "loss": 0.1473, + "step": 30906 + }, + { + "epoch": 84.21525885558583, + "grad_norm": 2.6102943420410156, + "learning_rate": 1.278561908499999e-06, + "loss": 0.0339, + "step": 30907 + }, + { + "epoch": 84.21798365122616, + "grad_norm": 2.582096815109253, + "learning_rate": 1.2781301823096226e-06, + "loss": 0.066, + "step": 30908 + }, + { + "epoch": 84.22070844686648, + "grad_norm": 2.0452327728271484, + "learning_rate": 1.2776985240448847e-06, + "loss": 0.0834, + "step": 30909 + }, + { + "epoch": 84.22343324250681, + "grad_norm": 1.526092767715454, + "learning_rate": 1.2772669337091525e-06, + "loss": 0.0232, + "step": 30910 + }, + { + "epoch": 84.22615803814713, + "grad_norm": 2.2443490028381348, + "learning_rate": 1.2768354113057823e-06, + "loss": 0.1376, + "step": 30911 + }, + { + "epoch": 84.22888283378747, + "grad_norm": 3.8927268981933594, + "learning_rate": 1.2764039568381392e-06, + "loss": 0.1478, + "step": 30912 + }, + { + "epoch": 84.2316076294278, + "grad_norm": 2.086414098739624, + "learning_rate": 1.2759725703095793e-06, + "loss": 0.0336, + "step": 30913 + }, + { + "epoch": 84.23433242506812, + "grad_norm": 2.4165940284729004, + "learning_rate": 1.2755412517234667e-06, + "loss": 0.0211, + "step": 30914 + }, + { + "epoch": 84.23705722070845, + "grad_norm": 2.5106959342956543, + "learning_rate": 1.2751100010831575e-06, + "loss": 0.1234, + "step": 30915 + }, + { + "epoch": 84.23978201634877, + "grad_norm": 1.790252923965454, + "learning_rate": 1.2746788183920112e-06, + "loss": 0.0216, + "step": 30916 + }, + { + "epoch": 84.2425068119891, + "grad_norm": 2.535311222076416, + "learning_rate": 1.274247703653383e-06, + "loss": 0.0208, + "step": 30917 + }, + { + "epoch": 84.24523160762942, + "grad_norm": 1.900929570198059, + "learning_rate": 1.2738166568706345e-06, + "loss": 0.0211, + "step": 30918 + }, + { + "epoch": 84.24795640326975, + "grad_norm": 2.733259439468384, + "learning_rate": 1.273385678047122e-06, + "loss": 0.0845, + "step": 30919 + }, + { + "epoch": 84.25068119891009, + "grad_norm": 2.1603260040283203, + "learning_rate": 1.2729547671862008e-06, + "loss": 0.0251, + "step": 30920 + }, + { + "epoch": 84.2534059945504, + "grad_norm": 2.6811716556549072, + "learning_rate": 1.2725239242912246e-06, + "loss": 0.0393, + "step": 30921 + }, + { + "epoch": 84.25613079019074, + "grad_norm": 1.8573046922683716, + "learning_rate": 1.272093149365553e-06, + "loss": 0.0291, + "step": 30922 + }, + { + "epoch": 84.25885558583106, + "grad_norm": 1.8902552127838135, + "learning_rate": 1.2716624424125402e-06, + "loss": 0.0342, + "step": 30923 + }, + { + "epoch": 84.26158038147139, + "grad_norm": 3.814934492111206, + "learning_rate": 1.2712318034355387e-06, + "loss": 0.0434, + "step": 30924 + }, + { + "epoch": 84.26430517711172, + "grad_norm": 2.337177276611328, + "learning_rate": 1.2708012324379004e-06, + "loss": 0.0277, + "step": 30925 + }, + { + "epoch": 84.26702997275204, + "grad_norm": 3.1108927726745605, + "learning_rate": 1.2703707294229839e-06, + "loss": 0.1517, + "step": 30926 + }, + { + "epoch": 84.26975476839237, + "grad_norm": 2.411223888397217, + "learning_rate": 1.2699402943941386e-06, + "loss": 0.0433, + "step": 30927 + }, + { + "epoch": 84.2724795640327, + "grad_norm": 2.898160457611084, + "learning_rate": 1.2695099273547152e-06, + "loss": 0.0975, + "step": 30928 + }, + { + "epoch": 84.27520435967303, + "grad_norm": 2.993513584136963, + "learning_rate": 1.2690796283080698e-06, + "loss": 0.0949, + "step": 30929 + }, + { + "epoch": 84.27792915531334, + "grad_norm": 2.257850408554077, + "learning_rate": 1.2686493972575498e-06, + "loss": 0.0277, + "step": 30930 + }, + { + "epoch": 84.28065395095368, + "grad_norm": 2.626110315322876, + "learning_rate": 1.2682192342065093e-06, + "loss": 0.0405, + "step": 30931 + }, + { + "epoch": 84.28337874659401, + "grad_norm": 3.5695180892944336, + "learning_rate": 1.2677891391582953e-06, + "loss": 0.0306, + "step": 30932 + }, + { + "epoch": 84.28610354223433, + "grad_norm": 2.670917272567749, + "learning_rate": 1.2673591121162577e-06, + "loss": 0.0439, + "step": 30933 + }, + { + "epoch": 84.28882833787466, + "grad_norm": 3.586989641189575, + "learning_rate": 1.2669291530837469e-06, + "loss": 0.0845, + "step": 30934 + }, + { + "epoch": 84.29155313351498, + "grad_norm": 2.1815574169158936, + "learning_rate": 1.2664992620641114e-06, + "loss": 0.0437, + "step": 30935 + }, + { + "epoch": 84.29427792915531, + "grad_norm": 2.8163528442382812, + "learning_rate": 1.2660694390606986e-06, + "loss": 0.0634, + "step": 30936 + }, + { + "epoch": 84.29700272479565, + "grad_norm": 2.318514108657837, + "learning_rate": 1.2656396840768549e-06, + "loss": 0.0394, + "step": 30937 + }, + { + "epoch": 84.29972752043597, + "grad_norm": 4.409590244293213, + "learning_rate": 1.2652099971159293e-06, + "loss": 0.0283, + "step": 30938 + }, + { + "epoch": 84.3024523160763, + "grad_norm": 1.8094323873519897, + "learning_rate": 1.2647803781812673e-06, + "loss": 0.0297, + "step": 30939 + }, + { + "epoch": 84.30517711171662, + "grad_norm": 24.27855682373047, + "learning_rate": 1.264350827276214e-06, + "loss": 0.0663, + "step": 30940 + }, + { + "epoch": 84.30790190735695, + "grad_norm": 2.4616377353668213, + "learning_rate": 1.2639213444041133e-06, + "loss": 0.1532, + "step": 30941 + }, + { + "epoch": 84.31062670299727, + "grad_norm": 1.8487862348556519, + "learning_rate": 1.2634919295683145e-06, + "loss": 0.0305, + "step": 30942 + }, + { + "epoch": 84.3133514986376, + "grad_norm": 2.1329538822174072, + "learning_rate": 1.26306258277216e-06, + "loss": 0.0241, + "step": 30943 + }, + { + "epoch": 84.31607629427793, + "grad_norm": 2.2670230865478516, + "learning_rate": 1.262633304018992e-06, + "loss": 0.089, + "step": 30944 + }, + { + "epoch": 84.31880108991825, + "grad_norm": 2.1846530437469482, + "learning_rate": 1.2622040933121527e-06, + "loss": 0.0602, + "step": 30945 + }, + { + "epoch": 84.32152588555859, + "grad_norm": 2.693756341934204, + "learning_rate": 1.261774950654986e-06, + "loss": 0.0292, + "step": 30946 + }, + { + "epoch": 84.3242506811989, + "grad_norm": 3.18593168258667, + "learning_rate": 1.261345876050838e-06, + "loss": 0.0283, + "step": 30947 + }, + { + "epoch": 84.32697547683924, + "grad_norm": 2.7687511444091797, + "learning_rate": 1.2609168695030471e-06, + "loss": 0.0807, + "step": 30948 + }, + { + "epoch": 84.32970027247957, + "grad_norm": 3.2963898181915283, + "learning_rate": 1.260487931014953e-06, + "loss": 0.0496, + "step": 30949 + }, + { + "epoch": 84.33242506811989, + "grad_norm": 2.9117414951324463, + "learning_rate": 1.2600590605898966e-06, + "loss": 0.0457, + "step": 30950 + }, + { + "epoch": 84.33514986376022, + "grad_norm": 3.7882585525512695, + "learning_rate": 1.2596302582312214e-06, + "loss": 0.1302, + "step": 30951 + }, + { + "epoch": 84.33787465940054, + "grad_norm": 2.384852647781372, + "learning_rate": 1.2592015239422639e-06, + "loss": 0.04, + "step": 30952 + }, + { + "epoch": 84.34059945504087, + "grad_norm": 1.8089810609817505, + "learning_rate": 1.2587728577263636e-06, + "loss": 0.1188, + "step": 30953 + }, + { + "epoch": 84.34332425068119, + "grad_norm": 2.1156163215637207, + "learning_rate": 1.2583442595868566e-06, + "loss": 0.0431, + "step": 30954 + }, + { + "epoch": 84.34604904632153, + "grad_norm": 3.846061944961548, + "learning_rate": 1.257915729527085e-06, + "loss": 0.0419, + "step": 30955 + }, + { + "epoch": 84.34877384196186, + "grad_norm": 3.296739101409912, + "learning_rate": 1.2574872675503858e-06, + "loss": 0.082, + "step": 30956 + }, + { + "epoch": 84.35149863760218, + "grad_norm": 2.082808256149292, + "learning_rate": 1.2570588736600909e-06, + "loss": 0.0252, + "step": 30957 + }, + { + "epoch": 84.35422343324251, + "grad_norm": 5.212313652038574, + "learning_rate": 1.2566305478595431e-06, + "loss": 0.1072, + "step": 30958 + }, + { + "epoch": 84.35694822888283, + "grad_norm": 2.4390437602996826, + "learning_rate": 1.2562022901520744e-06, + "loss": 0.0641, + "step": 30959 + }, + { + "epoch": 84.35967302452316, + "grad_norm": 1.88674795627594, + "learning_rate": 1.2557741005410207e-06, + "loss": 0.0216, + "step": 30960 + }, + { + "epoch": 84.3623978201635, + "grad_norm": 2.0010910034179688, + "learning_rate": 1.255345979029715e-06, + "loss": 0.0391, + "step": 30961 + }, + { + "epoch": 84.36512261580381, + "grad_norm": 2.3853631019592285, + "learning_rate": 1.2549179256214939e-06, + "loss": 0.0546, + "step": 30962 + }, + { + "epoch": 84.36784741144415, + "grad_norm": 1.9459019899368286, + "learning_rate": 1.254489940319692e-06, + "loss": 0.0306, + "step": 30963 + }, + { + "epoch": 84.37057220708446, + "grad_norm": 1.6892529726028442, + "learning_rate": 1.2540620231276423e-06, + "loss": 0.0265, + "step": 30964 + }, + { + "epoch": 84.3732970027248, + "grad_norm": 3.0371382236480713, + "learning_rate": 1.2536341740486746e-06, + "loss": 0.2409, + "step": 30965 + }, + { + "epoch": 84.37602179836512, + "grad_norm": 2.210012912750244, + "learning_rate": 1.2532063930861205e-06, + "loss": 0.0375, + "step": 30966 + }, + { + "epoch": 84.37874659400545, + "grad_norm": 3.261143207550049, + "learning_rate": 1.2527786802433162e-06, + "loss": 0.1751, + "step": 30967 + }, + { + "epoch": 84.38147138964578, + "grad_norm": 5.779815673828125, + "learning_rate": 1.2523510355235902e-06, + "loss": 0.0497, + "step": 30968 + }, + { + "epoch": 84.3841961852861, + "grad_norm": 2.058689832687378, + "learning_rate": 1.251923458930272e-06, + "loss": 0.0815, + "step": 30969 + }, + { + "epoch": 84.38692098092643, + "grad_norm": 2.412895917892456, + "learning_rate": 1.25149595046669e-06, + "loss": 0.026, + "step": 30970 + }, + { + "epoch": 84.38964577656675, + "grad_norm": 2.345301389694214, + "learning_rate": 1.2510685101361797e-06, + "loss": 0.0925, + "step": 30971 + }, + { + "epoch": 84.39237057220708, + "grad_norm": 2.365218162536621, + "learning_rate": 1.2506411379420647e-06, + "loss": 0.0274, + "step": 30972 + }, + { + "epoch": 84.39509536784742, + "grad_norm": 4.25044059753418, + "learning_rate": 1.2502138338876757e-06, + "loss": 0.0877, + "step": 30973 + }, + { + "epoch": 84.39782016348774, + "grad_norm": 2.1025803089141846, + "learning_rate": 1.2497865979763368e-06, + "loss": 0.0357, + "step": 30974 + }, + { + "epoch": 84.40054495912807, + "grad_norm": 3.219825267791748, + "learning_rate": 1.249359430211381e-06, + "loss": 0.0613, + "step": 30975 + }, + { + "epoch": 84.40326975476839, + "grad_norm": 2.0448338985443115, + "learning_rate": 1.248932330596132e-06, + "loss": 0.026, + "step": 30976 + }, + { + "epoch": 84.40599455040872, + "grad_norm": 1.8425649404525757, + "learning_rate": 1.2485052991339174e-06, + "loss": 0.0208, + "step": 30977 + }, + { + "epoch": 84.40871934604904, + "grad_norm": 2.058178663253784, + "learning_rate": 1.248078335828059e-06, + "loss": 0.0329, + "step": 30978 + }, + { + "epoch": 84.41144414168937, + "grad_norm": 1.8262965679168701, + "learning_rate": 1.2476514406818863e-06, + "loss": 0.0309, + "step": 30979 + }, + { + "epoch": 84.4141689373297, + "grad_norm": 1.9117165803909302, + "learning_rate": 1.247224613698721e-06, + "loss": 0.0192, + "step": 30980 + }, + { + "epoch": 84.41689373297002, + "grad_norm": 2.8641581535339355, + "learning_rate": 1.2467978548818914e-06, + "loss": 0.1315, + "step": 30981 + }, + { + "epoch": 84.41961852861036, + "grad_norm": 2.1521008014678955, + "learning_rate": 1.2463711642347154e-06, + "loss": 0.1354, + "step": 30982 + }, + { + "epoch": 84.42234332425068, + "grad_norm": 2.883301258087158, + "learning_rate": 1.245944541760522e-06, + "loss": 0.0472, + "step": 30983 + }, + { + "epoch": 84.42506811989101, + "grad_norm": 2.296856641769409, + "learning_rate": 1.24551798746263e-06, + "loss": 0.0292, + "step": 30984 + }, + { + "epoch": 84.42779291553134, + "grad_norm": 2.1604671478271484, + "learning_rate": 1.245091501344362e-06, + "loss": 0.0354, + "step": 30985 + }, + { + "epoch": 84.43051771117166, + "grad_norm": 2.4055051803588867, + "learning_rate": 1.244665083409038e-06, + "loss": 0.0542, + "step": 30986 + }, + { + "epoch": 84.433242506812, + "grad_norm": 3.1053826808929443, + "learning_rate": 1.2442387336599825e-06, + "loss": 0.0252, + "step": 30987 + }, + { + "epoch": 84.43596730245231, + "grad_norm": 1.906609058380127, + "learning_rate": 1.2438124521005135e-06, + "loss": 0.0238, + "step": 30988 + }, + { + "epoch": 84.43869209809264, + "grad_norm": 2.015774965286255, + "learning_rate": 1.2433862387339524e-06, + "loss": 0.0274, + "step": 30989 + }, + { + "epoch": 84.44141689373296, + "grad_norm": 2.535973310470581, + "learning_rate": 1.2429600935636144e-06, + "loss": 0.0421, + "step": 30990 + }, + { + "epoch": 84.4441416893733, + "grad_norm": 2.4865448474884033, + "learning_rate": 1.2425340165928234e-06, + "loss": 0.0483, + "step": 30991 + }, + { + "epoch": 84.44686648501363, + "grad_norm": 1.868030071258545, + "learning_rate": 1.242108007824896e-06, + "loss": 0.0224, + "step": 30992 + }, + { + "epoch": 84.44959128065395, + "grad_norm": 3.9106252193450928, + "learning_rate": 1.2416820672631502e-06, + "loss": 0.0426, + "step": 30993 + }, + { + "epoch": 84.45231607629428, + "grad_norm": 1.4307934045791626, + "learning_rate": 1.2412561949108992e-06, + "loss": 0.123, + "step": 30994 + }, + { + "epoch": 84.4550408719346, + "grad_norm": 2.5642943382263184, + "learning_rate": 1.240830390771466e-06, + "loss": 0.0305, + "step": 30995 + }, + { + "epoch": 84.45776566757493, + "grad_norm": 1.859707236289978, + "learning_rate": 1.2404046548481641e-06, + "loss": 0.0277, + "step": 30996 + }, + { + "epoch": 84.46049046321527, + "grad_norm": 2.6319589614868164, + "learning_rate": 1.2399789871443057e-06, + "loss": 0.0896, + "step": 30997 + }, + { + "epoch": 84.46321525885558, + "grad_norm": 2.9149649143218994, + "learning_rate": 1.2395533876632094e-06, + "loss": 0.0246, + "step": 30998 + }, + { + "epoch": 84.46594005449592, + "grad_norm": 3.1326661109924316, + "learning_rate": 1.2391278564081921e-06, + "loss": 0.1539, + "step": 30999 + }, + { + "epoch": 84.46866485013624, + "grad_norm": 2.4415969848632812, + "learning_rate": 1.2387023933825637e-06, + "loss": 0.0405, + "step": 31000 + }, + { + "epoch": 84.47138964577657, + "grad_norm": 2.142533302307129, + "learning_rate": 1.2382769985896405e-06, + "loss": 0.0343, + "step": 31001 + }, + { + "epoch": 84.47411444141689, + "grad_norm": 3.939147472381592, + "learning_rate": 1.2378516720327315e-06, + "loss": 0.1234, + "step": 31002 + }, + { + "epoch": 84.47683923705722, + "grad_norm": 3.032827615737915, + "learning_rate": 1.2374264137151537e-06, + "loss": 0.0408, + "step": 31003 + }, + { + "epoch": 84.47956403269755, + "grad_norm": 2.321712017059326, + "learning_rate": 1.2370012236402162e-06, + "loss": 0.0873, + "step": 31004 + }, + { + "epoch": 84.48228882833787, + "grad_norm": 2.2680418491363525, + "learning_rate": 1.236576101811232e-06, + "loss": 0.0836, + "step": 31005 + }, + { + "epoch": 84.4850136239782, + "grad_norm": 2.3834011554718018, + "learning_rate": 1.2361510482315087e-06, + "loss": 0.2104, + "step": 31006 + }, + { + "epoch": 84.48773841961852, + "grad_norm": 2.9098286628723145, + "learning_rate": 1.235726062904361e-06, + "loss": 0.0476, + "step": 31007 + }, + { + "epoch": 84.49046321525886, + "grad_norm": 2.6561827659606934, + "learning_rate": 1.2353011458330976e-06, + "loss": 0.0657, + "step": 31008 + }, + { + "epoch": 84.49318801089919, + "grad_norm": 2.9487643241882324, + "learning_rate": 1.234876297021026e-06, + "loss": 0.0361, + "step": 31009 + }, + { + "epoch": 84.49591280653951, + "grad_norm": 2.6250460147857666, + "learning_rate": 1.2344515164714531e-06, + "loss": 0.0347, + "step": 31010 + }, + { + "epoch": 84.49863760217984, + "grad_norm": 2.3775174617767334, + "learning_rate": 1.2340268041876923e-06, + "loss": 0.0491, + "step": 31011 + }, + { + "epoch": 84.50136239782016, + "grad_norm": 1.9457837343215942, + "learning_rate": 1.2336021601730485e-06, + "loss": 0.0315, + "step": 31012 + }, + { + "epoch": 84.50408719346049, + "grad_norm": 2.286740779876709, + "learning_rate": 1.2331775844308292e-06, + "loss": 0.0429, + "step": 31013 + }, + { + "epoch": 84.50681198910081, + "grad_norm": 2.9992775917053223, + "learning_rate": 1.232753076964338e-06, + "loss": 0.0771, + "step": 31014 + }, + { + "epoch": 84.50953678474114, + "grad_norm": 2.1540305614471436, + "learning_rate": 1.2323286377768839e-06, + "loss": 0.0342, + "step": 31015 + }, + { + "epoch": 84.51226158038148, + "grad_norm": 2.3368608951568604, + "learning_rate": 1.231904266871775e-06, + "loss": 0.0284, + "step": 31016 + }, + { + "epoch": 84.5149863760218, + "grad_norm": 1.906496524810791, + "learning_rate": 1.2314799642523135e-06, + "loss": 0.0569, + "step": 31017 + }, + { + "epoch": 84.51771117166213, + "grad_norm": 4.40822696685791, + "learning_rate": 1.2310557299218029e-06, + "loss": 0.0353, + "step": 31018 + }, + { + "epoch": 84.52043596730245, + "grad_norm": 2.7115578651428223, + "learning_rate": 1.2306315638835464e-06, + "loss": 0.0661, + "step": 31019 + }, + { + "epoch": 84.52316076294278, + "grad_norm": 3.1134707927703857, + "learning_rate": 1.2302074661408502e-06, + "loss": 0.0421, + "step": 31020 + }, + { + "epoch": 84.52588555858311, + "grad_norm": 2.8423943519592285, + "learning_rate": 1.2297834366970174e-06, + "loss": 0.1245, + "step": 31021 + }, + { + "epoch": 84.52861035422343, + "grad_norm": 2.3413920402526855, + "learning_rate": 1.2293594755553462e-06, + "loss": 0.1918, + "step": 31022 + }, + { + "epoch": 84.53133514986376, + "grad_norm": 2.1077334880828857, + "learning_rate": 1.228935582719143e-06, + "loss": 0.0427, + "step": 31023 + }, + { + "epoch": 84.53405994550408, + "grad_norm": 2.3549013137817383, + "learning_rate": 1.2285117581917084e-06, + "loss": 0.098, + "step": 31024 + }, + { + "epoch": 84.53678474114442, + "grad_norm": 2.0314838886260986, + "learning_rate": 1.2280880019763407e-06, + "loss": 0.0216, + "step": 31025 + }, + { + "epoch": 84.53950953678473, + "grad_norm": 2.8202052116394043, + "learning_rate": 1.227664314076339e-06, + "loss": 0.079, + "step": 31026 + }, + { + "epoch": 84.54223433242507, + "grad_norm": 3.7878527641296387, + "learning_rate": 1.227240694495009e-06, + "loss": 0.0235, + "step": 31027 + }, + { + "epoch": 84.5449591280654, + "grad_norm": 6.113048076629639, + "learning_rate": 1.2268171432356447e-06, + "loss": 0.1633, + "step": 31028 + }, + { + "epoch": 84.54768392370572, + "grad_norm": 2.637174129486084, + "learning_rate": 1.2263936603015457e-06, + "loss": 0.06, + "step": 31029 + }, + { + "epoch": 84.55040871934605, + "grad_norm": 3.4079182147979736, + "learning_rate": 1.2259702456960099e-06, + "loss": 0.12, + "step": 31030 + }, + { + "epoch": 84.55313351498637, + "grad_norm": 2.9253225326538086, + "learning_rate": 1.2255468994223342e-06, + "loss": 0.1418, + "step": 31031 + }, + { + "epoch": 84.5558583106267, + "grad_norm": 2.9753916263580322, + "learning_rate": 1.225123621483819e-06, + "loss": 0.058, + "step": 31032 + }, + { + "epoch": 84.55858310626704, + "grad_norm": 2.4538822174072266, + "learning_rate": 1.2247004118837603e-06, + "loss": 0.1138, + "step": 31033 + }, + { + "epoch": 84.56130790190736, + "grad_norm": 2.228626251220703, + "learning_rate": 1.2242772706254502e-06, + "loss": 0.0296, + "step": 31034 + }, + { + "epoch": 84.56403269754769, + "grad_norm": 2.627859115600586, + "learning_rate": 1.2238541977121853e-06, + "loss": 0.1024, + "step": 31035 + }, + { + "epoch": 84.566757493188, + "grad_norm": 3.1097116470336914, + "learning_rate": 1.223431193147263e-06, + "loss": 0.188, + "step": 31036 + }, + { + "epoch": 84.56948228882834, + "grad_norm": 1.7681435346603394, + "learning_rate": 1.2230082569339773e-06, + "loss": 0.0208, + "step": 31037 + }, + { + "epoch": 84.57220708446866, + "grad_norm": 1.7119303941726685, + "learning_rate": 1.222585389075619e-06, + "loss": 0.0193, + "step": 31038 + }, + { + "epoch": 84.57493188010899, + "grad_norm": 2.7175660133361816, + "learning_rate": 1.222162589575483e-06, + "loss": 0.042, + "step": 31039 + }, + { + "epoch": 84.57765667574932, + "grad_norm": 2.8624460697174072, + "learning_rate": 1.2217398584368634e-06, + "loss": 0.1138, + "step": 31040 + }, + { + "epoch": 84.58038147138964, + "grad_norm": 1.645054578781128, + "learning_rate": 1.221317195663051e-06, + "loss": 0.1273, + "step": 31041 + }, + { + "epoch": 84.58310626702998, + "grad_norm": 1.6453557014465332, + "learning_rate": 1.2208946012573352e-06, + "loss": 0.0642, + "step": 31042 + }, + { + "epoch": 84.5858310626703, + "grad_norm": 6.238443374633789, + "learning_rate": 1.2204720752230126e-06, + "loss": 0.0368, + "step": 31043 + }, + { + "epoch": 84.58855585831063, + "grad_norm": 2.3180487155914307, + "learning_rate": 1.2200496175633714e-06, + "loss": 0.1693, + "step": 31044 + }, + { + "epoch": 84.59128065395096, + "grad_norm": 2.5004770755767822, + "learning_rate": 1.2196272282817e-06, + "loss": 0.0537, + "step": 31045 + }, + { + "epoch": 84.59400544959128, + "grad_norm": 3.1233437061309814, + "learning_rate": 1.2192049073812872e-06, + "loss": 0.0854, + "step": 31046 + }, + { + "epoch": 84.59673024523161, + "grad_norm": 1.4701508283615112, + "learning_rate": 1.218782654865427e-06, + "loss": 0.0183, + "step": 31047 + }, + { + "epoch": 84.59945504087193, + "grad_norm": 2.837486505508423, + "learning_rate": 1.218360470737402e-06, + "loss": 0.0482, + "step": 31048 + }, + { + "epoch": 84.60217983651226, + "grad_norm": 1.651308536529541, + "learning_rate": 1.2179383550005052e-06, + "loss": 0.0216, + "step": 31049 + }, + { + "epoch": 84.60490463215258, + "grad_norm": 2.7535626888275146, + "learning_rate": 1.2175163076580222e-06, + "loss": 0.0243, + "step": 31050 + }, + { + "epoch": 84.60762942779292, + "grad_norm": 2.362203598022461, + "learning_rate": 1.2170943287132375e-06, + "loss": 0.1221, + "step": 31051 + }, + { + "epoch": 84.61035422343325, + "grad_norm": 2.717883348464966, + "learning_rate": 1.2166724181694411e-06, + "loss": 0.0828, + "step": 31052 + }, + { + "epoch": 84.61307901907357, + "grad_norm": 1.5653126239776611, + "learning_rate": 1.2162505760299182e-06, + "loss": 0.0209, + "step": 31053 + }, + { + "epoch": 84.6158038147139, + "grad_norm": 3.5864832401275635, + "learning_rate": 1.2158288022979514e-06, + "loss": 0.0935, + "step": 31054 + }, + { + "epoch": 84.61852861035422, + "grad_norm": 4.0297160148620605, + "learning_rate": 1.215407096976826e-06, + "loss": 0.0945, + "step": 31055 + }, + { + "epoch": 84.62125340599455, + "grad_norm": 2.4685301780700684, + "learning_rate": 1.2149854600698296e-06, + "loss": 0.0526, + "step": 31056 + }, + { + "epoch": 84.62397820163488, + "grad_norm": 1.8899409770965576, + "learning_rate": 1.2145638915802438e-06, + "loss": 0.0241, + "step": 31057 + }, + { + "epoch": 84.6267029972752, + "grad_norm": 3.2765052318573, + "learning_rate": 1.2141423915113515e-06, + "loss": 0.0333, + "step": 31058 + }, + { + "epoch": 84.62942779291554, + "grad_norm": 2.8388254642486572, + "learning_rate": 1.2137209598664334e-06, + "loss": 0.0682, + "step": 31059 + }, + { + "epoch": 84.63215258855585, + "grad_norm": 2.8888697624206543, + "learning_rate": 1.213299596648776e-06, + "loss": 0.1235, + "step": 31060 + }, + { + "epoch": 84.63487738419619, + "grad_norm": 2.789600133895874, + "learning_rate": 1.2128783018616585e-06, + "loss": 0.1367, + "step": 31061 + }, + { + "epoch": 84.6376021798365, + "grad_norm": 2.938390016555786, + "learning_rate": 1.212457075508362e-06, + "loss": 0.0446, + "step": 31062 + }, + { + "epoch": 84.64032697547684, + "grad_norm": 2.4707260131835938, + "learning_rate": 1.2120359175921636e-06, + "loss": 0.2618, + "step": 31063 + }, + { + "epoch": 84.64305177111717, + "grad_norm": 2.305969715118408, + "learning_rate": 1.2116148281163497e-06, + "loss": 0.0809, + "step": 31064 + }, + { + "epoch": 84.64577656675749, + "grad_norm": 3.376065492630005, + "learning_rate": 1.2111938070841979e-06, + "loss": 0.0724, + "step": 31065 + }, + { + "epoch": 84.64850136239782, + "grad_norm": 3.548962116241455, + "learning_rate": 1.2107728544989817e-06, + "loss": 0.0347, + "step": 31066 + }, + { + "epoch": 84.65122615803814, + "grad_norm": 2.1145694255828857, + "learning_rate": 1.2103519703639844e-06, + "loss": 0.1118, + "step": 31067 + }, + { + "epoch": 84.65395095367847, + "grad_norm": 2.4844484329223633, + "learning_rate": 1.2099311546824853e-06, + "loss": 0.0376, + "step": 31068 + }, + { + "epoch": 84.65667574931881, + "grad_norm": 2.0232150554656982, + "learning_rate": 1.20951040745776e-06, + "loss": 0.0338, + "step": 31069 + }, + { + "epoch": 84.65940054495913, + "grad_norm": 5.746128082275391, + "learning_rate": 1.2090897286930837e-06, + "loss": 0.0821, + "step": 31070 + }, + { + "epoch": 84.66212534059946, + "grad_norm": 2.1323885917663574, + "learning_rate": 1.2086691183917322e-06, + "loss": 0.039, + "step": 31071 + }, + { + "epoch": 84.66485013623978, + "grad_norm": 3.363504648208618, + "learning_rate": 1.208248576556985e-06, + "loss": 0.0508, + "step": 31072 + }, + { + "epoch": 84.66757493188011, + "grad_norm": 3.2984578609466553, + "learning_rate": 1.2078281031921146e-06, + "loss": 0.1499, + "step": 31073 + }, + { + "epoch": 84.67029972752043, + "grad_norm": 2.885843276977539, + "learning_rate": 1.2074076983003956e-06, + "loss": 0.054, + "step": 31074 + }, + { + "epoch": 84.67302452316076, + "grad_norm": 2.0458831787109375, + "learning_rate": 1.2069873618851001e-06, + "loss": 0.038, + "step": 31075 + }, + { + "epoch": 84.6757493188011, + "grad_norm": 2.1821789741516113, + "learning_rate": 1.2065670939495068e-06, + "loss": 0.0532, + "step": 31076 + }, + { + "epoch": 84.67847411444141, + "grad_norm": 4.3712053298950195, + "learning_rate": 1.2061468944968857e-06, + "loss": 0.0278, + "step": 31077 + }, + { + "epoch": 84.68119891008175, + "grad_norm": 3.6181650161743164, + "learning_rate": 1.2057267635305102e-06, + "loss": 0.0635, + "step": 31078 + }, + { + "epoch": 84.68392370572207, + "grad_norm": 3.243540048599243, + "learning_rate": 1.205306701053649e-06, + "loss": 0.0646, + "step": 31079 + }, + { + "epoch": 84.6866485013624, + "grad_norm": 2.5232150554656982, + "learning_rate": 1.204886707069578e-06, + "loss": 0.0372, + "step": 31080 + }, + { + "epoch": 84.68937329700273, + "grad_norm": 3.703014373779297, + "learning_rate": 1.2044667815815668e-06, + "loss": 0.0549, + "step": 31081 + }, + { + "epoch": 84.69209809264305, + "grad_norm": 1.814774751663208, + "learning_rate": 1.2040469245928843e-06, + "loss": 0.0267, + "step": 31082 + }, + { + "epoch": 84.69482288828338, + "grad_norm": 2.440342664718628, + "learning_rate": 1.2036271361067996e-06, + "loss": 0.0547, + "step": 31083 + }, + { + "epoch": 84.6975476839237, + "grad_norm": 2.8584320545196533, + "learning_rate": 1.203207416126584e-06, + "loss": 0.0314, + "step": 31084 + }, + { + "epoch": 84.70027247956403, + "grad_norm": 4.247107028961182, + "learning_rate": 1.2027877646555087e-06, + "loss": 0.0472, + "step": 31085 + }, + { + "epoch": 84.70299727520435, + "grad_norm": 4.565586566925049, + "learning_rate": 1.202368181696838e-06, + "loss": 0.0707, + "step": 31086 + }, + { + "epoch": 84.70572207084469, + "grad_norm": 2.6981148719787598, + "learning_rate": 1.2019486672538383e-06, + "loss": 0.0278, + "step": 31087 + }, + { + "epoch": 84.70844686648502, + "grad_norm": 2.0777294635772705, + "learning_rate": 1.2015292213297824e-06, + "loss": 0.0635, + "step": 31088 + }, + { + "epoch": 84.71117166212534, + "grad_norm": 3.509965658187866, + "learning_rate": 1.2011098439279333e-06, + "loss": 0.0839, + "step": 31089 + }, + { + "epoch": 84.71389645776567, + "grad_norm": 2.077681541442871, + "learning_rate": 1.2006905350515575e-06, + "loss": 0.0781, + "step": 31090 + }, + { + "epoch": 84.71662125340599, + "grad_norm": 2.4037723541259766, + "learning_rate": 1.2002712947039185e-06, + "loss": 0.0282, + "step": 31091 + }, + { + "epoch": 84.71934604904632, + "grad_norm": 2.0101139545440674, + "learning_rate": 1.1998521228882853e-06, + "loss": 0.0259, + "step": 31092 + }, + { + "epoch": 84.72207084468666, + "grad_norm": 2.952502489089966, + "learning_rate": 1.1994330196079208e-06, + "loss": 0.0504, + "step": 31093 + }, + { + "epoch": 84.72479564032697, + "grad_norm": 2.8094520568847656, + "learning_rate": 1.1990139848660886e-06, + "loss": 0.107, + "step": 31094 + }, + { + "epoch": 84.7275204359673, + "grad_norm": 2.9072251319885254, + "learning_rate": 1.198595018666051e-06, + "loss": 0.0944, + "step": 31095 + }, + { + "epoch": 84.73024523160763, + "grad_norm": 3.1361992359161377, + "learning_rate": 1.1981761210110732e-06, + "loss": 0.0674, + "step": 31096 + }, + { + "epoch": 84.73297002724796, + "grad_norm": 2.763051986694336, + "learning_rate": 1.1977572919044166e-06, + "loss": 0.0265, + "step": 31097 + }, + { + "epoch": 84.73569482288828, + "grad_norm": 3.9850151538848877, + "learning_rate": 1.1973385313493436e-06, + "loss": 0.0349, + "step": 31098 + }, + { + "epoch": 84.73841961852861, + "grad_norm": 2.8541979789733887, + "learning_rate": 1.1969198393491123e-06, + "loss": 0.0525, + "step": 31099 + }, + { + "epoch": 84.74114441416894, + "grad_norm": 2.51537823677063, + "learning_rate": 1.1965012159069855e-06, + "loss": 0.0711, + "step": 31100 + }, + { + "epoch": 84.74386920980926, + "grad_norm": 2.9767189025878906, + "learning_rate": 1.1960826610262266e-06, + "loss": 0.0348, + "step": 31101 + }, + { + "epoch": 84.7465940054496, + "grad_norm": 2.8209567070007324, + "learning_rate": 1.1956641747100918e-06, + "loss": 0.0441, + "step": 31102 + }, + { + "epoch": 84.74931880108991, + "grad_norm": 2.726255178451538, + "learning_rate": 1.1952457569618415e-06, + "loss": 0.0213, + "step": 31103 + }, + { + "epoch": 84.75204359673025, + "grad_norm": 2.257753610610962, + "learning_rate": 1.1948274077847322e-06, + "loss": 0.0232, + "step": 31104 + }, + { + "epoch": 84.75476839237058, + "grad_norm": 8.945773124694824, + "learning_rate": 1.1944091271820258e-06, + "loss": 0.0518, + "step": 31105 + }, + { + "epoch": 84.7574931880109, + "grad_norm": 1.8746299743652344, + "learning_rate": 1.1939909151569773e-06, + "loss": 0.0314, + "step": 31106 + }, + { + "epoch": 84.76021798365123, + "grad_norm": 4.879593849182129, + "learning_rate": 1.193572771712842e-06, + "loss": 0.0649, + "step": 31107 + }, + { + "epoch": 84.76294277929155, + "grad_norm": 2.582674980163574, + "learning_rate": 1.1931546968528807e-06, + "loss": 0.0397, + "step": 31108 + }, + { + "epoch": 84.76566757493188, + "grad_norm": 4.804081439971924, + "learning_rate": 1.192736690580346e-06, + "loss": 0.0867, + "step": 31109 + }, + { + "epoch": 84.7683923705722, + "grad_norm": 18.874242782592773, + "learning_rate": 1.1923187528984958e-06, + "loss": 0.1046, + "step": 31110 + }, + { + "epoch": 84.77111716621253, + "grad_norm": 2.4071621894836426, + "learning_rate": 1.1919008838105816e-06, + "loss": 0.0323, + "step": 31111 + }, + { + "epoch": 84.77384196185287, + "grad_norm": 2.356154203414917, + "learning_rate": 1.191483083319862e-06, + "loss": 0.1667, + "step": 31112 + }, + { + "epoch": 84.77656675749319, + "grad_norm": 3.3072586059570312, + "learning_rate": 1.191065351429589e-06, + "loss": 0.118, + "step": 31113 + }, + { + "epoch": 84.77929155313352, + "grad_norm": 2.270320415496826, + "learning_rate": 1.190647688143014e-06, + "loss": 0.1204, + "step": 31114 + }, + { + "epoch": 84.78201634877384, + "grad_norm": 2.617692708969116, + "learning_rate": 1.1902300934633904e-06, + "loss": 0.0427, + "step": 31115 + }, + { + "epoch": 84.78474114441417, + "grad_norm": 3.325610876083374, + "learning_rate": 1.189812567393973e-06, + "loss": 0.046, + "step": 31116 + }, + { + "epoch": 84.7874659400545, + "grad_norm": 2.1286509037017822, + "learning_rate": 1.1893951099380097e-06, + "loss": 0.0273, + "step": 31117 + }, + { + "epoch": 84.79019073569482, + "grad_norm": 5.044488906860352, + "learning_rate": 1.1889777210987564e-06, + "loss": 0.058, + "step": 31118 + }, + { + "epoch": 84.79291553133515, + "grad_norm": 2.514359474182129, + "learning_rate": 1.1885604008794604e-06, + "loss": 0.0311, + "step": 31119 + }, + { + "epoch": 84.79564032697547, + "grad_norm": 2.4255313873291016, + "learning_rate": 1.1881431492833694e-06, + "loss": 0.0403, + "step": 31120 + }, + { + "epoch": 84.7983651226158, + "grad_norm": 4.272997856140137, + "learning_rate": 1.1877259663137398e-06, + "loss": 0.036, + "step": 31121 + }, + { + "epoch": 84.80108991825612, + "grad_norm": 2.7143914699554443, + "learning_rate": 1.1873088519738163e-06, + "loss": 0.0286, + "step": 31122 + }, + { + "epoch": 84.80381471389646, + "grad_norm": 1.854542851448059, + "learning_rate": 1.1868918062668467e-06, + "loss": 0.0225, + "step": 31123 + }, + { + "epoch": 84.80653950953679, + "grad_norm": 2.3984200954437256, + "learning_rate": 1.1864748291960793e-06, + "loss": 0.0614, + "step": 31124 + }, + { + "epoch": 84.80926430517711, + "grad_norm": 2.313521385192871, + "learning_rate": 1.1860579207647638e-06, + "loss": 0.0905, + "step": 31125 + }, + { + "epoch": 84.81198910081744, + "grad_norm": 3.3067080974578857, + "learning_rate": 1.1856410809761454e-06, + "loss": 0.0237, + "step": 31126 + }, + { + "epoch": 84.81471389645776, + "grad_norm": 1.8766144514083862, + "learning_rate": 1.1852243098334703e-06, + "loss": 0.034, + "step": 31127 + }, + { + "epoch": 84.8174386920981, + "grad_norm": 2.371131181716919, + "learning_rate": 1.1848076073399838e-06, + "loss": 0.041, + "step": 31128 + }, + { + "epoch": 84.82016348773843, + "grad_norm": 2.869938850402832, + "learning_rate": 1.1843909734989323e-06, + "loss": 0.0428, + "step": 31129 + }, + { + "epoch": 84.82288828337875, + "grad_norm": 5.338016033172607, + "learning_rate": 1.1839744083135618e-06, + "loss": 0.0854, + "step": 31130 + }, + { + "epoch": 84.82561307901908, + "grad_norm": 2.4351656436920166, + "learning_rate": 1.183557911787112e-06, + "loss": 0.1161, + "step": 31131 + }, + { + "epoch": 84.8283378746594, + "grad_norm": 2.4238884449005127, + "learning_rate": 1.1831414839228318e-06, + "loss": 0.0297, + "step": 31132 + }, + { + "epoch": 84.83106267029973, + "grad_norm": 2.19629168510437, + "learning_rate": 1.1827251247239614e-06, + "loss": 0.0621, + "step": 31133 + }, + { + "epoch": 84.83378746594005, + "grad_norm": 2.6091413497924805, + "learning_rate": 1.1823088341937416e-06, + "loss": 0.021, + "step": 31134 + }, + { + "epoch": 84.83651226158038, + "grad_norm": 2.723750114440918, + "learning_rate": 1.1818926123354201e-06, + "loss": 0.0998, + "step": 31135 + }, + { + "epoch": 84.83923705722071, + "grad_norm": 3.025283098220825, + "learning_rate": 1.181476459152232e-06, + "loss": 0.0399, + "step": 31136 + }, + { + "epoch": 84.84196185286103, + "grad_norm": 1.6982884407043457, + "learning_rate": 1.1810603746474235e-06, + "loss": 0.0213, + "step": 31137 + }, + { + "epoch": 84.84468664850137, + "grad_norm": 3.653689384460449, + "learning_rate": 1.1806443588242333e-06, + "loss": 0.1872, + "step": 31138 + }, + { + "epoch": 84.84741144414168, + "grad_norm": 2.5489659309387207, + "learning_rate": 1.1802284116859008e-06, + "loss": 0.1274, + "step": 31139 + }, + { + "epoch": 84.85013623978202, + "grad_norm": 2.3214521408081055, + "learning_rate": 1.1798125332356646e-06, + "loss": 0.0807, + "step": 31140 + }, + { + "epoch": 84.85286103542235, + "grad_norm": 2.6158955097198486, + "learning_rate": 1.1793967234767656e-06, + "loss": 0.0384, + "step": 31141 + }, + { + "epoch": 84.85558583106267, + "grad_norm": 7.601649761199951, + "learning_rate": 1.178980982412441e-06, + "loss": 0.1165, + "step": 31142 + }, + { + "epoch": 84.858310626703, + "grad_norm": 3.254023313522339, + "learning_rate": 1.1785653100459282e-06, + "loss": 0.0483, + "step": 31143 + }, + { + "epoch": 84.86103542234332, + "grad_norm": 3.435879945755005, + "learning_rate": 1.1781497063804636e-06, + "loss": 0.0952, + "step": 31144 + }, + { + "epoch": 84.86376021798365, + "grad_norm": 3.469769239425659, + "learning_rate": 1.177734171419287e-06, + "loss": 0.0854, + "step": 31145 + }, + { + "epoch": 84.86648501362397, + "grad_norm": 2.5312633514404297, + "learning_rate": 1.1773187051656332e-06, + "loss": 0.1277, + "step": 31146 + }, + { + "epoch": 84.8692098092643, + "grad_norm": 2.338857650756836, + "learning_rate": 1.1769033076227364e-06, + "loss": 0.0605, + "step": 31147 + }, + { + "epoch": 84.87193460490464, + "grad_norm": 1.533124566078186, + "learning_rate": 1.1764879787938311e-06, + "loss": 0.0217, + "step": 31148 + }, + { + "epoch": 84.87465940054496, + "grad_norm": 5.608811855316162, + "learning_rate": 1.1760727186821552e-06, + "loss": 0.0547, + "step": 31149 + }, + { + "epoch": 84.87738419618529, + "grad_norm": 3.0883374214172363, + "learning_rate": 1.175657527290941e-06, + "loss": 0.0475, + "step": 31150 + }, + { + "epoch": 84.88010899182561, + "grad_norm": 2.5763869285583496, + "learning_rate": 1.1752424046234223e-06, + "loss": 0.0509, + "step": 31151 + }, + { + "epoch": 84.88283378746594, + "grad_norm": 1.486336350440979, + "learning_rate": 1.1748273506828278e-06, + "loss": 0.0198, + "step": 31152 + }, + { + "epoch": 84.88555858310627, + "grad_norm": 2.8218631744384766, + "learning_rate": 1.174412365472397e-06, + "loss": 0.0547, + "step": 31153 + }, + { + "epoch": 84.88828337874659, + "grad_norm": 4.80703067779541, + "learning_rate": 1.1739974489953598e-06, + "loss": 0.0379, + "step": 31154 + }, + { + "epoch": 84.89100817438693, + "grad_norm": 7.6221208572387695, + "learning_rate": 1.1735826012549457e-06, + "loss": 0.0318, + "step": 31155 + }, + { + "epoch": 84.89373297002724, + "grad_norm": 1.7960706949234009, + "learning_rate": 1.1731678222543841e-06, + "loss": 0.061, + "step": 31156 + }, + { + "epoch": 84.89645776566758, + "grad_norm": 3.2422173023223877, + "learning_rate": 1.1727531119969104e-06, + "loss": 0.0469, + "step": 31157 + }, + { + "epoch": 84.8991825613079, + "grad_norm": 1.7906864881515503, + "learning_rate": 1.172338470485751e-06, + "loss": 0.0178, + "step": 31158 + }, + { + "epoch": 84.90190735694823, + "grad_norm": 3.061605930328369, + "learning_rate": 1.1719238977241343e-06, + "loss": 0.1223, + "step": 31159 + }, + { + "epoch": 84.90463215258856, + "grad_norm": 6.10139799118042, + "learning_rate": 1.1715093937152888e-06, + "loss": 0.1513, + "step": 31160 + }, + { + "epoch": 84.90735694822888, + "grad_norm": 1.8453673124313354, + "learning_rate": 1.1710949584624466e-06, + "loss": 0.0167, + "step": 31161 + }, + { + "epoch": 84.91008174386921, + "grad_norm": 2.165992259979248, + "learning_rate": 1.1706805919688323e-06, + "loss": 0.023, + "step": 31162 + }, + { + "epoch": 84.91280653950953, + "grad_norm": 3.98290753364563, + "learning_rate": 1.1702662942376742e-06, + "loss": 0.1148, + "step": 31163 + }, + { + "epoch": 84.91553133514986, + "grad_norm": 3.149789810180664, + "learning_rate": 1.1698520652721946e-06, + "loss": 0.131, + "step": 31164 + }, + { + "epoch": 84.9182561307902, + "grad_norm": 4.626081466674805, + "learning_rate": 1.1694379050756256e-06, + "loss": 0.0928, + "step": 31165 + }, + { + "epoch": 84.92098092643052, + "grad_norm": 2.892207622528076, + "learning_rate": 1.16902381365119e-06, + "loss": 0.0401, + "step": 31166 + }, + { + "epoch": 84.92370572207085, + "grad_norm": 2.274512529373169, + "learning_rate": 1.168609791002112e-06, + "loss": 0.0345, + "step": 31167 + }, + { + "epoch": 84.92643051771117, + "grad_norm": 2.4470462799072266, + "learning_rate": 1.168195837131616e-06, + "loss": 0.0663, + "step": 31168 + }, + { + "epoch": 84.9291553133515, + "grad_norm": 3.115577220916748, + "learning_rate": 1.1677819520429258e-06, + "loss": 0.1073, + "step": 31169 + }, + { + "epoch": 84.93188010899182, + "grad_norm": 2.0581114292144775, + "learning_rate": 1.1673681357392674e-06, + "loss": 0.1468, + "step": 31170 + }, + { + "epoch": 84.93460490463215, + "grad_norm": 2.517979145050049, + "learning_rate": 1.166954388223862e-06, + "loss": 0.0661, + "step": 31171 + }, + { + "epoch": 84.93732970027249, + "grad_norm": 2.2308521270751953, + "learning_rate": 1.1665407094999292e-06, + "loss": 0.0263, + "step": 31172 + }, + { + "epoch": 84.9400544959128, + "grad_norm": 2.980236768722534, + "learning_rate": 1.1661270995706953e-06, + "loss": 0.1513, + "step": 31173 + }, + { + "epoch": 84.94277929155314, + "grad_norm": 1.9563831090927124, + "learning_rate": 1.1657135584393797e-06, + "loss": 0.0236, + "step": 31174 + }, + { + "epoch": 84.94550408719346, + "grad_norm": 2.2078192234039307, + "learning_rate": 1.1653000861092012e-06, + "loss": 0.0337, + "step": 31175 + }, + { + "epoch": 84.94822888283379, + "grad_norm": 3.0110480785369873, + "learning_rate": 1.1648866825833804e-06, + "loss": 0.2238, + "step": 31176 + }, + { + "epoch": 84.95095367847412, + "grad_norm": 1.9992401599884033, + "learning_rate": 1.1644733478651394e-06, + "loss": 0.0192, + "step": 31177 + }, + { + "epoch": 84.95367847411444, + "grad_norm": 3.679093360900879, + "learning_rate": 1.1640600819576965e-06, + "loss": 0.0235, + "step": 31178 + }, + { + "epoch": 84.95640326975477, + "grad_norm": 3.946873664855957, + "learning_rate": 1.163646884864268e-06, + "loss": 0.0602, + "step": 31179 + }, + { + "epoch": 84.95912806539509, + "grad_norm": 3.0473928451538086, + "learning_rate": 1.1632337565880715e-06, + "loss": 0.025, + "step": 31180 + }, + { + "epoch": 84.96185286103542, + "grad_norm": 2.5463502407073975, + "learning_rate": 1.1628206971323287e-06, + "loss": 0.0283, + "step": 31181 + }, + { + "epoch": 84.96457765667574, + "grad_norm": 2.951878309249878, + "learning_rate": 1.1624077065002537e-06, + "loss": 0.0784, + "step": 31182 + }, + { + "epoch": 84.96730245231608, + "grad_norm": 2.6662778854370117, + "learning_rate": 1.161994784695063e-06, + "loss": 0.0309, + "step": 31183 + }, + { + "epoch": 84.97002724795641, + "grad_norm": 3.0899598598480225, + "learning_rate": 1.1615819317199696e-06, + "loss": 0.0242, + "step": 31184 + }, + { + "epoch": 84.97275204359673, + "grad_norm": 2.764861583709717, + "learning_rate": 1.161169147578195e-06, + "loss": 0.0521, + "step": 31185 + }, + { + "epoch": 84.97547683923706, + "grad_norm": 1.660042643547058, + "learning_rate": 1.160756432272947e-06, + "loss": 0.137, + "step": 31186 + }, + { + "epoch": 84.97820163487738, + "grad_norm": 2.3153398036956787, + "learning_rate": 1.1603437858074463e-06, + "loss": 0.0395, + "step": 31187 + }, + { + "epoch": 84.98092643051771, + "grad_norm": 5.803910732269287, + "learning_rate": 1.1599312081849046e-06, + "loss": 0.0934, + "step": 31188 + }, + { + "epoch": 84.98365122615803, + "grad_norm": 2.680100917816162, + "learning_rate": 1.1595186994085306e-06, + "loss": 0.0411, + "step": 31189 + }, + { + "epoch": 84.98637602179836, + "grad_norm": 4.34005069732666, + "learning_rate": 1.159106259481544e-06, + "loss": 0.1272, + "step": 31190 + }, + { + "epoch": 84.9891008174387, + "grad_norm": 2.859818458557129, + "learning_rate": 1.1586938884071519e-06, + "loss": 0.0697, + "step": 31191 + }, + { + "epoch": 84.99182561307902, + "grad_norm": 2.5982792377471924, + "learning_rate": 1.1582815861885676e-06, + "loss": 0.138, + "step": 31192 + }, + { + "epoch": 84.99455040871935, + "grad_norm": 4.581809997558594, + "learning_rate": 1.1578693528289998e-06, + "loss": 0.12, + "step": 31193 + }, + { + "epoch": 84.99727520435967, + "grad_norm": 2.7573812007904053, + "learning_rate": 1.1574571883316632e-06, + "loss": 0.127, + "step": 31194 + }, + { + "epoch": 85.0, + "grad_norm": 3.7230260372161865, + "learning_rate": 1.1570450926997657e-06, + "loss": 0.0482, + "step": 31195 + }, + { + "epoch": 85.00272479564033, + "grad_norm": 2.5617825984954834, + "learning_rate": 1.1566330659365134e-06, + "loss": 0.0917, + "step": 31196 + }, + { + "epoch": 85.00544959128065, + "grad_norm": 3.321756601333618, + "learning_rate": 1.1562211080451201e-06, + "loss": 0.0431, + "step": 31197 + }, + { + "epoch": 85.00817438692098, + "grad_norm": 2.9215753078460693, + "learning_rate": 1.155809219028794e-06, + "loss": 0.0309, + "step": 31198 + }, + { + "epoch": 85.0108991825613, + "grad_norm": 2.704392910003662, + "learning_rate": 1.1553973988907397e-06, + "loss": 0.0821, + "step": 31199 + }, + { + "epoch": 85.01362397820164, + "grad_norm": 1.7946335077285767, + "learning_rate": 1.1549856476341637e-06, + "loss": 0.0607, + "step": 31200 + }, + { + "epoch": 85.01634877384195, + "grad_norm": 2.6398544311523438, + "learning_rate": 1.1545739652622768e-06, + "loss": 0.0727, + "step": 31201 + }, + { + "epoch": 85.01907356948229, + "grad_norm": 2.370229959487915, + "learning_rate": 1.154162351778283e-06, + "loss": 0.03, + "step": 31202 + }, + { + "epoch": 85.02179836512262, + "grad_norm": 2.9440078735351562, + "learning_rate": 1.1537508071853865e-06, + "loss": 0.0268, + "step": 31203 + }, + { + "epoch": 85.02452316076294, + "grad_norm": 3.667236566543579, + "learning_rate": 1.1533393314867959e-06, + "loss": 0.1429, + "step": 31204 + }, + { + "epoch": 85.02724795640327, + "grad_norm": 2.9445602893829346, + "learning_rate": 1.1529279246857129e-06, + "loss": 0.1617, + "step": 31205 + }, + { + "epoch": 85.02997275204359, + "grad_norm": 2.893164873123169, + "learning_rate": 1.1525165867853427e-06, + "loss": 0.1164, + "step": 31206 + }, + { + "epoch": 85.03269754768392, + "grad_norm": 2.4880118370056152, + "learning_rate": 1.1521053177888897e-06, + "loss": 0.0347, + "step": 31207 + }, + { + "epoch": 85.03542234332426, + "grad_norm": 1.9457095861434937, + "learning_rate": 1.1516941176995555e-06, + "loss": 0.066, + "step": 31208 + }, + { + "epoch": 85.03814713896458, + "grad_norm": 2.136549234390259, + "learning_rate": 1.1512829865205399e-06, + "loss": 0.0394, + "step": 31209 + }, + { + "epoch": 85.04087193460491, + "grad_norm": 3.3046276569366455, + "learning_rate": 1.1508719242550504e-06, + "loss": 0.1154, + "step": 31210 + }, + { + "epoch": 85.04359673024523, + "grad_norm": 2.7356948852539062, + "learning_rate": 1.1504609309062865e-06, + "loss": 0.0315, + "step": 31211 + }, + { + "epoch": 85.04632152588556, + "grad_norm": 3.503849744796753, + "learning_rate": 1.1500500064774468e-06, + "loss": 0.077, + "step": 31212 + }, + { + "epoch": 85.04904632152588, + "grad_norm": 2.7946083545684814, + "learning_rate": 1.149639150971731e-06, + "loss": 0.0604, + "step": 31213 + }, + { + "epoch": 85.05177111716621, + "grad_norm": 2.3161447048187256, + "learning_rate": 1.149228364392343e-06, + "loss": 0.0505, + "step": 31214 + }, + { + "epoch": 85.05449591280654, + "grad_norm": 2.6644997596740723, + "learning_rate": 1.1488176467424783e-06, + "loss": 0.0559, + "step": 31215 + }, + { + "epoch": 85.05722070844686, + "grad_norm": 2.237291097640991, + "learning_rate": 1.1484069980253365e-06, + "loss": 0.0398, + "step": 31216 + }, + { + "epoch": 85.0599455040872, + "grad_norm": 2.0043485164642334, + "learning_rate": 1.1479964182441172e-06, + "loss": 0.1298, + "step": 31217 + }, + { + "epoch": 85.06267029972751, + "grad_norm": 2.936828851699829, + "learning_rate": 1.147585907402018e-06, + "loss": 0.0819, + "step": 31218 + }, + { + "epoch": 85.06539509536785, + "grad_norm": 2.717475652694702, + "learning_rate": 1.1471754655022338e-06, + "loss": 0.144, + "step": 31219 + }, + { + "epoch": 85.06811989100818, + "grad_norm": 2.3554444313049316, + "learning_rate": 1.14676509254796e-06, + "loss": 0.0378, + "step": 31220 + }, + { + "epoch": 85.0708446866485, + "grad_norm": 1.8457690477371216, + "learning_rate": 1.1463547885423953e-06, + "loss": 0.0201, + "step": 31221 + }, + { + "epoch": 85.07356948228883, + "grad_norm": 3.1834592819213867, + "learning_rate": 1.145944553488736e-06, + "loss": 0.2402, + "step": 31222 + }, + { + "epoch": 85.07629427792915, + "grad_norm": 2.8990871906280518, + "learning_rate": 1.1455343873901758e-06, + "loss": 0.1426, + "step": 31223 + }, + { + "epoch": 85.07901907356948, + "grad_norm": 2.236565113067627, + "learning_rate": 1.1451242902499093e-06, + "loss": 0.1035, + "step": 31224 + }, + { + "epoch": 85.0817438692098, + "grad_norm": 2.261110544204712, + "learning_rate": 1.1447142620711282e-06, + "loss": 0.0701, + "step": 31225 + }, + { + "epoch": 85.08446866485014, + "grad_norm": 2.307209014892578, + "learning_rate": 1.1443043028570277e-06, + "loss": 0.1181, + "step": 31226 + }, + { + "epoch": 85.08719346049047, + "grad_norm": 1.7935295104980469, + "learning_rate": 1.143894412610802e-06, + "loss": 0.0445, + "step": 31227 + }, + { + "epoch": 85.08991825613079, + "grad_norm": 2.47874116897583, + "learning_rate": 1.1434845913356407e-06, + "loss": 0.0458, + "step": 31228 + }, + { + "epoch": 85.09264305177112, + "grad_norm": 3.583185911178589, + "learning_rate": 1.1430748390347345e-06, + "loss": 0.0691, + "step": 31229 + }, + { + "epoch": 85.09536784741144, + "grad_norm": 2.242398262023926, + "learning_rate": 1.142665155711279e-06, + "loss": 0.03, + "step": 31230 + }, + { + "epoch": 85.09809264305177, + "grad_norm": 1.7714391946792603, + "learning_rate": 1.142255541368461e-06, + "loss": 0.03, + "step": 31231 + }, + { + "epoch": 85.1008174386921, + "grad_norm": 3.1620378494262695, + "learning_rate": 1.141845996009472e-06, + "loss": 0.1696, + "step": 31232 + }, + { + "epoch": 85.10354223433242, + "grad_norm": 7.280642986297607, + "learning_rate": 1.1414365196374999e-06, + "loss": 0.0847, + "step": 31233 + }, + { + "epoch": 85.10626702997276, + "grad_norm": 2.3759689331054688, + "learning_rate": 1.141027112255737e-06, + "loss": 0.026, + "step": 31234 + }, + { + "epoch": 85.10899182561307, + "grad_norm": 2.9072611331939697, + "learning_rate": 1.1406177738673697e-06, + "loss": 0.0734, + "step": 31235 + }, + { + "epoch": 85.11171662125341, + "grad_norm": 2.286513328552246, + "learning_rate": 1.1402085044755862e-06, + "loss": 0.0255, + "step": 31236 + }, + { + "epoch": 85.11444141689373, + "grad_norm": 3.010617733001709, + "learning_rate": 1.139799304083571e-06, + "loss": 0.0982, + "step": 31237 + }, + { + "epoch": 85.11716621253406, + "grad_norm": 2.5518136024475098, + "learning_rate": 1.1393901726945145e-06, + "loss": 0.0519, + "step": 31238 + }, + { + "epoch": 85.11989100817439, + "grad_norm": 2.2859580516815186, + "learning_rate": 1.1389811103116032e-06, + "loss": 0.047, + "step": 31239 + }, + { + "epoch": 85.12261580381471, + "grad_norm": 2.7176449298858643, + "learning_rate": 1.1385721169380226e-06, + "loss": 0.1465, + "step": 31240 + }, + { + "epoch": 85.12534059945504, + "grad_norm": 2.257220983505249, + "learning_rate": 1.1381631925769555e-06, + "loss": 0.0256, + "step": 31241 + }, + { + "epoch": 85.12806539509536, + "grad_norm": 2.7775049209594727, + "learning_rate": 1.1377543372315892e-06, + "loss": 0.1032, + "step": 31242 + }, + { + "epoch": 85.1307901907357, + "grad_norm": 2.5805413722991943, + "learning_rate": 1.1373455509051078e-06, + "loss": 0.0284, + "step": 31243 + }, + { + "epoch": 85.13351498637603, + "grad_norm": 2.0446224212646484, + "learning_rate": 1.1369368336006937e-06, + "loss": 0.0316, + "step": 31244 + }, + { + "epoch": 85.13623978201635, + "grad_norm": 3.1809558868408203, + "learning_rate": 1.136528185321528e-06, + "loss": 0.1657, + "step": 31245 + }, + { + "epoch": 85.13896457765668, + "grad_norm": 2.5956246852874756, + "learning_rate": 1.136119606070798e-06, + "loss": 0.0262, + "step": 31246 + }, + { + "epoch": 85.141689373297, + "grad_norm": 2.1996331214904785, + "learning_rate": 1.1357110958516826e-06, + "loss": 0.0258, + "step": 31247 + }, + { + "epoch": 85.14441416893733, + "grad_norm": 1.5208231210708618, + "learning_rate": 1.135302654667364e-06, + "loss": 0.1075, + "step": 31248 + }, + { + "epoch": 85.14713896457765, + "grad_norm": 2.095036029815674, + "learning_rate": 1.1348942825210218e-06, + "loss": 0.0305, + "step": 31249 + }, + { + "epoch": 85.14986376021798, + "grad_norm": 3.0639026165008545, + "learning_rate": 1.1344859794158391e-06, + "loss": 0.2263, + "step": 31250 + }, + { + "epoch": 85.15258855585832, + "grad_norm": 2.629934549331665, + "learning_rate": 1.1340777453549944e-06, + "loss": 0.0828, + "step": 31251 + }, + { + "epoch": 85.15531335149863, + "grad_norm": 2.574131488800049, + "learning_rate": 1.1336695803416664e-06, + "loss": 0.0454, + "step": 31252 + }, + { + "epoch": 85.15803814713897, + "grad_norm": 2.7287404537200928, + "learning_rate": 1.1332614843790325e-06, + "loss": 0.0228, + "step": 31253 + }, + { + "epoch": 85.16076294277929, + "grad_norm": 2.968825101852417, + "learning_rate": 1.1328534574702755e-06, + "loss": 0.106, + "step": 31254 + }, + { + "epoch": 85.16348773841962, + "grad_norm": 2.069678544998169, + "learning_rate": 1.1324454996185673e-06, + "loss": 0.0744, + "step": 31255 + }, + { + "epoch": 85.16621253405995, + "grad_norm": 2.4735465049743652, + "learning_rate": 1.1320376108270904e-06, + "loss": 0.0351, + "step": 31256 + }, + { + "epoch": 85.16893732970027, + "grad_norm": 6.014044761657715, + "learning_rate": 1.1316297910990203e-06, + "loss": 0.0474, + "step": 31257 + }, + { + "epoch": 85.1716621253406, + "grad_norm": 2.1581010818481445, + "learning_rate": 1.1312220404375285e-06, + "loss": 0.0285, + "step": 31258 + }, + { + "epoch": 85.17438692098092, + "grad_norm": 3.769885540008545, + "learning_rate": 1.1308143588457965e-06, + "loss": 0.1763, + "step": 31259 + }, + { + "epoch": 85.17711171662125, + "grad_norm": 3.3707964420318604, + "learning_rate": 1.1304067463269974e-06, + "loss": 0.071, + "step": 31260 + }, + { + "epoch": 85.17983651226157, + "grad_norm": 6.158848762512207, + "learning_rate": 1.129999202884302e-06, + "loss": 0.0274, + "step": 31261 + }, + { + "epoch": 85.1825613079019, + "grad_norm": 2.6891701221466064, + "learning_rate": 1.1295917285208901e-06, + "loss": 0.0343, + "step": 31262 + }, + { + "epoch": 85.18528610354224, + "grad_norm": 2.750530481338501, + "learning_rate": 1.1291843232399324e-06, + "loss": 0.0407, + "step": 31263 + }, + { + "epoch": 85.18801089918256, + "grad_norm": 2.945326328277588, + "learning_rate": 1.128776987044602e-06, + "loss": 0.0627, + "step": 31264 + }, + { + "epoch": 85.19073569482289, + "grad_norm": 78.27469635009766, + "learning_rate": 1.1283697199380683e-06, + "loss": 0.0397, + "step": 31265 + }, + { + "epoch": 85.19346049046321, + "grad_norm": 2.988227367401123, + "learning_rate": 1.1279625219235068e-06, + "loss": 0.1306, + "step": 31266 + }, + { + "epoch": 85.19618528610354, + "grad_norm": 2.2063028812408447, + "learning_rate": 1.1275553930040894e-06, + "loss": 0.0306, + "step": 31267 + }, + { + "epoch": 85.19891008174388, + "grad_norm": 3.1017582416534424, + "learning_rate": 1.1271483331829835e-06, + "loss": 0.0246, + "step": 31268 + }, + { + "epoch": 85.2016348773842, + "grad_norm": 3.0398337841033936, + "learning_rate": 1.12674134246336e-06, + "loss": 0.0315, + "step": 31269 + }, + { + "epoch": 85.20435967302453, + "grad_norm": 3.5283937454223633, + "learning_rate": 1.1263344208483906e-06, + "loss": 0.097, + "step": 31270 + }, + { + "epoch": 85.20708446866485, + "grad_norm": 2.1142489910125732, + "learning_rate": 1.125927568341244e-06, + "loss": 0.024, + "step": 31271 + }, + { + "epoch": 85.20980926430518, + "grad_norm": 2.6907687187194824, + "learning_rate": 1.1255207849450845e-06, + "loss": 0.0297, + "step": 31272 + }, + { + "epoch": 85.2125340599455, + "grad_norm": 1.589200496673584, + "learning_rate": 1.125114070663087e-06, + "loss": 0.0723, + "step": 31273 + }, + { + "epoch": 85.21525885558583, + "grad_norm": 1.5391526222229004, + "learning_rate": 1.1247074254984126e-06, + "loss": 0.0222, + "step": 31274 + }, + { + "epoch": 85.21798365122616, + "grad_norm": 2.298555374145508, + "learning_rate": 1.1243008494542328e-06, + "loss": 0.0267, + "step": 31275 + }, + { + "epoch": 85.22070844686648, + "grad_norm": 3.090374231338501, + "learning_rate": 1.1238943425337135e-06, + "loss": 0.0399, + "step": 31276 + }, + { + "epoch": 85.22343324250681, + "grad_norm": 1.9240354299545288, + "learning_rate": 1.1234879047400183e-06, + "loss": 0.1801, + "step": 31277 + }, + { + "epoch": 85.22615803814713, + "grad_norm": 2.856506586074829, + "learning_rate": 1.1230815360763126e-06, + "loss": 0.0693, + "step": 31278 + }, + { + "epoch": 85.22888283378747, + "grad_norm": 1.5447888374328613, + "learning_rate": 1.1226752365457626e-06, + "loss": 0.0196, + "step": 31279 + }, + { + "epoch": 85.2316076294278, + "grad_norm": 2.7791478633880615, + "learning_rate": 1.122269006151534e-06, + "loss": 0.064, + "step": 31280 + }, + { + "epoch": 85.23433242506812, + "grad_norm": 1.721009612083435, + "learning_rate": 1.121862844896786e-06, + "loss": 0.0385, + "step": 31281 + }, + { + "epoch": 85.23705722070845, + "grad_norm": 2.0161871910095215, + "learning_rate": 1.1214567527846854e-06, + "loss": 0.1422, + "step": 31282 + }, + { + "epoch": 85.23978201634877, + "grad_norm": 4.117589950561523, + "learning_rate": 1.1210507298183948e-06, + "loss": 0.0613, + "step": 31283 + }, + { + "epoch": 85.2425068119891, + "grad_norm": 2.8080499172210693, + "learning_rate": 1.1206447760010752e-06, + "loss": 0.1205, + "step": 31284 + }, + { + "epoch": 85.24523160762942, + "grad_norm": 2.301487445831299, + "learning_rate": 1.1202388913358863e-06, + "loss": 0.0329, + "step": 31285 + }, + { + "epoch": 85.24795640326975, + "grad_norm": 2.305171012878418, + "learning_rate": 1.1198330758259934e-06, + "loss": 0.0531, + "step": 31286 + }, + { + "epoch": 85.25068119891009, + "grad_norm": 2.888373374938965, + "learning_rate": 1.119427329474555e-06, + "loss": 0.0626, + "step": 31287 + }, + { + "epoch": 85.2534059945504, + "grad_norm": 3.4480016231536865, + "learning_rate": 1.1190216522847297e-06, + "loss": 0.072, + "step": 31288 + }, + { + "epoch": 85.25613079019074, + "grad_norm": 2.151869058609009, + "learning_rate": 1.118616044259676e-06, + "loss": 0.0673, + "step": 31289 + }, + { + "epoch": 85.25885558583106, + "grad_norm": 1.628497838973999, + "learning_rate": 1.118210505402556e-06, + "loss": 0.0487, + "step": 31290 + }, + { + "epoch": 85.26158038147139, + "grad_norm": 1.705924391746521, + "learning_rate": 1.117805035716527e-06, + "loss": 0.0278, + "step": 31291 + }, + { + "epoch": 85.26430517711172, + "grad_norm": 1.645024061203003, + "learning_rate": 1.117399635204748e-06, + "loss": 0.0268, + "step": 31292 + }, + { + "epoch": 85.26702997275204, + "grad_norm": 2.6714820861816406, + "learning_rate": 1.1169943038703734e-06, + "loss": 0.0263, + "step": 31293 + }, + { + "epoch": 85.26975476839237, + "grad_norm": 1.848447322845459, + "learning_rate": 1.1165890417165604e-06, + "loss": 0.0193, + "step": 31294 + }, + { + "epoch": 85.2724795640327, + "grad_norm": 2.722369909286499, + "learning_rate": 1.1161838487464682e-06, + "loss": 0.0359, + "step": 31295 + }, + { + "epoch": 85.27520435967303, + "grad_norm": 2.494370460510254, + "learning_rate": 1.115778724963249e-06, + "loss": 0.0701, + "step": 31296 + }, + { + "epoch": 85.27792915531334, + "grad_norm": 2.0855612754821777, + "learning_rate": 1.1153736703700602e-06, + "loss": 0.0211, + "step": 31297 + }, + { + "epoch": 85.28065395095368, + "grad_norm": 1.9474340677261353, + "learning_rate": 1.1149686849700524e-06, + "loss": 0.0343, + "step": 31298 + }, + { + "epoch": 85.28337874659401, + "grad_norm": 3.5660603046417236, + "learning_rate": 1.1145637687663856e-06, + "loss": 0.0623, + "step": 31299 + }, + { + "epoch": 85.28610354223433, + "grad_norm": 1.9984091520309448, + "learning_rate": 1.1141589217622096e-06, + "loss": 0.0208, + "step": 31300 + }, + { + "epoch": 85.28882833787466, + "grad_norm": 2.32194447517395, + "learning_rate": 1.1137541439606781e-06, + "loss": 0.1028, + "step": 31301 + }, + { + "epoch": 85.29155313351498, + "grad_norm": 2.6686768531799316, + "learning_rate": 1.113349435364941e-06, + "loss": 0.0389, + "step": 31302 + }, + { + "epoch": 85.29427792915531, + "grad_norm": 2.5307862758636475, + "learning_rate": 1.1129447959781546e-06, + "loss": 0.0249, + "step": 31303 + }, + { + "epoch": 85.29700272479565, + "grad_norm": 3.1726667881011963, + "learning_rate": 1.112540225803468e-06, + "loss": 0.0769, + "step": 31304 + }, + { + "epoch": 85.29972752043597, + "grad_norm": 2.270932197570801, + "learning_rate": 1.1121357248440301e-06, + "loss": 0.0247, + "step": 31305 + }, + { + "epoch": 85.3024523160763, + "grad_norm": 1.6723506450653076, + "learning_rate": 1.1117312931029933e-06, + "loss": 0.0177, + "step": 31306 + }, + { + "epoch": 85.30517711171662, + "grad_norm": 2.499312400817871, + "learning_rate": 1.1113269305835095e-06, + "loss": 0.1686, + "step": 31307 + }, + { + "epoch": 85.30790190735695, + "grad_norm": 1.9165818691253662, + "learning_rate": 1.110922637288725e-06, + "loss": 0.024, + "step": 31308 + }, + { + "epoch": 85.31062670299727, + "grad_norm": 3.382559299468994, + "learning_rate": 1.1105184132217894e-06, + "loss": 0.0561, + "step": 31309 + }, + { + "epoch": 85.3133514986376, + "grad_norm": 3.5681657791137695, + "learning_rate": 1.110114258385847e-06, + "loss": 0.144, + "step": 31310 + }, + { + "epoch": 85.31607629427793, + "grad_norm": 2.3098039627075195, + "learning_rate": 1.109710172784052e-06, + "loss": 0.0869, + "step": 31311 + }, + { + "epoch": 85.31880108991825, + "grad_norm": 5.275523662567139, + "learning_rate": 1.1093061564195473e-06, + "loss": 0.2314, + "step": 31312 + }, + { + "epoch": 85.32152588555859, + "grad_norm": 2.3177170753479004, + "learning_rate": 1.1089022092954804e-06, + "loss": 0.0722, + "step": 31313 + }, + { + "epoch": 85.3242506811989, + "grad_norm": 4.753061771392822, + "learning_rate": 1.1084983314149956e-06, + "loss": 0.0399, + "step": 31314 + }, + { + "epoch": 85.32697547683924, + "grad_norm": 2.071126937866211, + "learning_rate": 1.1080945227812401e-06, + "loss": 0.0317, + "step": 31315 + }, + { + "epoch": 85.32970027247957, + "grad_norm": 1.5893691778182983, + "learning_rate": 1.1076907833973594e-06, + "loss": 0.0224, + "step": 31316 + }, + { + "epoch": 85.33242506811989, + "grad_norm": 3.2053310871124268, + "learning_rate": 1.1072871132664964e-06, + "loss": 0.0321, + "step": 31317 + }, + { + "epoch": 85.33514986376022, + "grad_norm": 2.5301358699798584, + "learning_rate": 1.1068835123917932e-06, + "loss": 0.0318, + "step": 31318 + }, + { + "epoch": 85.33787465940054, + "grad_norm": 2.5551259517669678, + "learning_rate": 1.106479980776397e-06, + "loss": 0.0998, + "step": 31319 + }, + { + "epoch": 85.34059945504087, + "grad_norm": 2.8790533542633057, + "learning_rate": 1.106076518423449e-06, + "loss": 0.0703, + "step": 31320 + }, + { + "epoch": 85.34332425068119, + "grad_norm": 2.3201816082000732, + "learning_rate": 1.1056731253360896e-06, + "loss": 0.036, + "step": 31321 + }, + { + "epoch": 85.34604904632153, + "grad_norm": 2.061262845993042, + "learning_rate": 1.1052698015174601e-06, + "loss": 0.0563, + "step": 31322 + }, + { + "epoch": 85.34877384196186, + "grad_norm": 3.3432466983795166, + "learning_rate": 1.1048665469707055e-06, + "loss": 0.1288, + "step": 31323 + }, + { + "epoch": 85.35149863760218, + "grad_norm": 3.4909512996673584, + "learning_rate": 1.104463361698962e-06, + "loss": 0.0766, + "step": 31324 + }, + { + "epoch": 85.35422343324251, + "grad_norm": 2.3487298488616943, + "learning_rate": 1.1040602457053729e-06, + "loss": 0.0624, + "step": 31325 + }, + { + "epoch": 85.35694822888283, + "grad_norm": 2.2828550338745117, + "learning_rate": 1.1036571989930744e-06, + "loss": 0.0402, + "step": 31326 + }, + { + "epoch": 85.35967302452316, + "grad_norm": 3.2351059913635254, + "learning_rate": 1.1032542215652098e-06, + "loss": 0.1084, + "step": 31327 + }, + { + "epoch": 85.3623978201635, + "grad_norm": 1.4596086740493774, + "learning_rate": 1.1028513134249153e-06, + "loss": 0.0159, + "step": 31328 + }, + { + "epoch": 85.36512261580381, + "grad_norm": 1.4271363019943237, + "learning_rate": 1.1024484745753271e-06, + "loss": 0.0206, + "step": 31329 + }, + { + "epoch": 85.36784741144415, + "grad_norm": 1.773149847984314, + "learning_rate": 1.1020457050195833e-06, + "loss": 0.0202, + "step": 31330 + }, + { + "epoch": 85.37057220708446, + "grad_norm": 2.0291876792907715, + "learning_rate": 1.1016430047608218e-06, + "loss": 0.1331, + "step": 31331 + }, + { + "epoch": 85.3732970027248, + "grad_norm": 3.2120614051818848, + "learning_rate": 1.1012403738021793e-06, + "loss": 0.0467, + "step": 31332 + }, + { + "epoch": 85.37602179836512, + "grad_norm": 2.912571668624878, + "learning_rate": 1.10083781214679e-06, + "loss": 0.114, + "step": 31333 + }, + { + "epoch": 85.37874659400545, + "grad_norm": 2.736415386199951, + "learning_rate": 1.1004353197977869e-06, + "loss": 0.0289, + "step": 31334 + }, + { + "epoch": 85.38147138964578, + "grad_norm": 2.302786111831665, + "learning_rate": 1.1000328967583096e-06, + "loss": 0.0355, + "step": 31335 + }, + { + "epoch": 85.3841961852861, + "grad_norm": 3.136418104171753, + "learning_rate": 1.099630543031489e-06, + "loss": 0.1011, + "step": 31336 + }, + { + "epoch": 85.38692098092643, + "grad_norm": 2.4176077842712402, + "learning_rate": 1.0992282586204605e-06, + "loss": 0.023, + "step": 31337 + }, + { + "epoch": 85.38964577656675, + "grad_norm": 2.6242637634277344, + "learning_rate": 1.0988260435283526e-06, + "loss": 0.0296, + "step": 31338 + }, + { + "epoch": 85.39237057220708, + "grad_norm": 2.302511215209961, + "learning_rate": 1.098423897758304e-06, + "loss": 0.0217, + "step": 31339 + }, + { + "epoch": 85.39509536784742, + "grad_norm": 2.617093801498413, + "learning_rate": 1.098021821313443e-06, + "loss": 0.0621, + "step": 31340 + }, + { + "epoch": 85.39782016348774, + "grad_norm": 4.201938152313232, + "learning_rate": 1.0976198141968998e-06, + "loss": 0.0968, + "step": 31341 + }, + { + "epoch": 85.40054495912807, + "grad_norm": 2.8996481895446777, + "learning_rate": 1.097217876411808e-06, + "loss": 0.05, + "step": 31342 + }, + { + "epoch": 85.40326975476839, + "grad_norm": 5.1527557373046875, + "learning_rate": 1.0968160079612966e-06, + "loss": 0.1267, + "step": 31343 + }, + { + "epoch": 85.40599455040872, + "grad_norm": 2.3500819206237793, + "learning_rate": 1.0964142088484963e-06, + "loss": 0.0312, + "step": 31344 + }, + { + "epoch": 85.40871934604904, + "grad_norm": 2.4018545150756836, + "learning_rate": 1.0960124790765358e-06, + "loss": 0.0482, + "step": 31345 + }, + { + "epoch": 85.41144414168937, + "grad_norm": 3.214704751968384, + "learning_rate": 1.0956108186485414e-06, + "loss": 0.0484, + "step": 31346 + }, + { + "epoch": 85.4141689373297, + "grad_norm": 2.7772579193115234, + "learning_rate": 1.0952092275676461e-06, + "loss": 0.1192, + "step": 31347 + }, + { + "epoch": 85.41689373297002, + "grad_norm": 9.122698783874512, + "learning_rate": 1.0948077058369744e-06, + "loss": 0.0257, + "step": 31348 + }, + { + "epoch": 85.41961852861036, + "grad_norm": 2.5185344219207764, + "learning_rate": 1.0944062534596534e-06, + "loss": 0.0297, + "step": 31349 + }, + { + "epoch": 85.42234332425068, + "grad_norm": 2.5750045776367188, + "learning_rate": 1.0940048704388085e-06, + "loss": 0.1198, + "step": 31350 + }, + { + "epoch": 85.42506811989101, + "grad_norm": 2.800236701965332, + "learning_rate": 1.0936035567775682e-06, + "loss": 0.0509, + "step": 31351 + }, + { + "epoch": 85.42779291553134, + "grad_norm": 3.1607398986816406, + "learning_rate": 1.093202312479057e-06, + "loss": 0.0387, + "step": 31352 + }, + { + "epoch": 85.43051771117166, + "grad_norm": 3.0872299671173096, + "learning_rate": 1.0928011375464e-06, + "loss": 0.0855, + "step": 31353 + }, + { + "epoch": 85.433242506812, + "grad_norm": 4.9866766929626465, + "learning_rate": 1.0924000319827189e-06, + "loss": 0.0336, + "step": 31354 + }, + { + "epoch": 85.43596730245231, + "grad_norm": 2.2867190837860107, + "learning_rate": 1.0919989957911414e-06, + "loss": 0.093, + "step": 31355 + }, + { + "epoch": 85.43869209809264, + "grad_norm": 2.031414270401001, + "learning_rate": 1.0915980289747885e-06, + "loss": 0.1001, + "step": 31356 + }, + { + "epoch": 85.44141689373296, + "grad_norm": 3.1889355182647705, + "learning_rate": 1.0911971315367842e-06, + "loss": 0.0287, + "step": 31357 + }, + { + "epoch": 85.4441416893733, + "grad_norm": 1.4479886293411255, + "learning_rate": 1.0907963034802472e-06, + "loss": 0.0231, + "step": 31358 + }, + { + "epoch": 85.44686648501363, + "grad_norm": 2.1521711349487305, + "learning_rate": 1.0903955448083025e-06, + "loss": 0.0507, + "step": 31359 + }, + { + "epoch": 85.44959128065395, + "grad_norm": 2.2834932804107666, + "learning_rate": 1.0899948555240724e-06, + "loss": 0.0745, + "step": 31360 + }, + { + "epoch": 85.45231607629428, + "grad_norm": 3.421525239944458, + "learning_rate": 1.0895942356306754e-06, + "loss": 0.0495, + "step": 31361 + }, + { + "epoch": 85.4550408719346, + "grad_norm": 3.9137887954711914, + "learning_rate": 1.0891936851312325e-06, + "loss": 0.0602, + "step": 31362 + }, + { + "epoch": 85.45776566757493, + "grad_norm": 2.5682373046875, + "learning_rate": 1.0887932040288597e-06, + "loss": 0.0656, + "step": 31363 + }, + { + "epoch": 85.46049046321527, + "grad_norm": 2.6598455905914307, + "learning_rate": 1.0883927923266813e-06, + "loss": 0.1311, + "step": 31364 + }, + { + "epoch": 85.46321525885558, + "grad_norm": 2.747976541519165, + "learning_rate": 1.0879924500278116e-06, + "loss": 0.0326, + "step": 31365 + }, + { + "epoch": 85.46594005449592, + "grad_norm": 1.0858652591705322, + "learning_rate": 1.0875921771353714e-06, + "loss": 0.0143, + "step": 31366 + }, + { + "epoch": 85.46866485013624, + "grad_norm": 5.205644607543945, + "learning_rate": 1.0871919736524739e-06, + "loss": 0.0232, + "step": 31367 + }, + { + "epoch": 85.47138964577657, + "grad_norm": 2.80965256690979, + "learning_rate": 1.0867918395822397e-06, + "loss": 0.0311, + "step": 31368 + }, + { + "epoch": 85.47411444141689, + "grad_norm": 1.7131377458572388, + "learning_rate": 1.0863917749277852e-06, + "loss": 0.1043, + "step": 31369 + }, + { + "epoch": 85.47683923705722, + "grad_norm": 2.595020055770874, + "learning_rate": 1.0859917796922216e-06, + "loss": 0.0878, + "step": 31370 + }, + { + "epoch": 85.47956403269755, + "grad_norm": 1.2756234407424927, + "learning_rate": 1.0855918538786692e-06, + "loss": 0.0158, + "step": 31371 + }, + { + "epoch": 85.48228882833787, + "grad_norm": 2.4362616539001465, + "learning_rate": 1.0851919974902403e-06, + "loss": 0.027, + "step": 31372 + }, + { + "epoch": 85.4850136239782, + "grad_norm": 5.21702241897583, + "learning_rate": 1.0847922105300502e-06, + "loss": 0.0666, + "step": 31373 + }, + { + "epoch": 85.48773841961852, + "grad_norm": 2.4590508937835693, + "learning_rate": 1.0843924930012084e-06, + "loss": 0.1561, + "step": 31374 + }, + { + "epoch": 85.49046321525886, + "grad_norm": 2.4573071002960205, + "learning_rate": 1.0839928449068316e-06, + "loss": 0.0404, + "step": 31375 + }, + { + "epoch": 85.49318801089919, + "grad_norm": 4.320873737335205, + "learning_rate": 1.0835932662500338e-06, + "loss": 0.0459, + "step": 31376 + }, + { + "epoch": 85.49591280653951, + "grad_norm": 2.13910174369812, + "learning_rate": 1.0831937570339247e-06, + "loss": 0.0344, + "step": 31377 + }, + { + "epoch": 85.49863760217984, + "grad_norm": 2.389197826385498, + "learning_rate": 1.082794317261615e-06, + "loss": 0.0988, + "step": 31378 + }, + { + "epoch": 85.50136239782016, + "grad_norm": 2.4774317741394043, + "learning_rate": 1.0823949469362138e-06, + "loss": 0.1, + "step": 31379 + }, + { + "epoch": 85.50408719346049, + "grad_norm": 2.9944775104522705, + "learning_rate": 1.081995646060836e-06, + "loss": 0.041, + "step": 31380 + }, + { + "epoch": 85.50681198910081, + "grad_norm": 4.310959339141846, + "learning_rate": 1.0815964146385894e-06, + "loss": 0.0392, + "step": 31381 + }, + { + "epoch": 85.50953678474114, + "grad_norm": 2.6893749237060547, + "learning_rate": 1.0811972526725834e-06, + "loss": 0.0374, + "step": 31382 + }, + { + "epoch": 85.51226158038148, + "grad_norm": 2.7266385555267334, + "learning_rate": 1.0807981601659234e-06, + "loss": 0.0927, + "step": 31383 + }, + { + "epoch": 85.5149863760218, + "grad_norm": 2.57831072807312, + "learning_rate": 1.0803991371217227e-06, + "loss": 0.0374, + "step": 31384 + }, + { + "epoch": 85.51771117166213, + "grad_norm": 5.09738302230835, + "learning_rate": 1.0800001835430861e-06, + "loss": 0.0845, + "step": 31385 + }, + { + "epoch": 85.52043596730245, + "grad_norm": 2.6946308612823486, + "learning_rate": 1.0796012994331207e-06, + "loss": 0.0717, + "step": 31386 + }, + { + "epoch": 85.52316076294278, + "grad_norm": 2.0716943740844727, + "learning_rate": 1.0792024847949323e-06, + "loss": 0.0296, + "step": 31387 + }, + { + "epoch": 85.52588555858311, + "grad_norm": 2.4201676845550537, + "learning_rate": 1.0788037396316287e-06, + "loss": 0.0241, + "step": 31388 + }, + { + "epoch": 85.52861035422343, + "grad_norm": 2.9360971450805664, + "learning_rate": 1.0784050639463151e-06, + "loss": 0.0445, + "step": 31389 + }, + { + "epoch": 85.53133514986376, + "grad_norm": 2.013364791870117, + "learning_rate": 1.0780064577420935e-06, + "loss": 0.0189, + "step": 31390 + }, + { + "epoch": 85.53405994550408, + "grad_norm": 3.436640977859497, + "learning_rate": 1.0776079210220725e-06, + "loss": 0.1096, + "step": 31391 + }, + { + "epoch": 85.53678474114442, + "grad_norm": 2.0758986473083496, + "learning_rate": 1.0772094537893518e-06, + "loss": 0.0638, + "step": 31392 + }, + { + "epoch": 85.53950953678473, + "grad_norm": 4.707724094390869, + "learning_rate": 1.076811056047039e-06, + "loss": 0.0671, + "step": 31393 + }, + { + "epoch": 85.54223433242507, + "grad_norm": 2.8454244136810303, + "learning_rate": 1.076412727798234e-06, + "loss": 0.1167, + "step": 31394 + }, + { + "epoch": 85.5449591280654, + "grad_norm": 2.417797565460205, + "learning_rate": 1.0760144690460384e-06, + "loss": 0.0767, + "step": 31395 + }, + { + "epoch": 85.54768392370572, + "grad_norm": 1.9386225938796997, + "learning_rate": 1.0756162797935555e-06, + "loss": 0.1134, + "step": 31396 + }, + { + "epoch": 85.55040871934605, + "grad_norm": 2.14420485496521, + "learning_rate": 1.0752181600438872e-06, + "loss": 0.2065, + "step": 31397 + }, + { + "epoch": 85.55313351498637, + "grad_norm": 2.394150733947754, + "learning_rate": 1.0748201098001322e-06, + "loss": 0.0452, + "step": 31398 + }, + { + "epoch": 85.5558583106267, + "grad_norm": 2.4033522605895996, + "learning_rate": 1.0744221290653877e-06, + "loss": 0.1661, + "step": 31399 + }, + { + "epoch": 85.55858310626704, + "grad_norm": 2.9644079208374023, + "learning_rate": 1.0740242178427595e-06, + "loss": 0.028, + "step": 31400 + }, + { + "epoch": 85.56130790190736, + "grad_norm": 2.385225534439087, + "learning_rate": 1.0736263761353437e-06, + "loss": 0.1234, + "step": 31401 + }, + { + "epoch": 85.56403269754769, + "grad_norm": 3.1157336235046387, + "learning_rate": 1.0732286039462381e-06, + "loss": 0.1483, + "step": 31402 + }, + { + "epoch": 85.566757493188, + "grad_norm": 1.2751082181930542, + "learning_rate": 1.0728309012785386e-06, + "loss": 0.0175, + "step": 31403 + }, + { + "epoch": 85.56948228882834, + "grad_norm": 2.8085267543792725, + "learning_rate": 1.0724332681353466e-06, + "loss": 0.0617, + "step": 31404 + }, + { + "epoch": 85.57220708446866, + "grad_norm": 3.7019472122192383, + "learning_rate": 1.0720357045197572e-06, + "loss": 0.0338, + "step": 31405 + }, + { + "epoch": 85.57493188010899, + "grad_norm": 2.4826486110687256, + "learning_rate": 1.0716382104348667e-06, + "loss": 0.0442, + "step": 31406 + }, + { + "epoch": 85.57765667574932, + "grad_norm": 4.046591758728027, + "learning_rate": 1.0712407858837682e-06, + "loss": 0.0831, + "step": 31407 + }, + { + "epoch": 85.58038147138964, + "grad_norm": 5.646476745605469, + "learning_rate": 1.0708434308695604e-06, + "loss": 0.0908, + "step": 31408 + }, + { + "epoch": 85.58310626702998, + "grad_norm": 3.560476064682007, + "learning_rate": 1.0704461453953373e-06, + "loss": 0.0964, + "step": 31409 + }, + { + "epoch": 85.5858310626703, + "grad_norm": 2.3625431060791016, + "learning_rate": 1.0700489294641902e-06, + "loss": 0.0346, + "step": 31410 + }, + { + "epoch": 85.58855585831063, + "grad_norm": 2.201275587081909, + "learning_rate": 1.0696517830792141e-06, + "loss": 0.0345, + "step": 31411 + }, + { + "epoch": 85.59128065395096, + "grad_norm": 2.2521026134490967, + "learning_rate": 1.0692547062435056e-06, + "loss": 0.0264, + "step": 31412 + }, + { + "epoch": 85.59400544959128, + "grad_norm": 2.509371519088745, + "learning_rate": 1.0688576989601528e-06, + "loss": 0.058, + "step": 31413 + }, + { + "epoch": 85.59673024523161, + "grad_norm": 2.8696141242980957, + "learning_rate": 1.0684607612322495e-06, + "loss": 0.0323, + "step": 31414 + }, + { + "epoch": 85.59945504087193, + "grad_norm": 2.570969581604004, + "learning_rate": 1.068063893062884e-06, + "loss": 0.0933, + "step": 31415 + }, + { + "epoch": 85.60217983651226, + "grad_norm": 1.7264670133590698, + "learning_rate": 1.0676670944551515e-06, + "loss": 0.043, + "step": 31416 + }, + { + "epoch": 85.60490463215258, + "grad_norm": 6.297112941741943, + "learning_rate": 1.0672703654121407e-06, + "loss": 0.1358, + "step": 31417 + }, + { + "epoch": 85.60762942779292, + "grad_norm": 2.092822790145874, + "learning_rate": 1.0668737059369405e-06, + "loss": 0.0234, + "step": 31418 + }, + { + "epoch": 85.61035422343325, + "grad_norm": 3.4409234523773193, + "learning_rate": 1.0664771160326382e-06, + "loss": 0.0609, + "step": 31419 + }, + { + "epoch": 85.61307901907357, + "grad_norm": 2.049858808517456, + "learning_rate": 1.0660805957023268e-06, + "loss": 0.0202, + "step": 31420 + }, + { + "epoch": 85.6158038147139, + "grad_norm": 2.0648813247680664, + "learning_rate": 1.0656841449490918e-06, + "loss": 0.0257, + "step": 31421 + }, + { + "epoch": 85.61852861035422, + "grad_norm": 1.8562856912612915, + "learning_rate": 1.0652877637760217e-06, + "loss": 0.0251, + "step": 31422 + }, + { + "epoch": 85.62125340599455, + "grad_norm": 3.5806736946105957, + "learning_rate": 1.0648914521862008e-06, + "loss": 0.03, + "step": 31423 + }, + { + "epoch": 85.62397820163488, + "grad_norm": 3.132786273956299, + "learning_rate": 1.064495210182719e-06, + "loss": 0.0504, + "step": 31424 + }, + { + "epoch": 85.6267029972752, + "grad_norm": 2.8375136852264404, + "learning_rate": 1.0640990377686611e-06, + "loss": 0.0466, + "step": 31425 + }, + { + "epoch": 85.62942779291554, + "grad_norm": 2.8802056312561035, + "learning_rate": 1.0637029349471128e-06, + "loss": 0.0393, + "step": 31426 + }, + { + "epoch": 85.63215258855585, + "grad_norm": 2.7082021236419678, + "learning_rate": 1.0633069017211562e-06, + "loss": 0.0581, + "step": 31427 + }, + { + "epoch": 85.63487738419619, + "grad_norm": 2.3465468883514404, + "learning_rate": 1.0629109380938785e-06, + "loss": 0.0419, + "step": 31428 + }, + { + "epoch": 85.6376021798365, + "grad_norm": 3.680985927581787, + "learning_rate": 1.062515044068364e-06, + "loss": 0.0239, + "step": 31429 + }, + { + "epoch": 85.64032697547684, + "grad_norm": 4.25960636138916, + "learning_rate": 1.0621192196476949e-06, + "loss": 0.0475, + "step": 31430 + }, + { + "epoch": 85.64305177111717, + "grad_norm": 2.498424530029297, + "learning_rate": 1.0617234648349506e-06, + "loss": 0.0728, + "step": 31431 + }, + { + "epoch": 85.64577656675749, + "grad_norm": 3.0986287593841553, + "learning_rate": 1.06132777963322e-06, + "loss": 0.096, + "step": 31432 + }, + { + "epoch": 85.64850136239782, + "grad_norm": 2.214416265487671, + "learning_rate": 1.0609321640455793e-06, + "loss": 0.0566, + "step": 31433 + }, + { + "epoch": 85.65122615803814, + "grad_norm": 1.5452136993408203, + "learning_rate": 1.060536618075113e-06, + "loss": 0.0215, + "step": 31434 + }, + { + "epoch": 85.65395095367847, + "grad_norm": 4.361598014831543, + "learning_rate": 1.0601411417248964e-06, + "loss": 0.0395, + "step": 31435 + }, + { + "epoch": 85.65667574931881, + "grad_norm": 3.358471393585205, + "learning_rate": 1.0597457349980156e-06, + "loss": 0.0562, + "step": 31436 + }, + { + "epoch": 85.65940054495913, + "grad_norm": 2.2020375728607178, + "learning_rate": 1.0593503978975472e-06, + "loss": 0.0899, + "step": 31437 + }, + { + "epoch": 85.66212534059946, + "grad_norm": 3.1154308319091797, + "learning_rate": 1.05895513042657e-06, + "loss": 0.0459, + "step": 31438 + }, + { + "epoch": 85.66485013623978, + "grad_norm": 2.8388190269470215, + "learning_rate": 1.0585599325881602e-06, + "loss": 0.032, + "step": 31439 + }, + { + "epoch": 85.66757493188011, + "grad_norm": 2.577883005142212, + "learning_rate": 1.0581648043853999e-06, + "loss": 0.0281, + "step": 31440 + }, + { + "epoch": 85.67029972752043, + "grad_norm": 3.873203754425049, + "learning_rate": 1.0577697458213654e-06, + "loss": 0.0652, + "step": 31441 + }, + { + "epoch": 85.67302452316076, + "grad_norm": 4.001662731170654, + "learning_rate": 1.0573747568991311e-06, + "loss": 0.0791, + "step": 31442 + }, + { + "epoch": 85.6757493188011, + "grad_norm": 3.218181610107422, + "learning_rate": 1.0569798376217722e-06, + "loss": 0.1775, + "step": 31443 + }, + { + "epoch": 85.67847411444141, + "grad_norm": 1.7833396196365356, + "learning_rate": 1.0565849879923673e-06, + "loss": 0.0236, + "step": 31444 + }, + { + "epoch": 85.68119891008175, + "grad_norm": 3.1455492973327637, + "learning_rate": 1.056190208013993e-06, + "loss": 0.0829, + "step": 31445 + }, + { + "epoch": 85.68392370572207, + "grad_norm": 3.2898142337799072, + "learning_rate": 1.05579549768972e-06, + "loss": 0.037, + "step": 31446 + }, + { + "epoch": 85.6866485013624, + "grad_norm": 1.9134249687194824, + "learning_rate": 1.0554008570226248e-06, + "loss": 0.0781, + "step": 31447 + }, + { + "epoch": 85.68937329700273, + "grad_norm": 4.054567337036133, + "learning_rate": 1.0550062860157783e-06, + "loss": 0.0599, + "step": 31448 + }, + { + "epoch": 85.69209809264305, + "grad_norm": 2.6702451705932617, + "learning_rate": 1.054611784672256e-06, + "loss": 0.0755, + "step": 31449 + }, + { + "epoch": 85.69482288828338, + "grad_norm": 1.6346731185913086, + "learning_rate": 1.0542173529951293e-06, + "loss": 0.0677, + "step": 31450 + }, + { + "epoch": 85.6975476839237, + "grad_norm": 4.656773090362549, + "learning_rate": 1.053822990987471e-06, + "loss": 0.1542, + "step": 31451 + }, + { + "epoch": 85.70027247956403, + "grad_norm": 1.8992481231689453, + "learning_rate": 1.053428698652349e-06, + "loss": 0.0555, + "step": 31452 + }, + { + "epoch": 85.70299727520435, + "grad_norm": 2.108342409133911, + "learning_rate": 1.0530344759928369e-06, + "loss": 0.0293, + "step": 31453 + }, + { + "epoch": 85.70572207084469, + "grad_norm": 2.579798460006714, + "learning_rate": 1.0526403230120064e-06, + "loss": 0.0406, + "step": 31454 + }, + { + "epoch": 85.70844686648502, + "grad_norm": 3.2917730808258057, + "learning_rate": 1.0522462397129218e-06, + "loss": 0.0213, + "step": 31455 + }, + { + "epoch": 85.71117166212534, + "grad_norm": 2.3854780197143555, + "learning_rate": 1.0518522260986575e-06, + "loss": 0.0296, + "step": 31456 + }, + { + "epoch": 85.71389645776567, + "grad_norm": 3.2360236644744873, + "learning_rate": 1.0514582821722807e-06, + "loss": 0.1155, + "step": 31457 + }, + { + "epoch": 85.71662125340599, + "grad_norm": 2.146756172180176, + "learning_rate": 1.0510644079368582e-06, + "loss": 0.0276, + "step": 31458 + }, + { + "epoch": 85.71934604904632, + "grad_norm": 2.608949899673462, + "learning_rate": 1.0506706033954561e-06, + "loss": 0.0243, + "step": 31459 + }, + { + "epoch": 85.72207084468666, + "grad_norm": 2.1771044731140137, + "learning_rate": 1.0502768685511456e-06, + "loss": 0.049, + "step": 31460 + }, + { + "epoch": 85.72479564032697, + "grad_norm": 1.8936131000518799, + "learning_rate": 1.0498832034069884e-06, + "loss": 0.0223, + "step": 31461 + }, + { + "epoch": 85.7275204359673, + "grad_norm": 3.245781660079956, + "learning_rate": 1.0494896079660554e-06, + "loss": 0.0338, + "step": 31462 + }, + { + "epoch": 85.73024523160763, + "grad_norm": 2.8010880947113037, + "learning_rate": 1.049096082231409e-06, + "loss": 0.0592, + "step": 31463 + }, + { + "epoch": 85.73297002724796, + "grad_norm": 2.7403125762939453, + "learning_rate": 1.0487026262061117e-06, + "loss": 0.0214, + "step": 31464 + }, + { + "epoch": 85.73569482288828, + "grad_norm": 1.6857712268829346, + "learning_rate": 1.0483092398932326e-06, + "loss": 0.0805, + "step": 31465 + }, + { + "epoch": 85.73841961852861, + "grad_norm": 2.862874746322632, + "learning_rate": 1.0479159232958337e-06, + "loss": 0.1347, + "step": 31466 + }, + { + "epoch": 85.74114441416894, + "grad_norm": 1.8531434535980225, + "learning_rate": 1.0475226764169766e-06, + "loss": 0.0612, + "step": 31467 + }, + { + "epoch": 85.74386920980926, + "grad_norm": 2.6498937606811523, + "learning_rate": 1.0471294992597237e-06, + "loss": 0.0293, + "step": 31468 + }, + { + "epoch": 85.7465940054496, + "grad_norm": 1.5940945148468018, + "learning_rate": 1.046736391827139e-06, + "loss": 0.0169, + "step": 31469 + }, + { + "epoch": 85.74931880108991, + "grad_norm": 3.2719297409057617, + "learning_rate": 1.0463433541222834e-06, + "loss": 0.0893, + "step": 31470 + }, + { + "epoch": 85.75204359673025, + "grad_norm": 3.037069082260132, + "learning_rate": 1.0459503861482179e-06, + "loss": 0.036, + "step": 31471 + }, + { + "epoch": 85.75476839237058, + "grad_norm": 2.491203546524048, + "learning_rate": 1.0455574879079999e-06, + "loss": 0.05, + "step": 31472 + }, + { + "epoch": 85.7574931880109, + "grad_norm": 3.3718345165252686, + "learning_rate": 1.045164659404695e-06, + "loss": 0.1023, + "step": 31473 + }, + { + "epoch": 85.76021798365123, + "grad_norm": 2.3489160537719727, + "learning_rate": 1.0447719006413592e-06, + "loss": 0.0719, + "step": 31474 + }, + { + "epoch": 85.76294277929155, + "grad_norm": 4.1013383865356445, + "learning_rate": 1.0443792116210515e-06, + "loss": 0.0478, + "step": 31475 + }, + { + "epoch": 85.76566757493188, + "grad_norm": 2.5753602981567383, + "learning_rate": 1.0439865923468284e-06, + "loss": 0.0389, + "step": 31476 + }, + { + "epoch": 85.7683923705722, + "grad_norm": 2.968282461166382, + "learning_rate": 1.0435940428217516e-06, + "loss": 0.0492, + "step": 31477 + }, + { + "epoch": 85.77111716621253, + "grad_norm": 3.0301930904388428, + "learning_rate": 1.0432015630488756e-06, + "loss": 0.0941, + "step": 31478 + }, + { + "epoch": 85.77384196185287, + "grad_norm": 2.6919567584991455, + "learning_rate": 1.0428091530312556e-06, + "loss": 0.0448, + "step": 31479 + }, + { + "epoch": 85.77656675749319, + "grad_norm": 2.990431785583496, + "learning_rate": 1.0424168127719502e-06, + "loss": 0.2594, + "step": 31480 + }, + { + "epoch": 85.77929155313352, + "grad_norm": 3.8211493492126465, + "learning_rate": 1.042024542274016e-06, + "loss": 0.0489, + "step": 31481 + }, + { + "epoch": 85.78201634877384, + "grad_norm": 2.424978017807007, + "learning_rate": 1.0416323415405061e-06, + "loss": 0.1753, + "step": 31482 + }, + { + "epoch": 85.78474114441417, + "grad_norm": 2.314209222793579, + "learning_rate": 1.0412402105744756e-06, + "loss": 0.0315, + "step": 31483 + }, + { + "epoch": 85.7874659400545, + "grad_norm": 3.6571786403656006, + "learning_rate": 1.0408481493789758e-06, + "loss": 0.1508, + "step": 31484 + }, + { + "epoch": 85.79019073569482, + "grad_norm": 2.1805782318115234, + "learning_rate": 1.040456157957065e-06, + "loss": 0.0235, + "step": 31485 + }, + { + "epoch": 85.79291553133515, + "grad_norm": 2.3275468349456787, + "learning_rate": 1.0400642363117918e-06, + "loss": 0.0294, + "step": 31486 + }, + { + "epoch": 85.79564032697547, + "grad_norm": 2.6586239337921143, + "learning_rate": 1.039672384446211e-06, + "loss": 0.0275, + "step": 31487 + }, + { + "epoch": 85.7983651226158, + "grad_norm": 2.1028189659118652, + "learning_rate": 1.0392806023633717e-06, + "loss": 0.0388, + "step": 31488 + }, + { + "epoch": 85.80108991825612, + "grad_norm": 2.2674365043640137, + "learning_rate": 1.0388888900663274e-06, + "loss": 0.1472, + "step": 31489 + }, + { + "epoch": 85.80381471389646, + "grad_norm": 3.2275967597961426, + "learning_rate": 1.038497247558129e-06, + "loss": 0.0364, + "step": 31490 + }, + { + "epoch": 85.80653950953679, + "grad_norm": 2.492194652557373, + "learning_rate": 1.038105674841825e-06, + "loss": 0.0705, + "step": 31491 + }, + { + "epoch": 85.80926430517711, + "grad_norm": 2.9958271980285645, + "learning_rate": 1.0377141719204642e-06, + "loss": 0.2088, + "step": 31492 + }, + { + "epoch": 85.81198910081744, + "grad_norm": 2.5424046516418457, + "learning_rate": 1.0373227387970986e-06, + "loss": 0.027, + "step": 31493 + }, + { + "epoch": 85.81471389645776, + "grad_norm": 2.828305959701538, + "learning_rate": 1.0369313754747744e-06, + "loss": 0.076, + "step": 31494 + }, + { + "epoch": 85.8174386920981, + "grad_norm": 2.2557549476623535, + "learning_rate": 1.0365400819565407e-06, + "loss": 0.0321, + "step": 31495 + }, + { + "epoch": 85.82016348773843, + "grad_norm": 2.285198926925659, + "learning_rate": 1.0361488582454404e-06, + "loss": 0.069, + "step": 31496 + }, + { + "epoch": 85.82288828337875, + "grad_norm": 3.4394943714141846, + "learning_rate": 1.0357577043445287e-06, + "loss": 0.0373, + "step": 31497 + }, + { + "epoch": 85.82561307901908, + "grad_norm": 2.6939773559570312, + "learning_rate": 1.0353666202568468e-06, + "loss": 0.0318, + "step": 31498 + }, + { + "epoch": 85.8283378746594, + "grad_norm": 3.18467378616333, + "learning_rate": 1.0349756059854421e-06, + "loss": 0.1026, + "step": 31499 + }, + { + "epoch": 85.83106267029973, + "grad_norm": 2.1771793365478516, + "learning_rate": 1.0345846615333565e-06, + "loss": 0.0364, + "step": 31500 + }, + { + "epoch": 85.83378746594005, + "grad_norm": 4.8560662269592285, + "learning_rate": 1.034193786903639e-06, + "loss": 0.1635, + "step": 31501 + }, + { + "epoch": 85.83651226158038, + "grad_norm": 2.727335214614868, + "learning_rate": 1.033802982099331e-06, + "loss": 0.0716, + "step": 31502 + }, + { + "epoch": 85.83923705722071, + "grad_norm": 2.5315072536468506, + "learning_rate": 1.0334122471234775e-06, + "loss": 0.1616, + "step": 31503 + }, + { + "epoch": 85.84196185286103, + "grad_norm": 2.0643715858459473, + "learning_rate": 1.033021581979118e-06, + "loss": 0.0664, + "step": 31504 + }, + { + "epoch": 85.84468664850137, + "grad_norm": 3.0063178539276123, + "learning_rate": 1.0326309866693007e-06, + "loss": 0.2104, + "step": 31505 + }, + { + "epoch": 85.84741144414168, + "grad_norm": 3.5163540840148926, + "learning_rate": 1.032240461197065e-06, + "loss": 0.0269, + "step": 31506 + }, + { + "epoch": 85.85013623978202, + "grad_norm": 2.4701731204986572, + "learning_rate": 1.0318500055654513e-06, + "loss": 0.0315, + "step": 31507 + }, + { + "epoch": 85.85286103542235, + "grad_norm": 3.7995245456695557, + "learning_rate": 1.0314596197774985e-06, + "loss": 0.1136, + "step": 31508 + }, + { + "epoch": 85.85558583106267, + "grad_norm": 2.90480375289917, + "learning_rate": 1.0310693038362518e-06, + "loss": 0.0612, + "step": 31509 + }, + { + "epoch": 85.858310626703, + "grad_norm": 2.6373202800750732, + "learning_rate": 1.03067905774475e-06, + "loss": 0.0476, + "step": 31510 + }, + { + "epoch": 85.86103542234332, + "grad_norm": 2.086611747741699, + "learning_rate": 1.0302888815060297e-06, + "loss": 0.0798, + "step": 31511 + }, + { + "epoch": 85.86376021798365, + "grad_norm": 2.0838420391082764, + "learning_rate": 1.0298987751231293e-06, + "loss": 0.0282, + "step": 31512 + }, + { + "epoch": 85.86648501362397, + "grad_norm": 2.5717296600341797, + "learning_rate": 1.0295087385990888e-06, + "loss": 0.2165, + "step": 31513 + }, + { + "epoch": 85.8692098092643, + "grad_norm": 4.200585842132568, + "learning_rate": 1.0291187719369466e-06, + "loss": 0.0344, + "step": 31514 + }, + { + "epoch": 85.87193460490464, + "grad_norm": 2.4633283615112305, + "learning_rate": 1.0287288751397395e-06, + "loss": 0.0529, + "step": 31515 + }, + { + "epoch": 85.87465940054496, + "grad_norm": 3.0095136165618896, + "learning_rate": 1.0283390482105037e-06, + "loss": 0.0295, + "step": 31516 + }, + { + "epoch": 85.87738419618529, + "grad_norm": 2.8084800243377686, + "learning_rate": 1.0279492911522714e-06, + "loss": 0.0425, + "step": 31517 + }, + { + "epoch": 85.88010899182561, + "grad_norm": 2.4964981079101562, + "learning_rate": 1.0275596039680835e-06, + "loss": 0.0404, + "step": 31518 + }, + { + "epoch": 85.88283378746594, + "grad_norm": 2.2275397777557373, + "learning_rate": 1.027169986660973e-06, + "loss": 0.0281, + "step": 31519 + }, + { + "epoch": 85.88555858310627, + "grad_norm": 2.452439785003662, + "learning_rate": 1.026780439233972e-06, + "loss": 0.0469, + "step": 31520 + }, + { + "epoch": 85.88828337874659, + "grad_norm": 2.2140159606933594, + "learning_rate": 1.026390961690118e-06, + "loss": 0.0178, + "step": 31521 + }, + { + "epoch": 85.89100817438693, + "grad_norm": 2.875448703765869, + "learning_rate": 1.026001554032443e-06, + "loss": 0.0587, + "step": 31522 + }, + { + "epoch": 85.89373297002724, + "grad_norm": 2.641120672225952, + "learning_rate": 1.025612216263978e-06, + "loss": 0.0683, + "step": 31523 + }, + { + "epoch": 85.89645776566758, + "grad_norm": 1.6421146392822266, + "learning_rate": 1.0252229483877551e-06, + "loss": 0.0227, + "step": 31524 + }, + { + "epoch": 85.8991825613079, + "grad_norm": 2.881132125854492, + "learning_rate": 1.0248337504068085e-06, + "loss": 0.0413, + "step": 31525 + }, + { + "epoch": 85.90190735694823, + "grad_norm": 2.6686294078826904, + "learning_rate": 1.0244446223241677e-06, + "loss": 0.0603, + "step": 31526 + }, + { + "epoch": 85.90463215258856, + "grad_norm": 1.8666067123413086, + "learning_rate": 1.024055564142863e-06, + "loss": 0.0174, + "step": 31527 + }, + { + "epoch": 85.90735694822888, + "grad_norm": 2.5336527824401855, + "learning_rate": 1.0236665758659237e-06, + "loss": 0.0888, + "step": 31528 + }, + { + "epoch": 85.91008174386921, + "grad_norm": 2.7427446842193604, + "learning_rate": 1.023277657496381e-06, + "loss": 0.0374, + "step": 31529 + }, + { + "epoch": 85.91280653950953, + "grad_norm": 2.498741388320923, + "learning_rate": 1.0228888090372613e-06, + "loss": 0.0218, + "step": 31530 + }, + { + "epoch": 85.91553133514986, + "grad_norm": 2.7943947315216064, + "learning_rate": 1.0225000304915977e-06, + "loss": 0.0419, + "step": 31531 + }, + { + "epoch": 85.9182561307902, + "grad_norm": 6.141363143920898, + "learning_rate": 1.0221113218624134e-06, + "loss": 0.1079, + "step": 31532 + }, + { + "epoch": 85.92098092643052, + "grad_norm": 2.3486995697021484, + "learning_rate": 1.021722683152736e-06, + "loss": 0.046, + "step": 31533 + }, + { + "epoch": 85.92370572207085, + "grad_norm": 2.334148645401001, + "learning_rate": 1.0213341143655952e-06, + "loss": 0.0354, + "step": 31534 + }, + { + "epoch": 85.92643051771117, + "grad_norm": 2.234052896499634, + "learning_rate": 1.0209456155040166e-06, + "loss": 0.1401, + "step": 31535 + }, + { + "epoch": 85.9291553133515, + "grad_norm": 5.003220558166504, + "learning_rate": 1.020557186571023e-06, + "loss": 0.0345, + "step": 31536 + }, + { + "epoch": 85.93188010899182, + "grad_norm": 2.0255320072174072, + "learning_rate": 1.0201688275696397e-06, + "loss": 0.0686, + "step": 31537 + }, + { + "epoch": 85.93460490463215, + "grad_norm": 2.026007652282715, + "learning_rate": 1.0197805385028935e-06, + "loss": 0.0272, + "step": 31538 + }, + { + "epoch": 85.93732970027249, + "grad_norm": 2.777132749557495, + "learning_rate": 1.0193923193738087e-06, + "loss": 0.045, + "step": 31539 + }, + { + "epoch": 85.9400544959128, + "grad_norm": 2.49111008644104, + "learning_rate": 1.019004170185407e-06, + "loss": 0.0387, + "step": 31540 + }, + { + "epoch": 85.94277929155314, + "grad_norm": 2.2162814140319824, + "learning_rate": 1.0186160909407095e-06, + "loss": 0.0233, + "step": 31541 + }, + { + "epoch": 85.94550408719346, + "grad_norm": 2.7575600147247314, + "learning_rate": 1.0182280816427436e-06, + "loss": 0.1483, + "step": 31542 + }, + { + "epoch": 85.94822888283379, + "grad_norm": 3.0144386291503906, + "learning_rate": 1.0178401422945273e-06, + "loss": 0.0549, + "step": 31543 + }, + { + "epoch": 85.95095367847412, + "grad_norm": 3.633289098739624, + "learning_rate": 1.0174522728990821e-06, + "loss": 0.0442, + "step": 31544 + }, + { + "epoch": 85.95367847411444, + "grad_norm": 2.7940962314605713, + "learning_rate": 1.0170644734594304e-06, + "loss": 0.0675, + "step": 31545 + }, + { + "epoch": 85.95640326975477, + "grad_norm": 2.4861257076263428, + "learning_rate": 1.0166767439785917e-06, + "loss": 0.0333, + "step": 31546 + }, + { + "epoch": 85.95912806539509, + "grad_norm": 2.6529250144958496, + "learning_rate": 1.016289084459584e-06, + "loss": 0.0348, + "step": 31547 + }, + { + "epoch": 85.96185286103542, + "grad_norm": 3.331308364868164, + "learning_rate": 1.015901494905429e-06, + "loss": 0.0411, + "step": 31548 + }, + { + "epoch": 85.96457765667574, + "grad_norm": 2.4053611755371094, + "learning_rate": 1.0155139753191424e-06, + "loss": 0.053, + "step": 31549 + }, + { + "epoch": 85.96730245231608, + "grad_norm": 2.1256680488586426, + "learning_rate": 1.0151265257037457e-06, + "loss": 0.0401, + "step": 31550 + }, + { + "epoch": 85.97002724795641, + "grad_norm": 3.6913411617279053, + "learning_rate": 1.0147391460622547e-06, + "loss": 0.1061, + "step": 31551 + }, + { + "epoch": 85.97275204359673, + "grad_norm": 2.2901344299316406, + "learning_rate": 1.0143518363976857e-06, + "loss": 0.0257, + "step": 31552 + }, + { + "epoch": 85.97547683923706, + "grad_norm": 3.701040744781494, + "learning_rate": 1.013964596713053e-06, + "loss": 0.1472, + "step": 31553 + }, + { + "epoch": 85.97820163487738, + "grad_norm": 2.446267604827881, + "learning_rate": 1.0135774270113774e-06, + "loss": 0.0359, + "step": 31554 + }, + { + "epoch": 85.98092643051771, + "grad_norm": 7.176121234893799, + "learning_rate": 1.0131903272956722e-06, + "loss": 0.0816, + "step": 31555 + }, + { + "epoch": 85.98365122615803, + "grad_norm": 1.4883784055709839, + "learning_rate": 1.0128032975689506e-06, + "loss": 0.0185, + "step": 31556 + }, + { + "epoch": 85.98637602179836, + "grad_norm": 2.5638229846954346, + "learning_rate": 1.0124163378342255e-06, + "loss": 0.0256, + "step": 31557 + }, + { + "epoch": 85.9891008174387, + "grad_norm": 3.9347333908081055, + "learning_rate": 1.0120294480945148e-06, + "loss": 0.0617, + "step": 31558 + }, + { + "epoch": 85.99182561307902, + "grad_norm": 2.0129220485687256, + "learning_rate": 1.0116426283528301e-06, + "loss": 0.0208, + "step": 31559 + }, + { + "epoch": 85.99455040871935, + "grad_norm": 2.478191614151001, + "learning_rate": 1.0112558786121829e-06, + "loss": 0.1113, + "step": 31560 + }, + { + "epoch": 85.99727520435967, + "grad_norm": 2.614762783050537, + "learning_rate": 1.0108691988755837e-06, + "loss": 0.1372, + "step": 31561 + }, + { + "epoch": 86.0, + "grad_norm": 2.7023041248321533, + "learning_rate": 1.010482589146048e-06, + "loss": 0.0381, + "step": 31562 + }, + { + "epoch": 86.00272479564033, + "grad_norm": 3.757795572280884, + "learning_rate": 1.0100960494265843e-06, + "loss": 0.1278, + "step": 31563 + }, + { + "epoch": 86.00544959128065, + "grad_norm": 1.8841562271118164, + "learning_rate": 1.0097095797202016e-06, + "loss": 0.0246, + "step": 31564 + }, + { + "epoch": 86.00817438692098, + "grad_norm": 2.0132946968078613, + "learning_rate": 1.0093231800299109e-06, + "loss": 0.0715, + "step": 31565 + }, + { + "epoch": 86.0108991825613, + "grad_norm": 3.5072214603424072, + "learning_rate": 1.0089368503587238e-06, + "loss": 0.0303, + "step": 31566 + }, + { + "epoch": 86.01362397820164, + "grad_norm": 2.2425694465637207, + "learning_rate": 1.008550590709647e-06, + "loss": 0.0373, + "step": 31567 + }, + { + "epoch": 86.01634877384195, + "grad_norm": 2.0086355209350586, + "learning_rate": 1.0081644010856895e-06, + "loss": 0.0391, + "step": 31568 + }, + { + "epoch": 86.01907356948229, + "grad_norm": 3.336557626724243, + "learning_rate": 1.0077782814898563e-06, + "loss": 0.0402, + "step": 31569 + }, + { + "epoch": 86.02179836512262, + "grad_norm": 2.4130775928497314, + "learning_rate": 1.0073922319251584e-06, + "loss": 0.0249, + "step": 31570 + }, + { + "epoch": 86.02452316076294, + "grad_norm": 2.9354212284088135, + "learning_rate": 1.0070062523946001e-06, + "loss": 0.0931, + "step": 31571 + }, + { + "epoch": 86.02724795640327, + "grad_norm": 3.061462163925171, + "learning_rate": 1.006620342901188e-06, + "loss": 0.0888, + "step": 31572 + }, + { + "epoch": 86.02997275204359, + "grad_norm": 3.5965375900268555, + "learning_rate": 1.0062345034479236e-06, + "loss": 0.0609, + "step": 31573 + }, + { + "epoch": 86.03269754768392, + "grad_norm": 2.9291248321533203, + "learning_rate": 1.0058487340378187e-06, + "loss": 0.1035, + "step": 31574 + }, + { + "epoch": 86.03542234332426, + "grad_norm": 1.810512900352478, + "learning_rate": 1.0054630346738747e-06, + "loss": 0.0278, + "step": 31575 + }, + { + "epoch": 86.03814713896458, + "grad_norm": 2.29118275642395, + "learning_rate": 1.005077405359095e-06, + "loss": 0.0427, + "step": 31576 + }, + { + "epoch": 86.04087193460491, + "grad_norm": 1.8794190883636475, + "learning_rate": 1.0046918460964806e-06, + "loss": 0.0446, + "step": 31577 + }, + { + "epoch": 86.04359673024523, + "grad_norm": 2.5822699069976807, + "learning_rate": 1.0043063568890388e-06, + "loss": 0.0974, + "step": 31578 + }, + { + "epoch": 86.04632152588556, + "grad_norm": 7.6384663581848145, + "learning_rate": 1.0039209377397696e-06, + "loss": 0.0791, + "step": 31579 + }, + { + "epoch": 86.04904632152588, + "grad_norm": 2.6081624031066895, + "learning_rate": 1.003535588651674e-06, + "loss": 0.0252, + "step": 31580 + }, + { + "epoch": 86.05177111716621, + "grad_norm": 4.446021556854248, + "learning_rate": 1.0031503096277529e-06, + "loss": 0.0521, + "step": 31581 + }, + { + "epoch": 86.05449591280654, + "grad_norm": 3.872101068496704, + "learning_rate": 1.002765100671007e-06, + "loss": 0.0657, + "step": 31582 + }, + { + "epoch": 86.05722070844686, + "grad_norm": 3.703188896179199, + "learning_rate": 1.0023799617844387e-06, + "loss": 0.1037, + "step": 31583 + }, + { + "epoch": 86.0599455040872, + "grad_norm": 3.0919201374053955, + "learning_rate": 1.0019948929710456e-06, + "loss": 0.0465, + "step": 31584 + }, + { + "epoch": 86.06267029972751, + "grad_norm": 2.5964608192443848, + "learning_rate": 1.0016098942338249e-06, + "loss": 0.1445, + "step": 31585 + }, + { + "epoch": 86.06539509536785, + "grad_norm": 3.06375789642334, + "learning_rate": 1.0012249655757788e-06, + "loss": 0.047, + "step": 31586 + }, + { + "epoch": 86.06811989100818, + "grad_norm": 2.214186668395996, + "learning_rate": 1.000840106999903e-06, + "loss": 0.0228, + "step": 31587 + }, + { + "epoch": 86.0708446866485, + "grad_norm": 2.7507073879241943, + "learning_rate": 1.0004553185091948e-06, + "loss": 0.0348, + "step": 31588 + }, + { + "epoch": 86.07356948228883, + "grad_norm": 5.628101348876953, + "learning_rate": 1.0000706001066485e-06, + "loss": 0.2528, + "step": 31589 + }, + { + "epoch": 86.07629427792915, + "grad_norm": 1.5397335290908813, + "learning_rate": 9.996859517952652e-07, + "loss": 0.0209, + "step": 31590 + }, + { + "epoch": 86.07901907356948, + "grad_norm": 2.0383923053741455, + "learning_rate": 9.993013735780376e-07, + "loss": 0.1154, + "step": 31591 + }, + { + "epoch": 86.0817438692098, + "grad_norm": 2.6254165172576904, + "learning_rate": 9.989168654579617e-07, + "loss": 0.0374, + "step": 31592 + }, + { + "epoch": 86.08446866485014, + "grad_norm": 2.1478607654571533, + "learning_rate": 9.985324274380292e-07, + "loss": 0.0405, + "step": 31593 + }, + { + "epoch": 86.08719346049047, + "grad_norm": 5.356241703033447, + "learning_rate": 9.981480595212389e-07, + "loss": 0.1077, + "step": 31594 + }, + { + "epoch": 86.08991825613079, + "grad_norm": 2.7925865650177, + "learning_rate": 9.977637617105818e-07, + "loss": 0.0503, + "step": 31595 + }, + { + "epoch": 86.09264305177112, + "grad_norm": 2.177604913711548, + "learning_rate": 9.973795340090498e-07, + "loss": 0.2251, + "step": 31596 + }, + { + "epoch": 86.09536784741144, + "grad_norm": 2.89493989944458, + "learning_rate": 9.96995376419635e-07, + "loss": 0.0238, + "step": 31597 + }, + { + "epoch": 86.09809264305177, + "grad_norm": 2.561154842376709, + "learning_rate": 9.966112889453328e-07, + "loss": 0.0974, + "step": 31598 + }, + { + "epoch": 86.1008174386921, + "grad_norm": 2.3899598121643066, + "learning_rate": 9.962272715891296e-07, + "loss": 0.0529, + "step": 31599 + }, + { + "epoch": 86.10354223433242, + "grad_norm": 2.1979386806488037, + "learning_rate": 9.958433243540211e-07, + "loss": 0.0818, + "step": 31600 + }, + { + "epoch": 86.10626702997276, + "grad_norm": 1.9779709577560425, + "learning_rate": 9.954594472429947e-07, + "loss": 0.0222, + "step": 31601 + }, + { + "epoch": 86.10899182561307, + "grad_norm": 6.739572525024414, + "learning_rate": 9.950756402590379e-07, + "loss": 0.0601, + "step": 31602 + }, + { + "epoch": 86.11171662125341, + "grad_norm": 2.4656660556793213, + "learning_rate": 9.94691903405145e-07, + "loss": 0.0442, + "step": 31603 + }, + { + "epoch": 86.11444141689373, + "grad_norm": 1.7424670457839966, + "learning_rate": 9.943082366843005e-07, + "loss": 0.1101, + "step": 31604 + }, + { + "epoch": 86.11716621253406, + "grad_norm": 1.816726803779602, + "learning_rate": 9.939246400994929e-07, + "loss": 0.1181, + "step": 31605 + }, + { + "epoch": 86.11989100817439, + "grad_norm": 2.8455731868743896, + "learning_rate": 9.935411136537121e-07, + "loss": 0.0796, + "step": 31606 + }, + { + "epoch": 86.12261580381471, + "grad_norm": 1.9792871475219727, + "learning_rate": 9.931576573499425e-07, + "loss": 0.0303, + "step": 31607 + }, + { + "epoch": 86.12534059945504, + "grad_norm": 2.497490882873535, + "learning_rate": 9.927742711911715e-07, + "loss": 0.1184, + "step": 31608 + }, + { + "epoch": 86.12806539509536, + "grad_norm": 2.35503888130188, + "learning_rate": 9.923909551803824e-07, + "loss": 0.0634, + "step": 31609 + }, + { + "epoch": 86.1307901907357, + "grad_norm": 2.9196982383728027, + "learning_rate": 9.920077093205648e-07, + "loss": 0.0273, + "step": 31610 + }, + { + "epoch": 86.13351498637603, + "grad_norm": 3.038902521133423, + "learning_rate": 9.916245336147023e-07, + "loss": 0.0262, + "step": 31611 + }, + { + "epoch": 86.13623978201635, + "grad_norm": 2.693570852279663, + "learning_rate": 9.912414280657766e-07, + "loss": 0.0563, + "step": 31612 + }, + { + "epoch": 86.13896457765668, + "grad_norm": 2.607591390609741, + "learning_rate": 9.908583926767712e-07, + "loss": 0.1106, + "step": 31613 + }, + { + "epoch": 86.141689373297, + "grad_norm": 2.580155372619629, + "learning_rate": 9.904754274506723e-07, + "loss": 0.0608, + "step": 31614 + }, + { + "epoch": 86.14441416893733, + "grad_norm": 3.828810453414917, + "learning_rate": 9.90092532390462e-07, + "loss": 0.1573, + "step": 31615 + }, + { + "epoch": 86.14713896457765, + "grad_norm": 2.2987725734710693, + "learning_rate": 9.89709707499118e-07, + "loss": 0.0311, + "step": 31616 + }, + { + "epoch": 86.14986376021798, + "grad_norm": 2.210296630859375, + "learning_rate": 9.893269527796268e-07, + "loss": 0.0528, + "step": 31617 + }, + { + "epoch": 86.15258855585832, + "grad_norm": 4.510499954223633, + "learning_rate": 9.88944268234966e-07, + "loss": 0.1065, + "step": 31618 + }, + { + "epoch": 86.15531335149863, + "grad_norm": 2.624666452407837, + "learning_rate": 9.885616538681186e-07, + "loss": 0.0655, + "step": 31619 + }, + { + "epoch": 86.15803814713897, + "grad_norm": 3.6263275146484375, + "learning_rate": 9.881791096820625e-07, + "loss": 0.0242, + "step": 31620 + }, + { + "epoch": 86.16076294277929, + "grad_norm": 2.314969062805176, + "learning_rate": 9.877966356797785e-07, + "loss": 0.0376, + "step": 31621 + }, + { + "epoch": 86.16348773841962, + "grad_norm": 2.3886630535125732, + "learning_rate": 9.87414231864242e-07, + "loss": 0.0185, + "step": 31622 + }, + { + "epoch": 86.16621253405995, + "grad_norm": 3.664731502532959, + "learning_rate": 9.870318982384352e-07, + "loss": 0.035, + "step": 31623 + }, + { + "epoch": 86.16893732970027, + "grad_norm": 6.761654376983643, + "learning_rate": 9.866496348053334e-07, + "loss": 0.0874, + "step": 31624 + }, + { + "epoch": 86.1716621253406, + "grad_norm": 2.344679594039917, + "learning_rate": 9.862674415679152e-07, + "loss": 0.0234, + "step": 31625 + }, + { + "epoch": 86.17438692098092, + "grad_norm": 2.3501219749450684, + "learning_rate": 9.858853185291538e-07, + "loss": 0.0343, + "step": 31626 + }, + { + "epoch": 86.17711171662125, + "grad_norm": 2.972172260284424, + "learning_rate": 9.855032656920283e-07, + "loss": 0.0427, + "step": 31627 + }, + { + "epoch": 86.17983651226157, + "grad_norm": 2.6144793033599854, + "learning_rate": 9.851212830595148e-07, + "loss": 0.0368, + "step": 31628 + }, + { + "epoch": 86.1825613079019, + "grad_norm": 1.8932509422302246, + "learning_rate": 9.847393706345843e-07, + "loss": 0.023, + "step": 31629 + }, + { + "epoch": 86.18528610354224, + "grad_norm": 2.38089919090271, + "learning_rate": 9.843575284202145e-07, + "loss": 0.0579, + "step": 31630 + }, + { + "epoch": 86.18801089918256, + "grad_norm": 3.900752544403076, + "learning_rate": 9.839757564193787e-07, + "loss": 0.1188, + "step": 31631 + }, + { + "epoch": 86.19073569482289, + "grad_norm": 2.6539125442504883, + "learning_rate": 9.835940546350498e-07, + "loss": 0.0752, + "step": 31632 + }, + { + "epoch": 86.19346049046321, + "grad_norm": 2.0343661308288574, + "learning_rate": 9.832124230701979e-07, + "loss": 0.0365, + "step": 31633 + }, + { + "epoch": 86.19618528610354, + "grad_norm": 2.7909703254699707, + "learning_rate": 9.828308617277971e-07, + "loss": 0.0272, + "step": 31634 + }, + { + "epoch": 86.19891008174388, + "grad_norm": 2.19333815574646, + "learning_rate": 9.824493706108218e-07, + "loss": 0.0705, + "step": 31635 + }, + { + "epoch": 86.2016348773842, + "grad_norm": 1.797225832939148, + "learning_rate": 9.820679497222396e-07, + "loss": 0.0279, + "step": 31636 + }, + { + "epoch": 86.20435967302453, + "grad_norm": 2.0403614044189453, + "learning_rate": 9.816865990650238e-07, + "loss": 0.0642, + "step": 31637 + }, + { + "epoch": 86.20708446866485, + "grad_norm": 3.0743956565856934, + "learning_rate": 9.813053186421395e-07, + "loss": 0.028, + "step": 31638 + }, + { + "epoch": 86.20980926430518, + "grad_norm": 1.8789576292037964, + "learning_rate": 9.8092410845656e-07, + "loss": 0.1133, + "step": 31639 + }, + { + "epoch": 86.2125340599455, + "grad_norm": 2.5614380836486816, + "learning_rate": 9.805429685112555e-07, + "loss": 0.1739, + "step": 31640 + }, + { + "epoch": 86.21525885558583, + "grad_norm": 2.94986629486084, + "learning_rate": 9.80161898809191e-07, + "loss": 0.1197, + "step": 31641 + }, + { + "epoch": 86.21798365122616, + "grad_norm": 8.736162185668945, + "learning_rate": 9.79780899353333e-07, + "loss": 0.0333, + "step": 31642 + }, + { + "epoch": 86.22070844686648, + "grad_norm": 2.2208738327026367, + "learning_rate": 9.793999701466527e-07, + "loss": 0.1297, + "step": 31643 + }, + { + "epoch": 86.22343324250681, + "grad_norm": 2.76037859916687, + "learning_rate": 9.790191111921166e-07, + "loss": 0.102, + "step": 31644 + }, + { + "epoch": 86.22615803814713, + "grad_norm": 2.774686098098755, + "learning_rate": 9.786383224926877e-07, + "loss": 0.0749, + "step": 31645 + }, + { + "epoch": 86.22888283378747, + "grad_norm": 2.381895065307617, + "learning_rate": 9.782576040513325e-07, + "loss": 0.0385, + "step": 31646 + }, + { + "epoch": 86.2316076294278, + "grad_norm": 2.5969865322113037, + "learning_rate": 9.778769558710177e-07, + "loss": 0.0536, + "step": 31647 + }, + { + "epoch": 86.23433242506812, + "grad_norm": 2.099355697631836, + "learning_rate": 9.774963779547076e-07, + "loss": 0.0508, + "step": 31648 + }, + { + "epoch": 86.23705722070845, + "grad_norm": 2.1510770320892334, + "learning_rate": 9.771158703053652e-07, + "loss": 0.03, + "step": 31649 + }, + { + "epoch": 86.23978201634877, + "grad_norm": 3.3781051635742188, + "learning_rate": 9.767354329259515e-07, + "loss": 0.0821, + "step": 31650 + }, + { + "epoch": 86.2425068119891, + "grad_norm": 2.2429616451263428, + "learning_rate": 9.76355065819432e-07, + "loss": 0.035, + "step": 31651 + }, + { + "epoch": 86.24523160762942, + "grad_norm": 3.0349185466766357, + "learning_rate": 9.75974768988771e-07, + "loss": 0.1015, + "step": 31652 + }, + { + "epoch": 86.24795640326975, + "grad_norm": 2.058422565460205, + "learning_rate": 9.755945424369283e-07, + "loss": 0.0319, + "step": 31653 + }, + { + "epoch": 86.25068119891009, + "grad_norm": 2.664964199066162, + "learning_rate": 9.752143861668628e-07, + "loss": 0.0303, + "step": 31654 + }, + { + "epoch": 86.2534059945504, + "grad_norm": 2.0678510665893555, + "learning_rate": 9.748343001815385e-07, + "loss": 0.0316, + "step": 31655 + }, + { + "epoch": 86.25613079019074, + "grad_norm": 2.756922960281372, + "learning_rate": 9.744542844839145e-07, + "loss": 0.0724, + "step": 31656 + }, + { + "epoch": 86.25885558583106, + "grad_norm": 2.7466092109680176, + "learning_rate": 9.740743390769503e-07, + "loss": 0.0384, + "step": 31657 + }, + { + "epoch": 86.26158038147139, + "grad_norm": 2.183837652206421, + "learning_rate": 9.736944639636025e-07, + "loss": 0.061, + "step": 31658 + }, + { + "epoch": 86.26430517711172, + "grad_norm": 2.141596794128418, + "learning_rate": 9.733146591468334e-07, + "loss": 0.0342, + "step": 31659 + }, + { + "epoch": 86.26702997275204, + "grad_norm": 1.158841848373413, + "learning_rate": 9.729349246296005e-07, + "loss": 0.0144, + "step": 31660 + }, + { + "epoch": 86.26975476839237, + "grad_norm": 3.59151029586792, + "learning_rate": 9.72555260414858e-07, + "loss": 0.1706, + "step": 31661 + }, + { + "epoch": 86.2724795640327, + "grad_norm": 2.8652048110961914, + "learning_rate": 9.721756665055637e-07, + "loss": 0.113, + "step": 31662 + }, + { + "epoch": 86.27520435967303, + "grad_norm": 2.286719560623169, + "learning_rate": 9.717961429046773e-07, + "loss": 0.0691, + "step": 31663 + }, + { + "epoch": 86.27792915531334, + "grad_norm": 3.3621742725372314, + "learning_rate": 9.714166896151511e-07, + "loss": 0.051, + "step": 31664 + }, + { + "epoch": 86.28065395095368, + "grad_norm": 7.1724677085876465, + "learning_rate": 9.710373066399413e-07, + "loss": 0.0445, + "step": 31665 + }, + { + "epoch": 86.28337874659401, + "grad_norm": 2.8919363021850586, + "learning_rate": 9.706579939820005e-07, + "loss": 0.1347, + "step": 31666 + }, + { + "epoch": 86.28610354223433, + "grad_norm": 3.9138731956481934, + "learning_rate": 9.702787516442858e-07, + "loss": 0.0484, + "step": 31667 + }, + { + "epoch": 86.28882833787466, + "grad_norm": 2.2986462116241455, + "learning_rate": 9.698995796297483e-07, + "loss": 0.0996, + "step": 31668 + }, + { + "epoch": 86.29155313351498, + "grad_norm": 2.9334826469421387, + "learning_rate": 9.695204779413448e-07, + "loss": 0.173, + "step": 31669 + }, + { + "epoch": 86.29427792915531, + "grad_norm": 1.976965069770813, + "learning_rate": 9.691414465820226e-07, + "loss": 0.0242, + "step": 31670 + }, + { + "epoch": 86.29700272479565, + "grad_norm": 3.205742120742798, + "learning_rate": 9.687624855547372e-07, + "loss": 0.0263, + "step": 31671 + }, + { + "epoch": 86.29972752043597, + "grad_norm": 2.6435394287109375, + "learning_rate": 9.683835948624397e-07, + "loss": 0.0585, + "step": 31672 + }, + { + "epoch": 86.3024523160763, + "grad_norm": 2.673785924911499, + "learning_rate": 9.680047745080811e-07, + "loss": 0.1645, + "step": 31673 + }, + { + "epoch": 86.30517711171662, + "grad_norm": 2.2024083137512207, + "learning_rate": 9.676260244946078e-07, + "loss": 0.052, + "step": 31674 + }, + { + "epoch": 86.30790190735695, + "grad_norm": 1.9879213571548462, + "learning_rate": 9.672473448249741e-07, + "loss": 0.1141, + "step": 31675 + }, + { + "epoch": 86.31062670299727, + "grad_norm": 2.3783514499664307, + "learning_rate": 9.668687355021266e-07, + "loss": 0.0229, + "step": 31676 + }, + { + "epoch": 86.3133514986376, + "grad_norm": 2.5844457149505615, + "learning_rate": 9.664901965290163e-07, + "loss": 0.0403, + "step": 31677 + }, + { + "epoch": 86.31607629427793, + "grad_norm": 2.5226974487304688, + "learning_rate": 9.661117279085862e-07, + "loss": 0.0565, + "step": 31678 + }, + { + "epoch": 86.31880108991825, + "grad_norm": 2.8497304916381836, + "learning_rate": 9.6573332964379e-07, + "loss": 0.0582, + "step": 31679 + }, + { + "epoch": 86.32152588555859, + "grad_norm": 2.5396921634674072, + "learning_rate": 9.653550017375724e-07, + "loss": 0.0564, + "step": 31680 + }, + { + "epoch": 86.3242506811989, + "grad_norm": 2.415186643600464, + "learning_rate": 9.64976744192878e-07, + "loss": 0.0755, + "step": 31681 + }, + { + "epoch": 86.32697547683924, + "grad_norm": 2.5656049251556396, + "learning_rate": 9.645985570126526e-07, + "loss": 0.0437, + "step": 31682 + }, + { + "epoch": 86.32970027247957, + "grad_norm": 2.18369197845459, + "learning_rate": 9.642204401998446e-07, + "loss": 0.0396, + "step": 31683 + }, + { + "epoch": 86.33242506811989, + "grad_norm": 2.092224359512329, + "learning_rate": 9.63842393757397e-07, + "loss": 0.0344, + "step": 31684 + }, + { + "epoch": 86.33514986376022, + "grad_norm": 2.9330737590789795, + "learning_rate": 9.634644176882523e-07, + "loss": 0.1577, + "step": 31685 + }, + { + "epoch": 86.33787465940054, + "grad_norm": 4.163845062255859, + "learning_rate": 9.63086511995358e-07, + "loss": 0.0517, + "step": 31686 + }, + { + "epoch": 86.34059945504087, + "grad_norm": 1.6118370294570923, + "learning_rate": 9.62708676681653e-07, + "loss": 0.022, + "step": 31687 + }, + { + "epoch": 86.34332425068119, + "grad_norm": 1.8610044717788696, + "learning_rate": 9.623309117500833e-07, + "loss": 0.0326, + "step": 31688 + }, + { + "epoch": 86.34604904632153, + "grad_norm": 2.1245548725128174, + "learning_rate": 9.619532172035906e-07, + "loss": 0.1534, + "step": 31689 + }, + { + "epoch": 86.34877384196186, + "grad_norm": 3.2282018661499023, + "learning_rate": 9.615755930451144e-07, + "loss": 0.0527, + "step": 31690 + }, + { + "epoch": 86.35149863760218, + "grad_norm": 2.665231227874756, + "learning_rate": 9.611980392775956e-07, + "loss": 0.027, + "step": 31691 + }, + { + "epoch": 86.35422343324251, + "grad_norm": 1.7034244537353516, + "learning_rate": 9.608205559039763e-07, + "loss": 0.0215, + "step": 31692 + }, + { + "epoch": 86.35694822888283, + "grad_norm": 2.240299940109253, + "learning_rate": 9.604431429271965e-07, + "loss": 0.0431, + "step": 31693 + }, + { + "epoch": 86.35967302452316, + "grad_norm": 2.746917963027954, + "learning_rate": 9.600658003501928e-07, + "loss": 0.031, + "step": 31694 + }, + { + "epoch": 86.3623978201635, + "grad_norm": 3.9302194118499756, + "learning_rate": 9.596885281759071e-07, + "loss": 0.097, + "step": 31695 + }, + { + "epoch": 86.36512261580381, + "grad_norm": 2.550478458404541, + "learning_rate": 9.593113264072762e-07, + "loss": 0.0354, + "step": 31696 + }, + { + "epoch": 86.36784741144415, + "grad_norm": 2.1466379165649414, + "learning_rate": 9.589341950472374e-07, + "loss": 0.0285, + "step": 31697 + }, + { + "epoch": 86.37057220708446, + "grad_norm": 2.9122791290283203, + "learning_rate": 9.585571340987265e-07, + "loss": 0.0986, + "step": 31698 + }, + { + "epoch": 86.3732970027248, + "grad_norm": 2.4622130393981934, + "learning_rate": 9.581801435646843e-07, + "loss": 0.0646, + "step": 31699 + }, + { + "epoch": 86.37602179836512, + "grad_norm": 2.4040420055389404, + "learning_rate": 9.578032234480428e-07, + "loss": 0.0262, + "step": 31700 + }, + { + "epoch": 86.37874659400545, + "grad_norm": 2.9493465423583984, + "learning_rate": 9.574263737517398e-07, + "loss": 0.087, + "step": 31701 + }, + { + "epoch": 86.38147138964578, + "grad_norm": 3.674093008041382, + "learning_rate": 9.570495944787062e-07, + "loss": 0.0902, + "step": 31702 + }, + { + "epoch": 86.3841961852861, + "grad_norm": 1.984806776046753, + "learning_rate": 9.566728856318807e-07, + "loss": 0.0305, + "step": 31703 + }, + { + "epoch": 86.38692098092643, + "grad_norm": 1.5852702856063843, + "learning_rate": 9.562962472141967e-07, + "loss": 0.0221, + "step": 31704 + }, + { + "epoch": 86.38964577656675, + "grad_norm": 3.671549081802368, + "learning_rate": 9.559196792285864e-07, + "loss": 0.0425, + "step": 31705 + }, + { + "epoch": 86.39237057220708, + "grad_norm": 2.510288715362549, + "learning_rate": 9.555431816779836e-07, + "loss": 0.0349, + "step": 31706 + }, + { + "epoch": 86.39509536784742, + "grad_norm": 2.7061891555786133, + "learning_rate": 9.551667545653164e-07, + "loss": 0.0582, + "step": 31707 + }, + { + "epoch": 86.39782016348774, + "grad_norm": 3.321589946746826, + "learning_rate": 9.547903978935214e-07, + "loss": 0.0523, + "step": 31708 + }, + { + "epoch": 86.40054495912807, + "grad_norm": 2.741774797439575, + "learning_rate": 9.544141116655282e-07, + "loss": 0.0353, + "step": 31709 + }, + { + "epoch": 86.40326975476839, + "grad_norm": 2.553030252456665, + "learning_rate": 9.540378958842666e-07, + "loss": 0.0639, + "step": 31710 + }, + { + "epoch": 86.40599455040872, + "grad_norm": 2.1983866691589355, + "learning_rate": 9.536617505526647e-07, + "loss": 0.0264, + "step": 31711 + }, + { + "epoch": 86.40871934604904, + "grad_norm": 3.1577227115631104, + "learning_rate": 9.532856756736552e-07, + "loss": 0.0671, + "step": 31712 + }, + { + "epoch": 86.41144414168937, + "grad_norm": 2.494140625, + "learning_rate": 9.529096712501662e-07, + "loss": 0.0475, + "step": 31713 + }, + { + "epoch": 86.4141689373297, + "grad_norm": 1.940166711807251, + "learning_rate": 9.525337372851262e-07, + "loss": 0.0286, + "step": 31714 + }, + { + "epoch": 86.41689373297002, + "grad_norm": 1.5205905437469482, + "learning_rate": 9.521578737814596e-07, + "loss": 0.0274, + "step": 31715 + }, + { + "epoch": 86.41961852861036, + "grad_norm": 3.7131528854370117, + "learning_rate": 9.517820807420985e-07, + "loss": 0.1935, + "step": 31716 + }, + { + "epoch": 86.42234332425068, + "grad_norm": 3.8278331756591797, + "learning_rate": 9.514063581699673e-07, + "loss": 0.0605, + "step": 31717 + }, + { + "epoch": 86.42506811989101, + "grad_norm": 3.2751076221466064, + "learning_rate": 9.510307060679902e-07, + "loss": 0.057, + "step": 31718 + }, + { + "epoch": 86.42779291553134, + "grad_norm": 1.6732395887374878, + "learning_rate": 9.506551244390949e-07, + "loss": 0.0163, + "step": 31719 + }, + { + "epoch": 86.43051771117166, + "grad_norm": 2.4423439502716064, + "learning_rate": 9.50279613286208e-07, + "loss": 0.0477, + "step": 31720 + }, + { + "epoch": 86.433242506812, + "grad_norm": 2.7212328910827637, + "learning_rate": 9.499041726122515e-07, + "loss": 0.0534, + "step": 31721 + }, + { + "epoch": 86.43596730245231, + "grad_norm": 1.925323247909546, + "learning_rate": 9.49528802420151e-07, + "loss": 0.0355, + "step": 31722 + }, + { + "epoch": 86.43869209809264, + "grad_norm": 3.1092705726623535, + "learning_rate": 9.491535027128262e-07, + "loss": 0.0569, + "step": 31723 + }, + { + "epoch": 86.44141689373296, + "grad_norm": 3.6347572803497314, + "learning_rate": 9.487782734932049e-07, + "loss": 0.0532, + "step": 31724 + }, + { + "epoch": 86.4441416893733, + "grad_norm": 2.326617956161499, + "learning_rate": 9.48403114764207e-07, + "loss": 0.098, + "step": 31725 + }, + { + "epoch": 86.44686648501363, + "grad_norm": 2.7363393306732178, + "learning_rate": 9.480280265287545e-07, + "loss": 0.0788, + "step": 31726 + }, + { + "epoch": 86.44959128065395, + "grad_norm": 2.173239231109619, + "learning_rate": 9.476530087897673e-07, + "loss": 0.0289, + "step": 31727 + }, + { + "epoch": 86.45231607629428, + "grad_norm": 1.6472687721252441, + "learning_rate": 9.472780615501675e-07, + "loss": 0.0239, + "step": 31728 + }, + { + "epoch": 86.4550408719346, + "grad_norm": 2.5682032108306885, + "learning_rate": 9.469031848128762e-07, + "loss": 0.0379, + "step": 31729 + }, + { + "epoch": 86.45776566757493, + "grad_norm": 2.8013603687286377, + "learning_rate": 9.4652837858081e-07, + "loss": 0.1393, + "step": 31730 + }, + { + "epoch": 86.46049046321527, + "grad_norm": 7.143606662750244, + "learning_rate": 9.461536428568885e-07, + "loss": 0.0311, + "step": 31731 + }, + { + "epoch": 86.46321525885558, + "grad_norm": 2.643972396850586, + "learning_rate": 9.457789776440329e-07, + "loss": 0.044, + "step": 31732 + }, + { + "epoch": 86.46594005449592, + "grad_norm": 3.4036853313446045, + "learning_rate": 9.454043829451586e-07, + "loss": 0.2029, + "step": 31733 + }, + { + "epoch": 86.46866485013624, + "grad_norm": 2.121493101119995, + "learning_rate": 9.450298587631846e-07, + "loss": 0.0646, + "step": 31734 + }, + { + "epoch": 86.47138964577657, + "grad_norm": 2.426875591278076, + "learning_rate": 9.446554051010238e-07, + "loss": 0.0377, + "step": 31735 + }, + { + "epoch": 86.47411444141689, + "grad_norm": 2.656691312789917, + "learning_rate": 9.442810219615984e-07, + "loss": 0.0436, + "step": 31736 + }, + { + "epoch": 86.47683923705722, + "grad_norm": 2.8276569843292236, + "learning_rate": 9.439067093478171e-07, + "loss": 0.039, + "step": 31737 + }, + { + "epoch": 86.47956403269755, + "grad_norm": 2.29971981048584, + "learning_rate": 9.435324672626023e-07, + "loss": 0.0758, + "step": 31738 + }, + { + "epoch": 86.48228882833787, + "grad_norm": 2.5507752895355225, + "learning_rate": 9.431582957088625e-07, + "loss": 0.0374, + "step": 31739 + }, + { + "epoch": 86.4850136239782, + "grad_norm": 2.6894922256469727, + "learning_rate": 9.427841946895166e-07, + "loss": 0.0278, + "step": 31740 + }, + { + "epoch": 86.48773841961852, + "grad_norm": 2.1117866039276123, + "learning_rate": 9.424101642074756e-07, + "loss": 0.0237, + "step": 31741 + }, + { + "epoch": 86.49046321525886, + "grad_norm": 2.634681463241577, + "learning_rate": 9.420362042656539e-07, + "loss": 0.0397, + "step": 31742 + }, + { + "epoch": 86.49318801089919, + "grad_norm": 2.8264572620391846, + "learning_rate": 9.41662314866959e-07, + "loss": 0.0305, + "step": 31743 + }, + { + "epoch": 86.49591280653951, + "grad_norm": 2.0114846229553223, + "learning_rate": 9.412884960143099e-07, + "loss": 0.0215, + "step": 31744 + }, + { + "epoch": 86.49863760217984, + "grad_norm": 2.80314302444458, + "learning_rate": 9.409147477106139e-07, + "loss": 0.0903, + "step": 31745 + }, + { + "epoch": 86.50136239782016, + "grad_norm": 2.1577348709106445, + "learning_rate": 9.405410699587825e-07, + "loss": 0.0736, + "step": 31746 + }, + { + "epoch": 86.50408719346049, + "grad_norm": 1.879530906677246, + "learning_rate": 9.40167462761723e-07, + "loss": 0.0269, + "step": 31747 + }, + { + "epoch": 86.50681198910081, + "grad_norm": 5.320206165313721, + "learning_rate": 9.397939261223499e-07, + "loss": 0.0373, + "step": 31748 + }, + { + "epoch": 86.50953678474114, + "grad_norm": 4.1179423332214355, + "learning_rate": 9.394204600435708e-07, + "loss": 0.0325, + "step": 31749 + }, + { + "epoch": 86.51226158038148, + "grad_norm": 3.245192050933838, + "learning_rate": 9.390470645282923e-07, + "loss": 0.0913, + "step": 31750 + }, + { + "epoch": 86.5149863760218, + "grad_norm": 4.733980178833008, + "learning_rate": 9.386737395794232e-07, + "loss": 0.0546, + "step": 31751 + }, + { + "epoch": 86.51771117166213, + "grad_norm": 2.638227701187134, + "learning_rate": 9.383004851998723e-07, + "loss": 0.0668, + "step": 31752 + }, + { + "epoch": 86.52043596730245, + "grad_norm": 3.1194350719451904, + "learning_rate": 9.379273013925449e-07, + "loss": 0.1016, + "step": 31753 + }, + { + "epoch": 86.52316076294278, + "grad_norm": 2.7698941230773926, + "learning_rate": 9.375541881603479e-07, + "loss": 0.0289, + "step": 31754 + }, + { + "epoch": 86.52588555858311, + "grad_norm": 2.454678773880005, + "learning_rate": 9.371811455061874e-07, + "loss": 0.1671, + "step": 31755 + }, + { + "epoch": 86.52861035422343, + "grad_norm": 2.9940426349639893, + "learning_rate": 9.368081734329682e-07, + "loss": 0.0616, + "step": 31756 + }, + { + "epoch": 86.53133514986376, + "grad_norm": 3.0953903198242188, + "learning_rate": 9.364352719435965e-07, + "loss": 0.0616, + "step": 31757 + }, + { + "epoch": 86.53405994550408, + "grad_norm": 2.4276750087738037, + "learning_rate": 9.360624410409746e-07, + "loss": 0.0549, + "step": 31758 + }, + { + "epoch": 86.53678474114442, + "grad_norm": 3.2068097591400146, + "learning_rate": 9.356896807280047e-07, + "loss": 0.0746, + "step": 31759 + }, + { + "epoch": 86.53950953678473, + "grad_norm": 2.9232585430145264, + "learning_rate": 9.353169910075944e-07, + "loss": 0.203, + "step": 31760 + }, + { + "epoch": 86.54223433242507, + "grad_norm": 2.7625324726104736, + "learning_rate": 9.349443718826434e-07, + "loss": 0.1773, + "step": 31761 + }, + { + "epoch": 86.5449591280654, + "grad_norm": 2.888930082321167, + "learning_rate": 9.345718233560541e-07, + "loss": 0.0292, + "step": 31762 + }, + { + "epoch": 86.54768392370572, + "grad_norm": 2.8343310356140137, + "learning_rate": 9.341993454307252e-07, + "loss": 0.0463, + "step": 31763 + }, + { + "epoch": 86.55040871934605, + "grad_norm": 1.7458686828613281, + "learning_rate": 9.338269381095632e-07, + "loss": 0.0531, + "step": 31764 + }, + { + "epoch": 86.55313351498637, + "grad_norm": 1.3781216144561768, + "learning_rate": 9.334546013954637e-07, + "loss": 0.0244, + "step": 31765 + }, + { + "epoch": 86.5558583106267, + "grad_norm": 3.210026741027832, + "learning_rate": 9.330823352913287e-07, + "loss": 0.1514, + "step": 31766 + }, + { + "epoch": 86.55858310626704, + "grad_norm": 2.650787353515625, + "learning_rate": 9.327101398000548e-07, + "loss": 0.0203, + "step": 31767 + }, + { + "epoch": 86.56130790190736, + "grad_norm": 2.5487656593322754, + "learning_rate": 9.323380149245442e-07, + "loss": 0.031, + "step": 31768 + }, + { + "epoch": 86.56403269754769, + "grad_norm": 2.2274551391601562, + "learning_rate": 9.319659606676934e-07, + "loss": 0.0447, + "step": 31769 + }, + { + "epoch": 86.566757493188, + "grad_norm": 2.514932870864868, + "learning_rate": 9.315939770324e-07, + "loss": 0.0397, + "step": 31770 + }, + { + "epoch": 86.56948228882834, + "grad_norm": 2.385927438735962, + "learning_rate": 9.312220640215585e-07, + "loss": 0.0283, + "step": 31771 + }, + { + "epoch": 86.57220708446866, + "grad_norm": 3.0768346786499023, + "learning_rate": 9.308502216380677e-07, + "loss": 0.048, + "step": 31772 + }, + { + "epoch": 86.57493188010899, + "grad_norm": 3.3297297954559326, + "learning_rate": 9.304784498848263e-07, + "loss": 0.0755, + "step": 31773 + }, + { + "epoch": 86.57765667574932, + "grad_norm": 2.2790002822875977, + "learning_rate": 9.301067487647253e-07, + "loss": 0.0339, + "step": 31774 + }, + { + "epoch": 86.58038147138964, + "grad_norm": 3.9251515865325928, + "learning_rate": 9.297351182806624e-07, + "loss": 0.0542, + "step": 31775 + }, + { + "epoch": 86.58310626702998, + "grad_norm": 2.3171865940093994, + "learning_rate": 9.293635584355276e-07, + "loss": 0.0292, + "step": 31776 + }, + { + "epoch": 86.5858310626703, + "grad_norm": 2.964221239089966, + "learning_rate": 9.289920692322196e-07, + "loss": 0.147, + "step": 31777 + }, + { + "epoch": 86.58855585831063, + "grad_norm": 2.2152185440063477, + "learning_rate": 9.286206506736306e-07, + "loss": 0.0949, + "step": 31778 + }, + { + "epoch": 86.59128065395096, + "grad_norm": 1.898727297782898, + "learning_rate": 9.282493027626482e-07, + "loss": 0.0271, + "step": 31779 + }, + { + "epoch": 86.59400544959128, + "grad_norm": 3.3184823989868164, + "learning_rate": 9.278780255021713e-07, + "loss": 0.0466, + "step": 31780 + }, + { + "epoch": 86.59673024523161, + "grad_norm": 1.897197961807251, + "learning_rate": 9.275068188950887e-07, + "loss": 0.0414, + "step": 31781 + }, + { + "epoch": 86.59945504087193, + "grad_norm": 2.450909376144409, + "learning_rate": 9.271356829442902e-07, + "loss": 0.2228, + "step": 31782 + }, + { + "epoch": 86.60217983651226, + "grad_norm": 2.1270909309387207, + "learning_rate": 9.267646176526657e-07, + "loss": 0.0239, + "step": 31783 + }, + { + "epoch": 86.60490463215258, + "grad_norm": 2.101029872894287, + "learning_rate": 9.263936230231075e-07, + "loss": 0.0234, + "step": 31784 + }, + { + "epoch": 86.60762942779292, + "grad_norm": 2.107457160949707, + "learning_rate": 9.260226990585042e-07, + "loss": 0.0371, + "step": 31785 + }, + { + "epoch": 86.61035422343325, + "grad_norm": 2.3350908756256104, + "learning_rate": 9.256518457617436e-07, + "loss": 0.0318, + "step": 31786 + }, + { + "epoch": 86.61307901907357, + "grad_norm": 2.550260305404663, + "learning_rate": 9.252810631357134e-07, + "loss": 0.0377, + "step": 31787 + }, + { + "epoch": 86.6158038147139, + "grad_norm": 2.5874295234680176, + "learning_rate": 9.249103511833013e-07, + "loss": 0.1504, + "step": 31788 + }, + { + "epoch": 86.61852861035422, + "grad_norm": 2.730004072189331, + "learning_rate": 9.245397099073971e-07, + "loss": 0.0446, + "step": 31789 + }, + { + "epoch": 86.62125340599455, + "grad_norm": 7.804656028747559, + "learning_rate": 9.241691393108864e-07, + "loss": 0.044, + "step": 31790 + }, + { + "epoch": 86.62397820163488, + "grad_norm": 5.257740497589111, + "learning_rate": 9.237986393966536e-07, + "loss": 0.0382, + "step": 31791 + }, + { + "epoch": 86.6267029972752, + "grad_norm": 1.4204128980636597, + "learning_rate": 9.23428210167584e-07, + "loss": 0.0195, + "step": 31792 + }, + { + "epoch": 86.62942779291554, + "grad_norm": 1.9685324430465698, + "learning_rate": 9.230578516265642e-07, + "loss": 0.0283, + "step": 31793 + }, + { + "epoch": 86.63215258855585, + "grad_norm": 2.91001558303833, + "learning_rate": 9.226875637764788e-07, + "loss": 0.0483, + "step": 31794 + }, + { + "epoch": 86.63487738419619, + "grad_norm": 2.7391185760498047, + "learning_rate": 9.223173466202096e-07, + "loss": 0.105, + "step": 31795 + }, + { + "epoch": 86.6376021798365, + "grad_norm": 2.036832094192505, + "learning_rate": 9.219472001606389e-07, + "loss": 0.0445, + "step": 31796 + }, + { + "epoch": 86.64032697547684, + "grad_norm": 2.2425432205200195, + "learning_rate": 9.215771244006533e-07, + "loss": 0.0974, + "step": 31797 + }, + { + "epoch": 86.64305177111717, + "grad_norm": 4.180068492889404, + "learning_rate": 9.212071193431327e-07, + "loss": 0.1271, + "step": 31798 + }, + { + "epoch": 86.64577656675749, + "grad_norm": 2.0754756927490234, + "learning_rate": 9.208371849909592e-07, + "loss": 0.0266, + "step": 31799 + }, + { + "epoch": 86.64850136239782, + "grad_norm": 2.5021541118621826, + "learning_rate": 9.204673213470105e-07, + "loss": 0.0259, + "step": 31800 + }, + { + "epoch": 86.65122615803814, + "grad_norm": 2.7732303142547607, + "learning_rate": 9.200975284141733e-07, + "loss": 0.0308, + "step": 31801 + }, + { + "epoch": 86.65395095367847, + "grad_norm": 2.38616943359375, + "learning_rate": 9.197278061953241e-07, + "loss": 0.0898, + "step": 31802 + }, + { + "epoch": 86.65667574931881, + "grad_norm": 2.6551296710968018, + "learning_rate": 9.193581546933406e-07, + "loss": 0.0683, + "step": 31803 + }, + { + "epoch": 86.65940054495913, + "grad_norm": 2.102505922317505, + "learning_rate": 9.189885739111048e-07, + "loss": 0.0332, + "step": 31804 + }, + { + "epoch": 86.66212534059946, + "grad_norm": 3.7889506816864014, + "learning_rate": 9.186190638514925e-07, + "loss": 0.141, + "step": 31805 + }, + { + "epoch": 86.66485013623978, + "grad_norm": 1.921257495880127, + "learning_rate": 9.182496245173844e-07, + "loss": 0.0322, + "step": 31806 + }, + { + "epoch": 86.66757493188011, + "grad_norm": 3.020113229751587, + "learning_rate": 9.178802559116551e-07, + "loss": 0.1434, + "step": 31807 + }, + { + "epoch": 86.67029972752043, + "grad_norm": 2.542175531387329, + "learning_rate": 9.175109580371811e-07, + "loss": 0.0213, + "step": 31808 + }, + { + "epoch": 86.67302452316076, + "grad_norm": 2.8657314777374268, + "learning_rate": 9.171417308968411e-07, + "loss": 0.0614, + "step": 31809 + }, + { + "epoch": 86.6757493188011, + "grad_norm": 1.7940597534179688, + "learning_rate": 9.167725744935097e-07, + "loss": 0.0244, + "step": 31810 + }, + { + "epoch": 86.67847411444141, + "grad_norm": 2.6655895709991455, + "learning_rate": 9.1640348883006e-07, + "loss": 0.1663, + "step": 31811 + }, + { + "epoch": 86.68119891008175, + "grad_norm": 3.1102259159088135, + "learning_rate": 9.160344739093663e-07, + "loss": 0.1017, + "step": 31812 + }, + { + "epoch": 86.68392370572207, + "grad_norm": 2.133916139602661, + "learning_rate": 9.156655297343053e-07, + "loss": 0.0239, + "step": 31813 + }, + { + "epoch": 86.6866485013624, + "grad_norm": 2.9862277507781982, + "learning_rate": 9.152966563077492e-07, + "loss": 0.0505, + "step": 31814 + }, + { + "epoch": 86.68937329700273, + "grad_norm": 3.5533385276794434, + "learning_rate": 9.149278536325701e-07, + "loss": 0.0312, + "step": 31815 + }, + { + "epoch": 86.69209809264305, + "grad_norm": 2.2575623989105225, + "learning_rate": 9.145591217116378e-07, + "loss": 0.115, + "step": 31816 + }, + { + "epoch": 86.69482288828338, + "grad_norm": 2.2151005268096924, + "learning_rate": 9.141904605478291e-07, + "loss": 0.0812, + "step": 31817 + }, + { + "epoch": 86.6975476839237, + "grad_norm": 1.6522341966629028, + "learning_rate": 9.138218701440138e-07, + "loss": 0.0297, + "step": 31818 + }, + { + "epoch": 86.70027247956403, + "grad_norm": 2.0549027919769287, + "learning_rate": 9.134533505030596e-07, + "loss": 0.0254, + "step": 31819 + }, + { + "epoch": 86.70299727520435, + "grad_norm": 2.8211066722869873, + "learning_rate": 9.130849016278376e-07, + "loss": 0.1104, + "step": 31820 + }, + { + "epoch": 86.70572207084469, + "grad_norm": 11.08095932006836, + "learning_rate": 9.127165235212199e-07, + "loss": 0.0874, + "step": 31821 + }, + { + "epoch": 86.70844686648502, + "grad_norm": 2.0970847606658936, + "learning_rate": 9.12348216186072e-07, + "loss": 0.0357, + "step": 31822 + }, + { + "epoch": 86.71117166212534, + "grad_norm": 3.2193431854248047, + "learning_rate": 9.119799796252626e-07, + "loss": 0.0341, + "step": 31823 + }, + { + "epoch": 86.71389645776567, + "grad_norm": 3.7054831981658936, + "learning_rate": 9.116118138416619e-07, + "loss": 0.0803, + "step": 31824 + }, + { + "epoch": 86.71662125340599, + "grad_norm": 2.5147147178649902, + "learning_rate": 9.112437188381362e-07, + "loss": 0.0582, + "step": 31825 + }, + { + "epoch": 86.71934604904632, + "grad_norm": 2.2300379276275635, + "learning_rate": 9.108756946175523e-07, + "loss": 0.1179, + "step": 31826 + }, + { + "epoch": 86.72207084468666, + "grad_norm": 4.37146520614624, + "learning_rate": 9.105077411827757e-07, + "loss": 0.1824, + "step": 31827 + }, + { + "epoch": 86.72479564032697, + "grad_norm": 3.2096545696258545, + "learning_rate": 9.101398585366705e-07, + "loss": 0.1223, + "step": 31828 + }, + { + "epoch": 86.7275204359673, + "grad_norm": 3.0343284606933594, + "learning_rate": 9.097720466821059e-07, + "loss": 0.0778, + "step": 31829 + }, + { + "epoch": 86.73024523160763, + "grad_norm": 2.826237678527832, + "learning_rate": 9.094043056219437e-07, + "loss": 0.0406, + "step": 31830 + }, + { + "epoch": 86.73297002724796, + "grad_norm": 3.87508487701416, + "learning_rate": 9.090366353590485e-07, + "loss": 0.0679, + "step": 31831 + }, + { + "epoch": 86.73569482288828, + "grad_norm": 2.8609530925750732, + "learning_rate": 9.086690358962813e-07, + "loss": 0.0408, + "step": 31832 + }, + { + "epoch": 86.73841961852861, + "grad_norm": 3.1503353118896484, + "learning_rate": 9.083015072365087e-07, + "loss": 0.034, + "step": 31833 + }, + { + "epoch": 86.74114441416894, + "grad_norm": 2.6293821334838867, + "learning_rate": 9.079340493825916e-07, + "loss": 0.0878, + "step": 31834 + }, + { + "epoch": 86.74386920980926, + "grad_norm": 1.9450099468231201, + "learning_rate": 9.075666623373913e-07, + "loss": 0.1136, + "step": 31835 + }, + { + "epoch": 86.7465940054496, + "grad_norm": 2.772766351699829, + "learning_rate": 9.071993461037676e-07, + "loss": 0.097, + "step": 31836 + }, + { + "epoch": 86.74931880108991, + "grad_norm": 2.1210412979125977, + "learning_rate": 9.068321006845837e-07, + "loss": 0.0933, + "step": 31837 + }, + { + "epoch": 86.75204359673025, + "grad_norm": 3.3114240169525146, + "learning_rate": 9.064649260826997e-07, + "loss": 0.047, + "step": 31838 + }, + { + "epoch": 86.75476839237058, + "grad_norm": 1.7541974782943726, + "learning_rate": 9.060978223009742e-07, + "loss": 0.0447, + "step": 31839 + }, + { + "epoch": 86.7574931880109, + "grad_norm": 2.293485164642334, + "learning_rate": 9.05730789342264e-07, + "loss": 0.0547, + "step": 31840 + }, + { + "epoch": 86.76021798365123, + "grad_norm": 2.6151113510131836, + "learning_rate": 9.053638272094301e-07, + "loss": 0.0627, + "step": 31841 + }, + { + "epoch": 86.76294277929155, + "grad_norm": 3.138340473175049, + "learning_rate": 9.049969359053312e-07, + "loss": 0.0391, + "step": 31842 + }, + { + "epoch": 86.76566757493188, + "grad_norm": 2.081235647201538, + "learning_rate": 9.046301154328241e-07, + "loss": 0.1178, + "step": 31843 + }, + { + "epoch": 86.7683923705722, + "grad_norm": 2.535001516342163, + "learning_rate": 9.04263365794762e-07, + "loss": 0.0547, + "step": 31844 + }, + { + "epoch": 86.77111716621253, + "grad_norm": 3.6016337871551514, + "learning_rate": 9.038966869940069e-07, + "loss": 0.0424, + "step": 31845 + }, + { + "epoch": 86.77384196185287, + "grad_norm": 2.7954092025756836, + "learning_rate": 9.035300790334112e-07, + "loss": 0.1006, + "step": 31846 + }, + { + "epoch": 86.77656675749319, + "grad_norm": 2.7124500274658203, + "learning_rate": 9.031635419158314e-07, + "loss": 0.0766, + "step": 31847 + }, + { + "epoch": 86.77929155313352, + "grad_norm": 2.300968885421753, + "learning_rate": 9.027970756441184e-07, + "loss": 0.0377, + "step": 31848 + }, + { + "epoch": 86.78201634877384, + "grad_norm": 2.9123425483703613, + "learning_rate": 9.024306802211313e-07, + "loss": 0.0479, + "step": 31849 + }, + { + "epoch": 86.78474114441417, + "grad_norm": 2.441084861755371, + "learning_rate": 9.020643556497211e-07, + "loss": 0.0496, + "step": 31850 + }, + { + "epoch": 86.7874659400545, + "grad_norm": 3.1042938232421875, + "learning_rate": 9.016981019327397e-07, + "loss": 0.085, + "step": 31851 + }, + { + "epoch": 86.79019073569482, + "grad_norm": 2.328429698944092, + "learning_rate": 9.013319190730407e-07, + "loss": 0.0209, + "step": 31852 + }, + { + "epoch": 86.79291553133515, + "grad_norm": 4.259504318237305, + "learning_rate": 9.009658070734762e-07, + "loss": 0.1889, + "step": 31853 + }, + { + "epoch": 86.79564032697547, + "grad_norm": 2.216219902038574, + "learning_rate": 9.005997659368982e-07, + "loss": 0.0207, + "step": 31854 + }, + { + "epoch": 86.7983651226158, + "grad_norm": 2.459240674972534, + "learning_rate": 9.002337956661556e-07, + "loss": 0.0843, + "step": 31855 + }, + { + "epoch": 86.80108991825612, + "grad_norm": 2.159674882888794, + "learning_rate": 8.998678962640983e-07, + "loss": 0.0467, + "step": 31856 + }, + { + "epoch": 86.80381471389646, + "grad_norm": 2.2981133460998535, + "learning_rate": 8.995020677335764e-07, + "loss": 0.0356, + "step": 31857 + }, + { + "epoch": 86.80653950953679, + "grad_norm": 2.905636787414551, + "learning_rate": 8.99136310077442e-07, + "loss": 0.1357, + "step": 31858 + }, + { + "epoch": 86.80926430517711, + "grad_norm": 3.5976691246032715, + "learning_rate": 8.987706232985405e-07, + "loss": 0.0505, + "step": 31859 + }, + { + "epoch": 86.81198910081744, + "grad_norm": 3.997267961502075, + "learning_rate": 8.984050073997197e-07, + "loss": 0.0659, + "step": 31860 + }, + { + "epoch": 86.81471389645776, + "grad_norm": 3.3631575107574463, + "learning_rate": 8.980394623838273e-07, + "loss": 0.0684, + "step": 31861 + }, + { + "epoch": 86.8174386920981, + "grad_norm": 4.546899318695068, + "learning_rate": 8.976739882537122e-07, + "loss": 0.104, + "step": 31862 + }, + { + "epoch": 86.82016348773843, + "grad_norm": 2.5868873596191406, + "learning_rate": 8.973085850122187e-07, + "loss": 0.0408, + "step": 31863 + }, + { + "epoch": 86.82288828337875, + "grad_norm": 4.059663772583008, + "learning_rate": 8.969432526621924e-07, + "loss": 0.0644, + "step": 31864 + }, + { + "epoch": 86.82561307901908, + "grad_norm": 1.9142038822174072, + "learning_rate": 8.965779912064787e-07, + "loss": 0.0543, + "step": 31865 + }, + { + "epoch": 86.8283378746594, + "grad_norm": 2.3329153060913086, + "learning_rate": 8.962128006479232e-07, + "loss": 0.0354, + "step": 31866 + }, + { + "epoch": 86.83106267029973, + "grad_norm": 3.1029655933380127, + "learning_rate": 8.958476809893702e-07, + "loss": 0.0397, + "step": 31867 + }, + { + "epoch": 86.83378746594005, + "grad_norm": 2.926924705505371, + "learning_rate": 8.954826322336596e-07, + "loss": 0.0825, + "step": 31868 + }, + { + "epoch": 86.83651226158038, + "grad_norm": 2.328819513320923, + "learning_rate": 8.951176543836404e-07, + "loss": 0.0427, + "step": 31869 + }, + { + "epoch": 86.83923705722071, + "grad_norm": 1.3802648782730103, + "learning_rate": 8.947527474421513e-07, + "loss": 0.0187, + "step": 31870 + }, + { + "epoch": 86.84196185286103, + "grad_norm": 3.1059184074401855, + "learning_rate": 8.943879114120347e-07, + "loss": 0.0925, + "step": 31871 + }, + { + "epoch": 86.84468664850137, + "grad_norm": 3.1488611698150635, + "learning_rate": 8.940231462961302e-07, + "loss": 0.0365, + "step": 31872 + }, + { + "epoch": 86.84741144414168, + "grad_norm": 3.2357780933380127, + "learning_rate": 8.936584520972824e-07, + "loss": 0.0765, + "step": 31873 + }, + { + "epoch": 86.85013623978202, + "grad_norm": 4.385752201080322, + "learning_rate": 8.932938288183268e-07, + "loss": 0.1023, + "step": 31874 + }, + { + "epoch": 86.85286103542235, + "grad_norm": 1.538090705871582, + "learning_rate": 8.929292764621078e-07, + "loss": 0.0219, + "step": 31875 + }, + { + "epoch": 86.85558583106267, + "grad_norm": 3.7086973190307617, + "learning_rate": 8.925647950314631e-07, + "loss": 0.0296, + "step": 31876 + }, + { + "epoch": 86.858310626703, + "grad_norm": 1.9129804372787476, + "learning_rate": 8.922003845292293e-07, + "loss": 0.0354, + "step": 31877 + }, + { + "epoch": 86.86103542234332, + "grad_norm": 2.6988542079925537, + "learning_rate": 8.918360449582464e-07, + "loss": 0.0794, + "step": 31878 + }, + { + "epoch": 86.86376021798365, + "grad_norm": 2.3943700790405273, + "learning_rate": 8.914717763213521e-07, + "loss": 0.0245, + "step": 31879 + }, + { + "epoch": 86.86648501362397, + "grad_norm": 2.104721784591675, + "learning_rate": 8.911075786213819e-07, + "loss": 0.1231, + "step": 31880 + }, + { + "epoch": 86.8692098092643, + "grad_norm": 2.727410316467285, + "learning_rate": 8.907434518611713e-07, + "loss": 0.0293, + "step": 31881 + }, + { + "epoch": 86.87193460490464, + "grad_norm": 5.318673133850098, + "learning_rate": 8.903793960435592e-07, + "loss": 0.1412, + "step": 31882 + }, + { + "epoch": 86.87465940054496, + "grad_norm": 2.8119523525238037, + "learning_rate": 8.900154111713787e-07, + "loss": 0.0371, + "step": 31883 + }, + { + "epoch": 86.87738419618529, + "grad_norm": 3.3595151901245117, + "learning_rate": 8.896514972474657e-07, + "loss": 0.0228, + "step": 31884 + }, + { + "epoch": 86.88010899182561, + "grad_norm": 2.101471185684204, + "learning_rate": 8.892876542746509e-07, + "loss": 0.0845, + "step": 31885 + }, + { + "epoch": 86.88283378746594, + "grad_norm": 4.005616188049316, + "learning_rate": 8.889238822557733e-07, + "loss": 0.056, + "step": 31886 + }, + { + "epoch": 86.88555858310627, + "grad_norm": 2.5760974884033203, + "learning_rate": 8.885601811936628e-07, + "loss": 0.1622, + "step": 31887 + }, + { + "epoch": 86.88828337874659, + "grad_norm": 1.8493988513946533, + "learning_rate": 8.881965510911506e-07, + "loss": 0.0256, + "step": 31888 + }, + { + "epoch": 86.89100817438693, + "grad_norm": 4.823277950286865, + "learning_rate": 8.87832991951072e-07, + "loss": 0.0253, + "step": 31889 + }, + { + "epoch": 86.89373297002724, + "grad_norm": 2.7438676357269287, + "learning_rate": 8.874695037762571e-07, + "loss": 0.1183, + "step": 31890 + }, + { + "epoch": 86.89645776566758, + "grad_norm": 2.3376359939575195, + "learning_rate": 8.871060865695347e-07, + "loss": 0.0327, + "step": 31891 + }, + { + "epoch": 86.8991825613079, + "grad_norm": 2.2812001705169678, + "learning_rate": 8.867427403337392e-07, + "loss": 0.0224, + "step": 31892 + }, + { + "epoch": 86.90190735694823, + "grad_norm": 1.6706823110580444, + "learning_rate": 8.86379465071695e-07, + "loss": 0.0216, + "step": 31893 + }, + { + "epoch": 86.90463215258856, + "grad_norm": 5.328125, + "learning_rate": 8.860162607862366e-07, + "loss": 0.0358, + "step": 31894 + }, + { + "epoch": 86.90735694822888, + "grad_norm": 2.010127544403076, + "learning_rate": 8.856531274801904e-07, + "loss": 0.1028, + "step": 31895 + }, + { + "epoch": 86.91008174386921, + "grad_norm": 2.0606815814971924, + "learning_rate": 8.852900651563833e-07, + "loss": 0.0237, + "step": 31896 + }, + { + "epoch": 86.91280653950953, + "grad_norm": 2.7134268283843994, + "learning_rate": 8.84927073817643e-07, + "loss": 0.0866, + "step": 31897 + }, + { + "epoch": 86.91553133514986, + "grad_norm": 2.1887168884277344, + "learning_rate": 8.845641534667993e-07, + "loss": 0.0237, + "step": 31898 + }, + { + "epoch": 86.9182561307902, + "grad_norm": 2.4767327308654785, + "learning_rate": 8.842013041066754e-07, + "loss": 0.1119, + "step": 31899 + }, + { + "epoch": 86.92098092643052, + "grad_norm": 3.3079845905303955, + "learning_rate": 8.838385257400994e-07, + "loss": 0.043, + "step": 31900 + }, + { + "epoch": 86.92370572207085, + "grad_norm": 1.898982048034668, + "learning_rate": 8.834758183698933e-07, + "loss": 0.0299, + "step": 31901 + }, + { + "epoch": 86.92643051771117, + "grad_norm": 2.012143611907959, + "learning_rate": 8.831131819988859e-07, + "loss": 0.0359, + "step": 31902 + }, + { + "epoch": 86.9291553133515, + "grad_norm": 2.660198926925659, + "learning_rate": 8.827506166298994e-07, + "loss": 0.1469, + "step": 31903 + }, + { + "epoch": 86.93188010899182, + "grad_norm": 2.0650031566619873, + "learning_rate": 8.823881222657582e-07, + "loss": 0.0967, + "step": 31904 + }, + { + "epoch": 86.93460490463215, + "grad_norm": 2.527787208557129, + "learning_rate": 8.820256989092824e-07, + "loss": 0.07, + "step": 31905 + }, + { + "epoch": 86.93732970027249, + "grad_norm": 2.7898435592651367, + "learning_rate": 8.816633465632996e-07, + "loss": 0.1494, + "step": 31906 + }, + { + "epoch": 86.9400544959128, + "grad_norm": 1.7793904542922974, + "learning_rate": 8.813010652306286e-07, + "loss": 0.0227, + "step": 31907 + }, + { + "epoch": 86.94277929155314, + "grad_norm": 3.2279844284057617, + "learning_rate": 8.809388549140918e-07, + "loss": 0.0329, + "step": 31908 + }, + { + "epoch": 86.94550408719346, + "grad_norm": 1.4497243165969849, + "learning_rate": 8.805767156165057e-07, + "loss": 0.0203, + "step": 31909 + }, + { + "epoch": 86.94822888283379, + "grad_norm": 4.106661319732666, + "learning_rate": 8.802146473406991e-07, + "loss": 0.1039, + "step": 31910 + }, + { + "epoch": 86.95095367847412, + "grad_norm": 2.7305715084075928, + "learning_rate": 8.798526500894866e-07, + "loss": 0.0335, + "step": 31911 + }, + { + "epoch": 86.95367847411444, + "grad_norm": 2.0169501304626465, + "learning_rate": 8.79490723865688e-07, + "loss": 0.0247, + "step": 31912 + }, + { + "epoch": 86.95640326975477, + "grad_norm": 3.3821303844451904, + "learning_rate": 8.7912886867212e-07, + "loss": 0.0529, + "step": 31913 + }, + { + "epoch": 86.95912806539509, + "grad_norm": 4.41207218170166, + "learning_rate": 8.787670845116059e-07, + "loss": 0.1172, + "step": 31914 + }, + { + "epoch": 86.96185286103542, + "grad_norm": 2.8587772846221924, + "learning_rate": 8.784053713869589e-07, + "loss": 0.0516, + "step": 31915 + }, + { + "epoch": 86.96457765667574, + "grad_norm": 3.60770320892334, + "learning_rate": 8.78043729300998e-07, + "loss": 0.0603, + "step": 31916 + }, + { + "epoch": 86.96730245231608, + "grad_norm": 3.2521111965179443, + "learning_rate": 8.776821582565365e-07, + "loss": 0.0331, + "step": 31917 + }, + { + "epoch": 86.97002724795641, + "grad_norm": 2.495760917663574, + "learning_rate": 8.773206582563953e-07, + "loss": 0.0235, + "step": 31918 + }, + { + "epoch": 86.97275204359673, + "grad_norm": 4.632887363433838, + "learning_rate": 8.769592293033868e-07, + "loss": 0.036, + "step": 31919 + }, + { + "epoch": 86.97547683923706, + "grad_norm": 1.7221351861953735, + "learning_rate": 8.765978714003265e-07, + "loss": 0.0354, + "step": 31920 + }, + { + "epoch": 86.97820163487738, + "grad_norm": 2.451761245727539, + "learning_rate": 8.762365845500265e-07, + "loss": 0.0454, + "step": 31921 + }, + { + "epoch": 86.98092643051771, + "grad_norm": 4.969675064086914, + "learning_rate": 8.758753687553035e-07, + "loss": 0.1991, + "step": 31922 + }, + { + "epoch": 86.98365122615803, + "grad_norm": 1.9271904230117798, + "learning_rate": 8.755142240189706e-07, + "loss": 0.0205, + "step": 31923 + }, + { + "epoch": 86.98637602179836, + "grad_norm": 2.6992568969726562, + "learning_rate": 8.751531503438382e-07, + "loss": 0.041, + "step": 31924 + }, + { + "epoch": 86.9891008174387, + "grad_norm": 2.373265266418457, + "learning_rate": 8.747921477327182e-07, + "loss": 0.1707, + "step": 31925 + }, + { + "epoch": 86.99182561307902, + "grad_norm": 2.343313455581665, + "learning_rate": 8.744312161884228e-07, + "loss": 0.0607, + "step": 31926 + }, + { + "epoch": 86.99455040871935, + "grad_norm": 1.9195460081100464, + "learning_rate": 8.740703557137653e-07, + "loss": 0.0277, + "step": 31927 + }, + { + "epoch": 86.99727520435967, + "grad_norm": 1.5488792657852173, + "learning_rate": 8.737095663115547e-07, + "loss": 0.1361, + "step": 31928 + }, + { + "epoch": 87.0, + "grad_norm": 2.9402854442596436, + "learning_rate": 8.733488479845997e-07, + "loss": 0.0556, + "step": 31929 + }, + { + "epoch": 87.00272479564033, + "grad_norm": 2.30751895904541, + "learning_rate": 8.729882007357083e-07, + "loss": 0.026, + "step": 31930 + }, + { + "epoch": 87.00544959128065, + "grad_norm": 2.3755152225494385, + "learning_rate": 8.726276245676934e-07, + "loss": 0.1469, + "step": 31931 + }, + { + "epoch": 87.00817438692098, + "grad_norm": 2.6640377044677734, + "learning_rate": 8.722671194833598e-07, + "loss": 0.038, + "step": 31932 + }, + { + "epoch": 87.0108991825613, + "grad_norm": 2.6814212799072266, + "learning_rate": 8.719066854855151e-07, + "loss": 0.1313, + "step": 31933 + }, + { + "epoch": 87.01362397820164, + "grad_norm": 2.758610248565674, + "learning_rate": 8.715463225769693e-07, + "loss": 0.0336, + "step": 31934 + }, + { + "epoch": 87.01634877384195, + "grad_norm": 3.4616310596466064, + "learning_rate": 8.711860307605257e-07, + "loss": 0.1166, + "step": 31935 + }, + { + "epoch": 87.01907356948229, + "grad_norm": 1.5524550676345825, + "learning_rate": 8.708258100389933e-07, + "loss": 0.0221, + "step": 31936 + }, + { + "epoch": 87.02179836512262, + "grad_norm": 2.028284788131714, + "learning_rate": 8.704656604151729e-07, + "loss": 0.0186, + "step": 31937 + }, + { + "epoch": 87.02452316076294, + "grad_norm": 3.196913480758667, + "learning_rate": 8.701055818918736e-07, + "loss": 0.0307, + "step": 31938 + }, + { + "epoch": 87.02724795640327, + "grad_norm": 3.3685288429260254, + "learning_rate": 8.697455744718985e-07, + "loss": 0.0929, + "step": 31939 + }, + { + "epoch": 87.02997275204359, + "grad_norm": 2.4672834873199463, + "learning_rate": 8.693856381580512e-07, + "loss": 0.1396, + "step": 31940 + }, + { + "epoch": 87.03269754768392, + "grad_norm": 2.7180583477020264, + "learning_rate": 8.690257729531326e-07, + "loss": 0.0294, + "step": 31941 + }, + { + "epoch": 87.03542234332426, + "grad_norm": 1.4101189374923706, + "learning_rate": 8.686659788599494e-07, + "loss": 0.0237, + "step": 31942 + }, + { + "epoch": 87.03814713896458, + "grad_norm": 13.789135932922363, + "learning_rate": 8.683062558812994e-07, + "loss": 0.0596, + "step": 31943 + }, + { + "epoch": 87.04087193460491, + "grad_norm": 3.0247530937194824, + "learning_rate": 8.679466040199891e-07, + "loss": 0.0793, + "step": 31944 + }, + { + "epoch": 87.04359673024523, + "grad_norm": 3.7759997844696045, + "learning_rate": 8.675870232788164e-07, + "loss": 0.1435, + "step": 31945 + }, + { + "epoch": 87.04632152588556, + "grad_norm": 3.1340579986572266, + "learning_rate": 8.672275136605801e-07, + "loss": 0.1152, + "step": 31946 + }, + { + "epoch": 87.04904632152588, + "grad_norm": 2.5545504093170166, + "learning_rate": 8.668680751680836e-07, + "loss": 0.0429, + "step": 31947 + }, + { + "epoch": 87.05177111716621, + "grad_norm": 2.539555549621582, + "learning_rate": 8.665087078041245e-07, + "loss": 0.0214, + "step": 31948 + }, + { + "epoch": 87.05449591280654, + "grad_norm": 1.6589235067367554, + "learning_rate": 8.661494115715019e-07, + "loss": 0.0223, + "step": 31949 + }, + { + "epoch": 87.05722070844686, + "grad_norm": 2.8541224002838135, + "learning_rate": 8.657901864730112e-07, + "loss": 0.0499, + "step": 31950 + }, + { + "epoch": 87.0599455040872, + "grad_norm": 3.6259543895721436, + "learning_rate": 8.654310325114557e-07, + "loss": 0.0718, + "step": 31951 + }, + { + "epoch": 87.06267029972751, + "grad_norm": 6.198474407196045, + "learning_rate": 8.650719496896287e-07, + "loss": 0.0982, + "step": 31952 + }, + { + "epoch": 87.06539509536785, + "grad_norm": 2.609693765640259, + "learning_rate": 8.647129380103248e-07, + "loss": 0.0179, + "step": 31953 + }, + { + "epoch": 87.06811989100818, + "grad_norm": 2.1050493717193604, + "learning_rate": 8.643539974763449e-07, + "loss": 0.0784, + "step": 31954 + }, + { + "epoch": 87.0708446866485, + "grad_norm": 1.9728049039840698, + "learning_rate": 8.639951280904824e-07, + "loss": 0.1097, + "step": 31955 + }, + { + "epoch": 87.07356948228883, + "grad_norm": 2.081594467163086, + "learning_rate": 8.636363298555317e-07, + "loss": 0.0273, + "step": 31956 + }, + { + "epoch": 87.07629427792915, + "grad_norm": 1.9430947303771973, + "learning_rate": 8.632776027742851e-07, + "loss": 0.1135, + "step": 31957 + }, + { + "epoch": 87.07901907356948, + "grad_norm": 2.7454442977905273, + "learning_rate": 8.629189468495402e-07, + "loss": 0.0389, + "step": 31958 + }, + { + "epoch": 87.0817438692098, + "grad_norm": 5.959187984466553, + "learning_rate": 8.625603620840894e-07, + "loss": 0.0393, + "step": 31959 + }, + { + "epoch": 87.08446866485014, + "grad_norm": 1.8962658643722534, + "learning_rate": 8.622018484807215e-07, + "loss": 0.0295, + "step": 31960 + }, + { + "epoch": 87.08719346049047, + "grad_norm": 10.90555477142334, + "learning_rate": 8.618434060422331e-07, + "loss": 0.057, + "step": 31961 + }, + { + "epoch": 87.08991825613079, + "grad_norm": 2.2312071323394775, + "learning_rate": 8.614850347714132e-07, + "loss": 0.0691, + "step": 31962 + }, + { + "epoch": 87.09264305177112, + "grad_norm": 2.277768850326538, + "learning_rate": 8.61126734671055e-07, + "loss": 0.0458, + "step": 31963 + }, + { + "epoch": 87.09536784741144, + "grad_norm": 2.634031057357788, + "learning_rate": 8.607685057439486e-07, + "loss": 0.044, + "step": 31964 + }, + { + "epoch": 87.09809264305177, + "grad_norm": 1.797587275505066, + "learning_rate": 8.604103479928815e-07, + "loss": 0.0279, + "step": 31965 + }, + { + "epoch": 87.1008174386921, + "grad_norm": 3.5806045532226562, + "learning_rate": 8.600522614206442e-07, + "loss": 0.1663, + "step": 31966 + }, + { + "epoch": 87.10354223433242, + "grad_norm": 1.9146403074264526, + "learning_rate": 8.596942460300261e-07, + "loss": 0.0673, + "step": 31967 + }, + { + "epoch": 87.10626702997276, + "grad_norm": 3.6403446197509766, + "learning_rate": 8.593363018238154e-07, + "loss": 0.0812, + "step": 31968 + }, + { + "epoch": 87.10899182561307, + "grad_norm": 2.977989912033081, + "learning_rate": 8.589784288047997e-07, + "loss": 0.0325, + "step": 31969 + }, + { + "epoch": 87.11171662125341, + "grad_norm": 1.993374228477478, + "learning_rate": 8.586206269757647e-07, + "loss": 0.0668, + "step": 31970 + }, + { + "epoch": 87.11444141689373, + "grad_norm": 2.3206489086151123, + "learning_rate": 8.58262896339499e-07, + "loss": 0.0424, + "step": 31971 + }, + { + "epoch": 87.11716621253406, + "grad_norm": 3.1360924243927, + "learning_rate": 8.579052368987872e-07, + "loss": 0.0473, + "step": 31972 + }, + { + "epoch": 87.11989100817439, + "grad_norm": 2.342132329940796, + "learning_rate": 8.57547648656416e-07, + "loss": 0.1698, + "step": 31973 + }, + { + "epoch": 87.12261580381471, + "grad_norm": 2.187732458114624, + "learning_rate": 8.571901316151676e-07, + "loss": 0.0246, + "step": 31974 + }, + { + "epoch": 87.12534059945504, + "grad_norm": 1.0331571102142334, + "learning_rate": 8.568326857778297e-07, + "loss": 0.0133, + "step": 31975 + }, + { + "epoch": 87.12806539509536, + "grad_norm": 2.2067832946777344, + "learning_rate": 8.564753111471847e-07, + "loss": 0.0335, + "step": 31976 + }, + { + "epoch": 87.1307901907357, + "grad_norm": 2.947394609451294, + "learning_rate": 8.561180077260134e-07, + "loss": 0.0362, + "step": 31977 + }, + { + "epoch": 87.13351498637603, + "grad_norm": 2.036851406097412, + "learning_rate": 8.557607755171016e-07, + "loss": 0.024, + "step": 31978 + }, + { + "epoch": 87.13623978201635, + "grad_norm": 1.8236857652664185, + "learning_rate": 8.554036145232314e-07, + "loss": 0.0243, + "step": 31979 + }, + { + "epoch": 87.13896457765668, + "grad_norm": 1.9249520301818848, + "learning_rate": 8.550465247471839e-07, + "loss": 0.0346, + "step": 31980 + }, + { + "epoch": 87.141689373297, + "grad_norm": 2.917386770248413, + "learning_rate": 8.546895061917404e-07, + "loss": 0.0836, + "step": 31981 + }, + { + "epoch": 87.14441416893733, + "grad_norm": 3.850255250930786, + "learning_rate": 8.543325588596785e-07, + "loss": 0.0261, + "step": 31982 + }, + { + "epoch": 87.14713896457765, + "grad_norm": 2.069046974182129, + "learning_rate": 8.539756827537815e-07, + "loss": 0.0389, + "step": 31983 + }, + { + "epoch": 87.14986376021798, + "grad_norm": 9.028697967529297, + "learning_rate": 8.536188778768284e-07, + "loss": 0.0376, + "step": 31984 + }, + { + "epoch": 87.15258855585832, + "grad_norm": 4.243398666381836, + "learning_rate": 8.53262144231597e-07, + "loss": 0.0577, + "step": 31985 + }, + { + "epoch": 87.15531335149863, + "grad_norm": 2.879706382751465, + "learning_rate": 8.529054818208638e-07, + "loss": 0.0732, + "step": 31986 + }, + { + "epoch": 87.15803814713897, + "grad_norm": 2.511085033416748, + "learning_rate": 8.525488906474089e-07, + "loss": 0.1094, + "step": 31987 + }, + { + "epoch": 87.16076294277929, + "grad_norm": 1.7432821989059448, + "learning_rate": 8.521923707140101e-07, + "loss": 0.0207, + "step": 31988 + }, + { + "epoch": 87.16348773841962, + "grad_norm": 3.6034116744995117, + "learning_rate": 8.518359220234429e-07, + "loss": 0.0448, + "step": 31989 + }, + { + "epoch": 87.16621253405995, + "grad_norm": 1.8865264654159546, + "learning_rate": 8.514795445784807e-07, + "loss": 0.0292, + "step": 31990 + }, + { + "epoch": 87.16893732970027, + "grad_norm": 5.443391799926758, + "learning_rate": 8.511232383819024e-07, + "loss": 0.1571, + "step": 31991 + }, + { + "epoch": 87.1716621253406, + "grad_norm": 3.189753293991089, + "learning_rate": 8.507670034364834e-07, + "loss": 0.0864, + "step": 31992 + }, + { + "epoch": 87.17438692098092, + "grad_norm": 2.250596046447754, + "learning_rate": 8.504108397449962e-07, + "loss": 0.025, + "step": 31993 + }, + { + "epoch": 87.17711171662125, + "grad_norm": 2.4600954055786133, + "learning_rate": 8.500547473102116e-07, + "loss": 0.0389, + "step": 31994 + }, + { + "epoch": 87.17983651226157, + "grad_norm": 3.1625146865844727, + "learning_rate": 8.496987261349077e-07, + "loss": 0.0632, + "step": 31995 + }, + { + "epoch": 87.1825613079019, + "grad_norm": 3.342609167098999, + "learning_rate": 8.493427762218575e-07, + "loss": 0.0461, + "step": 31996 + }, + { + "epoch": 87.18528610354224, + "grad_norm": 4.623934268951416, + "learning_rate": 8.489868975738303e-07, + "loss": 0.0715, + "step": 31997 + }, + { + "epoch": 87.18801089918256, + "grad_norm": 2.85520601272583, + "learning_rate": 8.486310901935968e-07, + "loss": 0.0348, + "step": 31998 + }, + { + "epoch": 87.19073569482289, + "grad_norm": 2.3970866203308105, + "learning_rate": 8.482753540839328e-07, + "loss": 0.0296, + "step": 31999 + }, + { + "epoch": 87.19346049046321, + "grad_norm": 4.5319342613220215, + "learning_rate": 8.479196892476049e-07, + "loss": 0.0769, + "step": 32000 + }, + { + "epoch": 87.19618528610354, + "grad_norm": 3.3380751609802246, + "learning_rate": 8.475640956873843e-07, + "loss": 0.077, + "step": 32001 + }, + { + "epoch": 87.19891008174388, + "grad_norm": 2.58056640625, + "learning_rate": 8.472085734060376e-07, + "loss": 0.0666, + "step": 32002 + }, + { + "epoch": 87.2016348773842, + "grad_norm": 2.57891845703125, + "learning_rate": 8.468531224063381e-07, + "loss": 0.0326, + "step": 32003 + }, + { + "epoch": 87.20435967302453, + "grad_norm": 2.006296157836914, + "learning_rate": 8.464977426910514e-07, + "loss": 0.0281, + "step": 32004 + }, + { + "epoch": 87.20708446866485, + "grad_norm": 2.3370838165283203, + "learning_rate": 8.461424342629465e-07, + "loss": 0.0364, + "step": 32005 + }, + { + "epoch": 87.20980926430518, + "grad_norm": 2.5445826053619385, + "learning_rate": 8.457871971247877e-07, + "loss": 0.1144, + "step": 32006 + }, + { + "epoch": 87.2125340599455, + "grad_norm": 2.2657854557037354, + "learning_rate": 8.454320312793451e-07, + "loss": 0.0289, + "step": 32007 + }, + { + "epoch": 87.21525885558583, + "grad_norm": 6.7753825187683105, + "learning_rate": 8.450769367293832e-07, + "loss": 0.0304, + "step": 32008 + }, + { + "epoch": 87.21798365122616, + "grad_norm": 1.9065998792648315, + "learning_rate": 8.447219134776674e-07, + "loss": 0.0217, + "step": 32009 + }, + { + "epoch": 87.22070844686648, + "grad_norm": 2.338294744491577, + "learning_rate": 8.443669615269611e-07, + "loss": 0.1282, + "step": 32010 + }, + { + "epoch": 87.22343324250681, + "grad_norm": 2.3199870586395264, + "learning_rate": 8.440120808800323e-07, + "loss": 0.0515, + "step": 32011 + }, + { + "epoch": 87.22615803814713, + "grad_norm": 2.0141749382019043, + "learning_rate": 8.436572715396407e-07, + "loss": 0.0718, + "step": 32012 + }, + { + "epoch": 87.22888283378747, + "grad_norm": 2.863680362701416, + "learning_rate": 8.433025335085532e-07, + "loss": 0.0327, + "step": 32013 + }, + { + "epoch": 87.2316076294278, + "grad_norm": 2.172550916671753, + "learning_rate": 8.429478667895307e-07, + "loss": 0.0244, + "step": 32014 + }, + { + "epoch": 87.23433242506812, + "grad_norm": 3.00764799118042, + "learning_rate": 8.425932713853346e-07, + "loss": 0.0572, + "step": 32015 + }, + { + "epoch": 87.23705722070845, + "grad_norm": 15.083392143249512, + "learning_rate": 8.422387472987281e-07, + "loss": 0.0299, + "step": 32016 + }, + { + "epoch": 87.23978201634877, + "grad_norm": 2.5588722229003906, + "learning_rate": 8.418842945324724e-07, + "loss": 0.0271, + "step": 32017 + }, + { + "epoch": 87.2425068119891, + "grad_norm": 4.644388198852539, + "learning_rate": 8.415299130893251e-07, + "loss": 0.0737, + "step": 32018 + }, + { + "epoch": 87.24523160762942, + "grad_norm": 2.2760121822357178, + "learning_rate": 8.411756029720497e-07, + "loss": 0.0431, + "step": 32019 + }, + { + "epoch": 87.24795640326975, + "grad_norm": 2.807145118713379, + "learning_rate": 8.408213641834029e-07, + "loss": 0.0366, + "step": 32020 + }, + { + "epoch": 87.25068119891009, + "grad_norm": 1.9172195196151733, + "learning_rate": 8.404671967261457e-07, + "loss": 0.0674, + "step": 32021 + }, + { + "epoch": 87.2534059945504, + "grad_norm": 2.739680528640747, + "learning_rate": 8.401131006030327e-07, + "loss": 0.0451, + "step": 32022 + }, + { + "epoch": 87.25613079019074, + "grad_norm": 3.617414951324463, + "learning_rate": 8.397590758168272e-07, + "loss": 0.128, + "step": 32023 + }, + { + "epoch": 87.25885558583106, + "grad_norm": 2.3763816356658936, + "learning_rate": 8.394051223702815e-07, + "loss": 0.0491, + "step": 32024 + }, + { + "epoch": 87.26158038147139, + "grad_norm": 3.6216704845428467, + "learning_rate": 8.390512402661555e-07, + "loss": 0.1775, + "step": 32025 + }, + { + "epoch": 87.26430517711172, + "grad_norm": 2.240335464477539, + "learning_rate": 8.386974295072004e-07, + "loss": 0.025, + "step": 32026 + }, + { + "epoch": 87.26702997275204, + "grad_norm": 2.863473653793335, + "learning_rate": 8.383436900961772e-07, + "loss": 0.072, + "step": 32027 + }, + { + "epoch": 87.26975476839237, + "grad_norm": 3.8904831409454346, + "learning_rate": 8.379900220358384e-07, + "loss": 0.0481, + "step": 32028 + }, + { + "epoch": 87.2724795640327, + "grad_norm": 2.4198544025421143, + "learning_rate": 8.376364253289371e-07, + "loss": 0.1564, + "step": 32029 + }, + { + "epoch": 87.27520435967303, + "grad_norm": 2.7671501636505127, + "learning_rate": 8.372828999782301e-07, + "loss": 0.0377, + "step": 32030 + }, + { + "epoch": 87.27792915531334, + "grad_norm": 2.004340887069702, + "learning_rate": 8.369294459864663e-07, + "loss": 0.0227, + "step": 32031 + }, + { + "epoch": 87.28065395095368, + "grad_norm": 2.9251890182495117, + "learning_rate": 8.365760633564035e-07, + "loss": 0.0939, + "step": 32032 + }, + { + "epoch": 87.28337874659401, + "grad_norm": 4.655163764953613, + "learning_rate": 8.362227520907918e-07, + "loss": 0.0331, + "step": 32033 + }, + { + "epoch": 87.28610354223433, + "grad_norm": 3.044646978378296, + "learning_rate": 8.35869512192381e-07, + "loss": 0.035, + "step": 32034 + }, + { + "epoch": 87.28882833787466, + "grad_norm": 2.171783924102783, + "learning_rate": 8.355163436639236e-07, + "loss": 0.0323, + "step": 32035 + }, + { + "epoch": 87.29155313351498, + "grad_norm": 1.5490366220474243, + "learning_rate": 8.351632465081705e-07, + "loss": 0.2205, + "step": 32036 + }, + { + "epoch": 87.29427792915531, + "grad_norm": 2.554487466812134, + "learning_rate": 8.348102207278708e-07, + "loss": 0.1241, + "step": 32037 + }, + { + "epoch": 87.29700272479565, + "grad_norm": 1.847252607345581, + "learning_rate": 8.344572663257755e-07, + "loss": 0.0343, + "step": 32038 + }, + { + "epoch": 87.29972752043597, + "grad_norm": 2.1390950679779053, + "learning_rate": 8.341043833046292e-07, + "loss": 0.0283, + "step": 32039 + }, + { + "epoch": 87.3024523160763, + "grad_norm": 3.2583892345428467, + "learning_rate": 8.337515716671851e-07, + "loss": 0.1564, + "step": 32040 + }, + { + "epoch": 87.30517711171662, + "grad_norm": 3.5399813652038574, + "learning_rate": 8.333988314161879e-07, + "loss": 0.0613, + "step": 32041 + }, + { + "epoch": 87.30790190735695, + "grad_norm": 3.7903201580047607, + "learning_rate": 8.33046162554385e-07, + "loss": 0.0641, + "step": 32042 + }, + { + "epoch": 87.31062670299727, + "grad_norm": 5.673577308654785, + "learning_rate": 8.326935650845247e-07, + "loss": 0.0978, + "step": 32043 + }, + { + "epoch": 87.3133514986376, + "grad_norm": 2.934593915939331, + "learning_rate": 8.323410390093523e-07, + "loss": 0.0689, + "step": 32044 + }, + { + "epoch": 87.31607629427793, + "grad_norm": 3.9851810932159424, + "learning_rate": 8.319885843316123e-07, + "loss": 0.0618, + "step": 32045 + }, + { + "epoch": 87.31880108991825, + "grad_norm": 3.383972644805908, + "learning_rate": 8.316362010540479e-07, + "loss": 0.1647, + "step": 32046 + }, + { + "epoch": 87.32152588555859, + "grad_norm": 2.7322640419006348, + "learning_rate": 8.312838891794073e-07, + "loss": 0.0832, + "step": 32047 + }, + { + "epoch": 87.3242506811989, + "grad_norm": 3.392420768737793, + "learning_rate": 8.309316487104335e-07, + "loss": 0.0846, + "step": 32048 + }, + { + "epoch": 87.32697547683924, + "grad_norm": 3.0945212841033936, + "learning_rate": 8.305794796498689e-07, + "loss": 0.0451, + "step": 32049 + }, + { + "epoch": 87.32970027247957, + "grad_norm": 2.9162776470184326, + "learning_rate": 8.302273820004558e-07, + "loss": 0.1233, + "step": 32050 + }, + { + "epoch": 87.33242506811989, + "grad_norm": 3.2233474254608154, + "learning_rate": 8.298753557649353e-07, + "loss": 0.0765, + "step": 32051 + }, + { + "epoch": 87.33514986376022, + "grad_norm": 1.705782413482666, + "learning_rate": 8.295234009460529e-07, + "loss": 0.027, + "step": 32052 + }, + { + "epoch": 87.33787465940054, + "grad_norm": 2.5130674839019775, + "learning_rate": 8.291715175465453e-07, + "loss": 0.0302, + "step": 32053 + }, + { + "epoch": 87.34059945504087, + "grad_norm": 4.544942855834961, + "learning_rate": 8.288197055691561e-07, + "loss": 0.0852, + "step": 32054 + }, + { + "epoch": 87.34332425068119, + "grad_norm": 3.1552555561065674, + "learning_rate": 8.284679650166227e-07, + "loss": 0.1218, + "step": 32055 + }, + { + "epoch": 87.34604904632153, + "grad_norm": 2.733889579772949, + "learning_rate": 8.281162958916866e-07, + "loss": 0.116, + "step": 32056 + }, + { + "epoch": 87.34877384196186, + "grad_norm": 3.0717015266418457, + "learning_rate": 8.277646981970855e-07, + "loss": 0.1185, + "step": 32057 + }, + { + "epoch": 87.35149863760218, + "grad_norm": 2.7397303581237793, + "learning_rate": 8.274131719355571e-07, + "loss": 0.0383, + "step": 32058 + }, + { + "epoch": 87.35422343324251, + "grad_norm": 2.4850943088531494, + "learning_rate": 8.270617171098383e-07, + "loss": 0.0369, + "step": 32059 + }, + { + "epoch": 87.35694822888283, + "grad_norm": 5.439486503601074, + "learning_rate": 8.2671033372267e-07, + "loss": 0.0525, + "step": 32060 + }, + { + "epoch": 87.35967302452316, + "grad_norm": 2.633753538131714, + "learning_rate": 8.263590217767858e-07, + "loss": 0.1182, + "step": 32061 + }, + { + "epoch": 87.3623978201635, + "grad_norm": 3.2475616931915283, + "learning_rate": 8.260077812749212e-07, + "loss": 0.1208, + "step": 32062 + }, + { + "epoch": 87.36512261580381, + "grad_norm": 2.1586110591888428, + "learning_rate": 8.25656612219814e-07, + "loss": 0.1158, + "step": 32063 + }, + { + "epoch": 87.36784741144415, + "grad_norm": 2.7510464191436768, + "learning_rate": 8.253055146141964e-07, + "loss": 0.0754, + "step": 32064 + }, + { + "epoch": 87.37057220708446, + "grad_norm": 3.917447805404663, + "learning_rate": 8.249544884608052e-07, + "loss": 0.1799, + "step": 32065 + }, + { + "epoch": 87.3732970027248, + "grad_norm": 2.3031461238861084, + "learning_rate": 8.246035337623737e-07, + "loss": 0.0312, + "step": 32066 + }, + { + "epoch": 87.37602179836512, + "grad_norm": 10.528989791870117, + "learning_rate": 8.24252650521633e-07, + "loss": 0.031, + "step": 32067 + }, + { + "epoch": 87.37874659400545, + "grad_norm": 2.054379940032959, + "learning_rate": 8.23901838741319e-07, + "loss": 0.019, + "step": 32068 + }, + { + "epoch": 87.38147138964578, + "grad_norm": 1.4419647455215454, + "learning_rate": 8.235510984241623e-07, + "loss": 0.0164, + "step": 32069 + }, + { + "epoch": 87.3841961852861, + "grad_norm": 3.174726963043213, + "learning_rate": 8.232004295728935e-07, + "loss": 0.0544, + "step": 32070 + }, + { + "epoch": 87.38692098092643, + "grad_norm": 1.9841511249542236, + "learning_rate": 8.228498321902434e-07, + "loss": 0.1894, + "step": 32071 + }, + { + "epoch": 87.38964577656675, + "grad_norm": 3.0590014457702637, + "learning_rate": 8.224993062789443e-07, + "loss": 0.0258, + "step": 32072 + }, + { + "epoch": 87.39237057220708, + "grad_norm": 2.2886037826538086, + "learning_rate": 8.221488518417264e-07, + "loss": 0.0314, + "step": 32073 + }, + { + "epoch": 87.39509536784742, + "grad_norm": 2.3827927112579346, + "learning_rate": 8.217984688813174e-07, + "loss": 0.0601, + "step": 32074 + }, + { + "epoch": 87.39782016348774, + "grad_norm": 3.274296760559082, + "learning_rate": 8.21448157400444e-07, + "loss": 0.0284, + "step": 32075 + }, + { + "epoch": 87.40054495912807, + "grad_norm": 2.597504138946533, + "learning_rate": 8.210979174018397e-07, + "loss": 0.0489, + "step": 32076 + }, + { + "epoch": 87.40326975476839, + "grad_norm": 3.3759877681732178, + "learning_rate": 8.207477488882287e-07, + "loss": 0.0261, + "step": 32077 + }, + { + "epoch": 87.40599455040872, + "grad_norm": 2.5323102474212646, + "learning_rate": 8.203976518623402e-07, + "loss": 0.0358, + "step": 32078 + }, + { + "epoch": 87.40871934604904, + "grad_norm": 2.9436633586883545, + "learning_rate": 8.200476263268964e-07, + "loss": 0.1111, + "step": 32079 + }, + { + "epoch": 87.41144414168937, + "grad_norm": 2.8936707973480225, + "learning_rate": 8.196976722846273e-07, + "loss": 0.1125, + "step": 32080 + }, + { + "epoch": 87.4141689373297, + "grad_norm": 1.7252203226089478, + "learning_rate": 8.193477897382574e-07, + "loss": 0.0308, + "step": 32081 + }, + { + "epoch": 87.41689373297002, + "grad_norm": 2.6562628746032715, + "learning_rate": 8.189979786905111e-07, + "loss": 0.0883, + "step": 32082 + }, + { + "epoch": 87.41961852861036, + "grad_norm": 3.75610089302063, + "learning_rate": 8.186482391441131e-07, + "loss": 0.0711, + "step": 32083 + }, + { + "epoch": 87.42234332425068, + "grad_norm": 4.6357316970825195, + "learning_rate": 8.182985711017877e-07, + "loss": 0.0534, + "step": 32084 + }, + { + "epoch": 87.42506811989101, + "grad_norm": 2.3157403469085693, + "learning_rate": 8.179489745662583e-07, + "loss": 0.0459, + "step": 32085 + }, + { + "epoch": 87.42779291553134, + "grad_norm": 2.565436601638794, + "learning_rate": 8.175994495402462e-07, + "loss": 0.0541, + "step": 32086 + }, + { + "epoch": 87.43051771117166, + "grad_norm": 5.693440914154053, + "learning_rate": 8.172499960264724e-07, + "loss": 0.0571, + "step": 32087 + }, + { + "epoch": 87.433242506812, + "grad_norm": 2.6509525775909424, + "learning_rate": 8.169006140276614e-07, + "loss": 0.0276, + "step": 32088 + }, + { + "epoch": 87.43596730245231, + "grad_norm": 2.344193458557129, + "learning_rate": 8.165513035465345e-07, + "loss": 0.0299, + "step": 32089 + }, + { + "epoch": 87.43869209809264, + "grad_norm": 1.9711655378341675, + "learning_rate": 8.162020645858093e-07, + "loss": 0.0234, + "step": 32090 + }, + { + "epoch": 87.44141689373296, + "grad_norm": 2.739438056945801, + "learning_rate": 8.15852897148205e-07, + "loss": 0.0367, + "step": 32091 + }, + { + "epoch": 87.4441416893733, + "grad_norm": 3.3594422340393066, + "learning_rate": 8.155038012364447e-07, + "loss": 0.0476, + "step": 32092 + }, + { + "epoch": 87.44686648501363, + "grad_norm": 1.8658385276794434, + "learning_rate": 8.151547768532453e-07, + "loss": 0.0268, + "step": 32093 + }, + { + "epoch": 87.44959128065395, + "grad_norm": 4.355685234069824, + "learning_rate": 8.148058240013246e-07, + "loss": 0.0499, + "step": 32094 + }, + { + "epoch": 87.45231607629428, + "grad_norm": 3.1923887729644775, + "learning_rate": 8.144569426833981e-07, + "loss": 0.0757, + "step": 32095 + }, + { + "epoch": 87.4550408719346, + "grad_norm": 2.8732986450195312, + "learning_rate": 8.141081329021883e-07, + "loss": 0.0535, + "step": 32096 + }, + { + "epoch": 87.45776566757493, + "grad_norm": 2.132540702819824, + "learning_rate": 8.137593946604083e-07, + "loss": 0.0213, + "step": 32097 + }, + { + "epoch": 87.46049046321527, + "grad_norm": 1.7454577684402466, + "learning_rate": 8.134107279607728e-07, + "loss": 0.0297, + "step": 32098 + }, + { + "epoch": 87.46321525885558, + "grad_norm": 2.77207088470459, + "learning_rate": 8.130621328060006e-07, + "loss": 0.0528, + "step": 32099 + }, + { + "epoch": 87.46594005449592, + "grad_norm": 3.1678285598754883, + "learning_rate": 8.127136091988031e-07, + "loss": 0.0408, + "step": 32100 + }, + { + "epoch": 87.46866485013624, + "grad_norm": 2.4710707664489746, + "learning_rate": 8.123651571418978e-07, + "loss": 0.0288, + "step": 32101 + }, + { + "epoch": 87.47138964577657, + "grad_norm": 2.966733455657959, + "learning_rate": 8.120167766379972e-07, + "loss": 0.0286, + "step": 32102 + }, + { + "epoch": 87.47411444141689, + "grad_norm": 3.19575572013855, + "learning_rate": 8.116684676898134e-07, + "loss": 0.0757, + "step": 32103 + }, + { + "epoch": 87.47683923705722, + "grad_norm": 1.9228724241256714, + "learning_rate": 8.113202303000589e-07, + "loss": 0.0222, + "step": 32104 + }, + { + "epoch": 87.47956403269755, + "grad_norm": 1.4114537239074707, + "learning_rate": 8.109720644714492e-07, + "loss": 0.0157, + "step": 32105 + }, + { + "epoch": 87.48228882833787, + "grad_norm": 3.4534709453582764, + "learning_rate": 8.106239702066921e-07, + "loss": 0.0638, + "step": 32106 + }, + { + "epoch": 87.4850136239782, + "grad_norm": 2.5079915523529053, + "learning_rate": 8.102759475084986e-07, + "loss": 0.036, + "step": 32107 + }, + { + "epoch": 87.48773841961852, + "grad_norm": 2.964305877685547, + "learning_rate": 8.099279963795814e-07, + "loss": 0.0323, + "step": 32108 + }, + { + "epoch": 87.49046321525886, + "grad_norm": 2.582146406173706, + "learning_rate": 8.095801168226503e-07, + "loss": 0.0841, + "step": 32109 + }, + { + "epoch": 87.49318801089919, + "grad_norm": 2.275869369506836, + "learning_rate": 8.092323088404119e-07, + "loss": 0.0303, + "step": 32110 + }, + { + "epoch": 87.49591280653951, + "grad_norm": 2.0972752571105957, + "learning_rate": 8.088845724355765e-07, + "loss": 0.0321, + "step": 32111 + }, + { + "epoch": 87.49863760217984, + "grad_norm": 2.659170150756836, + "learning_rate": 8.085369076108529e-07, + "loss": 0.0449, + "step": 32112 + }, + { + "epoch": 87.50136239782016, + "grad_norm": 1.7420847415924072, + "learning_rate": 8.081893143689479e-07, + "loss": 0.0208, + "step": 32113 + }, + { + "epoch": 87.50408719346049, + "grad_norm": 3.0050289630889893, + "learning_rate": 8.078417927125692e-07, + "loss": 0.0508, + "step": 32114 + }, + { + "epoch": 87.50681198910081, + "grad_norm": 2.8802103996276855, + "learning_rate": 8.074943426444204e-07, + "loss": 0.0572, + "step": 32115 + }, + { + "epoch": 87.50953678474114, + "grad_norm": 2.531992197036743, + "learning_rate": 8.071469641672103e-07, + "loss": 0.0895, + "step": 32116 + }, + { + "epoch": 87.51226158038148, + "grad_norm": 2.5337300300598145, + "learning_rate": 8.067996572836456e-07, + "loss": 0.0654, + "step": 32117 + }, + { + "epoch": 87.5149863760218, + "grad_norm": 2.8185200691223145, + "learning_rate": 8.064524219964298e-07, + "loss": 0.0458, + "step": 32118 + }, + { + "epoch": 87.51771117166213, + "grad_norm": 1.8498786687850952, + "learning_rate": 8.061052583082652e-07, + "loss": 0.0232, + "step": 32119 + }, + { + "epoch": 87.52043596730245, + "grad_norm": 3.859872579574585, + "learning_rate": 8.057581662218561e-07, + "loss": 0.0749, + "step": 32120 + }, + { + "epoch": 87.52316076294278, + "grad_norm": 3.3445465564727783, + "learning_rate": 8.054111457399083e-07, + "loss": 0.0546, + "step": 32121 + }, + { + "epoch": 87.52588555858311, + "grad_norm": 2.920300006866455, + "learning_rate": 8.050641968651218e-07, + "loss": 0.0415, + "step": 32122 + }, + { + "epoch": 87.52861035422343, + "grad_norm": 2.1514246463775635, + "learning_rate": 8.047173196002001e-07, + "loss": 0.0347, + "step": 32123 + }, + { + "epoch": 87.53133514986376, + "grad_norm": 2.5154616832733154, + "learning_rate": 8.043705139478431e-07, + "loss": 0.0405, + "step": 32124 + }, + { + "epoch": 87.53405994550408, + "grad_norm": 2.2705025672912598, + "learning_rate": 8.040237799107531e-07, + "loss": 0.0333, + "step": 32125 + }, + { + "epoch": 87.53678474114442, + "grad_norm": 2.769376277923584, + "learning_rate": 8.036771174916302e-07, + "loss": 0.1692, + "step": 32126 + }, + { + "epoch": 87.53950953678473, + "grad_norm": 2.183717727661133, + "learning_rate": 8.033305266931712e-07, + "loss": 0.0616, + "step": 32127 + }, + { + "epoch": 87.54223433242507, + "grad_norm": 2.682685375213623, + "learning_rate": 8.029840075180817e-07, + "loss": 0.0854, + "step": 32128 + }, + { + "epoch": 87.5449591280654, + "grad_norm": 4.025137424468994, + "learning_rate": 8.026375599690551e-07, + "loss": 0.0759, + "step": 32129 + }, + { + "epoch": 87.54768392370572, + "grad_norm": 2.4038383960723877, + "learning_rate": 8.022911840487924e-07, + "loss": 0.0318, + "step": 32130 + }, + { + "epoch": 87.55040871934605, + "grad_norm": 2.478999614715576, + "learning_rate": 8.019448797599871e-07, + "loss": 0.047, + "step": 32131 + }, + { + "epoch": 87.55313351498637, + "grad_norm": 6.368683815002441, + "learning_rate": 8.015986471053394e-07, + "loss": 0.0592, + "step": 32132 + }, + { + "epoch": 87.5558583106267, + "grad_norm": 2.918562650680542, + "learning_rate": 8.012524860875481e-07, + "loss": 0.0561, + "step": 32133 + }, + { + "epoch": 87.55858310626704, + "grad_norm": 2.6399192810058594, + "learning_rate": 8.009063967093055e-07, + "loss": 0.0298, + "step": 32134 + }, + { + "epoch": 87.56130790190736, + "grad_norm": 2.8267951011657715, + "learning_rate": 8.005603789733074e-07, + "loss": 0.0333, + "step": 32135 + }, + { + "epoch": 87.56403269754769, + "grad_norm": 4.2104363441467285, + "learning_rate": 8.00214432882248e-07, + "loss": 0.1008, + "step": 32136 + }, + { + "epoch": 87.566757493188, + "grad_norm": 2.6444315910339355, + "learning_rate": 7.998685584388244e-07, + "loss": 0.0539, + "step": 32137 + }, + { + "epoch": 87.56948228882834, + "grad_norm": 3.156651020050049, + "learning_rate": 7.995227556457274e-07, + "loss": 0.1323, + "step": 32138 + }, + { + "epoch": 87.57220708446866, + "grad_norm": 2.1488776206970215, + "learning_rate": 7.991770245056519e-07, + "loss": 0.0454, + "step": 32139 + }, + { + "epoch": 87.57493188010899, + "grad_norm": 2.564025402069092, + "learning_rate": 7.988313650212876e-07, + "loss": 0.0574, + "step": 32140 + }, + { + "epoch": 87.57765667574932, + "grad_norm": 2.330198287963867, + "learning_rate": 7.984857771953303e-07, + "loss": 0.0727, + "step": 32141 + }, + { + "epoch": 87.58038147138964, + "grad_norm": 2.864098310470581, + "learning_rate": 7.981402610304689e-07, + "loss": 0.0481, + "step": 32142 + }, + { + "epoch": 87.58310626702998, + "grad_norm": 1.646061897277832, + "learning_rate": 7.977948165293959e-07, + "loss": 0.018, + "step": 32143 + }, + { + "epoch": 87.5858310626703, + "grad_norm": 5.705280780792236, + "learning_rate": 7.974494436947989e-07, + "loss": 0.1504, + "step": 32144 + }, + { + "epoch": 87.58855585831063, + "grad_norm": 2.3666508197784424, + "learning_rate": 7.971041425293713e-07, + "loss": 0.1041, + "step": 32145 + }, + { + "epoch": 87.59128065395096, + "grad_norm": 2.5445120334625244, + "learning_rate": 7.967589130358e-07, + "loss": 0.0336, + "step": 32146 + }, + { + "epoch": 87.59400544959128, + "grad_norm": 3.171571969985962, + "learning_rate": 7.964137552167739e-07, + "loss": 0.0631, + "step": 32147 + }, + { + "epoch": 87.59673024523161, + "grad_norm": 2.541062831878662, + "learning_rate": 7.960686690749797e-07, + "loss": 0.0292, + "step": 32148 + }, + { + "epoch": 87.59945504087193, + "grad_norm": 1.9698750972747803, + "learning_rate": 7.957236546131086e-07, + "loss": 0.0192, + "step": 32149 + }, + { + "epoch": 87.60217983651226, + "grad_norm": 3.2101454734802246, + "learning_rate": 7.95378711833843e-07, + "loss": 0.0677, + "step": 32150 + }, + { + "epoch": 87.60490463215258, + "grad_norm": 2.757845878601074, + "learning_rate": 7.950338407398739e-07, + "loss": 0.1025, + "step": 32151 + }, + { + "epoch": 87.60762942779292, + "grad_norm": 14.851627349853516, + "learning_rate": 7.946890413338837e-07, + "loss": 0.1651, + "step": 32152 + }, + { + "epoch": 87.61035422343325, + "grad_norm": 2.203108310699463, + "learning_rate": 7.943443136185602e-07, + "loss": 0.0231, + "step": 32153 + }, + { + "epoch": 87.61307901907357, + "grad_norm": 1.8596984148025513, + "learning_rate": 7.93999657596587e-07, + "loss": 0.0218, + "step": 32154 + }, + { + "epoch": 87.6158038147139, + "grad_norm": 2.512727975845337, + "learning_rate": 7.936550732706483e-07, + "loss": 0.1162, + "step": 32155 + }, + { + "epoch": 87.61852861035422, + "grad_norm": 2.3046913146972656, + "learning_rate": 7.933105606434255e-07, + "loss": 0.1044, + "step": 32156 + }, + { + "epoch": 87.62125340599455, + "grad_norm": 2.938237190246582, + "learning_rate": 7.929661197176052e-07, + "loss": 0.0777, + "step": 32157 + }, + { + "epoch": 87.62397820163488, + "grad_norm": 2.446826457977295, + "learning_rate": 7.926217504958688e-07, + "loss": 0.1203, + "step": 32158 + }, + { + "epoch": 87.6267029972752, + "grad_norm": 3.3570597171783447, + "learning_rate": 7.922774529808985e-07, + "loss": 0.1578, + "step": 32159 + }, + { + "epoch": 87.62942779291554, + "grad_norm": 2.6146492958068848, + "learning_rate": 7.919332271753722e-07, + "loss": 0.1479, + "step": 32160 + }, + { + "epoch": 87.63215258855585, + "grad_norm": 3.064115047454834, + "learning_rate": 7.915890730819764e-07, + "loss": 0.0384, + "step": 32161 + }, + { + "epoch": 87.63487738419619, + "grad_norm": 1.6859407424926758, + "learning_rate": 7.912449907033881e-07, + "loss": 0.031, + "step": 32162 + }, + { + "epoch": 87.6376021798365, + "grad_norm": 2.9649910926818848, + "learning_rate": 7.909009800422874e-07, + "loss": 0.0326, + "step": 32163 + }, + { + "epoch": 87.64032697547684, + "grad_norm": 2.7740511894226074, + "learning_rate": 7.905570411013519e-07, + "loss": 0.0332, + "step": 32164 + }, + { + "epoch": 87.64305177111717, + "grad_norm": 2.3737103939056396, + "learning_rate": 7.90213173883263e-07, + "loss": 0.0304, + "step": 32165 + }, + { + "epoch": 87.64577656675749, + "grad_norm": 5.280933856964111, + "learning_rate": 7.898693783906975e-07, + "loss": 0.0484, + "step": 32166 + }, + { + "epoch": 87.64850136239782, + "grad_norm": 1.931410551071167, + "learning_rate": 7.895256546263319e-07, + "loss": 0.055, + "step": 32167 + }, + { + "epoch": 87.65122615803814, + "grad_norm": 4.705388069152832, + "learning_rate": 7.891820025928432e-07, + "loss": 0.0601, + "step": 32168 + }, + { + "epoch": 87.65395095367847, + "grad_norm": 2.216409206390381, + "learning_rate": 7.888384222929101e-07, + "loss": 0.1683, + "step": 32169 + }, + { + "epoch": 87.65667574931881, + "grad_norm": 3.612227201461792, + "learning_rate": 7.884949137292075e-07, + "loss": 0.0587, + "step": 32170 + }, + { + "epoch": 87.65940054495913, + "grad_norm": 2.983952522277832, + "learning_rate": 7.881514769044107e-07, + "loss": 0.1444, + "step": 32171 + }, + { + "epoch": 87.66212534059946, + "grad_norm": 2.391012668609619, + "learning_rate": 7.878081118211911e-07, + "loss": 0.038, + "step": 32172 + }, + { + "epoch": 87.66485013623978, + "grad_norm": 3.45635724067688, + "learning_rate": 7.874648184822275e-07, + "loss": 0.0657, + "step": 32173 + }, + { + "epoch": 87.66757493188011, + "grad_norm": 1.6082489490509033, + "learning_rate": 7.871215968901913e-07, + "loss": 0.0208, + "step": 32174 + }, + { + "epoch": 87.67029972752043, + "grad_norm": 2.6080129146575928, + "learning_rate": 7.867784470477557e-07, + "loss": 0.1196, + "step": 32175 + }, + { + "epoch": 87.67302452316076, + "grad_norm": 2.555482864379883, + "learning_rate": 7.864353689575909e-07, + "loss": 0.0296, + "step": 32176 + }, + { + "epoch": 87.6757493188011, + "grad_norm": 2.4604551792144775, + "learning_rate": 7.860923626223726e-07, + "loss": 0.0606, + "step": 32177 + }, + { + "epoch": 87.67847411444141, + "grad_norm": 3.1521799564361572, + "learning_rate": 7.857494280447709e-07, + "loss": 0.1531, + "step": 32178 + }, + { + "epoch": 87.68119891008175, + "grad_norm": 4.707701683044434, + "learning_rate": 7.854065652274556e-07, + "loss": 0.0546, + "step": 32179 + }, + { + "epoch": 87.68392370572207, + "grad_norm": 1.743828535079956, + "learning_rate": 7.850637741730959e-07, + "loss": 0.087, + "step": 32180 + }, + { + "epoch": 87.6866485013624, + "grad_norm": 2.3071610927581787, + "learning_rate": 7.847210548843653e-07, + "loss": 0.05, + "step": 32181 + }, + { + "epoch": 87.68937329700273, + "grad_norm": 2.3715646266937256, + "learning_rate": 7.843784073639304e-07, + "loss": 0.0733, + "step": 32182 + }, + { + "epoch": 87.69209809264305, + "grad_norm": 7.41796875, + "learning_rate": 7.840358316144592e-07, + "loss": 0.023, + "step": 32183 + }, + { + "epoch": 87.69482288828338, + "grad_norm": 2.684610605239868, + "learning_rate": 7.836933276386183e-07, + "loss": 0.119, + "step": 32184 + }, + { + "epoch": 87.6975476839237, + "grad_norm": 2.3460471630096436, + "learning_rate": 7.833508954390778e-07, + "loss": 0.0304, + "step": 32185 + }, + { + "epoch": 87.70027247956403, + "grad_norm": 2.5405545234680176, + "learning_rate": 7.830085350185057e-07, + "loss": 0.0744, + "step": 32186 + }, + { + "epoch": 87.70299727520435, + "grad_norm": 3.223616123199463, + "learning_rate": 7.826662463795665e-07, + "loss": 0.1763, + "step": 32187 + }, + { + "epoch": 87.70572207084469, + "grad_norm": 3.933316707611084, + "learning_rate": 7.823240295249257e-07, + "loss": 0.0526, + "step": 32188 + }, + { + "epoch": 87.70844686648502, + "grad_norm": 2.4163014888763428, + "learning_rate": 7.819818844572468e-07, + "loss": 0.0845, + "step": 32189 + }, + { + "epoch": 87.71117166212534, + "grad_norm": 2.0288498401641846, + "learning_rate": 7.81639811179199e-07, + "loss": 0.0315, + "step": 32190 + }, + { + "epoch": 87.71389645776567, + "grad_norm": 2.184022903442383, + "learning_rate": 7.812978096934421e-07, + "loss": 0.109, + "step": 32191 + }, + { + "epoch": 87.71662125340599, + "grad_norm": 4.986965656280518, + "learning_rate": 7.809558800026407e-07, + "loss": 0.1037, + "step": 32192 + }, + { + "epoch": 87.71934604904632, + "grad_norm": 1.883907437324524, + "learning_rate": 7.806140221094593e-07, + "loss": 0.0278, + "step": 32193 + }, + { + "epoch": 87.72207084468666, + "grad_norm": 3.1499037742614746, + "learning_rate": 7.802722360165593e-07, + "loss": 0.0463, + "step": 32194 + }, + { + "epoch": 87.72479564032697, + "grad_norm": 1.8229411840438843, + "learning_rate": 7.799305217266018e-07, + "loss": 0.0257, + "step": 32195 + }, + { + "epoch": 87.7275204359673, + "grad_norm": 2.774632215499878, + "learning_rate": 7.795888792422479e-07, + "loss": 0.0601, + "step": 32196 + }, + { + "epoch": 87.73024523160763, + "grad_norm": 2.2164721488952637, + "learning_rate": 7.792473085661601e-07, + "loss": 0.0566, + "step": 32197 + }, + { + "epoch": 87.73297002724796, + "grad_norm": 2.9088759422302246, + "learning_rate": 7.789058097009983e-07, + "loss": 0.0343, + "step": 32198 + }, + { + "epoch": 87.73569482288828, + "grad_norm": 3.0221238136291504, + "learning_rate": 7.785643826494205e-07, + "loss": 0.0394, + "step": 32199 + }, + { + "epoch": 87.73841961852861, + "grad_norm": 3.420117139816284, + "learning_rate": 7.782230274140845e-07, + "loss": 0.0813, + "step": 32200 + }, + { + "epoch": 87.74114441416894, + "grad_norm": 2.453206777572632, + "learning_rate": 7.778817439976515e-07, + "loss": 0.0588, + "step": 32201 + }, + { + "epoch": 87.74386920980926, + "grad_norm": 2.2068138122558594, + "learning_rate": 7.775405324027807e-07, + "loss": 0.0209, + "step": 32202 + }, + { + "epoch": 87.7465940054496, + "grad_norm": 1.9418346881866455, + "learning_rate": 7.771993926321264e-07, + "loss": 0.0213, + "step": 32203 + }, + { + "epoch": 87.74931880108991, + "grad_norm": 2.20292592048645, + "learning_rate": 7.768583246883476e-07, + "loss": 0.1205, + "step": 32204 + }, + { + "epoch": 87.75204359673025, + "grad_norm": 2.0393476486206055, + "learning_rate": 7.765173285740968e-07, + "loss": 0.0307, + "step": 32205 + }, + { + "epoch": 87.75476839237058, + "grad_norm": 2.3173751831054688, + "learning_rate": 7.761764042920339e-07, + "loss": 0.0358, + "step": 32206 + }, + { + "epoch": 87.7574931880109, + "grad_norm": 2.642428159713745, + "learning_rate": 7.758355518448124e-07, + "loss": 0.0936, + "step": 32207 + }, + { + "epoch": 87.76021798365123, + "grad_norm": 1.9830187559127808, + "learning_rate": 7.754947712350869e-07, + "loss": 0.1085, + "step": 32208 + }, + { + "epoch": 87.76294277929155, + "grad_norm": 2.271312952041626, + "learning_rate": 7.751540624655085e-07, + "loss": 0.0237, + "step": 32209 + }, + { + "epoch": 87.76566757493188, + "grad_norm": 2.239161491394043, + "learning_rate": 7.748134255387363e-07, + "loss": 0.0584, + "step": 32210 + }, + { + "epoch": 87.7683923705722, + "grad_norm": 3.01596999168396, + "learning_rate": 7.744728604574203e-07, + "loss": 0.0421, + "step": 32211 + }, + { + "epoch": 87.77111716621253, + "grad_norm": 3.220775604248047, + "learning_rate": 7.741323672242118e-07, + "loss": 0.1589, + "step": 32212 + }, + { + "epoch": 87.77384196185287, + "grad_norm": 3.0501341819763184, + "learning_rate": 7.73791945841762e-07, + "loss": 0.1608, + "step": 32213 + }, + { + "epoch": 87.77656675749319, + "grad_norm": 2.0995032787323, + "learning_rate": 7.734515963127254e-07, + "loss": 0.0573, + "step": 32214 + }, + { + "epoch": 87.77929155313352, + "grad_norm": 3.8837478160858154, + "learning_rate": 7.73111318639751e-07, + "loss": 0.055, + "step": 32215 + }, + { + "epoch": 87.78201634877384, + "grad_norm": 3.704047203063965, + "learning_rate": 7.727711128254878e-07, + "loss": 0.0661, + "step": 32216 + }, + { + "epoch": 87.78474114441417, + "grad_norm": 2.4582417011260986, + "learning_rate": 7.72430978872587e-07, + "loss": 0.0637, + "step": 32217 + }, + { + "epoch": 87.7874659400545, + "grad_norm": 2.763697385787964, + "learning_rate": 7.720909167836943e-07, + "loss": 0.0205, + "step": 32218 + }, + { + "epoch": 87.79019073569482, + "grad_norm": 2.093129873275757, + "learning_rate": 7.717509265614631e-07, + "loss": 0.0347, + "step": 32219 + }, + { + "epoch": 87.79291553133515, + "grad_norm": 2.884716033935547, + "learning_rate": 7.714110082085391e-07, + "loss": 0.0815, + "step": 32220 + }, + { + "epoch": 87.79564032697547, + "grad_norm": 3.5441763401031494, + "learning_rate": 7.710711617275668e-07, + "loss": 0.0954, + "step": 32221 + }, + { + "epoch": 87.7983651226158, + "grad_norm": 2.7222464084625244, + "learning_rate": 7.707313871211974e-07, + "loss": 0.11, + "step": 32222 + }, + { + "epoch": 87.80108991825612, + "grad_norm": 1.983210563659668, + "learning_rate": 7.703916843920745e-07, + "loss": 0.0309, + "step": 32223 + }, + { + "epoch": 87.80381471389646, + "grad_norm": 1.9344252347946167, + "learning_rate": 7.700520535428435e-07, + "loss": 0.0193, + "step": 32224 + }, + { + "epoch": 87.80653950953679, + "grad_norm": 2.7835206985473633, + "learning_rate": 7.697124945761492e-07, + "loss": 0.147, + "step": 32225 + }, + { + "epoch": 87.80926430517711, + "grad_norm": 2.15885066986084, + "learning_rate": 7.693730074946393e-07, + "loss": 0.0991, + "step": 32226 + }, + { + "epoch": 87.81198910081744, + "grad_norm": 2.10834002494812, + "learning_rate": 7.690335923009539e-07, + "loss": 0.0279, + "step": 32227 + }, + { + "epoch": 87.81471389645776, + "grad_norm": 1.8662948608398438, + "learning_rate": 7.686942489977389e-07, + "loss": 0.063, + "step": 32228 + }, + { + "epoch": 87.8174386920981, + "grad_norm": 1.5790742635726929, + "learning_rate": 7.683549775876331e-07, + "loss": 0.0248, + "step": 32229 + }, + { + "epoch": 87.82016348773843, + "grad_norm": 3.244419813156128, + "learning_rate": 7.680157780732844e-07, + "loss": 0.0337, + "step": 32230 + }, + { + "epoch": 87.82288828337875, + "grad_norm": 1.9691389799118042, + "learning_rate": 7.676766504573319e-07, + "loss": 0.0315, + "step": 32231 + }, + { + "epoch": 87.82561307901908, + "grad_norm": 2.6122236251831055, + "learning_rate": 7.673375947424155e-07, + "loss": 0.0434, + "step": 32232 + }, + { + "epoch": 87.8283378746594, + "grad_norm": 2.582932710647583, + "learning_rate": 7.669986109311756e-07, + "loss": 0.1578, + "step": 32233 + }, + { + "epoch": 87.83106267029973, + "grad_norm": 1.9818381071090698, + "learning_rate": 7.666596990262542e-07, + "loss": 0.1266, + "step": 32234 + }, + { + "epoch": 87.83378746594005, + "grad_norm": 2.519568681716919, + "learning_rate": 7.663208590302907e-07, + "loss": 0.0409, + "step": 32235 + }, + { + "epoch": 87.83651226158038, + "grad_norm": 2.1832003593444824, + "learning_rate": 7.659820909459215e-07, + "loss": 0.0245, + "step": 32236 + }, + { + "epoch": 87.83923705722071, + "grad_norm": 3.458500385284424, + "learning_rate": 7.656433947757869e-07, + "loss": 0.1296, + "step": 32237 + }, + { + "epoch": 87.84196185286103, + "grad_norm": 2.5669286251068115, + "learning_rate": 7.653047705225258e-07, + "loss": 0.0553, + "step": 32238 + }, + { + "epoch": 87.84468664850137, + "grad_norm": 2.642077922821045, + "learning_rate": 7.649662181887729e-07, + "loss": 0.0323, + "step": 32239 + }, + { + "epoch": 87.84741144414168, + "grad_norm": 2.2836034297943115, + "learning_rate": 7.646277377771671e-07, + "loss": 0.0755, + "step": 32240 + }, + { + "epoch": 87.85013623978202, + "grad_norm": 1.9051963090896606, + "learning_rate": 7.642893292903408e-07, + "loss": 0.025, + "step": 32241 + }, + { + "epoch": 87.85286103542235, + "grad_norm": 3.2509732246398926, + "learning_rate": 7.639509927309341e-07, + "loss": 0.0227, + "step": 32242 + }, + { + "epoch": 87.85558583106267, + "grad_norm": 1.6330887079238892, + "learning_rate": 7.636127281015804e-07, + "loss": 0.0413, + "step": 32243 + }, + { + "epoch": 87.858310626703, + "grad_norm": 6.737751483917236, + "learning_rate": 7.63274535404912e-07, + "loss": 0.0305, + "step": 32244 + }, + { + "epoch": 87.86103542234332, + "grad_norm": 3.404038667678833, + "learning_rate": 7.629364146435636e-07, + "loss": 0.0403, + "step": 32245 + }, + { + "epoch": 87.86376021798365, + "grad_norm": 2.899501085281372, + "learning_rate": 7.625983658201708e-07, + "loss": 0.0215, + "step": 32246 + }, + { + "epoch": 87.86648501362397, + "grad_norm": 4.718465328216553, + "learning_rate": 7.622603889373648e-07, + "loss": 0.0831, + "step": 32247 + }, + { + "epoch": 87.8692098092643, + "grad_norm": 2.426079511642456, + "learning_rate": 7.619224839977767e-07, + "loss": 0.0834, + "step": 32248 + }, + { + "epoch": 87.87193460490464, + "grad_norm": 1.613516926765442, + "learning_rate": 7.615846510040381e-07, + "loss": 0.0174, + "step": 32249 + }, + { + "epoch": 87.87465940054496, + "grad_norm": 2.838158369064331, + "learning_rate": 7.612468899587822e-07, + "loss": 0.1398, + "step": 32250 + }, + { + "epoch": 87.87738419618529, + "grad_norm": 3.891223907470703, + "learning_rate": 7.609092008646379e-07, + "loss": 0.0727, + "step": 32251 + }, + { + "epoch": 87.88010899182561, + "grad_norm": 2.4520819187164307, + "learning_rate": 7.605715837242355e-07, + "loss": 0.0407, + "step": 32252 + }, + { + "epoch": 87.88283378746594, + "grad_norm": 3.366380453109741, + "learning_rate": 7.60234038540203e-07, + "loss": 0.0707, + "step": 32253 + }, + { + "epoch": 87.88555858310627, + "grad_norm": 4.714087009429932, + "learning_rate": 7.598965653151702e-07, + "loss": 0.0802, + "step": 32254 + }, + { + "epoch": 87.88828337874659, + "grad_norm": 2.2426202297210693, + "learning_rate": 7.595591640517663e-07, + "loss": 0.0403, + "step": 32255 + }, + { + "epoch": 87.89100817438693, + "grad_norm": 3.1924262046813965, + "learning_rate": 7.592218347526192e-07, + "loss": 0.0907, + "step": 32256 + }, + { + "epoch": 87.89373297002724, + "grad_norm": 2.122835636138916, + "learning_rate": 7.588845774203535e-07, + "loss": 0.0807, + "step": 32257 + }, + { + "epoch": 87.89645776566758, + "grad_norm": 2.4528744220733643, + "learning_rate": 7.585473920575992e-07, + "loss": 0.2641, + "step": 32258 + }, + { + "epoch": 87.8991825613079, + "grad_norm": 2.00410532951355, + "learning_rate": 7.582102786669798e-07, + "loss": 0.0358, + "step": 32259 + }, + { + "epoch": 87.90190735694823, + "grad_norm": 2.9289979934692383, + "learning_rate": 7.57873237251121e-07, + "loss": 0.0928, + "step": 32260 + }, + { + "epoch": 87.90463215258856, + "grad_norm": 3.34232759475708, + "learning_rate": 7.575362678126474e-07, + "loss": 0.096, + "step": 32261 + }, + { + "epoch": 87.90735694822888, + "grad_norm": 1.7234410047531128, + "learning_rate": 7.571993703541847e-07, + "loss": 0.0208, + "step": 32262 + }, + { + "epoch": 87.91008174386921, + "grad_norm": 2.5581438541412354, + "learning_rate": 7.568625448783562e-07, + "loss": 0.0578, + "step": 32263 + }, + { + "epoch": 87.91280653950953, + "grad_norm": 2.0092294216156006, + "learning_rate": 7.565257913877843e-07, + "loss": 0.0506, + "step": 32264 + }, + { + "epoch": 87.91553133514986, + "grad_norm": 1.4506932497024536, + "learning_rate": 7.561891098850904e-07, + "loss": 0.0207, + "step": 32265 + }, + { + "epoch": 87.9182561307902, + "grad_norm": 3.2845566272735596, + "learning_rate": 7.558525003729e-07, + "loss": 0.0319, + "step": 32266 + }, + { + "epoch": 87.92098092643052, + "grad_norm": 2.6187777519226074, + "learning_rate": 7.555159628538322e-07, + "loss": 0.1014, + "step": 32267 + }, + { + "epoch": 87.92370572207085, + "grad_norm": 4.789071083068848, + "learning_rate": 7.551794973305093e-07, + "loss": 0.1189, + "step": 32268 + }, + { + "epoch": 87.92643051771117, + "grad_norm": 3.519306182861328, + "learning_rate": 7.548431038055492e-07, + "loss": 0.04, + "step": 32269 + }, + { + "epoch": 87.9291553133515, + "grad_norm": 3.2069647312164307, + "learning_rate": 7.545067822815733e-07, + "loss": 0.0404, + "step": 32270 + }, + { + "epoch": 87.93188010899182, + "grad_norm": 3.5142273902893066, + "learning_rate": 7.541705327612037e-07, + "loss": 0.0307, + "step": 32271 + }, + { + "epoch": 87.93460490463215, + "grad_norm": 1.9941633939743042, + "learning_rate": 7.53834355247055e-07, + "loss": 0.0918, + "step": 32272 + }, + { + "epoch": 87.93732970027249, + "grad_norm": 2.765315055847168, + "learning_rate": 7.534982497417476e-07, + "loss": 0.0282, + "step": 32273 + }, + { + "epoch": 87.9400544959128, + "grad_norm": 2.1391522884368896, + "learning_rate": 7.531622162478957e-07, + "loss": 0.0342, + "step": 32274 + }, + { + "epoch": 87.94277929155314, + "grad_norm": 2.1447854042053223, + "learning_rate": 7.528262547681209e-07, + "loss": 0.0224, + "step": 32275 + }, + { + "epoch": 87.94550408719346, + "grad_norm": 1.431930661201477, + "learning_rate": 7.524903653050386e-07, + "loss": 0.0176, + "step": 32276 + }, + { + "epoch": 87.94822888283379, + "grad_norm": 3.4243528842926025, + "learning_rate": 7.521545478612624e-07, + "loss": 0.0597, + "step": 32277 + }, + { + "epoch": 87.95095367847412, + "grad_norm": 2.164825439453125, + "learning_rate": 7.518188024394079e-07, + "loss": 0.1031, + "step": 32278 + }, + { + "epoch": 87.95367847411444, + "grad_norm": 2.4001989364624023, + "learning_rate": 7.514831290420921e-07, + "loss": 0.0545, + "step": 32279 + }, + { + "epoch": 87.95640326975477, + "grad_norm": 2.551877975463867, + "learning_rate": 7.511475276719282e-07, + "loss": 0.0361, + "step": 32280 + }, + { + "epoch": 87.95912806539509, + "grad_norm": 3.5497496128082275, + "learning_rate": 7.508119983315288e-07, + "loss": 0.1386, + "step": 32281 + }, + { + "epoch": 87.96185286103542, + "grad_norm": 2.0387940406799316, + "learning_rate": 7.504765410235082e-07, + "loss": 0.0973, + "step": 32282 + }, + { + "epoch": 87.96457765667574, + "grad_norm": 1.8813186883926392, + "learning_rate": 7.501411557504801e-07, + "loss": 0.0243, + "step": 32283 + }, + { + "epoch": 87.96730245231608, + "grad_norm": 1.5467861890792847, + "learning_rate": 7.498058425150534e-07, + "loss": 0.015, + "step": 32284 + }, + { + "epoch": 87.97002724795641, + "grad_norm": 3.1045641899108887, + "learning_rate": 7.494706013198406e-07, + "loss": 0.0716, + "step": 32285 + }, + { + "epoch": 87.97275204359673, + "grad_norm": 2.660520553588867, + "learning_rate": 7.491354321674538e-07, + "loss": 0.0736, + "step": 32286 + }, + { + "epoch": 87.97547683923706, + "grad_norm": 2.425281524658203, + "learning_rate": 7.488003350605022e-07, + "loss": 0.0285, + "step": 32287 + }, + { + "epoch": 87.97820163487738, + "grad_norm": 1.9388577938079834, + "learning_rate": 7.48465310001596e-07, + "loss": 0.0358, + "step": 32288 + }, + { + "epoch": 87.98092643051771, + "grad_norm": 2.165494441986084, + "learning_rate": 7.481303569933452e-07, + "loss": 0.0271, + "step": 32289 + }, + { + "epoch": 87.98365122615803, + "grad_norm": 1.887526512145996, + "learning_rate": 7.477954760383554e-07, + "loss": 0.0485, + "step": 32290 + }, + { + "epoch": 87.98637602179836, + "grad_norm": 3.798539400100708, + "learning_rate": 7.474606671392381e-07, + "loss": 0.1476, + "step": 32291 + }, + { + "epoch": 87.9891008174387, + "grad_norm": 2.9195845127105713, + "learning_rate": 7.471259302986e-07, + "loss": 0.2573, + "step": 32292 + }, + { + "epoch": 87.99182561307902, + "grad_norm": 5.432840347290039, + "learning_rate": 7.467912655190468e-07, + "loss": 0.0782, + "step": 32293 + }, + { + "epoch": 87.99455040871935, + "grad_norm": 1.555138111114502, + "learning_rate": 7.46456672803183e-07, + "loss": 0.0223, + "step": 32294 + }, + { + "epoch": 87.99727520435967, + "grad_norm": 2.1178574562072754, + "learning_rate": 7.461221521536199e-07, + "loss": 0.1377, + "step": 32295 + }, + { + "epoch": 88.0, + "grad_norm": 2.321068525314331, + "learning_rate": 7.457877035729588e-07, + "loss": 0.031, + "step": 32296 + }, + { + "epoch": 88.00272479564033, + "grad_norm": 2.299448251724243, + "learning_rate": 7.454533270638054e-07, + "loss": 0.0275, + "step": 32297 + }, + { + "epoch": 88.00544959128065, + "grad_norm": 2.3229076862335205, + "learning_rate": 7.451190226287619e-07, + "loss": 0.0418, + "step": 32298 + }, + { + "epoch": 88.00817438692098, + "grad_norm": 3.0564043521881104, + "learning_rate": 7.447847902704364e-07, + "loss": 0.0577, + "step": 32299 + }, + { + "epoch": 88.0108991825613, + "grad_norm": 2.5883285999298096, + "learning_rate": 7.444506299914278e-07, + "loss": 0.125, + "step": 32300 + }, + { + "epoch": 88.01362397820164, + "grad_norm": 3.360523223876953, + "learning_rate": 7.441165417943386e-07, + "loss": 0.1188, + "step": 32301 + }, + { + "epoch": 88.01634877384195, + "grad_norm": 2.566993236541748, + "learning_rate": 7.437825256817732e-07, + "loss": 0.0786, + "step": 32302 + }, + { + "epoch": 88.01907356948229, + "grad_norm": 2.3333346843719482, + "learning_rate": 7.434485816563319e-07, + "loss": 0.0771, + "step": 32303 + }, + { + "epoch": 88.02179836512262, + "grad_norm": 2.5192739963531494, + "learning_rate": 7.431147097206126e-07, + "loss": 0.0413, + "step": 32304 + }, + { + "epoch": 88.02452316076294, + "grad_norm": 1.8936649560928345, + "learning_rate": 7.42780909877221e-07, + "loss": 0.02, + "step": 32305 + }, + { + "epoch": 88.02724795640327, + "grad_norm": 2.71415638923645, + "learning_rate": 7.424471821287516e-07, + "loss": 0.025, + "step": 32306 + }, + { + "epoch": 88.02997275204359, + "grad_norm": 1.6457340717315674, + "learning_rate": 7.421135264778067e-07, + "loss": 0.02, + "step": 32307 + }, + { + "epoch": 88.03269754768392, + "grad_norm": 1.7237062454223633, + "learning_rate": 7.417799429269835e-07, + "loss": 0.0206, + "step": 32308 + }, + { + "epoch": 88.03542234332426, + "grad_norm": 2.5964341163635254, + "learning_rate": 7.414464314788816e-07, + "loss": 0.0346, + "step": 32309 + }, + { + "epoch": 88.03814713896458, + "grad_norm": 2.292182683944702, + "learning_rate": 7.411129921360937e-07, + "loss": 0.0524, + "step": 32310 + }, + { + "epoch": 88.04087193460491, + "grad_norm": 2.4391493797302246, + "learning_rate": 7.407796249012223e-07, + "loss": 0.1095, + "step": 32311 + }, + { + "epoch": 88.04359673024523, + "grad_norm": 2.506728172302246, + "learning_rate": 7.404463297768616e-07, + "loss": 0.1574, + "step": 32312 + }, + { + "epoch": 88.04632152588556, + "grad_norm": 2.8812003135681152, + "learning_rate": 7.401131067656054e-07, + "loss": 0.1881, + "step": 32313 + }, + { + "epoch": 88.04904632152588, + "grad_norm": 2.4724903106689453, + "learning_rate": 7.397799558700502e-07, + "loss": 0.1441, + "step": 32314 + }, + { + "epoch": 88.05177111716621, + "grad_norm": 2.306126594543457, + "learning_rate": 7.394468770927909e-07, + "loss": 0.1513, + "step": 32315 + }, + { + "epoch": 88.05449591280654, + "grad_norm": 4.2841105461120605, + "learning_rate": 7.39113870436422e-07, + "loss": 0.083, + "step": 32316 + }, + { + "epoch": 88.05722070844686, + "grad_norm": 2.380880832672119, + "learning_rate": 7.387809359035369e-07, + "loss": 0.0379, + "step": 32317 + }, + { + "epoch": 88.0599455040872, + "grad_norm": 3.122007369995117, + "learning_rate": 7.384480734967248e-07, + "loss": 0.0279, + "step": 32318 + }, + { + "epoch": 88.06267029972751, + "grad_norm": 1.5502064228057861, + "learning_rate": 7.381152832185833e-07, + "loss": 0.0201, + "step": 32319 + }, + { + "epoch": 88.06539509536785, + "grad_norm": 2.653925657272339, + "learning_rate": 7.377825650717029e-07, + "loss": 0.0635, + "step": 32320 + }, + { + "epoch": 88.06811989100818, + "grad_norm": 2.0360612869262695, + "learning_rate": 7.374499190586725e-07, + "loss": 0.0219, + "step": 32321 + }, + { + "epoch": 88.0708446866485, + "grad_norm": 2.081451416015625, + "learning_rate": 7.371173451820812e-07, + "loss": 0.022, + "step": 32322 + }, + { + "epoch": 88.07356948228883, + "grad_norm": 3.6597652435302734, + "learning_rate": 7.367848434445246e-07, + "loss": 0.0615, + "step": 32323 + }, + { + "epoch": 88.07629427792915, + "grad_norm": 1.9606828689575195, + "learning_rate": 7.364524138485896e-07, + "loss": 0.0705, + "step": 32324 + }, + { + "epoch": 88.07901907356948, + "grad_norm": 3.023667335510254, + "learning_rate": 7.361200563968662e-07, + "loss": 0.0405, + "step": 32325 + }, + { + "epoch": 88.0817438692098, + "grad_norm": 1.8557109832763672, + "learning_rate": 7.357877710919392e-07, + "loss": 0.0492, + "step": 32326 + }, + { + "epoch": 88.08446866485014, + "grad_norm": 1.7654945850372314, + "learning_rate": 7.354555579363998e-07, + "loss": 0.0295, + "step": 32327 + }, + { + "epoch": 88.08719346049047, + "grad_norm": 1.9492478370666504, + "learning_rate": 7.351234169328359e-07, + "loss": 0.0215, + "step": 32328 + }, + { + "epoch": 88.08991825613079, + "grad_norm": 3.418755292892456, + "learning_rate": 7.34791348083831e-07, + "loss": 0.0381, + "step": 32329 + }, + { + "epoch": 88.09264305177112, + "grad_norm": 3.9958670139312744, + "learning_rate": 7.344593513919718e-07, + "loss": 0.038, + "step": 32330 + }, + { + "epoch": 88.09536784741144, + "grad_norm": 3.9633195400238037, + "learning_rate": 7.341274268598476e-07, + "loss": 0.2505, + "step": 32331 + }, + { + "epoch": 88.09809264305177, + "grad_norm": 2.639070510864258, + "learning_rate": 7.337955744900394e-07, + "loss": 0.036, + "step": 32332 + }, + { + "epoch": 88.1008174386921, + "grad_norm": 2.3801422119140625, + "learning_rate": 7.334637942851342e-07, + "loss": 0.0592, + "step": 32333 + }, + { + "epoch": 88.10354223433242, + "grad_norm": 2.8734068870544434, + "learning_rate": 7.331320862477121e-07, + "loss": 0.0909, + "step": 32334 + }, + { + "epoch": 88.10626702997276, + "grad_norm": 2.515087127685547, + "learning_rate": 7.328004503803609e-07, + "loss": 0.0249, + "step": 32335 + }, + { + "epoch": 88.10899182561307, + "grad_norm": 1.818914532661438, + "learning_rate": 7.324688866856621e-07, + "loss": 0.0232, + "step": 32336 + }, + { + "epoch": 88.11171662125341, + "grad_norm": 2.735673189163208, + "learning_rate": 7.321373951661969e-07, + "loss": 0.0587, + "step": 32337 + }, + { + "epoch": 88.11444141689373, + "grad_norm": 3.4093174934387207, + "learning_rate": 7.318059758245455e-07, + "loss": 0.1008, + "step": 32338 + }, + { + "epoch": 88.11716621253406, + "grad_norm": 2.8783583641052246, + "learning_rate": 7.314746286632913e-07, + "loss": 0.0341, + "step": 32339 + }, + { + "epoch": 88.11989100817439, + "grad_norm": 2.247035026550293, + "learning_rate": 7.311433536850165e-07, + "loss": 0.0234, + "step": 32340 + }, + { + "epoch": 88.12261580381471, + "grad_norm": 1.9902700185775757, + "learning_rate": 7.308121508922983e-07, + "loss": 0.0204, + "step": 32341 + }, + { + "epoch": 88.12534059945504, + "grad_norm": 2.9673802852630615, + "learning_rate": 7.304810202877144e-07, + "loss": 0.0478, + "step": 32342 + }, + { + "epoch": 88.12806539509536, + "grad_norm": 2.6950340270996094, + "learning_rate": 7.301499618738484e-07, + "loss": 0.0414, + "step": 32343 + }, + { + "epoch": 88.1307901907357, + "grad_norm": 2.5807995796203613, + "learning_rate": 7.29818975653277e-07, + "loss": 0.0248, + "step": 32344 + }, + { + "epoch": 88.13351498637603, + "grad_norm": 2.492432117462158, + "learning_rate": 7.29488061628576e-07, + "loss": 0.0307, + "step": 32345 + }, + { + "epoch": 88.13623978201635, + "grad_norm": 2.092982530593872, + "learning_rate": 7.291572198023223e-07, + "loss": 0.037, + "step": 32346 + }, + { + "epoch": 88.13896457765668, + "grad_norm": 2.8097760677337646, + "learning_rate": 7.288264501770947e-07, + "loss": 0.0783, + "step": 32347 + }, + { + "epoch": 88.141689373297, + "grad_norm": 2.8103179931640625, + "learning_rate": 7.284957527554693e-07, + "loss": 0.0889, + "step": 32348 + }, + { + "epoch": 88.14441416893733, + "grad_norm": 2.2878992557525635, + "learning_rate": 7.281651275400203e-07, + "loss": 0.0328, + "step": 32349 + }, + { + "epoch": 88.14713896457765, + "grad_norm": 2.0587637424468994, + "learning_rate": 7.278345745333204e-07, + "loss": 0.0832, + "step": 32350 + }, + { + "epoch": 88.14986376021798, + "grad_norm": 1.798496127128601, + "learning_rate": 7.275040937379485e-07, + "loss": 0.0194, + "step": 32351 + }, + { + "epoch": 88.15258855585832, + "grad_norm": 2.808852195739746, + "learning_rate": 7.27173685156477e-07, + "loss": 0.0619, + "step": 32352 + }, + { + "epoch": 88.15531335149863, + "grad_norm": 2.5652859210968018, + "learning_rate": 7.268433487914784e-07, + "loss": 0.1185, + "step": 32353 + }, + { + "epoch": 88.15803814713897, + "grad_norm": 2.514193058013916, + "learning_rate": 7.265130846455226e-07, + "loss": 0.0447, + "step": 32354 + }, + { + "epoch": 88.16076294277929, + "grad_norm": 4.0318121910095215, + "learning_rate": 7.261828927211867e-07, + "loss": 0.1139, + "step": 32355 + }, + { + "epoch": 88.16348773841962, + "grad_norm": 2.110468626022339, + "learning_rate": 7.258527730210385e-07, + "loss": 0.0774, + "step": 32356 + }, + { + "epoch": 88.16621253405995, + "grad_norm": 4.696341514587402, + "learning_rate": 7.255227255476516e-07, + "loss": 0.1724, + "step": 32357 + }, + { + "epoch": 88.16893732970027, + "grad_norm": 2.1733508110046387, + "learning_rate": 7.25192750303596e-07, + "loss": 0.0339, + "step": 32358 + }, + { + "epoch": 88.1716621253406, + "grad_norm": 1.6791229248046875, + "learning_rate": 7.248628472914388e-07, + "loss": 0.1437, + "step": 32359 + }, + { + "epoch": 88.17438692098092, + "grad_norm": 2.093832015991211, + "learning_rate": 7.245330165137521e-07, + "loss": 0.0719, + "step": 32360 + }, + { + "epoch": 88.17711171662125, + "grad_norm": 2.7660741806030273, + "learning_rate": 7.24203257973104e-07, + "loss": 0.0756, + "step": 32361 + }, + { + "epoch": 88.17983651226157, + "grad_norm": 2.537230968475342, + "learning_rate": 7.238735716720635e-07, + "loss": 0.0526, + "step": 32362 + }, + { + "epoch": 88.1825613079019, + "grad_norm": 2.3053700923919678, + "learning_rate": 7.235439576131942e-07, + "loss": 0.0202, + "step": 32363 + }, + { + "epoch": 88.18528610354224, + "grad_norm": 1.8766133785247803, + "learning_rate": 7.232144157990683e-07, + "loss": 0.0264, + "step": 32364 + }, + { + "epoch": 88.18801089918256, + "grad_norm": 2.5794596672058105, + "learning_rate": 7.228849462322496e-07, + "loss": 0.049, + "step": 32365 + }, + { + "epoch": 88.19073569482289, + "grad_norm": 2.2495250701904297, + "learning_rate": 7.225555489153024e-07, + "loss": 0.0662, + "step": 32366 + }, + { + "epoch": 88.19346049046321, + "grad_norm": 2.3065366744995117, + "learning_rate": 7.22226223850796e-07, + "loss": 0.1619, + "step": 32367 + }, + { + "epoch": 88.19618528610354, + "grad_norm": 1.8450549840927124, + "learning_rate": 7.218969710412938e-07, + "loss": 0.0533, + "step": 32368 + }, + { + "epoch": 88.19891008174388, + "grad_norm": 2.7415997982025146, + "learning_rate": 7.215677904893593e-07, + "loss": 0.1223, + "step": 32369 + }, + { + "epoch": 88.2016348773842, + "grad_norm": 2.997288465499878, + "learning_rate": 7.212386821975537e-07, + "loss": 0.0674, + "step": 32370 + }, + { + "epoch": 88.20435967302453, + "grad_norm": 3.6610023975372314, + "learning_rate": 7.209096461684451e-07, + "loss": 0.0831, + "step": 32371 + }, + { + "epoch": 88.20708446866485, + "grad_norm": 2.011756420135498, + "learning_rate": 7.205806824045924e-07, + "loss": 0.0334, + "step": 32372 + }, + { + "epoch": 88.20980926430518, + "grad_norm": 3.1290664672851562, + "learning_rate": 7.202517909085583e-07, + "loss": 0.1391, + "step": 32373 + }, + { + "epoch": 88.2125340599455, + "grad_norm": 5.271706581115723, + "learning_rate": 7.199229716829048e-07, + "loss": 0.0294, + "step": 32374 + }, + { + "epoch": 88.21525885558583, + "grad_norm": 4.0691142082214355, + "learning_rate": 7.195942247301923e-07, + "loss": 0.0679, + "step": 32375 + }, + { + "epoch": 88.21798365122616, + "grad_norm": 5.225517749786377, + "learning_rate": 7.192655500529821e-07, + "loss": 0.0513, + "step": 32376 + }, + { + "epoch": 88.22070844686648, + "grad_norm": 2.8964128494262695, + "learning_rate": 7.189369476538333e-07, + "loss": 0.0522, + "step": 32377 + }, + { + "epoch": 88.22343324250681, + "grad_norm": 2.045886754989624, + "learning_rate": 7.186084175353047e-07, + "loss": 0.0229, + "step": 32378 + }, + { + "epoch": 88.22615803814713, + "grad_norm": 2.279428243637085, + "learning_rate": 7.182799596999534e-07, + "loss": 0.0516, + "step": 32379 + }, + { + "epoch": 88.22888283378747, + "grad_norm": 1.5180741548538208, + "learning_rate": 7.179515741503418e-07, + "loss": 0.0172, + "step": 32380 + }, + { + "epoch": 88.2316076294278, + "grad_norm": 2.6171324253082275, + "learning_rate": 7.176232608890232e-07, + "loss": 0.0245, + "step": 32381 + }, + { + "epoch": 88.23433242506812, + "grad_norm": 2.1556520462036133, + "learning_rate": 7.172950199185569e-07, + "loss": 0.0244, + "step": 32382 + }, + { + "epoch": 88.23705722070845, + "grad_norm": 2.845304489135742, + "learning_rate": 7.169668512414951e-07, + "loss": 0.0274, + "step": 32383 + }, + { + "epoch": 88.23978201634877, + "grad_norm": 2.633047103881836, + "learning_rate": 7.166387548603993e-07, + "loss": 0.0269, + "step": 32384 + }, + { + "epoch": 88.2425068119891, + "grad_norm": 3.4355244636535645, + "learning_rate": 7.163107307778227e-07, + "loss": 0.1012, + "step": 32385 + }, + { + "epoch": 88.24523160762942, + "grad_norm": 1.8461685180664062, + "learning_rate": 7.159827789963181e-07, + "loss": 0.0284, + "step": 32386 + }, + { + "epoch": 88.24795640326975, + "grad_norm": 2.820727825164795, + "learning_rate": 7.156548995184398e-07, + "loss": 0.0233, + "step": 32387 + }, + { + "epoch": 88.25068119891009, + "grad_norm": 6.894948482513428, + "learning_rate": 7.153270923467437e-07, + "loss": 0.1378, + "step": 32388 + }, + { + "epoch": 88.2534059945504, + "grad_norm": 2.133219003677368, + "learning_rate": 7.149993574837822e-07, + "loss": 0.0366, + "step": 32389 + }, + { + "epoch": 88.25613079019074, + "grad_norm": 2.540095090866089, + "learning_rate": 7.146716949321042e-07, + "loss": 0.0585, + "step": 32390 + }, + { + "epoch": 88.25885558583106, + "grad_norm": 2.4622929096221924, + "learning_rate": 7.143441046942645e-07, + "loss": 0.0401, + "step": 32391 + }, + { + "epoch": 88.26158038147139, + "grad_norm": 2.0890092849731445, + "learning_rate": 7.140165867728166e-07, + "loss": 0.0298, + "step": 32392 + }, + { + "epoch": 88.26430517711172, + "grad_norm": 1.8422714471817017, + "learning_rate": 7.136891411703073e-07, + "loss": 0.0353, + "step": 32393 + }, + { + "epoch": 88.26702997275204, + "grad_norm": 3.064406394958496, + "learning_rate": 7.13361767889289e-07, + "loss": 0.0589, + "step": 32394 + }, + { + "epoch": 88.26975476839237, + "grad_norm": 2.9960241317749023, + "learning_rate": 7.130344669323086e-07, + "loss": 0.0678, + "step": 32395 + }, + { + "epoch": 88.2724795640327, + "grad_norm": 1.6039263010025024, + "learning_rate": 7.127072383019185e-07, + "loss": 0.0176, + "step": 32396 + }, + { + "epoch": 88.27520435967303, + "grad_norm": 2.260348081588745, + "learning_rate": 7.123800820006643e-07, + "loss": 0.076, + "step": 32397 + }, + { + "epoch": 88.27792915531334, + "grad_norm": 4.56273889541626, + "learning_rate": 7.120529980310964e-07, + "loss": 0.0361, + "step": 32398 + }, + { + "epoch": 88.28065395095368, + "grad_norm": 2.5440008640289307, + "learning_rate": 7.117259863957593e-07, + "loss": 0.0676, + "step": 32399 + }, + { + "epoch": 88.28337874659401, + "grad_norm": 2.3230483531951904, + "learning_rate": 7.113990470972021e-07, + "loss": 0.0304, + "step": 32400 + }, + { + "epoch": 88.28610354223433, + "grad_norm": 5.4216461181640625, + "learning_rate": 7.110721801379705e-07, + "loss": 0.0302, + "step": 32401 + }, + { + "epoch": 88.28882833787466, + "grad_norm": 1.4944161176681519, + "learning_rate": 7.107453855206103e-07, + "loss": 0.0178, + "step": 32402 + }, + { + "epoch": 88.29155313351498, + "grad_norm": 2.5314242839813232, + "learning_rate": 7.104186632476639e-07, + "loss": 0.0691, + "step": 32403 + }, + { + "epoch": 88.29427792915531, + "grad_norm": 2.4386959075927734, + "learning_rate": 7.100920133216793e-07, + "loss": 0.0376, + "step": 32404 + }, + { + "epoch": 88.29700272479565, + "grad_norm": 2.228200674057007, + "learning_rate": 7.097654357451999e-07, + "loss": 0.031, + "step": 32405 + }, + { + "epoch": 88.29972752043597, + "grad_norm": 1.8890329599380493, + "learning_rate": 7.094389305207683e-07, + "loss": 0.0435, + "step": 32406 + }, + { + "epoch": 88.3024523160763, + "grad_norm": 3.7059457302093506, + "learning_rate": 7.091124976509245e-07, + "loss": 0.0433, + "step": 32407 + }, + { + "epoch": 88.30517711171662, + "grad_norm": 3.3551275730133057, + "learning_rate": 7.087861371382143e-07, + "loss": 0.1015, + "step": 32408 + }, + { + "epoch": 88.30790190735695, + "grad_norm": 3.033982515335083, + "learning_rate": 7.084598489851813e-07, + "loss": 0.1362, + "step": 32409 + }, + { + "epoch": 88.31062670299727, + "grad_norm": 2.023897647857666, + "learning_rate": 7.081336331943623e-07, + "loss": 0.035, + "step": 32410 + }, + { + "epoch": 88.3133514986376, + "grad_norm": 3.2727036476135254, + "learning_rate": 7.078074897682985e-07, + "loss": 0.0595, + "step": 32411 + }, + { + "epoch": 88.31607629427793, + "grad_norm": 2.589975357055664, + "learning_rate": 7.074814187095324e-07, + "loss": 0.1007, + "step": 32412 + }, + { + "epoch": 88.31880108991825, + "grad_norm": 2.6098878383636475, + "learning_rate": 7.071554200206021e-07, + "loss": 0.0549, + "step": 32413 + }, + { + "epoch": 88.32152588555859, + "grad_norm": 1.8974101543426514, + "learning_rate": 7.068294937040465e-07, + "loss": 0.1426, + "step": 32414 + }, + { + "epoch": 88.3242506811989, + "grad_norm": 1.4538369178771973, + "learning_rate": 7.065036397624014e-07, + "loss": 0.015, + "step": 32415 + }, + { + "epoch": 88.32697547683924, + "grad_norm": 5.012216567993164, + "learning_rate": 7.061778581982093e-07, + "loss": 0.0572, + "step": 32416 + }, + { + "epoch": 88.32970027247957, + "grad_norm": 2.0124173164367676, + "learning_rate": 7.058521490140047e-07, + "loss": 0.0234, + "step": 32417 + }, + { + "epoch": 88.33242506811989, + "grad_norm": 2.1418280601501465, + "learning_rate": 7.055265122123245e-07, + "loss": 0.024, + "step": 32418 + }, + { + "epoch": 88.33514986376022, + "grad_norm": 1.74332857131958, + "learning_rate": 7.052009477957022e-07, + "loss": 0.0237, + "step": 32419 + }, + { + "epoch": 88.33787465940054, + "grad_norm": 2.2411975860595703, + "learning_rate": 7.048754557666781e-07, + "loss": 0.027, + "step": 32420 + }, + { + "epoch": 88.34059945504087, + "grad_norm": 2.1045470237731934, + "learning_rate": 7.045500361277846e-07, + "loss": 0.0547, + "step": 32421 + }, + { + "epoch": 88.34332425068119, + "grad_norm": 2.1541929244995117, + "learning_rate": 7.042246888815563e-07, + "loss": 0.0974, + "step": 32422 + }, + { + "epoch": 88.34604904632153, + "grad_norm": 2.5627400875091553, + "learning_rate": 7.038994140305255e-07, + "loss": 0.0273, + "step": 32423 + }, + { + "epoch": 88.34877384196186, + "grad_norm": 4.022182464599609, + "learning_rate": 7.035742115772281e-07, + "loss": 0.0455, + "step": 32424 + }, + { + "epoch": 88.35149863760218, + "grad_norm": 3.07271671295166, + "learning_rate": 7.032490815241943e-07, + "loss": 0.0936, + "step": 32425 + }, + { + "epoch": 88.35422343324251, + "grad_norm": 2.802013397216797, + "learning_rate": 7.029240238739587e-07, + "loss": 0.0806, + "step": 32426 + }, + { + "epoch": 88.35694822888283, + "grad_norm": 2.2961838245391846, + "learning_rate": 7.025990386290527e-07, + "loss": 0.1447, + "step": 32427 + }, + { + "epoch": 88.35967302452316, + "grad_norm": 2.2719388008117676, + "learning_rate": 7.022741257920029e-07, + "loss": 0.0492, + "step": 32428 + }, + { + "epoch": 88.3623978201635, + "grad_norm": 2.973801851272583, + "learning_rate": 7.019492853653454e-07, + "loss": 0.0564, + "step": 32429 + }, + { + "epoch": 88.36512261580381, + "grad_norm": 2.531278371810913, + "learning_rate": 7.016245173516079e-07, + "loss": 0.1216, + "step": 32430 + }, + { + "epoch": 88.36784741144415, + "grad_norm": 3.1131370067596436, + "learning_rate": 7.012998217533174e-07, + "loss": 0.2001, + "step": 32431 + }, + { + "epoch": 88.37057220708446, + "grad_norm": 3.001033306121826, + "learning_rate": 7.009751985730062e-07, + "loss": 0.062, + "step": 32432 + }, + { + "epoch": 88.3732970027248, + "grad_norm": 2.2466847896575928, + "learning_rate": 7.006506478132003e-07, + "loss": 0.0268, + "step": 32433 + }, + { + "epoch": 88.37602179836512, + "grad_norm": 2.386246919631958, + "learning_rate": 7.003261694764286e-07, + "loss": 0.024, + "step": 32434 + }, + { + "epoch": 88.37874659400545, + "grad_norm": 2.3541605472564697, + "learning_rate": 7.000017635652157e-07, + "loss": 0.0307, + "step": 32435 + }, + { + "epoch": 88.38147138964578, + "grad_norm": 3.0564053058624268, + "learning_rate": 6.996774300820919e-07, + "loss": 0.0902, + "step": 32436 + }, + { + "epoch": 88.3841961852861, + "grad_norm": 2.4900553226470947, + "learning_rate": 6.993531690295796e-07, + "loss": 0.0354, + "step": 32437 + }, + { + "epoch": 88.38692098092643, + "grad_norm": 3.019763469696045, + "learning_rate": 6.990289804102068e-07, + "loss": 0.245, + "step": 32438 + }, + { + "epoch": 88.38964577656675, + "grad_norm": 2.5645194053649902, + "learning_rate": 6.987048642264938e-07, + "loss": 0.0164, + "step": 32439 + }, + { + "epoch": 88.39237057220708, + "grad_norm": 2.028104305267334, + "learning_rate": 6.983808204809706e-07, + "loss": 0.0277, + "step": 32440 + }, + { + "epoch": 88.39509536784742, + "grad_norm": 3.1489453315734863, + "learning_rate": 6.980568491761586e-07, + "loss": 0.1471, + "step": 32441 + }, + { + "epoch": 88.39782016348774, + "grad_norm": 1.981988549232483, + "learning_rate": 6.97732950314578e-07, + "loss": 0.0334, + "step": 32442 + }, + { + "epoch": 88.40054495912807, + "grad_norm": 2.9888768196105957, + "learning_rate": 6.974091238987557e-07, + "loss": 0.1154, + "step": 32443 + }, + { + "epoch": 88.40326975476839, + "grad_norm": 2.751434564590454, + "learning_rate": 6.970853699312108e-07, + "loss": 0.0654, + "step": 32444 + }, + { + "epoch": 88.40599455040872, + "grad_norm": 3.876380681991577, + "learning_rate": 6.967616884144668e-07, + "loss": 0.0257, + "step": 32445 + }, + { + "epoch": 88.40871934604904, + "grad_norm": 2.447319746017456, + "learning_rate": 6.964380793510428e-07, + "loss": 0.057, + "step": 32446 + }, + { + "epoch": 88.41144414168937, + "grad_norm": 4.316874027252197, + "learning_rate": 6.961145427434601e-07, + "loss": 0.0249, + "step": 32447 + }, + { + "epoch": 88.4141689373297, + "grad_norm": 2.9538207054138184, + "learning_rate": 6.957910785942357e-07, + "loss": 0.2019, + "step": 32448 + }, + { + "epoch": 88.41689373297002, + "grad_norm": 2.0260610580444336, + "learning_rate": 6.95467686905893e-07, + "loss": 0.0491, + "step": 32449 + }, + { + "epoch": 88.41961852861036, + "grad_norm": 2.5340194702148438, + "learning_rate": 6.951443676809489e-07, + "loss": 0.0746, + "step": 32450 + }, + { + "epoch": 88.42234332425068, + "grad_norm": 2.870420455932617, + "learning_rate": 6.948211209219191e-07, + "loss": 0.0373, + "step": 32451 + }, + { + "epoch": 88.42506811989101, + "grad_norm": 2.812525749206543, + "learning_rate": 6.94497946631324e-07, + "loss": 0.0916, + "step": 32452 + }, + { + "epoch": 88.42779291553134, + "grad_norm": 2.9845118522644043, + "learning_rate": 6.941748448116803e-07, + "loss": 0.114, + "step": 32453 + }, + { + "epoch": 88.43051771117166, + "grad_norm": 2.2237348556518555, + "learning_rate": 6.938518154655027e-07, + "loss": 0.0196, + "step": 32454 + }, + { + "epoch": 88.433242506812, + "grad_norm": 1.488059401512146, + "learning_rate": 6.93528858595306e-07, + "loss": 0.025, + "step": 32455 + }, + { + "epoch": 88.43596730245231, + "grad_norm": 1.537386417388916, + "learning_rate": 6.93205974203609e-07, + "loss": 0.0183, + "step": 32456 + }, + { + "epoch": 88.43869209809264, + "grad_norm": 2.6214711666107178, + "learning_rate": 6.928831622929244e-07, + "loss": 0.0319, + "step": 32457 + }, + { + "epoch": 88.44141689373296, + "grad_norm": 1.4960311651229858, + "learning_rate": 6.925604228657657e-07, + "loss": 0.0173, + "step": 32458 + }, + { + "epoch": 88.4441416893733, + "grad_norm": 3.0551717281341553, + "learning_rate": 6.922377559246462e-07, + "loss": 0.0503, + "step": 32459 + }, + { + "epoch": 88.44686648501363, + "grad_norm": 4.646723747253418, + "learning_rate": 6.919151614720787e-07, + "loss": 0.0295, + "step": 32460 + }, + { + "epoch": 88.44959128065395, + "grad_norm": 1.8327277898788452, + "learning_rate": 6.915926395105776e-07, + "loss": 0.1291, + "step": 32461 + }, + { + "epoch": 88.45231607629428, + "grad_norm": 2.9880619049072266, + "learning_rate": 6.912701900426544e-07, + "loss": 0.0687, + "step": 32462 + }, + { + "epoch": 88.4550408719346, + "grad_norm": 3.8878345489501953, + "learning_rate": 6.909478130708192e-07, + "loss": 0.0314, + "step": 32463 + }, + { + "epoch": 88.45776566757493, + "grad_norm": 2.996694564819336, + "learning_rate": 6.906255085975799e-07, + "loss": 0.0989, + "step": 32464 + }, + { + "epoch": 88.46049046321527, + "grad_norm": 3.5452499389648438, + "learning_rate": 6.903032766254525e-07, + "loss": 0.0565, + "step": 32465 + }, + { + "epoch": 88.46321525885558, + "grad_norm": 4.170506000518799, + "learning_rate": 6.899811171569437e-07, + "loss": 0.1153, + "step": 32466 + }, + { + "epoch": 88.46594005449592, + "grad_norm": 2.7486510276794434, + "learning_rate": 6.896590301945616e-07, + "loss": 0.0625, + "step": 32467 + }, + { + "epoch": 88.46866485013624, + "grad_norm": 2.1080689430236816, + "learning_rate": 6.893370157408141e-07, + "loss": 0.0404, + "step": 32468 + }, + { + "epoch": 88.47138964577657, + "grad_norm": 2.5748252868652344, + "learning_rate": 6.890150737982115e-07, + "loss": 0.0474, + "step": 32469 + }, + { + "epoch": 88.47411444141689, + "grad_norm": 1.9797866344451904, + "learning_rate": 6.886932043692596e-07, + "loss": 0.0227, + "step": 32470 + }, + { + "epoch": 88.47683923705722, + "grad_norm": 2.369738817214966, + "learning_rate": 6.883714074564663e-07, + "loss": 0.0889, + "step": 32471 + }, + { + "epoch": 88.47956403269755, + "grad_norm": 4.690642833709717, + "learning_rate": 6.88049683062334e-07, + "loss": 0.0421, + "step": 32472 + }, + { + "epoch": 88.48228882833787, + "grad_norm": 2.9402341842651367, + "learning_rate": 6.87728031189373e-07, + "loss": 0.1101, + "step": 32473 + }, + { + "epoch": 88.4850136239782, + "grad_norm": 1.914718508720398, + "learning_rate": 6.874064518400869e-07, + "loss": 0.0365, + "step": 32474 + }, + { + "epoch": 88.48773841961852, + "grad_norm": 2.57735276222229, + "learning_rate": 6.870849450169781e-07, + "loss": 0.0219, + "step": 32475 + }, + { + "epoch": 88.49046321525886, + "grad_norm": 2.4926013946533203, + "learning_rate": 6.867635107225512e-07, + "loss": 0.0797, + "step": 32476 + }, + { + "epoch": 88.49318801089919, + "grad_norm": 3.515141010284424, + "learning_rate": 6.864421489593132e-07, + "loss": 0.0284, + "step": 32477 + }, + { + "epoch": 88.49591280653951, + "grad_norm": 3.1314024925231934, + "learning_rate": 6.861208597297631e-07, + "loss": 0.079, + "step": 32478 + }, + { + "epoch": 88.49863760217984, + "grad_norm": 2.2189550399780273, + "learning_rate": 6.857996430364045e-07, + "loss": 0.0621, + "step": 32479 + }, + { + "epoch": 88.50136239782016, + "grad_norm": 1.7627149820327759, + "learning_rate": 6.854784988817365e-07, + "loss": 0.0193, + "step": 32480 + }, + { + "epoch": 88.50408719346049, + "grad_norm": 1.8683980703353882, + "learning_rate": 6.851574272682638e-07, + "loss": 0.1362, + "step": 32481 + }, + { + "epoch": 88.50681198910081, + "grad_norm": 1.919998288154602, + "learning_rate": 6.848364281984843e-07, + "loss": 0.0213, + "step": 32482 + }, + { + "epoch": 88.50953678474114, + "grad_norm": 2.2226004600524902, + "learning_rate": 6.845155016749006e-07, + "loss": 0.0477, + "step": 32483 + }, + { + "epoch": 88.51226158038148, + "grad_norm": 2.1266064643859863, + "learning_rate": 6.841946477000072e-07, + "loss": 0.0384, + "step": 32484 + }, + { + "epoch": 88.5149863760218, + "grad_norm": 2.8746864795684814, + "learning_rate": 6.838738662763089e-07, + "loss": 0.0883, + "step": 32485 + }, + { + "epoch": 88.51771117166213, + "grad_norm": 3.0734643936157227, + "learning_rate": 6.835531574063003e-07, + "loss": 0.1, + "step": 32486 + }, + { + "epoch": 88.52043596730245, + "grad_norm": 1.7114530801773071, + "learning_rate": 6.832325210924806e-07, + "loss": 0.0313, + "step": 32487 + }, + { + "epoch": 88.52316076294278, + "grad_norm": 2.248533248901367, + "learning_rate": 6.829119573373443e-07, + "loss": 0.1137, + "step": 32488 + }, + { + "epoch": 88.52588555858311, + "grad_norm": 5.388162612915039, + "learning_rate": 6.825914661433908e-07, + "loss": 0.1057, + "step": 32489 + }, + { + "epoch": 88.52861035422343, + "grad_norm": 2.2857561111450195, + "learning_rate": 6.822710475131155e-07, + "loss": 0.0471, + "step": 32490 + }, + { + "epoch": 88.53133514986376, + "grad_norm": 3.316270112991333, + "learning_rate": 6.819507014490134e-07, + "loss": 0.0884, + "step": 32491 + }, + { + "epoch": 88.53405994550408, + "grad_norm": 2.7123632431030273, + "learning_rate": 6.81630427953578e-07, + "loss": 0.0441, + "step": 32492 + }, + { + "epoch": 88.53678474114442, + "grad_norm": 2.2796952724456787, + "learning_rate": 6.81310227029307e-07, + "loss": 0.0667, + "step": 32493 + }, + { + "epoch": 88.53950953678473, + "grad_norm": 2.4223263263702393, + "learning_rate": 6.809900986786889e-07, + "loss": 0.122, + "step": 32494 + }, + { + "epoch": 88.54223433242507, + "grad_norm": 1.859542727470398, + "learning_rate": 6.806700429042223e-07, + "loss": 0.0206, + "step": 32495 + }, + { + "epoch": 88.5449591280654, + "grad_norm": 2.8135170936584473, + "learning_rate": 6.803500597083967e-07, + "loss": 0.114, + "step": 32496 + }, + { + "epoch": 88.54768392370572, + "grad_norm": 2.5066561698913574, + "learning_rate": 6.800301490937056e-07, + "loss": 0.0545, + "step": 32497 + }, + { + "epoch": 88.55040871934605, + "grad_norm": 2.343372344970703, + "learning_rate": 6.797103110626402e-07, + "loss": 0.0327, + "step": 32498 + }, + { + "epoch": 88.55313351498637, + "grad_norm": 3.180253505706787, + "learning_rate": 6.793905456176909e-07, + "loss": 0.0798, + "step": 32499 + }, + { + "epoch": 88.5558583106267, + "grad_norm": 2.0128023624420166, + "learning_rate": 6.790708527613454e-07, + "loss": 0.086, + "step": 32500 + }, + { + "epoch": 88.55858310626704, + "grad_norm": 2.8150742053985596, + "learning_rate": 6.787512324960987e-07, + "loss": 0.0298, + "step": 32501 + }, + { + "epoch": 88.56130790190736, + "grad_norm": 2.445643424987793, + "learning_rate": 6.784316848244377e-07, + "loss": 0.0359, + "step": 32502 + }, + { + "epoch": 88.56403269754769, + "grad_norm": 1.6584358215332031, + "learning_rate": 6.781122097488501e-07, + "loss": 0.0202, + "step": 32503 + }, + { + "epoch": 88.566757493188, + "grad_norm": 2.5261402130126953, + "learning_rate": 6.777928072718232e-07, + "loss": 0.0983, + "step": 32504 + }, + { + "epoch": 88.56948228882834, + "grad_norm": 2.7514688968658447, + "learning_rate": 6.774734773958469e-07, + "loss": 0.0786, + "step": 32505 + }, + { + "epoch": 88.57220708446866, + "grad_norm": 2.7484543323516846, + "learning_rate": 6.771542201234071e-07, + "loss": 0.0911, + "step": 32506 + }, + { + "epoch": 88.57493188010899, + "grad_norm": 1.4559698104858398, + "learning_rate": 6.768350354569909e-07, + "loss": 0.0155, + "step": 32507 + }, + { + "epoch": 88.57765667574932, + "grad_norm": 5.5457658767700195, + "learning_rate": 6.765159233990814e-07, + "loss": 0.0483, + "step": 32508 + }, + { + "epoch": 88.58038147138964, + "grad_norm": 2.0925986766815186, + "learning_rate": 6.761968839521682e-07, + "loss": 0.0364, + "step": 32509 + }, + { + "epoch": 88.58310626702998, + "grad_norm": 3.045254707336426, + "learning_rate": 6.758779171187324e-07, + "loss": 0.0305, + "step": 32510 + }, + { + "epoch": 88.5858310626703, + "grad_norm": 7.752040863037109, + "learning_rate": 6.755590229012588e-07, + "loss": 0.0869, + "step": 32511 + }, + { + "epoch": 88.58855585831063, + "grad_norm": 5.426023483276367, + "learning_rate": 6.752402013022319e-07, + "loss": 0.1346, + "step": 32512 + }, + { + "epoch": 88.59128065395096, + "grad_norm": 3.487820625305176, + "learning_rate": 6.749214523241332e-07, + "loss": 0.0764, + "step": 32513 + }, + { + "epoch": 88.59400544959128, + "grad_norm": 2.4322376251220703, + "learning_rate": 6.746027759694474e-07, + "loss": 0.1689, + "step": 32514 + }, + { + "epoch": 88.59673024523161, + "grad_norm": 2.054391622543335, + "learning_rate": 6.742841722406556e-07, + "loss": 0.025, + "step": 32515 + }, + { + "epoch": 88.59945504087193, + "grad_norm": 2.9714245796203613, + "learning_rate": 6.739656411402363e-07, + "loss": 0.1152, + "step": 32516 + }, + { + "epoch": 88.60217983651226, + "grad_norm": 1.3651752471923828, + "learning_rate": 6.736471826706747e-07, + "loss": 0.0147, + "step": 32517 + }, + { + "epoch": 88.60490463215258, + "grad_norm": 2.0237410068511963, + "learning_rate": 6.733287968344482e-07, + "loss": 0.0799, + "step": 32518 + }, + { + "epoch": 88.60762942779292, + "grad_norm": 2.2222201824188232, + "learning_rate": 6.730104836340367e-07, + "loss": 0.0456, + "step": 32519 + }, + { + "epoch": 88.61035422343325, + "grad_norm": 2.871119260787964, + "learning_rate": 6.726922430719185e-07, + "loss": 0.0737, + "step": 32520 + }, + { + "epoch": 88.61307901907357, + "grad_norm": 1.9032843112945557, + "learning_rate": 6.723740751505736e-07, + "loss": 0.0749, + "step": 32521 + }, + { + "epoch": 88.6158038147139, + "grad_norm": 2.381385564804077, + "learning_rate": 6.720559798724801e-07, + "loss": 0.0239, + "step": 32522 + }, + { + "epoch": 88.61852861035422, + "grad_norm": 2.4233813285827637, + "learning_rate": 6.717379572401139e-07, + "loss": 0.043, + "step": 32523 + }, + { + "epoch": 88.62125340599455, + "grad_norm": 3.771385431289673, + "learning_rate": 6.714200072559507e-07, + "loss": 0.0514, + "step": 32524 + }, + { + "epoch": 88.62397820163488, + "grad_norm": 7.224627494812012, + "learning_rate": 6.711021299224696e-07, + "loss": 0.0377, + "step": 32525 + }, + { + "epoch": 88.6267029972752, + "grad_norm": 2.9198646545410156, + "learning_rate": 6.707843252421453e-07, + "loss": 0.1455, + "step": 32526 + }, + { + "epoch": 88.62942779291554, + "grad_norm": 4.023635387420654, + "learning_rate": 6.704665932174525e-07, + "loss": 0.1044, + "step": 32527 + }, + { + "epoch": 88.63215258855585, + "grad_norm": 2.3568904399871826, + "learning_rate": 6.701489338508638e-07, + "loss": 0.0357, + "step": 32528 + }, + { + "epoch": 88.63487738419619, + "grad_norm": 1.82301926612854, + "learning_rate": 6.698313471448547e-07, + "loss": 0.0942, + "step": 32529 + }, + { + "epoch": 88.6376021798365, + "grad_norm": 2.3839166164398193, + "learning_rate": 6.695138331019002e-07, + "loss": 0.1733, + "step": 32530 + }, + { + "epoch": 88.64032697547684, + "grad_norm": 2.619131088256836, + "learning_rate": 6.691963917244726e-07, + "loss": 0.0795, + "step": 32531 + }, + { + "epoch": 88.64305177111717, + "grad_norm": 2.787616014480591, + "learning_rate": 6.688790230150421e-07, + "loss": 0.0362, + "step": 32532 + }, + { + "epoch": 88.64577656675749, + "grad_norm": 2.427051067352295, + "learning_rate": 6.685617269760802e-07, + "loss": 0.025, + "step": 32533 + }, + { + "epoch": 88.64850136239782, + "grad_norm": 2.578310489654541, + "learning_rate": 6.682445036100616e-07, + "loss": 0.0972, + "step": 32534 + }, + { + "epoch": 88.65122615803814, + "grad_norm": 1.6142969131469727, + "learning_rate": 6.679273529194541e-07, + "loss": 0.0187, + "step": 32535 + }, + { + "epoch": 88.65395095367847, + "grad_norm": 4.000240802764893, + "learning_rate": 6.67610274906727e-07, + "loss": 0.1039, + "step": 32536 + }, + { + "epoch": 88.65667574931881, + "grad_norm": 2.3971710205078125, + "learning_rate": 6.672932695743506e-07, + "loss": 0.0202, + "step": 32537 + }, + { + "epoch": 88.65940054495913, + "grad_norm": 2.449756622314453, + "learning_rate": 6.669763369247939e-07, + "loss": 0.0776, + "step": 32538 + }, + { + "epoch": 88.66212534059946, + "grad_norm": 1.5375303030014038, + "learning_rate": 6.666594769605261e-07, + "loss": 0.0149, + "step": 32539 + }, + { + "epoch": 88.66485013623978, + "grad_norm": 3.071993827819824, + "learning_rate": 6.66342689684012e-07, + "loss": 0.047, + "step": 32540 + }, + { + "epoch": 88.66757493188011, + "grad_norm": 2.8569655418395996, + "learning_rate": 6.660259750977227e-07, + "loss": 0.0233, + "step": 32541 + }, + { + "epoch": 88.67029972752043, + "grad_norm": 2.814210891723633, + "learning_rate": 6.65709333204122e-07, + "loss": 0.0423, + "step": 32542 + }, + { + "epoch": 88.67302452316076, + "grad_norm": 2.6103148460388184, + "learning_rate": 6.653927640056779e-07, + "loss": 0.0371, + "step": 32543 + }, + { + "epoch": 88.6757493188011, + "grad_norm": 1.996567726135254, + "learning_rate": 6.650762675048516e-07, + "loss": 0.0309, + "step": 32544 + }, + { + "epoch": 88.67847411444141, + "grad_norm": 1.3965378999710083, + "learning_rate": 6.647598437041114e-07, + "loss": 0.0221, + "step": 32545 + }, + { + "epoch": 88.68119891008175, + "grad_norm": 2.909156322479248, + "learning_rate": 6.644434926059228e-07, + "loss": 0.031, + "step": 32546 + }, + { + "epoch": 88.68392370572207, + "grad_norm": 2.3875527381896973, + "learning_rate": 6.641272142127475e-07, + "loss": 0.0394, + "step": 32547 + }, + { + "epoch": 88.6866485013624, + "grad_norm": 1.9616997241973877, + "learning_rate": 6.638110085270488e-07, + "loss": 0.0276, + "step": 32548 + }, + { + "epoch": 88.68937329700273, + "grad_norm": 2.376124858856201, + "learning_rate": 6.634948755512882e-07, + "loss": 0.0341, + "step": 32549 + }, + { + "epoch": 88.69209809264305, + "grad_norm": 3.137643337249756, + "learning_rate": 6.631788152879304e-07, + "loss": 0.106, + "step": 32550 + }, + { + "epoch": 88.69482288828338, + "grad_norm": 3.1571850776672363, + "learning_rate": 6.628628277394356e-07, + "loss": 0.0565, + "step": 32551 + }, + { + "epoch": 88.6975476839237, + "grad_norm": 3.1629316806793213, + "learning_rate": 6.625469129082651e-07, + "loss": 0.137, + "step": 32552 + }, + { + "epoch": 88.70027247956403, + "grad_norm": 2.550363540649414, + "learning_rate": 6.62231070796876e-07, + "loss": 0.0909, + "step": 32553 + }, + { + "epoch": 88.70299727520435, + "grad_norm": 2.6861281394958496, + "learning_rate": 6.619153014077328e-07, + "loss": 0.0411, + "step": 32554 + }, + { + "epoch": 88.70572207084469, + "grad_norm": 1.8477747440338135, + "learning_rate": 6.615996047432937e-07, + "loss": 0.0589, + "step": 32555 + }, + { + "epoch": 88.70844686648502, + "grad_norm": 3.0497498512268066, + "learning_rate": 6.612839808060146e-07, + "loss": 0.061, + "step": 32556 + }, + { + "epoch": 88.71117166212534, + "grad_norm": 2.910400867462158, + "learning_rate": 6.609684295983553e-07, + "loss": 0.0485, + "step": 32557 + }, + { + "epoch": 88.71389645776567, + "grad_norm": 4.672149658203125, + "learning_rate": 6.606529511227743e-07, + "loss": 0.0623, + "step": 32558 + }, + { + "epoch": 88.71662125340599, + "grad_norm": 2.9744796752929688, + "learning_rate": 6.603375453817273e-07, + "loss": 0.094, + "step": 32559 + }, + { + "epoch": 88.71934604904632, + "grad_norm": 3.9777817726135254, + "learning_rate": 6.600222123776712e-07, + "loss": 0.0494, + "step": 32560 + }, + { + "epoch": 88.72207084468666, + "grad_norm": 2.20937442779541, + "learning_rate": 6.597069521130594e-07, + "loss": 0.0667, + "step": 32561 + }, + { + "epoch": 88.72479564032697, + "grad_norm": 2.979435443878174, + "learning_rate": 6.593917645903491e-07, + "loss": 0.0806, + "step": 32562 + }, + { + "epoch": 88.7275204359673, + "grad_norm": 1.8783541917800903, + "learning_rate": 6.590766498119983e-07, + "loss": 0.0202, + "step": 32563 + }, + { + "epoch": 88.73024523160763, + "grad_norm": 4.087584018707275, + "learning_rate": 6.58761607780456e-07, + "loss": 0.0829, + "step": 32564 + }, + { + "epoch": 88.73297002724796, + "grad_norm": 2.5798182487487793, + "learning_rate": 6.584466384981769e-07, + "loss": 0.0248, + "step": 32565 + }, + { + "epoch": 88.73569482288828, + "grad_norm": 3.663706064224243, + "learning_rate": 6.58131741967617e-07, + "loss": 0.1457, + "step": 32566 + }, + { + "epoch": 88.73841961852861, + "grad_norm": 3.7107369899749756, + "learning_rate": 6.578169181912252e-07, + "loss": 0.0469, + "step": 32567 + }, + { + "epoch": 88.74114441416894, + "grad_norm": 2.8559722900390625, + "learning_rate": 6.575021671714554e-07, + "loss": 0.0285, + "step": 32568 + }, + { + "epoch": 88.74386920980926, + "grad_norm": 1.462720513343811, + "learning_rate": 6.571874889107554e-07, + "loss": 0.0192, + "step": 32569 + }, + { + "epoch": 88.7465940054496, + "grad_norm": 1.8686283826828003, + "learning_rate": 6.568728834115812e-07, + "loss": 0.0382, + "step": 32570 + }, + { + "epoch": 88.74931880108991, + "grad_norm": 4.0126566886901855, + "learning_rate": 6.565583506763795e-07, + "loss": 0.0472, + "step": 32571 + }, + { + "epoch": 88.75204359673025, + "grad_norm": 2.335212230682373, + "learning_rate": 6.562438907076018e-07, + "loss": 0.0407, + "step": 32572 + }, + { + "epoch": 88.75476839237058, + "grad_norm": 2.825334310531616, + "learning_rate": 6.559295035076929e-07, + "loss": 0.0724, + "step": 32573 + }, + { + "epoch": 88.7574931880109, + "grad_norm": 2.296994924545288, + "learning_rate": 6.556151890791073e-07, + "loss": 0.0274, + "step": 32574 + }, + { + "epoch": 88.76021798365123, + "grad_norm": 3.0914974212646484, + "learning_rate": 6.553009474242888e-07, + "loss": 0.0387, + "step": 32575 + }, + { + "epoch": 88.76294277929155, + "grad_norm": 2.1979379653930664, + "learning_rate": 6.549867785456864e-07, + "loss": 0.0975, + "step": 32576 + }, + { + "epoch": 88.76566757493188, + "grad_norm": 3.263225555419922, + "learning_rate": 6.546726824457438e-07, + "loss": 0.0783, + "step": 32577 + }, + { + "epoch": 88.7683923705722, + "grad_norm": 3.954967975616455, + "learning_rate": 6.543586591269124e-07, + "loss": 0.1224, + "step": 32578 + }, + { + "epoch": 88.77111716621253, + "grad_norm": 2.4080593585968018, + "learning_rate": 6.540447085916346e-07, + "loss": 0.0678, + "step": 32579 + }, + { + "epoch": 88.77384196185287, + "grad_norm": 2.408904790878296, + "learning_rate": 6.537308308423529e-07, + "loss": 0.0414, + "step": 32580 + }, + { + "epoch": 88.77656675749319, + "grad_norm": 3.955139398574829, + "learning_rate": 6.534170258815165e-07, + "loss": 0.1601, + "step": 32581 + }, + { + "epoch": 88.77929155313352, + "grad_norm": 2.4776837825775146, + "learning_rate": 6.531032937115677e-07, + "loss": 0.0286, + "step": 32582 + }, + { + "epoch": 88.78201634877384, + "grad_norm": 2.7745254039764404, + "learning_rate": 6.527896343349505e-07, + "loss": 0.2462, + "step": 32583 + }, + { + "epoch": 88.78474114441417, + "grad_norm": 16.306833267211914, + "learning_rate": 6.52476047754107e-07, + "loss": 0.0215, + "step": 32584 + }, + { + "epoch": 88.7874659400545, + "grad_norm": 2.210672378540039, + "learning_rate": 6.521625339714765e-07, + "loss": 0.0875, + "step": 32585 + }, + { + "epoch": 88.79019073569482, + "grad_norm": 2.5565500259399414, + "learning_rate": 6.51849092989506e-07, + "loss": 0.0517, + "step": 32586 + }, + { + "epoch": 88.79291553133515, + "grad_norm": 3.453659772872925, + "learning_rate": 6.515357248106325e-07, + "loss": 0.1878, + "step": 32587 + }, + { + "epoch": 88.79564032697547, + "grad_norm": 2.9403576850891113, + "learning_rate": 6.512224294372993e-07, + "loss": 0.0333, + "step": 32588 + }, + { + "epoch": 88.7983651226158, + "grad_norm": 3.5595004558563232, + "learning_rate": 6.509092068719425e-07, + "loss": 0.0309, + "step": 32589 + }, + { + "epoch": 88.80108991825612, + "grad_norm": 2.377322196960449, + "learning_rate": 6.505960571170056e-07, + "loss": 0.0456, + "step": 32590 + }, + { + "epoch": 88.80381471389646, + "grad_norm": 2.6467015743255615, + "learning_rate": 6.502829801749266e-07, + "loss": 0.0956, + "step": 32591 + }, + { + "epoch": 88.80653950953679, + "grad_norm": 2.7683017253875732, + "learning_rate": 6.499699760481415e-07, + "loss": 0.069, + "step": 32592 + }, + { + "epoch": 88.80926430517711, + "grad_norm": 5.441568851470947, + "learning_rate": 6.496570447390893e-07, + "loss": 0.0245, + "step": 32593 + }, + { + "epoch": 88.81198910081744, + "grad_norm": 2.438164472579956, + "learning_rate": 6.49344186250207e-07, + "loss": 0.0317, + "step": 32594 + }, + { + "epoch": 88.81471389645776, + "grad_norm": 2.7427258491516113, + "learning_rate": 6.490314005839327e-07, + "loss": 0.082, + "step": 32595 + }, + { + "epoch": 88.8174386920981, + "grad_norm": 3.3365774154663086, + "learning_rate": 6.487186877426998e-07, + "loss": 0.0434, + "step": 32596 + }, + { + "epoch": 88.82016348773843, + "grad_norm": 6.6274542808532715, + "learning_rate": 6.484060477289433e-07, + "loss": 0.0313, + "step": 32597 + }, + { + "epoch": 88.82288828337875, + "grad_norm": 2.2954092025756836, + "learning_rate": 6.480934805451001e-07, + "loss": 0.0643, + "step": 32598 + }, + { + "epoch": 88.82561307901908, + "grad_norm": 2.240321636199951, + "learning_rate": 6.477809861936047e-07, + "loss": 0.0309, + "step": 32599 + }, + { + "epoch": 88.8283378746594, + "grad_norm": 3.0100510120391846, + "learning_rate": 6.474685646768908e-07, + "loss": 0.1114, + "step": 32600 + }, + { + "epoch": 88.83106267029973, + "grad_norm": 3.1723432540893555, + "learning_rate": 6.471562159973899e-07, + "loss": 0.0271, + "step": 32601 + }, + { + "epoch": 88.83378746594005, + "grad_norm": 1.8667747974395752, + "learning_rate": 6.468439401575344e-07, + "loss": 0.1159, + "step": 32602 + }, + { + "epoch": 88.83651226158038, + "grad_norm": 1.8212648630142212, + "learning_rate": 6.46531737159759e-07, + "loss": 0.0195, + "step": 32603 + }, + { + "epoch": 88.83923705722071, + "grad_norm": 1.2121655941009521, + "learning_rate": 6.46219607006493e-07, + "loss": 0.0145, + "step": 32604 + }, + { + "epoch": 88.84196185286103, + "grad_norm": 3.006887435913086, + "learning_rate": 6.459075497001655e-07, + "loss": 0.0489, + "step": 32605 + }, + { + "epoch": 88.84468664850137, + "grad_norm": 2.8322653770446777, + "learning_rate": 6.455955652432111e-07, + "loss": 0.021, + "step": 32606 + }, + { + "epoch": 88.84741144414168, + "grad_norm": 2.9975996017456055, + "learning_rate": 6.45283653638058e-07, + "loss": 0.0737, + "step": 32607 + }, + { + "epoch": 88.85013623978202, + "grad_norm": 3.215750217437744, + "learning_rate": 6.449718148871342e-07, + "loss": 0.1501, + "step": 32608 + }, + { + "epoch": 88.85286103542235, + "grad_norm": 3.315380096435547, + "learning_rate": 6.446600489928667e-07, + "loss": 0.0647, + "step": 32609 + }, + { + "epoch": 88.85558583106267, + "grad_norm": 2.2998287677764893, + "learning_rate": 6.443483559576879e-07, + "loss": 0.0519, + "step": 32610 + }, + { + "epoch": 88.858310626703, + "grad_norm": 3.173992872238159, + "learning_rate": 6.440367357840228e-07, + "loss": 0.0286, + "step": 32611 + }, + { + "epoch": 88.86103542234332, + "grad_norm": 3.3180930614471436, + "learning_rate": 6.43725188474299e-07, + "loss": 0.0357, + "step": 32612 + }, + { + "epoch": 88.86376021798365, + "grad_norm": 4.685422897338867, + "learning_rate": 6.434137140309393e-07, + "loss": 0.0883, + "step": 32613 + }, + { + "epoch": 88.86648501362397, + "grad_norm": 2.7520151138305664, + "learning_rate": 6.43102312456374e-07, + "loss": 0.0362, + "step": 32614 + }, + { + "epoch": 88.8692098092643, + "grad_norm": 2.7013070583343506, + "learning_rate": 6.427909837530278e-07, + "loss": 0.0324, + "step": 32615 + }, + { + "epoch": 88.87193460490464, + "grad_norm": 1.632001280784607, + "learning_rate": 6.424797279233242e-07, + "loss": 0.03, + "step": 32616 + }, + { + "epoch": 88.87465940054496, + "grad_norm": 2.813481092453003, + "learning_rate": 6.421685449696868e-07, + "loss": 0.0352, + "step": 32617 + }, + { + "epoch": 88.87738419618529, + "grad_norm": 2.818861246109009, + "learning_rate": 6.418574348945384e-07, + "loss": 0.0523, + "step": 32618 + }, + { + "epoch": 88.88010899182561, + "grad_norm": 2.4353575706481934, + "learning_rate": 6.415463977003045e-07, + "loss": 0.1397, + "step": 32619 + }, + { + "epoch": 88.88283378746594, + "grad_norm": 3.076411724090576, + "learning_rate": 6.412354333894067e-07, + "loss": 0.0355, + "step": 32620 + }, + { + "epoch": 88.88555858310627, + "grad_norm": 2.091139793395996, + "learning_rate": 6.409245419642663e-07, + "loss": 0.0232, + "step": 32621 + }, + { + "epoch": 88.88828337874659, + "grad_norm": 2.2614316940307617, + "learning_rate": 6.406137234273013e-07, + "loss": 0.0869, + "step": 32622 + }, + { + "epoch": 88.89100817438693, + "grad_norm": 3.105689525604248, + "learning_rate": 6.403029777809377e-07, + "loss": 0.0956, + "step": 32623 + }, + { + "epoch": 88.89373297002724, + "grad_norm": 5.176424503326416, + "learning_rate": 6.399923050275935e-07, + "loss": 0.0207, + "step": 32624 + }, + { + "epoch": 88.89645776566758, + "grad_norm": 2.1554253101348877, + "learning_rate": 6.396817051696869e-07, + "loss": 0.0654, + "step": 32625 + }, + { + "epoch": 88.8991825613079, + "grad_norm": 2.6068801879882812, + "learning_rate": 6.39371178209639e-07, + "loss": 0.0411, + "step": 32626 + }, + { + "epoch": 88.90190735694823, + "grad_norm": 3.9998323917388916, + "learning_rate": 6.39060724149867e-07, + "loss": 0.0851, + "step": 32627 + }, + { + "epoch": 88.90463215258856, + "grad_norm": 2.202383518218994, + "learning_rate": 6.387503429927888e-07, + "loss": 0.0947, + "step": 32628 + }, + { + "epoch": 88.90735694822888, + "grad_norm": 1.9589344263076782, + "learning_rate": 6.384400347408204e-07, + "loss": 0.0257, + "step": 32629 + }, + { + "epoch": 88.91008174386921, + "grad_norm": 4.329192638397217, + "learning_rate": 6.381297993963809e-07, + "loss": 0.1002, + "step": 32630 + }, + { + "epoch": 88.91280653950953, + "grad_norm": 3.230823516845703, + "learning_rate": 6.378196369618828e-07, + "loss": 0.0496, + "step": 32631 + }, + { + "epoch": 88.91553133514986, + "grad_norm": 2.3963263034820557, + "learning_rate": 6.375095474397475e-07, + "loss": 0.0968, + "step": 32632 + }, + { + "epoch": 88.9182561307902, + "grad_norm": 2.2858119010925293, + "learning_rate": 6.371995308323853e-07, + "loss": 0.0712, + "step": 32633 + }, + { + "epoch": 88.92098092643052, + "grad_norm": 5.101203918457031, + "learning_rate": 6.368895871422099e-07, + "loss": 0.0385, + "step": 32634 + }, + { + "epoch": 88.92370572207085, + "grad_norm": 2.0538389682769775, + "learning_rate": 6.365797163716392e-07, + "loss": 0.1404, + "step": 32635 + }, + { + "epoch": 88.92643051771117, + "grad_norm": 2.3281009197235107, + "learning_rate": 6.362699185230848e-07, + "loss": 0.0459, + "step": 32636 + }, + { + "epoch": 88.9291553133515, + "grad_norm": 2.309115409851074, + "learning_rate": 6.359601935989579e-07, + "loss": 0.0777, + "step": 32637 + }, + { + "epoch": 88.93188010899182, + "grad_norm": 2.052091598510742, + "learning_rate": 6.356505416016712e-07, + "loss": 0.029, + "step": 32638 + }, + { + "epoch": 88.93460490463215, + "grad_norm": 4.119014263153076, + "learning_rate": 6.353409625336371e-07, + "loss": 0.1418, + "step": 32639 + }, + { + "epoch": 88.93732970027249, + "grad_norm": 1.9511654376983643, + "learning_rate": 6.350314563972671e-07, + "loss": 0.1573, + "step": 32640 + }, + { + "epoch": 88.9400544959128, + "grad_norm": 2.795783758163452, + "learning_rate": 6.347220231949702e-07, + "loss": 0.0499, + "step": 32641 + }, + { + "epoch": 88.94277929155314, + "grad_norm": 3.338364601135254, + "learning_rate": 6.344126629291559e-07, + "loss": 0.1038, + "step": 32642 + }, + { + "epoch": 88.94550408719346, + "grad_norm": 3.1988728046417236, + "learning_rate": 6.341033756022352e-07, + "loss": 0.1616, + "step": 32643 + }, + { + "epoch": 88.94822888283379, + "grad_norm": 2.0884668827056885, + "learning_rate": 6.337941612166154e-07, + "loss": 0.0275, + "step": 32644 + }, + { + "epoch": 88.95095367847412, + "grad_norm": 2.2075607776641846, + "learning_rate": 6.334850197747066e-07, + "loss": 0.0252, + "step": 32645 + }, + { + "epoch": 88.95367847411444, + "grad_norm": 5.519400596618652, + "learning_rate": 6.331759512789126e-07, + "loss": 0.1259, + "step": 32646 + }, + { + "epoch": 88.95640326975477, + "grad_norm": 1.751410961151123, + "learning_rate": 6.328669557316447e-07, + "loss": 0.0471, + "step": 32647 + }, + { + "epoch": 88.95912806539509, + "grad_norm": 2.8046438694000244, + "learning_rate": 6.325580331353065e-07, + "loss": 0.0349, + "step": 32648 + }, + { + "epoch": 88.96185286103542, + "grad_norm": 2.2592806816101074, + "learning_rate": 6.32249183492305e-07, + "loss": 0.0233, + "step": 32649 + }, + { + "epoch": 88.96457765667574, + "grad_norm": 2.1258723735809326, + "learning_rate": 6.319404068050439e-07, + "loss": 0.0625, + "step": 32650 + }, + { + "epoch": 88.96730245231608, + "grad_norm": 3.519087076187134, + "learning_rate": 6.316317030759322e-07, + "loss": 0.067, + "step": 32651 + }, + { + "epoch": 88.97002724795641, + "grad_norm": 2.198286533355713, + "learning_rate": 6.313230723073704e-07, + "loss": 0.0326, + "step": 32652 + }, + { + "epoch": 88.97275204359673, + "grad_norm": 4.731808662414551, + "learning_rate": 6.310145145017633e-07, + "loss": 0.052, + "step": 32653 + }, + { + "epoch": 88.97547683923706, + "grad_norm": 1.3734490871429443, + "learning_rate": 6.30706029661512e-07, + "loss": 0.0265, + "step": 32654 + }, + { + "epoch": 88.97820163487738, + "grad_norm": 2.5870254039764404, + "learning_rate": 6.303976177890214e-07, + "loss": 0.0681, + "step": 32655 + }, + { + "epoch": 88.98092643051771, + "grad_norm": 2.2474260330200195, + "learning_rate": 6.300892788866942e-07, + "loss": 0.0476, + "step": 32656 + }, + { + "epoch": 88.98365122615803, + "grad_norm": 5.296260833740234, + "learning_rate": 6.297810129569282e-07, + "loss": 0.056, + "step": 32657 + }, + { + "epoch": 88.98637602179836, + "grad_norm": 2.11629056930542, + "learning_rate": 6.294728200021261e-07, + "loss": 0.0226, + "step": 32658 + }, + { + "epoch": 88.9891008174387, + "grad_norm": 2.8374900817871094, + "learning_rate": 6.291647000246892e-07, + "loss": 0.0688, + "step": 32659 + }, + { + "epoch": 88.99182561307902, + "grad_norm": 2.699063539505005, + "learning_rate": 6.288566530270157e-07, + "loss": 0.1188, + "step": 32660 + }, + { + "epoch": 88.99455040871935, + "grad_norm": 2.0384888648986816, + "learning_rate": 6.285486790115047e-07, + "loss": 0.0287, + "step": 32661 + }, + { + "epoch": 88.99727520435967, + "grad_norm": 2.511185884475708, + "learning_rate": 6.282407779805544e-07, + "loss": 0.1725, + "step": 32662 + }, + { + "epoch": 89.0, + "grad_norm": 2.5621845722198486, + "learning_rate": 6.279329499365649e-07, + "loss": 0.0365, + "step": 32663 + }, + { + "epoch": 89.00272479564033, + "grad_norm": 2.2070326805114746, + "learning_rate": 6.276251948819312e-07, + "loss": 0.1821, + "step": 32664 + }, + { + "epoch": 89.00544959128065, + "grad_norm": 9.901810646057129, + "learning_rate": 6.273175128190512e-07, + "loss": 0.0916, + "step": 32665 + }, + { + "epoch": 89.00817438692098, + "grad_norm": 2.8300845623016357, + "learning_rate": 6.270099037503185e-07, + "loss": 0.0399, + "step": 32666 + }, + { + "epoch": 89.0108991825613, + "grad_norm": 1.4365792274475098, + "learning_rate": 6.267023676781314e-07, + "loss": 0.0178, + "step": 32667 + }, + { + "epoch": 89.01362397820164, + "grad_norm": 3.269904136657715, + "learning_rate": 6.263949046048868e-07, + "loss": 0.1554, + "step": 32668 + }, + { + "epoch": 89.01634877384195, + "grad_norm": 2.946486234664917, + "learning_rate": 6.260875145329759e-07, + "loss": 0.0316, + "step": 32669 + }, + { + "epoch": 89.01907356948229, + "grad_norm": 1.9456405639648438, + "learning_rate": 6.257801974647937e-07, + "loss": 0.0381, + "step": 32670 + }, + { + "epoch": 89.02179836512262, + "grad_norm": 4.5912957191467285, + "learning_rate": 6.254729534027337e-07, + "loss": 0.1149, + "step": 32671 + }, + { + "epoch": 89.02452316076294, + "grad_norm": 2.9190385341644287, + "learning_rate": 6.251657823491897e-07, + "loss": 0.0414, + "step": 32672 + }, + { + "epoch": 89.02724795640327, + "grad_norm": 1.9378341436386108, + "learning_rate": 6.248586843065518e-07, + "loss": 0.037, + "step": 32673 + }, + { + "epoch": 89.02997275204359, + "grad_norm": 2.1198220252990723, + "learning_rate": 6.245516592772116e-07, + "loss": 0.0262, + "step": 32674 + }, + { + "epoch": 89.03269754768392, + "grad_norm": 2.846665382385254, + "learning_rate": 6.242447072635626e-07, + "loss": 0.1463, + "step": 32675 + }, + { + "epoch": 89.03542234332426, + "grad_norm": 1.989553689956665, + "learning_rate": 6.239378282679953e-07, + "loss": 0.0202, + "step": 32676 + }, + { + "epoch": 89.03814713896458, + "grad_norm": 4.744172096252441, + "learning_rate": 6.236310222928977e-07, + "loss": 0.0194, + "step": 32677 + }, + { + "epoch": 89.04087193460491, + "grad_norm": 2.6994283199310303, + "learning_rate": 6.233242893406577e-07, + "loss": 0.0284, + "step": 32678 + }, + { + "epoch": 89.04359673024523, + "grad_norm": 2.5558924674987793, + "learning_rate": 6.23017629413668e-07, + "loss": 0.0686, + "step": 32679 + }, + { + "epoch": 89.04632152588556, + "grad_norm": 2.528228521347046, + "learning_rate": 6.227110425143157e-07, + "loss": 0.0458, + "step": 32680 + }, + { + "epoch": 89.04904632152588, + "grad_norm": 2.8393657207489014, + "learning_rate": 6.224045286449887e-07, + "loss": 0.0368, + "step": 32681 + }, + { + "epoch": 89.05177111716621, + "grad_norm": 2.4981143474578857, + "learning_rate": 6.220980878080707e-07, + "loss": 0.0534, + "step": 32682 + }, + { + "epoch": 89.05449591280654, + "grad_norm": 3.4097540378570557, + "learning_rate": 6.217917200059509e-07, + "loss": 0.0827, + "step": 32683 + }, + { + "epoch": 89.05722070844686, + "grad_norm": 2.685373306274414, + "learning_rate": 6.214854252410174e-07, + "loss": 0.029, + "step": 32684 + }, + { + "epoch": 89.0599455040872, + "grad_norm": 1.9985028505325317, + "learning_rate": 6.211792035156539e-07, + "loss": 0.0213, + "step": 32685 + }, + { + "epoch": 89.06267029972751, + "grad_norm": 2.6448488235473633, + "learning_rate": 6.208730548322439e-07, + "loss": 0.0171, + "step": 32686 + }, + { + "epoch": 89.06539509536785, + "grad_norm": 2.493192195892334, + "learning_rate": 6.205669791931723e-07, + "loss": 0.0428, + "step": 32687 + }, + { + "epoch": 89.06811989100818, + "grad_norm": 2.4542465209960938, + "learning_rate": 6.202609766008239e-07, + "loss": 0.0311, + "step": 32688 + }, + { + "epoch": 89.0708446866485, + "grad_norm": 2.34928822517395, + "learning_rate": 6.199550470575821e-07, + "loss": 0.0509, + "step": 32689 + }, + { + "epoch": 89.07356948228883, + "grad_norm": 5.120890140533447, + "learning_rate": 6.196491905658264e-07, + "loss": 0.0955, + "step": 32690 + }, + { + "epoch": 89.07629427792915, + "grad_norm": 2.2139899730682373, + "learning_rate": 6.193434071279414e-07, + "loss": 0.1122, + "step": 32691 + }, + { + "epoch": 89.07901907356948, + "grad_norm": 1.9536000490188599, + "learning_rate": 6.190376967463097e-07, + "loss": 0.0192, + "step": 32692 + }, + { + "epoch": 89.0817438692098, + "grad_norm": 1.561396837234497, + "learning_rate": 6.187320594233093e-07, + "loss": 0.0187, + "step": 32693 + }, + { + "epoch": 89.08446866485014, + "grad_norm": 2.2661666870117188, + "learning_rate": 6.184264951613206e-07, + "loss": 0.1571, + "step": 32694 + }, + { + "epoch": 89.08719346049047, + "grad_norm": 4.047026634216309, + "learning_rate": 6.181210039627261e-07, + "loss": 0.1483, + "step": 32695 + }, + { + "epoch": 89.08991825613079, + "grad_norm": 3.3938167095184326, + "learning_rate": 6.178155858299029e-07, + "loss": 0.0966, + "step": 32696 + }, + { + "epoch": 89.09264305177112, + "grad_norm": 2.6834189891815186, + "learning_rate": 6.1751024076523e-07, + "loss": 0.0762, + "step": 32697 + }, + { + "epoch": 89.09536784741144, + "grad_norm": 2.593212842941284, + "learning_rate": 6.172049687710846e-07, + "loss": 0.049, + "step": 32698 + }, + { + "epoch": 89.09809264305177, + "grad_norm": 2.224918842315674, + "learning_rate": 6.168997698498458e-07, + "loss": 0.063, + "step": 32699 + }, + { + "epoch": 89.1008174386921, + "grad_norm": 3.1200671195983887, + "learning_rate": 6.165946440038883e-07, + "loss": 0.0706, + "step": 32700 + }, + { + "epoch": 89.10354223433242, + "grad_norm": 2.4436869621276855, + "learning_rate": 6.162895912355904e-07, + "loss": 0.0462, + "step": 32701 + }, + { + "epoch": 89.10626702997276, + "grad_norm": 1.949854850769043, + "learning_rate": 6.159846115473278e-07, + "loss": 0.0257, + "step": 32702 + }, + { + "epoch": 89.10899182561307, + "grad_norm": 2.124957323074341, + "learning_rate": 6.156797049414742e-07, + "loss": 0.0265, + "step": 32703 + }, + { + "epoch": 89.11171662125341, + "grad_norm": 3.6889209747314453, + "learning_rate": 6.153748714204055e-07, + "loss": 0.1115, + "step": 32704 + }, + { + "epoch": 89.11444141689373, + "grad_norm": 2.025499105453491, + "learning_rate": 6.150701109864954e-07, + "loss": 0.0258, + "step": 32705 + }, + { + "epoch": 89.11716621253406, + "grad_norm": 2.7911789417266846, + "learning_rate": 6.147654236421174e-07, + "loss": 0.0648, + "step": 32706 + }, + { + "epoch": 89.11989100817439, + "grad_norm": 1.8968440294265747, + "learning_rate": 6.144608093896431e-07, + "loss": 0.0244, + "step": 32707 + }, + { + "epoch": 89.12261580381471, + "grad_norm": 2.548025131225586, + "learning_rate": 6.141562682314473e-07, + "loss": 0.0776, + "step": 32708 + }, + { + "epoch": 89.12534059945504, + "grad_norm": 1.5753182172775269, + "learning_rate": 6.138518001699001e-07, + "loss": 0.0197, + "step": 32709 + }, + { + "epoch": 89.12806539509536, + "grad_norm": 2.8098111152648926, + "learning_rate": 6.135474052073731e-07, + "loss": 0.0239, + "step": 32710 + }, + { + "epoch": 89.1307901907357, + "grad_norm": 2.4336137771606445, + "learning_rate": 6.132430833462344e-07, + "loss": 0.0474, + "step": 32711 + }, + { + "epoch": 89.13351498637603, + "grad_norm": 2.1622588634490967, + "learning_rate": 6.129388345888598e-07, + "loss": 0.0456, + "step": 32712 + }, + { + "epoch": 89.13623978201635, + "grad_norm": 2.102802038192749, + "learning_rate": 6.126346589376142e-07, + "loss": 0.0259, + "step": 32713 + }, + { + "epoch": 89.13896457765668, + "grad_norm": 2.271444082260132, + "learning_rate": 6.123305563948667e-07, + "loss": 0.0731, + "step": 32714 + }, + { + "epoch": 89.141689373297, + "grad_norm": 2.9211630821228027, + "learning_rate": 6.120265269629877e-07, + "loss": 0.1062, + "step": 32715 + }, + { + "epoch": 89.14441416893733, + "grad_norm": 2.3627302646636963, + "learning_rate": 6.117225706443441e-07, + "loss": 0.1202, + "step": 32716 + }, + { + "epoch": 89.14713896457765, + "grad_norm": 2.4656448364257812, + "learning_rate": 6.11418687441302e-07, + "loss": 0.0507, + "step": 32717 + }, + { + "epoch": 89.14986376021798, + "grad_norm": 2.1551454067230225, + "learning_rate": 6.111148773562303e-07, + "loss": 0.0582, + "step": 32718 + }, + { + "epoch": 89.15258855585832, + "grad_norm": 2.709928274154663, + "learning_rate": 6.108111403914919e-07, + "loss": 0.0601, + "step": 32719 + }, + { + "epoch": 89.15531335149863, + "grad_norm": 4.146137237548828, + "learning_rate": 6.105074765494556e-07, + "loss": 0.0416, + "step": 32720 + }, + { + "epoch": 89.15803814713897, + "grad_norm": 4.809267997741699, + "learning_rate": 6.102038858324855e-07, + "loss": 0.0658, + "step": 32721 + }, + { + "epoch": 89.16076294277929, + "grad_norm": 10.87790584564209, + "learning_rate": 6.09900368242945e-07, + "loss": 0.0338, + "step": 32722 + }, + { + "epoch": 89.16348773841962, + "grad_norm": 3.1182589530944824, + "learning_rate": 6.095969237831956e-07, + "loss": 0.0901, + "step": 32723 + }, + { + "epoch": 89.16621253405995, + "grad_norm": 3.3349595069885254, + "learning_rate": 6.092935524556065e-07, + "loss": 0.0775, + "step": 32724 + }, + { + "epoch": 89.16893732970027, + "grad_norm": 2.543630599975586, + "learning_rate": 6.089902542625359e-07, + "loss": 0.0615, + "step": 32725 + }, + { + "epoch": 89.1716621253406, + "grad_norm": 3.363832712173462, + "learning_rate": 6.086870292063473e-07, + "loss": 0.0519, + "step": 32726 + }, + { + "epoch": 89.17438692098092, + "grad_norm": 3.0619161128997803, + "learning_rate": 6.083838772894002e-07, + "loss": 0.0495, + "step": 32727 + }, + { + "epoch": 89.17711171662125, + "grad_norm": 2.945568323135376, + "learning_rate": 6.080807985140591e-07, + "loss": 0.0461, + "step": 32728 + }, + { + "epoch": 89.17983651226157, + "grad_norm": 1.8759384155273438, + "learning_rate": 6.077777928826811e-07, + "loss": 0.025, + "step": 32729 + }, + { + "epoch": 89.1825613079019, + "grad_norm": 2.955927610397339, + "learning_rate": 6.074748603976288e-07, + "loss": 0.0773, + "step": 32730 + }, + { + "epoch": 89.18528610354224, + "grad_norm": 2.0474166870117188, + "learning_rate": 6.07172001061258e-07, + "loss": 0.0966, + "step": 32731 + }, + { + "epoch": 89.18801089918256, + "grad_norm": 4.1849493980407715, + "learning_rate": 6.068692148759314e-07, + "loss": 0.0876, + "step": 32732 + }, + { + "epoch": 89.19073569482289, + "grad_norm": 1.793718695640564, + "learning_rate": 6.065665018440037e-07, + "loss": 0.0181, + "step": 32733 + }, + { + "epoch": 89.19346049046321, + "grad_norm": 2.2312920093536377, + "learning_rate": 6.062638619678352e-07, + "loss": 0.0449, + "step": 32734 + }, + { + "epoch": 89.19618528610354, + "grad_norm": 3.3801324367523193, + "learning_rate": 6.059612952497773e-07, + "loss": 0.0439, + "step": 32735 + }, + { + "epoch": 89.19891008174388, + "grad_norm": 3.0099101066589355, + "learning_rate": 6.056588016921949e-07, + "loss": 0.0379, + "step": 32736 + }, + { + "epoch": 89.2016348773842, + "grad_norm": 2.1082236766815186, + "learning_rate": 6.053563812974384e-07, + "loss": 0.0338, + "step": 32737 + }, + { + "epoch": 89.20435967302453, + "grad_norm": 2.8980274200439453, + "learning_rate": 6.050540340678635e-07, + "loss": 0.0331, + "step": 32738 + }, + { + "epoch": 89.20708446866485, + "grad_norm": 2.985513687133789, + "learning_rate": 6.04751760005825e-07, + "loss": 0.0504, + "step": 32739 + }, + { + "epoch": 89.20980926430518, + "grad_norm": 2.653040647506714, + "learning_rate": 6.044495591136778e-07, + "loss": 0.0242, + "step": 32740 + }, + { + "epoch": 89.2125340599455, + "grad_norm": 2.725943088531494, + "learning_rate": 6.041474313937756e-07, + "loss": 0.0619, + "step": 32741 + }, + { + "epoch": 89.21525885558583, + "grad_norm": 1.5715361833572388, + "learning_rate": 6.038453768484709e-07, + "loss": 0.0226, + "step": 32742 + }, + { + "epoch": 89.21798365122616, + "grad_norm": 1.7930307388305664, + "learning_rate": 6.035433954801151e-07, + "loss": 0.0795, + "step": 32743 + }, + { + "epoch": 89.22070844686648, + "grad_norm": 3.3262786865234375, + "learning_rate": 6.03241487291062e-07, + "loss": 0.0284, + "step": 32744 + }, + { + "epoch": 89.22343324250681, + "grad_norm": 2.5820655822753906, + "learning_rate": 6.029396522836617e-07, + "loss": 0.0195, + "step": 32745 + }, + { + "epoch": 89.22615803814713, + "grad_norm": 18.499683380126953, + "learning_rate": 6.026378904602648e-07, + "loss": 0.0504, + "step": 32746 + }, + { + "epoch": 89.22888283378747, + "grad_norm": 2.052060604095459, + "learning_rate": 6.023362018232193e-07, + "loss": 0.0534, + "step": 32747 + }, + { + "epoch": 89.2316076294278, + "grad_norm": 2.4382376670837402, + "learning_rate": 6.0203458637488e-07, + "loss": 0.0599, + "step": 32748 + }, + { + "epoch": 89.23433242506812, + "grad_norm": 1.8200987577438354, + "learning_rate": 6.017330441175917e-07, + "loss": 0.0282, + "step": 32749 + }, + { + "epoch": 89.23705722070845, + "grad_norm": 2.2123477458953857, + "learning_rate": 6.014315750537048e-07, + "loss": 0.0412, + "step": 32750 + }, + { + "epoch": 89.23978201634877, + "grad_norm": 2.306133270263672, + "learning_rate": 6.011301791855639e-07, + "loss": 0.1808, + "step": 32751 + }, + { + "epoch": 89.2425068119891, + "grad_norm": 3.1010894775390625, + "learning_rate": 6.008288565155196e-07, + "loss": 0.0461, + "step": 32752 + }, + { + "epoch": 89.24523160762942, + "grad_norm": 2.197079658508301, + "learning_rate": 6.005276070459187e-07, + "loss": 0.0397, + "step": 32753 + }, + { + "epoch": 89.24795640326975, + "grad_norm": 4.151401996612549, + "learning_rate": 6.002264307791061e-07, + "loss": 0.0743, + "step": 32754 + }, + { + "epoch": 89.25068119891009, + "grad_norm": 2.712472677230835, + "learning_rate": 5.999253277174255e-07, + "loss": 0.0796, + "step": 32755 + }, + { + "epoch": 89.2534059945504, + "grad_norm": 2.7949860095977783, + "learning_rate": 5.996242978632271e-07, + "loss": 0.041, + "step": 32756 + }, + { + "epoch": 89.25613079019074, + "grad_norm": 2.4863429069519043, + "learning_rate": 5.993233412188504e-07, + "loss": 0.0537, + "step": 32757 + }, + { + "epoch": 89.25885558583106, + "grad_norm": 2.821411609649658, + "learning_rate": 5.990224577866422e-07, + "loss": 0.0728, + "step": 32758 + }, + { + "epoch": 89.26158038147139, + "grad_norm": 2.6806938648223877, + "learning_rate": 5.987216475689428e-07, + "loss": 0.039, + "step": 32759 + }, + { + "epoch": 89.26430517711172, + "grad_norm": 2.995911121368408, + "learning_rate": 5.984209105680972e-07, + "loss": 0.0403, + "step": 32760 + }, + { + "epoch": 89.26702997275204, + "grad_norm": 2.1803905963897705, + "learning_rate": 5.981202467864478e-07, + "loss": 0.0241, + "step": 32761 + }, + { + "epoch": 89.26975476839237, + "grad_norm": 2.5929770469665527, + "learning_rate": 5.97819656226335e-07, + "loss": 0.0323, + "step": 32762 + }, + { + "epoch": 89.2724795640327, + "grad_norm": 2.173696756362915, + "learning_rate": 5.975191388900991e-07, + "loss": 0.0647, + "step": 32763 + }, + { + "epoch": 89.27520435967303, + "grad_norm": 2.4097962379455566, + "learning_rate": 5.972186947800829e-07, + "loss": 0.0335, + "step": 32764 + }, + { + "epoch": 89.27792915531334, + "grad_norm": 3.4600203037261963, + "learning_rate": 5.969183238986243e-07, + "loss": 0.1017, + "step": 32765 + }, + { + "epoch": 89.28065395095368, + "grad_norm": 2.4017767906188965, + "learning_rate": 5.966180262480636e-07, + "loss": 0.0634, + "step": 32766 + }, + { + "epoch": 89.28337874659401, + "grad_norm": 2.3255603313446045, + "learning_rate": 5.96317801830737e-07, + "loss": 0.0643, + "step": 32767 + }, + { + "epoch": 89.28610354223433, + "grad_norm": 2.5896341800689697, + "learning_rate": 5.960176506489868e-07, + "loss": 0.0682, + "step": 32768 + }, + { + "epoch": 89.28882833787466, + "grad_norm": 2.865616798400879, + "learning_rate": 5.957175727051467e-07, + "loss": 0.0579, + "step": 32769 + }, + { + "epoch": 89.29155313351498, + "grad_norm": 2.599228858947754, + "learning_rate": 5.954175680015572e-07, + "loss": 0.0493, + "step": 32770 + }, + { + "epoch": 89.29427792915531, + "grad_norm": 2.905381679534912, + "learning_rate": 5.951176365405531e-07, + "loss": 0.1078, + "step": 32771 + }, + { + "epoch": 89.29700272479565, + "grad_norm": 2.6210904121398926, + "learning_rate": 5.948177783244691e-07, + "loss": 0.0334, + "step": 32772 + }, + { + "epoch": 89.29972752043597, + "grad_norm": 2.3333895206451416, + "learning_rate": 5.945179933556422e-07, + "loss": 0.1201, + "step": 32773 + }, + { + "epoch": 89.3024523160763, + "grad_norm": 2.521071672439575, + "learning_rate": 5.942182816364061e-07, + "loss": 0.0431, + "step": 32774 + }, + { + "epoch": 89.30517711171662, + "grad_norm": 3.2333972454071045, + "learning_rate": 5.939186431690957e-07, + "loss": 0.0611, + "step": 32775 + }, + { + "epoch": 89.30790190735695, + "grad_norm": 1.64311683177948, + "learning_rate": 5.936190779560435e-07, + "loss": 0.081, + "step": 32776 + }, + { + "epoch": 89.31062670299727, + "grad_norm": 2.312652349472046, + "learning_rate": 5.933195859995833e-07, + "loss": 0.0696, + "step": 32777 + }, + { + "epoch": 89.3133514986376, + "grad_norm": 2.7373828887939453, + "learning_rate": 5.930201673020486e-07, + "loss": 0.1133, + "step": 32778 + }, + { + "epoch": 89.31607629427793, + "grad_norm": 2.6825835704803467, + "learning_rate": 5.927208218657676e-07, + "loss": 0.1092, + "step": 32779 + }, + { + "epoch": 89.31880108991825, + "grad_norm": 2.91965913772583, + "learning_rate": 5.924215496930763e-07, + "loss": 0.0297, + "step": 32780 + }, + { + "epoch": 89.32152588555859, + "grad_norm": 1.9278688430786133, + "learning_rate": 5.921223507863028e-07, + "loss": 0.0203, + "step": 32781 + }, + { + "epoch": 89.3242506811989, + "grad_norm": 2.232983350753784, + "learning_rate": 5.918232251477784e-07, + "loss": 0.1147, + "step": 32782 + }, + { + "epoch": 89.32697547683924, + "grad_norm": 2.1401584148406982, + "learning_rate": 5.915241727798293e-07, + "loss": 0.029, + "step": 32783 + }, + { + "epoch": 89.32970027247957, + "grad_norm": 3.384432792663574, + "learning_rate": 5.91225193684789e-07, + "loss": 0.033, + "step": 32784 + }, + { + "epoch": 89.33242506811989, + "grad_norm": 2.4877140522003174, + "learning_rate": 5.909262878649846e-07, + "loss": 0.0331, + "step": 32785 + }, + { + "epoch": 89.33514986376022, + "grad_norm": 2.889374256134033, + "learning_rate": 5.90627455322742e-07, + "loss": 0.0335, + "step": 32786 + }, + { + "epoch": 89.33787465940054, + "grad_norm": 2.776301860809326, + "learning_rate": 5.903286960603905e-07, + "loss": 0.0567, + "step": 32787 + }, + { + "epoch": 89.34059945504087, + "grad_norm": 2.3320226669311523, + "learning_rate": 5.900300100802558e-07, + "loss": 0.0274, + "step": 32788 + }, + { + "epoch": 89.34332425068119, + "grad_norm": 2.927804946899414, + "learning_rate": 5.897313973846652e-07, + "loss": 0.1109, + "step": 32789 + }, + { + "epoch": 89.34604904632153, + "grad_norm": 1.7589563131332397, + "learning_rate": 5.894328579759434e-07, + "loss": 0.0797, + "step": 32790 + }, + { + "epoch": 89.34877384196186, + "grad_norm": 3.696570873260498, + "learning_rate": 5.891343918564163e-07, + "loss": 0.1422, + "step": 32791 + }, + { + "epoch": 89.35149863760218, + "grad_norm": 1.8898727893829346, + "learning_rate": 5.888359990284065e-07, + "loss": 0.0294, + "step": 32792 + }, + { + "epoch": 89.35422343324251, + "grad_norm": 1.7833526134490967, + "learning_rate": 5.885376794942399e-07, + "loss": 0.0138, + "step": 32793 + }, + { + "epoch": 89.35694822888283, + "grad_norm": 2.947908639907837, + "learning_rate": 5.882394332562392e-07, + "loss": 0.035, + "step": 32794 + }, + { + "epoch": 89.35967302452316, + "grad_norm": 1.8422151803970337, + "learning_rate": 5.879412603167267e-07, + "loss": 0.0899, + "step": 32795 + }, + { + "epoch": 89.3623978201635, + "grad_norm": 2.5154712200164795, + "learning_rate": 5.87643160678023e-07, + "loss": 0.1249, + "step": 32796 + }, + { + "epoch": 89.36512261580381, + "grad_norm": 4.435185432434082, + "learning_rate": 5.87345134342453e-07, + "loss": 0.0288, + "step": 32797 + }, + { + "epoch": 89.36784741144415, + "grad_norm": 2.7728612422943115, + "learning_rate": 5.870471813123368e-07, + "loss": 0.1315, + "step": 32798 + }, + { + "epoch": 89.37057220708446, + "grad_norm": 3.42110538482666, + "learning_rate": 5.867493015899916e-07, + "loss": 0.0632, + "step": 32799 + }, + { + "epoch": 89.3732970027248, + "grad_norm": 3.111011266708374, + "learning_rate": 5.864514951777423e-07, + "loss": 0.0719, + "step": 32800 + }, + { + "epoch": 89.37602179836512, + "grad_norm": 1.8426586389541626, + "learning_rate": 5.861537620779056e-07, + "loss": 0.0244, + "step": 32801 + }, + { + "epoch": 89.37874659400545, + "grad_norm": 3.0814948081970215, + "learning_rate": 5.858561022928e-07, + "loss": 0.112, + "step": 32802 + }, + { + "epoch": 89.38147138964578, + "grad_norm": 2.558114528656006, + "learning_rate": 5.855585158247434e-07, + "loss": 0.0428, + "step": 32803 + }, + { + "epoch": 89.3841961852861, + "grad_norm": 2.08484148979187, + "learning_rate": 5.852610026760541e-07, + "loss": 0.027, + "step": 32804 + }, + { + "epoch": 89.38692098092643, + "grad_norm": 3.1211516857147217, + "learning_rate": 5.849635628490502e-07, + "loss": 0.117, + "step": 32805 + }, + { + "epoch": 89.38964577656675, + "grad_norm": 1.9015812873840332, + "learning_rate": 5.846661963460465e-07, + "loss": 0.1303, + "step": 32806 + }, + { + "epoch": 89.39237057220708, + "grad_norm": 1.7309904098510742, + "learning_rate": 5.8436890316936e-07, + "loss": 0.0252, + "step": 32807 + }, + { + "epoch": 89.39509536784742, + "grad_norm": 1.7384289503097534, + "learning_rate": 5.840716833213033e-07, + "loss": 0.0389, + "step": 32808 + }, + { + "epoch": 89.39782016348774, + "grad_norm": 2.4681620597839355, + "learning_rate": 5.837745368041958e-07, + "loss": 0.0398, + "step": 32809 + }, + { + "epoch": 89.40054495912807, + "grad_norm": 2.519777774810791, + "learning_rate": 5.834774636203488e-07, + "loss": 0.0523, + "step": 32810 + }, + { + "epoch": 89.40326975476839, + "grad_norm": 1.971938133239746, + "learning_rate": 5.831804637720762e-07, + "loss": 0.0243, + "step": 32811 + }, + { + "epoch": 89.40599455040872, + "grad_norm": 4.039462089538574, + "learning_rate": 5.828835372616892e-07, + "loss": 0.0792, + "step": 32812 + }, + { + "epoch": 89.40871934604904, + "grad_norm": 2.5203163623809814, + "learning_rate": 5.82586684091504e-07, + "loss": 0.1002, + "step": 32813 + }, + { + "epoch": 89.41144414168937, + "grad_norm": 1.8804906606674194, + "learning_rate": 5.822899042638297e-07, + "loss": 0.1174, + "step": 32814 + }, + { + "epoch": 89.4141689373297, + "grad_norm": 3.847694158554077, + "learning_rate": 5.8199319778098e-07, + "loss": 0.0779, + "step": 32815 + }, + { + "epoch": 89.41689373297002, + "grad_norm": 2.758211612701416, + "learning_rate": 5.816965646452622e-07, + "loss": 0.0592, + "step": 32816 + }, + { + "epoch": 89.41961852861036, + "grad_norm": 2.610078811645508, + "learning_rate": 5.814000048589896e-07, + "loss": 0.0995, + "step": 32817 + }, + { + "epoch": 89.42234332425068, + "grad_norm": 4.977338790893555, + "learning_rate": 5.811035184244706e-07, + "loss": 0.0934, + "step": 32818 + }, + { + "epoch": 89.42506811989101, + "grad_norm": 4.272146701812744, + "learning_rate": 5.808071053440145e-07, + "loss": 0.0891, + "step": 32819 + }, + { + "epoch": 89.42779291553134, + "grad_norm": 1.384609341621399, + "learning_rate": 5.805107656199272e-07, + "loss": 0.0177, + "step": 32820 + }, + { + "epoch": 89.43051771117166, + "grad_norm": 2.0737600326538086, + "learning_rate": 5.8021449925452e-07, + "loss": 0.016, + "step": 32821 + }, + { + "epoch": 89.433242506812, + "grad_norm": 3.2330639362335205, + "learning_rate": 5.799183062501001e-07, + "loss": 0.069, + "step": 32822 + }, + { + "epoch": 89.43596730245231, + "grad_norm": 2.6659324169158936, + "learning_rate": 5.796221866089735e-07, + "loss": 0.0446, + "step": 32823 + }, + { + "epoch": 89.43869209809264, + "grad_norm": 3.4410345554351807, + "learning_rate": 5.79326140333445e-07, + "loss": 0.0375, + "step": 32824 + }, + { + "epoch": 89.44141689373296, + "grad_norm": 3.1975862979888916, + "learning_rate": 5.790301674258214e-07, + "loss": 0.0577, + "step": 32825 + }, + { + "epoch": 89.4441416893733, + "grad_norm": 2.658019781112671, + "learning_rate": 5.787342678884089e-07, + "loss": 0.1726, + "step": 32826 + }, + { + "epoch": 89.44686648501363, + "grad_norm": 1.9277862310409546, + "learning_rate": 5.784384417235101e-07, + "loss": 0.0254, + "step": 32827 + }, + { + "epoch": 89.44959128065395, + "grad_norm": 3.593170166015625, + "learning_rate": 5.781426889334285e-07, + "loss": 0.0748, + "step": 32828 + }, + { + "epoch": 89.45231607629428, + "grad_norm": 2.957268714904785, + "learning_rate": 5.778470095204691e-07, + "loss": 0.0733, + "step": 32829 + }, + { + "epoch": 89.4550408719346, + "grad_norm": 3.954479217529297, + "learning_rate": 5.775514034869345e-07, + "loss": 0.0798, + "step": 32830 + }, + { + "epoch": 89.45776566757493, + "grad_norm": 2.9770193099975586, + "learning_rate": 5.772558708351262e-07, + "loss": 0.0762, + "step": 32831 + }, + { + "epoch": 89.46049046321527, + "grad_norm": 2.866166591644287, + "learning_rate": 5.769604115673444e-07, + "loss": 0.0399, + "step": 32832 + }, + { + "epoch": 89.46321525885558, + "grad_norm": 2.224769353866577, + "learning_rate": 5.76665025685893e-07, + "loss": 0.0307, + "step": 32833 + }, + { + "epoch": 89.46594005449592, + "grad_norm": 2.5665481090545654, + "learning_rate": 5.763697131930712e-07, + "loss": 0.0352, + "step": 32834 + }, + { + "epoch": 89.46866485013624, + "grad_norm": 1.5102972984313965, + "learning_rate": 5.760744740911794e-07, + "loss": 0.0183, + "step": 32835 + }, + { + "epoch": 89.47138964577657, + "grad_norm": 2.10481595993042, + "learning_rate": 5.757793083825147e-07, + "loss": 0.0552, + "step": 32836 + }, + { + "epoch": 89.47411444141689, + "grad_norm": 4.771435260772705, + "learning_rate": 5.754842160693785e-07, + "loss": 0.0833, + "step": 32837 + }, + { + "epoch": 89.47683923705722, + "grad_norm": 2.789193868637085, + "learning_rate": 5.751891971540658e-07, + "loss": 0.0639, + "step": 32838 + }, + { + "epoch": 89.47956403269755, + "grad_norm": 2.961798906326294, + "learning_rate": 5.748942516388789e-07, + "loss": 0.1006, + "step": 32839 + }, + { + "epoch": 89.48228882833787, + "grad_norm": 3.6757514476776123, + "learning_rate": 5.745993795261096e-07, + "loss": 0.0284, + "step": 32840 + }, + { + "epoch": 89.4850136239782, + "grad_norm": 2.3897275924682617, + "learning_rate": 5.743045808180592e-07, + "loss": 0.0339, + "step": 32841 + }, + { + "epoch": 89.48773841961852, + "grad_norm": 2.893338918685913, + "learning_rate": 5.740098555170215e-07, + "loss": 0.1059, + "step": 32842 + }, + { + "epoch": 89.49046321525886, + "grad_norm": 2.3885364532470703, + "learning_rate": 5.737152036252914e-07, + "loss": 0.1679, + "step": 32843 + }, + { + "epoch": 89.49318801089919, + "grad_norm": 2.1282293796539307, + "learning_rate": 5.734206251451624e-07, + "loss": 0.0418, + "step": 32844 + }, + { + "epoch": 89.49591280653951, + "grad_norm": 2.4373741149902344, + "learning_rate": 5.731261200789318e-07, + "loss": 0.0537, + "step": 32845 + }, + { + "epoch": 89.49863760217984, + "grad_norm": 3.325336217880249, + "learning_rate": 5.728316884288909e-07, + "loss": 0.0233, + "step": 32846 + }, + { + "epoch": 89.50136239782016, + "grad_norm": 2.2183892726898193, + "learning_rate": 5.725373301973336e-07, + "loss": 0.0456, + "step": 32847 + }, + { + "epoch": 89.50408719346049, + "grad_norm": 1.9245525598526, + "learning_rate": 5.722430453865513e-07, + "loss": 0.0171, + "step": 32848 + }, + { + "epoch": 89.50681198910081, + "grad_norm": 1.6682052612304688, + "learning_rate": 5.719488339988378e-07, + "loss": 0.0232, + "step": 32849 + }, + { + "epoch": 89.50953678474114, + "grad_norm": 2.2161269187927246, + "learning_rate": 5.716546960364844e-07, + "loss": 0.0538, + "step": 32850 + }, + { + "epoch": 89.51226158038148, + "grad_norm": 14.691620826721191, + "learning_rate": 5.713606315017794e-07, + "loss": 0.0448, + "step": 32851 + }, + { + "epoch": 89.5149863760218, + "grad_norm": 2.354126453399658, + "learning_rate": 5.710666403970133e-07, + "loss": 0.0698, + "step": 32852 + }, + { + "epoch": 89.51771117166213, + "grad_norm": 3.4341745376586914, + "learning_rate": 5.707727227244786e-07, + "loss": 0.0202, + "step": 32853 + }, + { + "epoch": 89.52043596730245, + "grad_norm": 2.4215874671936035, + "learning_rate": 5.704788784864612e-07, + "loss": 0.1346, + "step": 32854 + }, + { + "epoch": 89.52316076294278, + "grad_norm": 2.959627628326416, + "learning_rate": 5.701851076852504e-07, + "loss": 0.1062, + "step": 32855 + }, + { + "epoch": 89.52588555858311, + "grad_norm": 1.748242735862732, + "learning_rate": 5.698914103231357e-07, + "loss": 0.0253, + "step": 32856 + }, + { + "epoch": 89.52861035422343, + "grad_norm": 3.1157803535461426, + "learning_rate": 5.695977864024016e-07, + "loss": 0.226, + "step": 32857 + }, + { + "epoch": 89.53133514986376, + "grad_norm": 3.9220938682556152, + "learning_rate": 5.693042359253387e-07, + "loss": 0.0638, + "step": 32858 + }, + { + "epoch": 89.53405994550408, + "grad_norm": 3.532024621963501, + "learning_rate": 5.690107588942306e-07, + "loss": 0.1261, + "step": 32859 + }, + { + "epoch": 89.53678474114442, + "grad_norm": 2.2799363136291504, + "learning_rate": 5.687173553113623e-07, + "loss": 0.0352, + "step": 32860 + }, + { + "epoch": 89.53950953678473, + "grad_norm": 2.646981954574585, + "learning_rate": 5.684240251790186e-07, + "loss": 0.0389, + "step": 32861 + }, + { + "epoch": 89.54223433242507, + "grad_norm": 2.868276357650757, + "learning_rate": 5.681307684994874e-07, + "loss": 0.0541, + "step": 32862 + }, + { + "epoch": 89.5449591280654, + "grad_norm": 3.010094165802002, + "learning_rate": 5.678375852750496e-07, + "loss": 0.1429, + "step": 32863 + }, + { + "epoch": 89.54768392370572, + "grad_norm": 2.4626591205596924, + "learning_rate": 5.675444755079873e-07, + "loss": 0.0528, + "step": 32864 + }, + { + "epoch": 89.55040871934605, + "grad_norm": 5.357175350189209, + "learning_rate": 5.672514392005868e-07, + "loss": 0.2043, + "step": 32865 + }, + { + "epoch": 89.55313351498637, + "grad_norm": 2.567004919052124, + "learning_rate": 5.669584763551284e-07, + "loss": 0.0909, + "step": 32866 + }, + { + "epoch": 89.5558583106267, + "grad_norm": 5.483394622802734, + "learning_rate": 5.666655869738935e-07, + "loss": 0.0738, + "step": 32867 + }, + { + "epoch": 89.55858310626704, + "grad_norm": 2.470198154449463, + "learning_rate": 5.663727710591627e-07, + "loss": 0.0701, + "step": 32868 + }, + { + "epoch": 89.56130790190736, + "grad_norm": 3.3590195178985596, + "learning_rate": 5.660800286132173e-07, + "loss": 0.2203, + "step": 32869 + }, + { + "epoch": 89.56403269754769, + "grad_norm": 2.435865640640259, + "learning_rate": 5.657873596383378e-07, + "loss": 0.1519, + "step": 32870 + }, + { + "epoch": 89.566757493188, + "grad_norm": 2.570725202560425, + "learning_rate": 5.654947641368036e-07, + "loss": 0.0366, + "step": 32871 + }, + { + "epoch": 89.56948228882834, + "grad_norm": 1.5694717168807983, + "learning_rate": 5.652022421108894e-07, + "loss": 0.024, + "step": 32872 + }, + { + "epoch": 89.57220708446866, + "grad_norm": 2.274602174758911, + "learning_rate": 5.649097935628778e-07, + "loss": 0.0638, + "step": 32873 + }, + { + "epoch": 89.57493188010899, + "grad_norm": 2.2057981491088867, + "learning_rate": 5.646174184950459e-07, + "loss": 0.0829, + "step": 32874 + }, + { + "epoch": 89.57765667574932, + "grad_norm": 3.423875570297241, + "learning_rate": 5.643251169096698e-07, + "loss": 0.1163, + "step": 32875 + }, + { + "epoch": 89.58038147138964, + "grad_norm": 1.4155492782592773, + "learning_rate": 5.640328888090263e-07, + "loss": 0.0162, + "step": 32876 + }, + { + "epoch": 89.58310626702998, + "grad_norm": 2.519733190536499, + "learning_rate": 5.637407341953893e-07, + "loss": 0.0652, + "step": 32877 + }, + { + "epoch": 89.5858310626703, + "grad_norm": 2.3193299770355225, + "learning_rate": 5.634486530710382e-07, + "loss": 0.0406, + "step": 32878 + }, + { + "epoch": 89.58855585831063, + "grad_norm": 3.3823933601379395, + "learning_rate": 5.631566454382442e-07, + "loss": 0.022, + "step": 32879 + }, + { + "epoch": 89.59128065395096, + "grad_norm": 2.3177411556243896, + "learning_rate": 5.628647112992824e-07, + "loss": 0.0357, + "step": 32880 + }, + { + "epoch": 89.59400544959128, + "grad_norm": 2.8449323177337646, + "learning_rate": 5.625728506564254e-07, + "loss": 0.0537, + "step": 32881 + }, + { + "epoch": 89.59673024523161, + "grad_norm": 3.5362963676452637, + "learning_rate": 5.622810635119491e-07, + "loss": 0.1477, + "step": 32882 + }, + { + "epoch": 89.59945504087193, + "grad_norm": 3.34096622467041, + "learning_rate": 5.61989349868124e-07, + "loss": 0.0932, + "step": 32883 + }, + { + "epoch": 89.60217983651226, + "grad_norm": 2.2542879581451416, + "learning_rate": 5.616977097272214e-07, + "loss": 0.0302, + "step": 32884 + }, + { + "epoch": 89.60490463215258, + "grad_norm": 2.017786741256714, + "learning_rate": 5.614061430915118e-07, + "loss": 0.0296, + "step": 32885 + }, + { + "epoch": 89.60762942779292, + "grad_norm": 2.867518186569214, + "learning_rate": 5.611146499632692e-07, + "loss": 0.0371, + "step": 32886 + }, + { + "epoch": 89.61035422343325, + "grad_norm": 2.4117448329925537, + "learning_rate": 5.608232303447625e-07, + "loss": 0.051, + "step": 32887 + }, + { + "epoch": 89.61307901907357, + "grad_norm": 4.533914566040039, + "learning_rate": 5.605318842382589e-07, + "loss": 0.0869, + "step": 32888 + }, + { + "epoch": 89.6158038147139, + "grad_norm": 2.6035053730010986, + "learning_rate": 5.60240611646029e-07, + "loss": 0.0285, + "step": 32889 + }, + { + "epoch": 89.61852861035422, + "grad_norm": 1.7373334169387817, + "learning_rate": 5.599494125703431e-07, + "loss": 0.0671, + "step": 32890 + }, + { + "epoch": 89.62125340599455, + "grad_norm": 4.364772796630859, + "learning_rate": 5.59658287013467e-07, + "loss": 0.0485, + "step": 32891 + }, + { + "epoch": 89.62397820163488, + "grad_norm": 3.0294835567474365, + "learning_rate": 5.59367234977668e-07, + "loss": 0.0429, + "step": 32892 + }, + { + "epoch": 89.6267029972752, + "grad_norm": 2.105394124984741, + "learning_rate": 5.590762564652119e-07, + "loss": 0.1594, + "step": 32893 + }, + { + "epoch": 89.62942779291554, + "grad_norm": 2.268779754638672, + "learning_rate": 5.587853514783681e-07, + "loss": 0.0267, + "step": 32894 + }, + { + "epoch": 89.63215258855585, + "grad_norm": 1.684410572052002, + "learning_rate": 5.584945200193992e-07, + "loss": 0.0327, + "step": 32895 + }, + { + "epoch": 89.63487738419619, + "grad_norm": 2.1431210041046143, + "learning_rate": 5.582037620905723e-07, + "loss": 0.025, + "step": 32896 + }, + { + "epoch": 89.6376021798365, + "grad_norm": 3.0194146633148193, + "learning_rate": 5.579130776941488e-07, + "loss": 0.0322, + "step": 32897 + }, + { + "epoch": 89.64032697547684, + "grad_norm": 1.8627034425735474, + "learning_rate": 5.576224668323949e-07, + "loss": 0.0215, + "step": 32898 + }, + { + "epoch": 89.64305177111717, + "grad_norm": 1.5820367336273193, + "learning_rate": 5.57331929507574e-07, + "loss": 0.0902, + "step": 32899 + }, + { + "epoch": 89.64577656675749, + "grad_norm": 5.083982467651367, + "learning_rate": 5.570414657219481e-07, + "loss": 0.021, + "step": 32900 + }, + { + "epoch": 89.64850136239782, + "grad_norm": 1.6487438678741455, + "learning_rate": 5.567510754777782e-07, + "loss": 0.0175, + "step": 32901 + }, + { + "epoch": 89.65122615803814, + "grad_norm": 2.657700538635254, + "learning_rate": 5.564607587773274e-07, + "loss": 0.0336, + "step": 32902 + }, + { + "epoch": 89.65395095367847, + "grad_norm": 2.9634604454040527, + "learning_rate": 5.561705156228569e-07, + "loss": 0.0368, + "step": 32903 + }, + { + "epoch": 89.65667574931881, + "grad_norm": 1.4109307527542114, + "learning_rate": 5.558803460166274e-07, + "loss": 0.0159, + "step": 32904 + }, + { + "epoch": 89.65940054495913, + "grad_norm": 3.901301383972168, + "learning_rate": 5.555902499608956e-07, + "loss": 0.0363, + "step": 32905 + }, + { + "epoch": 89.66212534059946, + "grad_norm": 2.360651731491089, + "learning_rate": 5.553002274579244e-07, + "loss": 0.0452, + "step": 32906 + }, + { + "epoch": 89.66485013623978, + "grad_norm": 3.332643508911133, + "learning_rate": 5.550102785099687e-07, + "loss": 0.0926, + "step": 32907 + }, + { + "epoch": 89.66757493188011, + "grad_norm": 3.7273032665252686, + "learning_rate": 5.547204031192921e-07, + "loss": 0.1203, + "step": 32908 + }, + { + "epoch": 89.67029972752043, + "grad_norm": 2.0486652851104736, + "learning_rate": 5.544306012881462e-07, + "loss": 0.2535, + "step": 32909 + }, + { + "epoch": 89.67302452316076, + "grad_norm": 3.2788918018341064, + "learning_rate": 5.541408730187925e-07, + "loss": 0.0579, + "step": 32910 + }, + { + "epoch": 89.6757493188011, + "grad_norm": 2.957430601119995, + "learning_rate": 5.538512183134859e-07, + "loss": 0.1201, + "step": 32911 + }, + { + "epoch": 89.67847411444141, + "grad_norm": 5.769819259643555, + "learning_rate": 5.535616371744823e-07, + "loss": 0.0732, + "step": 32912 + }, + { + "epoch": 89.68119891008175, + "grad_norm": 2.5564122200012207, + "learning_rate": 5.532721296040344e-07, + "loss": 0.0898, + "step": 32913 + }, + { + "epoch": 89.68392370572207, + "grad_norm": 2.6478564739227295, + "learning_rate": 5.529826956044016e-07, + "loss": 0.0967, + "step": 32914 + }, + { + "epoch": 89.6866485013624, + "grad_norm": 2.3558647632598877, + "learning_rate": 5.526933351778352e-07, + "loss": 0.0333, + "step": 32915 + }, + { + "epoch": 89.68937329700273, + "grad_norm": 2.0492758750915527, + "learning_rate": 5.52404048326588e-07, + "loss": 0.0197, + "step": 32916 + }, + { + "epoch": 89.69209809264305, + "grad_norm": 1.885439157485962, + "learning_rate": 5.521148350529137e-07, + "loss": 0.0267, + "step": 32917 + }, + { + "epoch": 89.69482288828338, + "grad_norm": 2.625890016555786, + "learning_rate": 5.518256953590661e-07, + "loss": 0.083, + "step": 32918 + }, + { + "epoch": 89.6975476839237, + "grad_norm": 2.996981382369995, + "learning_rate": 5.515366292472956e-07, + "loss": 0.1002, + "step": 32919 + }, + { + "epoch": 89.70027247956403, + "grad_norm": 2.68178653717041, + "learning_rate": 5.512476367198538e-07, + "loss": 0.0501, + "step": 32920 + }, + { + "epoch": 89.70299727520435, + "grad_norm": 2.323176860809326, + "learning_rate": 5.509587177789911e-07, + "loss": 0.0574, + "step": 32921 + }, + { + "epoch": 89.70572207084469, + "grad_norm": 2.613534927368164, + "learning_rate": 5.506698724269577e-07, + "loss": 0.0295, + "step": 32922 + }, + { + "epoch": 89.70844686648502, + "grad_norm": 2.291454315185547, + "learning_rate": 5.503811006660032e-07, + "loss": 0.1754, + "step": 32923 + }, + { + "epoch": 89.71117166212534, + "grad_norm": 2.5666966438293457, + "learning_rate": 5.500924024983756e-07, + "loss": 0.0284, + "step": 32924 + }, + { + "epoch": 89.71389645776567, + "grad_norm": 2.7875821590423584, + "learning_rate": 5.498037779263265e-07, + "loss": 0.1326, + "step": 32925 + }, + { + "epoch": 89.71662125340599, + "grad_norm": 2.7814249992370605, + "learning_rate": 5.495152269520987e-07, + "loss": 0.097, + "step": 32926 + }, + { + "epoch": 89.71934604904632, + "grad_norm": 4.380067348480225, + "learning_rate": 5.492267495779447e-07, + "loss": 0.0491, + "step": 32927 + }, + { + "epoch": 89.72207084468666, + "grad_norm": 2.6277806758880615, + "learning_rate": 5.489383458061071e-07, + "loss": 0.0769, + "step": 32928 + }, + { + "epoch": 89.72479564032697, + "grad_norm": 3.794962167739868, + "learning_rate": 5.48650015638833e-07, + "loss": 0.0611, + "step": 32929 + }, + { + "epoch": 89.7275204359673, + "grad_norm": 2.078131914138794, + "learning_rate": 5.483617590783696e-07, + "loss": 0.1018, + "step": 32930 + }, + { + "epoch": 89.73024523160763, + "grad_norm": 2.3437399864196777, + "learning_rate": 5.480735761269607e-07, + "loss": 0.0845, + "step": 32931 + }, + { + "epoch": 89.73297002724796, + "grad_norm": 3.3094420433044434, + "learning_rate": 5.477854667868509e-07, + "loss": 0.1088, + "step": 32932 + }, + { + "epoch": 89.73569482288828, + "grad_norm": 5.927574634552002, + "learning_rate": 5.474974310602821e-07, + "loss": 0.0262, + "step": 32933 + }, + { + "epoch": 89.73841961852861, + "grad_norm": 2.4199492931365967, + "learning_rate": 5.472094689495e-07, + "loss": 0.039, + "step": 32934 + }, + { + "epoch": 89.74114441416894, + "grad_norm": 2.1367902755737305, + "learning_rate": 5.469215804567474e-07, + "loss": 0.033, + "step": 32935 + }, + { + "epoch": 89.74386920980926, + "grad_norm": 2.1038002967834473, + "learning_rate": 5.466337655842647e-07, + "loss": 0.0301, + "step": 32936 + }, + { + "epoch": 89.7465940054496, + "grad_norm": 1.8601211309432983, + "learning_rate": 5.463460243342922e-07, + "loss": 0.0213, + "step": 32937 + }, + { + "epoch": 89.74931880108991, + "grad_norm": 2.783090114593506, + "learning_rate": 5.460583567090738e-07, + "loss": 0.0622, + "step": 32938 + }, + { + "epoch": 89.75204359673025, + "grad_norm": 2.488863229751587, + "learning_rate": 5.457707627108489e-07, + "loss": 0.0536, + "step": 32939 + }, + { + "epoch": 89.75476839237058, + "grad_norm": 2.3114936351776123, + "learning_rate": 5.454832423418577e-07, + "loss": 0.1343, + "step": 32940 + }, + { + "epoch": 89.7574931880109, + "grad_norm": 2.3771212100982666, + "learning_rate": 5.451957956043363e-07, + "loss": 0.0267, + "step": 32941 + }, + { + "epoch": 89.76021798365123, + "grad_norm": 2.1391761302948, + "learning_rate": 5.449084225005263e-07, + "loss": 0.026, + "step": 32942 + }, + { + "epoch": 89.76294277929155, + "grad_norm": 3.2617347240448, + "learning_rate": 5.44621123032667e-07, + "loss": 0.2307, + "step": 32943 + }, + { + "epoch": 89.76566757493188, + "grad_norm": 1.751294493675232, + "learning_rate": 5.443338972029932e-07, + "loss": 0.0131, + "step": 32944 + }, + { + "epoch": 89.7683923705722, + "grad_norm": 3.4908711910247803, + "learning_rate": 5.440467450137432e-07, + "loss": 0.1128, + "step": 32945 + }, + { + "epoch": 89.77111716621253, + "grad_norm": 2.7195677757263184, + "learning_rate": 5.437596664671518e-07, + "loss": 0.0578, + "step": 32946 + }, + { + "epoch": 89.77384196185287, + "grad_norm": 3.3138933181762695, + "learning_rate": 5.434726615654562e-07, + "loss": 0.1062, + "step": 32947 + }, + { + "epoch": 89.77656675749319, + "grad_norm": 2.702662467956543, + "learning_rate": 5.431857303108923e-07, + "loss": 0.0457, + "step": 32948 + }, + { + "epoch": 89.77929155313352, + "grad_norm": 2.3171818256378174, + "learning_rate": 5.428988727056928e-07, + "loss": 0.081, + "step": 32949 + }, + { + "epoch": 89.78201634877384, + "grad_norm": 4.419804573059082, + "learning_rate": 5.426120887520914e-07, + "loss": 0.1153, + "step": 32950 + }, + { + "epoch": 89.78474114441417, + "grad_norm": 2.3891665935516357, + "learning_rate": 5.423253784523241e-07, + "loss": 0.0311, + "step": 32951 + }, + { + "epoch": 89.7874659400545, + "grad_norm": 2.4410691261291504, + "learning_rate": 5.420387418086215e-07, + "loss": 0.0289, + "step": 32952 + }, + { + "epoch": 89.79019073569482, + "grad_norm": 2.494887351989746, + "learning_rate": 5.417521788232161e-07, + "loss": 0.0427, + "step": 32953 + }, + { + "epoch": 89.79291553133515, + "grad_norm": 2.5476417541503906, + "learning_rate": 5.414656894983416e-07, + "loss": 0.0401, + "step": 32954 + }, + { + "epoch": 89.79564032697547, + "grad_norm": 3.26421856880188, + "learning_rate": 5.411792738362275e-07, + "loss": 0.1295, + "step": 32955 + }, + { + "epoch": 89.7983651226158, + "grad_norm": 2.7946064472198486, + "learning_rate": 5.408929318391054e-07, + "loss": 0.0589, + "step": 32956 + }, + { + "epoch": 89.80108991825612, + "grad_norm": 1.8081120252609253, + "learning_rate": 5.406066635092034e-07, + "loss": 0.0244, + "step": 32957 + }, + { + "epoch": 89.80381471389646, + "grad_norm": 1.8078542947769165, + "learning_rate": 5.403204688487517e-07, + "loss": 0.0253, + "step": 32958 + }, + { + "epoch": 89.80653950953679, + "grad_norm": 1.895068883895874, + "learning_rate": 5.400343478599812e-07, + "loss": 0.0264, + "step": 32959 + }, + { + "epoch": 89.80926430517711, + "grad_norm": 2.275346040725708, + "learning_rate": 5.397483005451199e-07, + "loss": 0.0461, + "step": 32960 + }, + { + "epoch": 89.81198910081744, + "grad_norm": 4.531795024871826, + "learning_rate": 5.394623269063926e-07, + "loss": 0.0252, + "step": 32961 + }, + { + "epoch": 89.81471389645776, + "grad_norm": 3.631432294845581, + "learning_rate": 5.391764269460276e-07, + "loss": 0.1023, + "step": 32962 + }, + { + "epoch": 89.8174386920981, + "grad_norm": 3.0109949111938477, + "learning_rate": 5.388906006662542e-07, + "loss": 0.0214, + "step": 32963 + }, + { + "epoch": 89.82016348773843, + "grad_norm": 3.0166165828704834, + "learning_rate": 5.386048480692952e-07, + "loss": 0.0717, + "step": 32964 + }, + { + "epoch": 89.82288828337875, + "grad_norm": 1.6970953941345215, + "learning_rate": 5.383191691573775e-07, + "loss": 0.0299, + "step": 32965 + }, + { + "epoch": 89.82561307901908, + "grad_norm": 2.4598007202148438, + "learning_rate": 5.380335639327238e-07, + "loss": 0.0297, + "step": 32966 + }, + { + "epoch": 89.8283378746594, + "grad_norm": 2.238889694213867, + "learning_rate": 5.377480323975626e-07, + "loss": 0.0941, + "step": 32967 + }, + { + "epoch": 89.83106267029973, + "grad_norm": 2.525719165802002, + "learning_rate": 5.37462574554114e-07, + "loss": 0.112, + "step": 32968 + }, + { + "epoch": 89.83378746594005, + "grad_norm": 1.9318571090698242, + "learning_rate": 5.37177190404603e-07, + "loss": 0.0241, + "step": 32969 + }, + { + "epoch": 89.83651226158038, + "grad_norm": 2.7263565063476562, + "learning_rate": 5.368918799512502e-07, + "loss": 0.089, + "step": 32970 + }, + { + "epoch": 89.83923705722071, + "grad_norm": 2.8696954250335693, + "learning_rate": 5.366066431962802e-07, + "loss": 0.151, + "step": 32971 + }, + { + "epoch": 89.84196185286103, + "grad_norm": 2.8988192081451416, + "learning_rate": 5.363214801419126e-07, + "loss": 0.1698, + "step": 32972 + }, + { + "epoch": 89.84468664850137, + "grad_norm": 2.658188581466675, + "learning_rate": 5.360363907903676e-07, + "loss": 0.1053, + "step": 32973 + }, + { + "epoch": 89.84741144414168, + "grad_norm": 3.5899264812469482, + "learning_rate": 5.357513751438682e-07, + "loss": 0.0692, + "step": 32974 + }, + { + "epoch": 89.85013623978202, + "grad_norm": 2.681520938873291, + "learning_rate": 5.354664332046311e-07, + "loss": 0.0356, + "step": 32975 + }, + { + "epoch": 89.85286103542235, + "grad_norm": 2.867356300354004, + "learning_rate": 5.351815649748782e-07, + "loss": 0.0275, + "step": 32976 + }, + { + "epoch": 89.85558583106267, + "grad_norm": 2.661987543106079, + "learning_rate": 5.348967704568265e-07, + "loss": 0.0327, + "step": 32977 + }, + { + "epoch": 89.858310626703, + "grad_norm": 3.018894910812378, + "learning_rate": 5.34612049652693e-07, + "loss": 0.1273, + "step": 32978 + }, + { + "epoch": 89.86103542234332, + "grad_norm": 2.4152638912200928, + "learning_rate": 5.343274025646972e-07, + "loss": 0.0289, + "step": 32979 + }, + { + "epoch": 89.86376021798365, + "grad_norm": 2.1353743076324463, + "learning_rate": 5.34042829195055e-07, + "loss": 0.0716, + "step": 32980 + }, + { + "epoch": 89.86648501362397, + "grad_norm": 2.2595503330230713, + "learning_rate": 5.337583295459825e-07, + "loss": 0.1349, + "step": 32981 + }, + { + "epoch": 89.8692098092643, + "grad_norm": 2.7043895721435547, + "learning_rate": 5.334739036196945e-07, + "loss": 0.0464, + "step": 32982 + }, + { + "epoch": 89.87193460490464, + "grad_norm": 1.942264199256897, + "learning_rate": 5.331895514184083e-07, + "loss": 0.0253, + "step": 32983 + }, + { + "epoch": 89.87465940054496, + "grad_norm": 1.7817914485931396, + "learning_rate": 5.329052729443363e-07, + "loss": 0.0239, + "step": 32984 + }, + { + "epoch": 89.87738419618529, + "grad_norm": 2.8188374042510986, + "learning_rate": 5.326210681996947e-07, + "loss": 0.054, + "step": 32985 + }, + { + "epoch": 89.88010899182561, + "grad_norm": 3.5125081539154053, + "learning_rate": 5.323369371866926e-07, + "loss": 0.04, + "step": 32986 + }, + { + "epoch": 89.88283378746594, + "grad_norm": 2.6244945526123047, + "learning_rate": 5.320528799075486e-07, + "loss": 0.0191, + "step": 32987 + }, + { + "epoch": 89.88555858310627, + "grad_norm": 3.1844279766082764, + "learning_rate": 5.317688963644718e-07, + "loss": 0.1572, + "step": 32988 + }, + { + "epoch": 89.88828337874659, + "grad_norm": 4.102267742156982, + "learning_rate": 5.314849865596738e-07, + "loss": 0.0503, + "step": 32989 + }, + { + "epoch": 89.89100817438693, + "grad_norm": 3.608659029006958, + "learning_rate": 5.312011504953641e-07, + "loss": 0.0674, + "step": 32990 + }, + { + "epoch": 89.89373297002724, + "grad_norm": 2.702633857727051, + "learning_rate": 5.309173881737573e-07, + "loss": 0.0263, + "step": 32991 + }, + { + "epoch": 89.89645776566758, + "grad_norm": 3.237031936645508, + "learning_rate": 5.306336995970607e-07, + "loss": 0.0351, + "step": 32992 + }, + { + "epoch": 89.8991825613079, + "grad_norm": 2.228076219558716, + "learning_rate": 5.303500847674825e-07, + "loss": 0.1762, + "step": 32993 + }, + { + "epoch": 89.90190735694823, + "grad_norm": 2.669952630996704, + "learning_rate": 5.300665436872332e-07, + "loss": 0.0774, + "step": 32994 + }, + { + "epoch": 89.90463215258856, + "grad_norm": 1.98214852809906, + "learning_rate": 5.297830763585221e-07, + "loss": 0.0528, + "step": 32995 + }, + { + "epoch": 89.90735694822888, + "grad_norm": 2.620363473892212, + "learning_rate": 5.294996827835564e-07, + "loss": 0.0258, + "step": 32996 + }, + { + "epoch": 89.91008174386921, + "grad_norm": 2.039790153503418, + "learning_rate": 5.292163629645419e-07, + "loss": 0.0275, + "step": 32997 + }, + { + "epoch": 89.91280653950953, + "grad_norm": 2.1500163078308105, + "learning_rate": 5.289331169036838e-07, + "loss": 0.035, + "step": 32998 + }, + { + "epoch": 89.91553133514986, + "grad_norm": 1.4995557069778442, + "learning_rate": 5.286499446031912e-07, + "loss": 0.016, + "step": 32999 + }, + { + "epoch": 89.9182561307902, + "grad_norm": 3.5196704864501953, + "learning_rate": 5.28366846065268e-07, + "loss": 0.1035, + "step": 33000 + }, + { + "epoch": 89.92098092643052, + "grad_norm": 2.2869179248809814, + "learning_rate": 5.280838212921192e-07, + "loss": 0.0532, + "step": 33001 + }, + { + "epoch": 89.92370572207085, + "grad_norm": 2.1659247875213623, + "learning_rate": 5.278008702859471e-07, + "loss": 0.0358, + "step": 33002 + }, + { + "epoch": 89.92643051771117, + "grad_norm": 2.7991530895233154, + "learning_rate": 5.275179930489593e-07, + "loss": 0.0675, + "step": 33003 + }, + { + "epoch": 89.9291553133515, + "grad_norm": 3.941906452178955, + "learning_rate": 5.272351895833561e-07, + "loss": 0.187, + "step": 33004 + }, + { + "epoch": 89.93188010899182, + "grad_norm": 2.4331722259521484, + "learning_rate": 5.2695245989134e-07, + "loss": 0.0365, + "step": 33005 + }, + { + "epoch": 89.93460490463215, + "grad_norm": 2.5806493759155273, + "learning_rate": 5.266698039751117e-07, + "loss": 0.0153, + "step": 33006 + }, + { + "epoch": 89.93732970027249, + "grad_norm": 2.010847568511963, + "learning_rate": 5.263872218368759e-07, + "loss": 0.0286, + "step": 33007 + }, + { + "epoch": 89.9400544959128, + "grad_norm": 1.869657039642334, + "learning_rate": 5.261047134788311e-07, + "loss": 0.034, + "step": 33008 + }, + { + "epoch": 89.94277929155314, + "grad_norm": 6.215493202209473, + "learning_rate": 5.258222789031775e-07, + "loss": 0.0331, + "step": 33009 + }, + { + "epoch": 89.94550408719346, + "grad_norm": 3.4132604598999023, + "learning_rate": 5.255399181121146e-07, + "loss": 0.0513, + "step": 33010 + }, + { + "epoch": 89.94822888283379, + "grad_norm": 2.238222360610962, + "learning_rate": 5.252576311078417e-07, + "loss": 0.0507, + "step": 33011 + }, + { + "epoch": 89.95095367847412, + "grad_norm": 2.523106336593628, + "learning_rate": 5.249754178925581e-07, + "loss": 0.029, + "step": 33012 + }, + { + "epoch": 89.95367847411444, + "grad_norm": 2.9947681427001953, + "learning_rate": 5.246932784684622e-07, + "loss": 0.0417, + "step": 33013 + }, + { + "epoch": 89.95640326975477, + "grad_norm": 3.382309913635254, + "learning_rate": 5.244112128377477e-07, + "loss": 0.0535, + "step": 33014 + }, + { + "epoch": 89.95912806539509, + "grad_norm": 1.5899206399917603, + "learning_rate": 5.241292210026161e-07, + "loss": 0.1373, + "step": 33015 + }, + { + "epoch": 89.96185286103542, + "grad_norm": 1.6889121532440186, + "learning_rate": 5.238473029652602e-07, + "loss": 0.0222, + "step": 33016 + }, + { + "epoch": 89.96457765667574, + "grad_norm": 2.2443130016326904, + "learning_rate": 5.235654587278771e-07, + "loss": 0.0392, + "step": 33017 + }, + { + "epoch": 89.96730245231608, + "grad_norm": 2.3111021518707275, + "learning_rate": 5.232836882926596e-07, + "loss": 0.0418, + "step": 33018 + }, + { + "epoch": 89.97002724795641, + "grad_norm": 2.983551263809204, + "learning_rate": 5.230019916618046e-07, + "loss": 0.0503, + "step": 33019 + }, + { + "epoch": 89.97275204359673, + "grad_norm": 2.7868733406066895, + "learning_rate": 5.227203688375049e-07, + "loss": 0.1354, + "step": 33020 + }, + { + "epoch": 89.97547683923706, + "grad_norm": 2.1836066246032715, + "learning_rate": 5.224388198219554e-07, + "loss": 0.0221, + "step": 33021 + }, + { + "epoch": 89.97820163487738, + "grad_norm": 3.358785629272461, + "learning_rate": 5.221573446173444e-07, + "loss": 0.0671, + "step": 33022 + }, + { + "epoch": 89.98092643051771, + "grad_norm": 3.126645803451538, + "learning_rate": 5.218759432258691e-07, + "loss": 0.0469, + "step": 33023 + }, + { + "epoch": 89.98365122615803, + "grad_norm": 2.0958292484283447, + "learning_rate": 5.215946156497187e-07, + "loss": 0.018, + "step": 33024 + }, + { + "epoch": 89.98637602179836, + "grad_norm": 2.102900505065918, + "learning_rate": 5.213133618910849e-07, + "loss": 0.0749, + "step": 33025 + }, + { + "epoch": 89.9891008174387, + "grad_norm": 1.6311944723129272, + "learning_rate": 5.210321819521558e-07, + "loss": 0.032, + "step": 33026 + }, + { + "epoch": 89.99182561307902, + "grad_norm": 1.8994883298873901, + "learning_rate": 5.207510758351231e-07, + "loss": 0.0353, + "step": 33027 + }, + { + "epoch": 89.99455040871935, + "grad_norm": 1.4795035123825073, + "learning_rate": 5.204700435421772e-07, + "loss": 0.0137, + "step": 33028 + }, + { + "epoch": 89.99727520435967, + "grad_norm": 2.647529363632202, + "learning_rate": 5.201890850755054e-07, + "loss": 0.0511, + "step": 33029 + }, + { + "epoch": 90.0, + "grad_norm": 2.3613972663879395, + "learning_rate": 5.199082004372958e-07, + "loss": 0.0328, + "step": 33030 + }, + { + "epoch": 90.00272479564033, + "grad_norm": 2.134033679962158, + "learning_rate": 5.196273896297354e-07, + "loss": 0.0479, + "step": 33031 + }, + { + "epoch": 90.00544959128065, + "grad_norm": 2.578030824661255, + "learning_rate": 5.193466526550117e-07, + "loss": 0.0362, + "step": 33032 + }, + { + "epoch": 90.00817438692098, + "grad_norm": 3.1712164878845215, + "learning_rate": 5.190659895153127e-07, + "loss": 0.0901, + "step": 33033 + }, + { + "epoch": 90.0108991825613, + "grad_norm": 2.9159908294677734, + "learning_rate": 5.187854002128223e-07, + "loss": 0.0516, + "step": 33034 + }, + { + "epoch": 90.01362397820164, + "grad_norm": 6.015149116516113, + "learning_rate": 5.185048847497242e-07, + "loss": 0.0363, + "step": 33035 + }, + { + "epoch": 90.01634877384195, + "grad_norm": 2.3716206550598145, + "learning_rate": 5.182244431282058e-07, + "loss": 0.0229, + "step": 33036 + }, + { + "epoch": 90.01907356948229, + "grad_norm": 3.414368152618408, + "learning_rate": 5.179440753504517e-07, + "loss": 0.0395, + "step": 33037 + }, + { + "epoch": 90.02179836512262, + "grad_norm": 2.8145992755889893, + "learning_rate": 5.176637814186414e-07, + "loss": 0.0249, + "step": 33038 + }, + { + "epoch": 90.02452316076294, + "grad_norm": 3.2736363410949707, + "learning_rate": 5.17383561334962e-07, + "loss": 0.0338, + "step": 33039 + }, + { + "epoch": 90.02724795640327, + "grad_norm": 2.978874921798706, + "learning_rate": 5.171034151015941e-07, + "loss": 0.0396, + "step": 33040 + }, + { + "epoch": 90.02997275204359, + "grad_norm": 2.7185943126678467, + "learning_rate": 5.168233427207204e-07, + "loss": 0.084, + "step": 33041 + }, + { + "epoch": 90.03269754768392, + "grad_norm": 2.609410285949707, + "learning_rate": 5.165433441945189e-07, + "loss": 0.0838, + "step": 33042 + }, + { + "epoch": 90.03542234332426, + "grad_norm": 1.7382959127426147, + "learning_rate": 5.162634195251748e-07, + "loss": 0.0211, + "step": 33043 + }, + { + "epoch": 90.03814713896458, + "grad_norm": 2.75905179977417, + "learning_rate": 5.15983568714864e-07, + "loss": 0.034, + "step": 33044 + }, + { + "epoch": 90.04087193460491, + "grad_norm": 1.7357958555221558, + "learning_rate": 5.157037917657692e-07, + "loss": 0.0248, + "step": 33045 + }, + { + "epoch": 90.04359673024523, + "grad_norm": 2.1174702644348145, + "learning_rate": 5.154240886800688e-07, + "loss": 0.0367, + "step": 33046 + }, + { + "epoch": 90.04632152588556, + "grad_norm": 6.2968878746032715, + "learning_rate": 5.151444594599386e-07, + "loss": 0.05, + "step": 33047 + }, + { + "epoch": 90.04904632152588, + "grad_norm": 1.8036682605743408, + "learning_rate": 5.148649041075593e-07, + "loss": 0.0173, + "step": 33048 + }, + { + "epoch": 90.05177111716621, + "grad_norm": 2.6650938987731934, + "learning_rate": 5.145854226251068e-07, + "loss": 0.057, + "step": 33049 + }, + { + "epoch": 90.05449591280654, + "grad_norm": 27.12366485595703, + "learning_rate": 5.143060150147583e-07, + "loss": 0.0246, + "step": 33050 + }, + { + "epoch": 90.05722070844686, + "grad_norm": 2.7090585231781006, + "learning_rate": 5.140266812786865e-07, + "loss": 0.035, + "step": 33051 + }, + { + "epoch": 90.0599455040872, + "grad_norm": 2.360356569290161, + "learning_rate": 5.137474214190719e-07, + "loss": 0.081, + "step": 33052 + }, + { + "epoch": 90.06267029972751, + "grad_norm": 2.3694264888763428, + "learning_rate": 5.134682354380871e-07, + "loss": 0.0348, + "step": 33053 + }, + { + "epoch": 90.06539509536785, + "grad_norm": 2.62050199508667, + "learning_rate": 5.131891233379071e-07, + "loss": 0.0666, + "step": 33054 + }, + { + "epoch": 90.06811989100818, + "grad_norm": 11.05138874053955, + "learning_rate": 5.129100851207025e-07, + "loss": 0.321, + "step": 33055 + }, + { + "epoch": 90.0708446866485, + "grad_norm": 3.2369446754455566, + "learning_rate": 5.126311207886503e-07, + "loss": 0.1585, + "step": 33056 + }, + { + "epoch": 90.07356948228883, + "grad_norm": 3.03149676322937, + "learning_rate": 5.123522303439222e-07, + "loss": 0.0489, + "step": 33057 + }, + { + "epoch": 90.07629427792915, + "grad_norm": 3.8002331256866455, + "learning_rate": 5.120734137886884e-07, + "loss": 0.0504, + "step": 33058 + }, + { + "epoch": 90.07901907356948, + "grad_norm": 2.704076051712036, + "learning_rate": 5.117946711251209e-07, + "loss": 0.0787, + "step": 33059 + }, + { + "epoch": 90.0817438692098, + "grad_norm": 3.1726512908935547, + "learning_rate": 5.115160023553922e-07, + "loss": 0.1538, + "step": 33060 + }, + { + "epoch": 90.08446866485014, + "grad_norm": 2.7844386100769043, + "learning_rate": 5.112374074816706e-07, + "loss": 0.0571, + "step": 33061 + }, + { + "epoch": 90.08719346049047, + "grad_norm": 3.116177797317505, + "learning_rate": 5.109588865061277e-07, + "loss": 0.0287, + "step": 33062 + }, + { + "epoch": 90.08991825613079, + "grad_norm": 2.319117307662964, + "learning_rate": 5.106804394309306e-07, + "loss": 0.0217, + "step": 33063 + }, + { + "epoch": 90.09264305177112, + "grad_norm": 2.8059732913970947, + "learning_rate": 5.104020662582499e-07, + "loss": 0.0293, + "step": 33064 + }, + { + "epoch": 90.09536784741144, + "grad_norm": 2.308300733566284, + "learning_rate": 5.101237669902526e-07, + "loss": 0.1803, + "step": 33065 + }, + { + "epoch": 90.09809264305177, + "grad_norm": 2.789944887161255, + "learning_rate": 5.09845541629106e-07, + "loss": 0.0535, + "step": 33066 + }, + { + "epoch": 90.1008174386921, + "grad_norm": 2.59648060798645, + "learning_rate": 5.095673901769749e-07, + "loss": 0.1116, + "step": 33067 + }, + { + "epoch": 90.10354223433242, + "grad_norm": 1.695949673652649, + "learning_rate": 5.092893126360288e-07, + "loss": 0.0651, + "step": 33068 + }, + { + "epoch": 90.10626702997276, + "grad_norm": 2.5341873168945312, + "learning_rate": 5.090113090084325e-07, + "loss": 0.0886, + "step": 33069 + }, + { + "epoch": 90.10899182561307, + "grad_norm": 6.12711763381958, + "learning_rate": 5.087333792963512e-07, + "loss": 0.0248, + "step": 33070 + }, + { + "epoch": 90.11171662125341, + "grad_norm": 3.309462547302246, + "learning_rate": 5.084555235019473e-07, + "loss": 0.1271, + "step": 33071 + }, + { + "epoch": 90.11444141689373, + "grad_norm": 2.403449535369873, + "learning_rate": 5.081777416273869e-07, + "loss": 0.0511, + "step": 33072 + }, + { + "epoch": 90.11716621253406, + "grad_norm": 3.0937139987945557, + "learning_rate": 5.079000336748341e-07, + "loss": 0.0382, + "step": 33073 + }, + { + "epoch": 90.11989100817439, + "grad_norm": 5.334840774536133, + "learning_rate": 5.076223996464491e-07, + "loss": 0.0422, + "step": 33074 + }, + { + "epoch": 90.12261580381471, + "grad_norm": 3.4917781352996826, + "learning_rate": 5.073448395443948e-07, + "loss": 0.131, + "step": 33075 + }, + { + "epoch": 90.12534059945504, + "grad_norm": 2.161721706390381, + "learning_rate": 5.070673533708337e-07, + "loss": 0.0455, + "step": 33076 + }, + { + "epoch": 90.12806539509536, + "grad_norm": 2.2415032386779785, + "learning_rate": 5.067899411279276e-07, + "loss": 0.0374, + "step": 33077 + }, + { + "epoch": 90.1307901907357, + "grad_norm": 3.1583940982818604, + "learning_rate": 5.065126028178357e-07, + "loss": 0.081, + "step": 33078 + }, + { + "epoch": 90.13351498637603, + "grad_norm": 2.8492276668548584, + "learning_rate": 5.062353384427144e-07, + "loss": 0.0925, + "step": 33079 + }, + { + "epoch": 90.13623978201635, + "grad_norm": 3.782942295074463, + "learning_rate": 5.059581480047304e-07, + "loss": 0.1233, + "step": 33080 + }, + { + "epoch": 90.13896457765668, + "grad_norm": 2.2050328254699707, + "learning_rate": 5.05681031506039e-07, + "loss": 0.0781, + "step": 33081 + }, + { + "epoch": 90.141689373297, + "grad_norm": 2.3911116123199463, + "learning_rate": 5.054039889487972e-07, + "loss": 0.0867, + "step": 33082 + }, + { + "epoch": 90.14441416893733, + "grad_norm": 2.5510473251342773, + "learning_rate": 5.051270203351632e-07, + "loss": 0.0259, + "step": 33083 + }, + { + "epoch": 90.14713896457765, + "grad_norm": 2.6050610542297363, + "learning_rate": 5.048501256672955e-07, + "loss": 0.198, + "step": 33084 + }, + { + "epoch": 90.14986376021798, + "grad_norm": 4.228565692901611, + "learning_rate": 5.045733049473489e-07, + "loss": 0.0959, + "step": 33085 + }, + { + "epoch": 90.15258855585832, + "grad_norm": 2.5402660369873047, + "learning_rate": 5.042965581774794e-07, + "loss": 0.1167, + "step": 33086 + }, + { + "epoch": 90.15531335149863, + "grad_norm": 2.778419256210327, + "learning_rate": 5.040198853598421e-07, + "loss": 0.0978, + "step": 33087 + }, + { + "epoch": 90.15803814713897, + "grad_norm": 3.5623526573181152, + "learning_rate": 5.037432864965941e-07, + "loss": 0.0295, + "step": 33088 + }, + { + "epoch": 90.16076294277929, + "grad_norm": 2.1568751335144043, + "learning_rate": 5.034667615898869e-07, + "loss": 0.0753, + "step": 33089 + }, + { + "epoch": 90.16348773841962, + "grad_norm": 3.8411865234375, + "learning_rate": 5.031903106418756e-07, + "loss": 0.0773, + "step": 33090 + }, + { + "epoch": 90.16621253405995, + "grad_norm": 2.954439163208008, + "learning_rate": 5.029139336547106e-07, + "loss": 0.1143, + "step": 33091 + }, + { + "epoch": 90.16893732970027, + "grad_norm": 3.459062099456787, + "learning_rate": 5.02637630630548e-07, + "loss": 0.0978, + "step": 33092 + }, + { + "epoch": 90.1716621253406, + "grad_norm": 2.2669992446899414, + "learning_rate": 5.023614015715372e-07, + "loss": 0.0756, + "step": 33093 + }, + { + "epoch": 90.17438692098092, + "grad_norm": 2.870089530944824, + "learning_rate": 5.020852464798309e-07, + "loss": 0.0579, + "step": 33094 + }, + { + "epoch": 90.17711171662125, + "grad_norm": 2.030543565750122, + "learning_rate": 5.018091653575774e-07, + "loss": 0.0234, + "step": 33095 + }, + { + "epoch": 90.17983651226157, + "grad_norm": 3.0314953327178955, + "learning_rate": 5.015331582069282e-07, + "loss": 0.0378, + "step": 33096 + }, + { + "epoch": 90.1825613079019, + "grad_norm": 2.4393393993377686, + "learning_rate": 5.01257225030034e-07, + "loss": 0.0844, + "step": 33097 + }, + { + "epoch": 90.18528610354224, + "grad_norm": 3.483377456665039, + "learning_rate": 5.009813658290441e-07, + "loss": 0.0524, + "step": 33098 + }, + { + "epoch": 90.18801089918256, + "grad_norm": 3.7955992221832275, + "learning_rate": 5.007055806061045e-07, + "loss": 0.0236, + "step": 33099 + }, + { + "epoch": 90.19073569482289, + "grad_norm": 2.5338237285614014, + "learning_rate": 5.004298693633625e-07, + "loss": 0.046, + "step": 33100 + }, + { + "epoch": 90.19346049046321, + "grad_norm": 2.2801761627197266, + "learning_rate": 5.001542321029695e-07, + "loss": 0.0709, + "step": 33101 + }, + { + "epoch": 90.19618528610354, + "grad_norm": 2.7014200687408447, + "learning_rate": 4.998786688270685e-07, + "loss": 0.0285, + "step": 33102 + }, + { + "epoch": 90.19891008174388, + "grad_norm": 2.956639289855957, + "learning_rate": 4.996031795378065e-07, + "loss": 0.0345, + "step": 33103 + }, + { + "epoch": 90.2016348773842, + "grad_norm": 2.349761486053467, + "learning_rate": 4.993277642373296e-07, + "loss": 0.1865, + "step": 33104 + }, + { + "epoch": 90.20435967302453, + "grad_norm": 1.7927157878875732, + "learning_rate": 4.990524229277826e-07, + "loss": 0.0331, + "step": 33105 + }, + { + "epoch": 90.20708446866485, + "grad_norm": 1.8765418529510498, + "learning_rate": 4.987771556113096e-07, + "loss": 0.0277, + "step": 33106 + }, + { + "epoch": 90.20980926430518, + "grad_norm": 1.8036874532699585, + "learning_rate": 4.985019622900522e-07, + "loss": 0.0833, + "step": 33107 + }, + { + "epoch": 90.2125340599455, + "grad_norm": 3.2392690181732178, + "learning_rate": 4.982268429661575e-07, + "loss": 0.0361, + "step": 33108 + }, + { + "epoch": 90.21525885558583, + "grad_norm": 3.99721622467041, + "learning_rate": 4.979517976417669e-07, + "loss": 0.0561, + "step": 33109 + }, + { + "epoch": 90.21798365122616, + "grad_norm": 2.079462766647339, + "learning_rate": 4.976768263190212e-07, + "loss": 0.0234, + "step": 33110 + }, + { + "epoch": 90.22070844686648, + "grad_norm": 1.9858804941177368, + "learning_rate": 4.97401929000062e-07, + "loss": 0.1116, + "step": 33111 + }, + { + "epoch": 90.22343324250681, + "grad_norm": 2.7112207412719727, + "learning_rate": 4.971271056870308e-07, + "loss": 0.1189, + "step": 33112 + }, + { + "epoch": 90.22615803814713, + "grad_norm": 2.296314001083374, + "learning_rate": 4.968523563820682e-07, + "loss": 0.0404, + "step": 33113 + }, + { + "epoch": 90.22888283378747, + "grad_norm": 2.176239252090454, + "learning_rate": 4.965776810873135e-07, + "loss": 0.0473, + "step": 33114 + }, + { + "epoch": 90.2316076294278, + "grad_norm": 2.048495292663574, + "learning_rate": 4.963030798049063e-07, + "loss": 0.0205, + "step": 33115 + }, + { + "epoch": 90.23433242506812, + "grad_norm": 2.07379412651062, + "learning_rate": 4.960285525369834e-07, + "loss": 0.0272, + "step": 33116 + }, + { + "epoch": 90.23705722070845, + "grad_norm": 2.025475025177002, + "learning_rate": 4.957540992856869e-07, + "loss": 0.0797, + "step": 33117 + }, + { + "epoch": 90.23978201634877, + "grad_norm": 2.2327964305877686, + "learning_rate": 4.954797200531502e-07, + "loss": 0.0743, + "step": 33118 + }, + { + "epoch": 90.2425068119891, + "grad_norm": 2.112105131149292, + "learning_rate": 4.95205414841512e-07, + "loss": 0.044, + "step": 33119 + }, + { + "epoch": 90.24523160762942, + "grad_norm": 2.899749755859375, + "learning_rate": 4.949311836529059e-07, + "loss": 0.0462, + "step": 33120 + }, + { + "epoch": 90.24795640326975, + "grad_norm": 2.9915671348571777, + "learning_rate": 4.946570264894724e-07, + "loss": 0.0679, + "step": 33121 + }, + { + "epoch": 90.25068119891009, + "grad_norm": 3.773315668106079, + "learning_rate": 4.943829433533431e-07, + "loss": 0.1619, + "step": 33122 + }, + { + "epoch": 90.2534059945504, + "grad_norm": 2.1987504959106445, + "learning_rate": 4.941089342466543e-07, + "loss": 0.0253, + "step": 33123 + }, + { + "epoch": 90.25613079019074, + "grad_norm": 1.9298509359359741, + "learning_rate": 4.938349991715375e-07, + "loss": 0.0744, + "step": 33124 + }, + { + "epoch": 90.25885558583106, + "grad_norm": 2.095750570297241, + "learning_rate": 4.935611381301298e-07, + "loss": 0.0176, + "step": 33125 + }, + { + "epoch": 90.26158038147139, + "grad_norm": 2.950507402420044, + "learning_rate": 4.932873511245606e-07, + "loss": 0.027, + "step": 33126 + }, + { + "epoch": 90.26430517711172, + "grad_norm": 1.4579638242721558, + "learning_rate": 4.930136381569628e-07, + "loss": 0.1051, + "step": 33127 + }, + { + "epoch": 90.26702997275204, + "grad_norm": 1.8372451066970825, + "learning_rate": 4.927399992294701e-07, + "loss": 0.1445, + "step": 33128 + }, + { + "epoch": 90.26975476839237, + "grad_norm": 2.2512099742889404, + "learning_rate": 4.924664343442132e-07, + "loss": 0.0766, + "step": 33129 + }, + { + "epoch": 90.2724795640327, + "grad_norm": 2.2136800289154053, + "learning_rate": 4.92192943503319e-07, + "loss": 0.0802, + "step": 33130 + }, + { + "epoch": 90.27520435967303, + "grad_norm": 3.093181848526001, + "learning_rate": 4.919195267089227e-07, + "loss": 0.0328, + "step": 33131 + }, + { + "epoch": 90.27792915531334, + "grad_norm": 2.9186415672302246, + "learning_rate": 4.916461839631492e-07, + "loss": 0.1646, + "step": 33132 + }, + { + "epoch": 90.28065395095368, + "grad_norm": 2.292050838470459, + "learning_rate": 4.913729152681302e-07, + "loss": 0.0657, + "step": 33133 + }, + { + "epoch": 90.28337874659401, + "grad_norm": 2.6327805519104004, + "learning_rate": 4.910997206259927e-07, + "loss": 0.0357, + "step": 33134 + }, + { + "epoch": 90.28610354223433, + "grad_norm": 1.9433643817901611, + "learning_rate": 4.908266000388651e-07, + "loss": 0.0195, + "step": 33135 + }, + { + "epoch": 90.28882833787466, + "grad_norm": 2.821531057357788, + "learning_rate": 4.905535535088724e-07, + "loss": 0.0333, + "step": 33136 + }, + { + "epoch": 90.29155313351498, + "grad_norm": 2.54772686958313, + "learning_rate": 4.902805810381439e-07, + "loss": 0.0794, + "step": 33137 + }, + { + "epoch": 90.29427792915531, + "grad_norm": 1.4708597660064697, + "learning_rate": 4.900076826288047e-07, + "loss": 0.0215, + "step": 33138 + }, + { + "epoch": 90.29700272479565, + "grad_norm": 1.879388451576233, + "learning_rate": 4.897348582829797e-07, + "loss": 0.0272, + "step": 33139 + }, + { + "epoch": 90.29972752043597, + "grad_norm": 14.01826000213623, + "learning_rate": 4.894621080027906e-07, + "loss": 0.0364, + "step": 33140 + }, + { + "epoch": 90.3024523160763, + "grad_norm": 2.1911098957061768, + "learning_rate": 4.891894317903678e-07, + "loss": 0.1552, + "step": 33141 + }, + { + "epoch": 90.30517711171662, + "grad_norm": 2.230325222015381, + "learning_rate": 4.889168296478309e-07, + "loss": 0.093, + "step": 33142 + }, + { + "epoch": 90.30790190735695, + "grad_norm": 3.2192161083221436, + "learning_rate": 4.886443015773023e-07, + "loss": 0.0432, + "step": 33143 + }, + { + "epoch": 90.31062670299727, + "grad_norm": 2.402613878250122, + "learning_rate": 4.883718475809063e-07, + "loss": 0.0865, + "step": 33144 + }, + { + "epoch": 90.3133514986376, + "grad_norm": 3.3279948234558105, + "learning_rate": 4.880994676607642e-07, + "loss": 0.1136, + "step": 33145 + }, + { + "epoch": 90.31607629427793, + "grad_norm": 2.0511176586151123, + "learning_rate": 4.878271618189978e-07, + "loss": 0.0278, + "step": 33146 + }, + { + "epoch": 90.31880108991825, + "grad_norm": 3.2558493614196777, + "learning_rate": 4.875549300577264e-07, + "loss": 0.0614, + "step": 33147 + }, + { + "epoch": 90.32152588555859, + "grad_norm": 2.5872344970703125, + "learning_rate": 4.872827723790707e-07, + "loss": 0.1026, + "step": 33148 + }, + { + "epoch": 90.3242506811989, + "grad_norm": 3.384432077407837, + "learning_rate": 4.870106887851522e-07, + "loss": 0.0583, + "step": 33149 + }, + { + "epoch": 90.32697547683924, + "grad_norm": 3.299123764038086, + "learning_rate": 4.867386792780882e-07, + "loss": 0.0501, + "step": 33150 + }, + { + "epoch": 90.32970027247957, + "grad_norm": 2.722965955734253, + "learning_rate": 4.864667438599968e-07, + "loss": 0.0472, + "step": 33151 + }, + { + "epoch": 90.33242506811989, + "grad_norm": 2.200094699859619, + "learning_rate": 4.861948825329954e-07, + "loss": 0.0862, + "step": 33152 + }, + { + "epoch": 90.33514986376022, + "grad_norm": 2.139737844467163, + "learning_rate": 4.859230952992022e-07, + "loss": 0.0257, + "step": 33153 + }, + { + "epoch": 90.33787465940054, + "grad_norm": 3.265510082244873, + "learning_rate": 4.856513821607356e-07, + "loss": 0.1213, + "step": 33154 + }, + { + "epoch": 90.34059945504087, + "grad_norm": 2.391695976257324, + "learning_rate": 4.853797431197082e-07, + "loss": 0.1046, + "step": 33155 + }, + { + "epoch": 90.34332425068119, + "grad_norm": 2.397998571395874, + "learning_rate": 4.851081781782363e-07, + "loss": 0.0173, + "step": 33156 + }, + { + "epoch": 90.34604904632153, + "grad_norm": 2.9855945110321045, + "learning_rate": 4.84836687338438e-07, + "loss": 0.0661, + "step": 33157 + }, + { + "epoch": 90.34877384196186, + "grad_norm": 3.025181293487549, + "learning_rate": 4.84565270602424e-07, + "loss": 0.194, + "step": 33158 + }, + { + "epoch": 90.35149863760218, + "grad_norm": 3.4120302200317383, + "learning_rate": 4.842939279723102e-07, + "loss": 0.0836, + "step": 33159 + }, + { + "epoch": 90.35422343324251, + "grad_norm": 2.47977876663208, + "learning_rate": 4.840226594502073e-07, + "loss": 0.1062, + "step": 33160 + }, + { + "epoch": 90.35694822888283, + "grad_norm": 3.055844306945801, + "learning_rate": 4.837514650382313e-07, + "loss": 0.0697, + "step": 33161 + }, + { + "epoch": 90.35967302452316, + "grad_norm": 4.376160144805908, + "learning_rate": 4.834803447384917e-07, + "loss": 0.0312, + "step": 33162 + }, + { + "epoch": 90.3623978201635, + "grad_norm": 3.98852276802063, + "learning_rate": 4.832092985531023e-07, + "loss": 0.1487, + "step": 33163 + }, + { + "epoch": 90.36512261580381, + "grad_norm": 2.69901442527771, + "learning_rate": 4.829383264841703e-07, + "loss": 0.0318, + "step": 33164 + }, + { + "epoch": 90.36784741144415, + "grad_norm": 1.9195072650909424, + "learning_rate": 4.826674285338085e-07, + "loss": 0.029, + "step": 33165 + }, + { + "epoch": 90.37057220708446, + "grad_norm": 13.976252555847168, + "learning_rate": 4.823966047041273e-07, + "loss": 0.036, + "step": 33166 + }, + { + "epoch": 90.3732970027248, + "grad_norm": 1.4326947927474976, + "learning_rate": 4.821258549972363e-07, + "loss": 0.017, + "step": 33167 + }, + { + "epoch": 90.37602179836512, + "grad_norm": 1.6718900203704834, + "learning_rate": 4.818551794152404e-07, + "loss": 0.0183, + "step": 33168 + }, + { + "epoch": 90.37874659400545, + "grad_norm": 2.5900321006774902, + "learning_rate": 4.815845779602512e-07, + "loss": 0.0364, + "step": 33169 + }, + { + "epoch": 90.38147138964578, + "grad_norm": 1.4867286682128906, + "learning_rate": 4.813140506343761e-07, + "loss": 0.0152, + "step": 33170 + }, + { + "epoch": 90.3841961852861, + "grad_norm": 2.70233416557312, + "learning_rate": 4.810435974397199e-07, + "loss": 0.0428, + "step": 33171 + }, + { + "epoch": 90.38692098092643, + "grad_norm": 2.667961359024048, + "learning_rate": 4.807732183783886e-07, + "loss": 0.0329, + "step": 33172 + }, + { + "epoch": 90.38964577656675, + "grad_norm": 8.53109073638916, + "learning_rate": 4.805029134524908e-07, + "loss": 0.0294, + "step": 33173 + }, + { + "epoch": 90.39237057220708, + "grad_norm": 2.219076633453369, + "learning_rate": 4.80232682664129e-07, + "loss": 0.0242, + "step": 33174 + }, + { + "epoch": 90.39509536784742, + "grad_norm": 2.394843578338623, + "learning_rate": 4.799625260154095e-07, + "loss": 0.0703, + "step": 33175 + }, + { + "epoch": 90.39782016348774, + "grad_norm": 2.4840338230133057, + "learning_rate": 4.796924435084338e-07, + "loss": 0.1506, + "step": 33176 + }, + { + "epoch": 90.40054495912807, + "grad_norm": 2.4439096450805664, + "learning_rate": 4.794224351453092e-07, + "loss": 0.0293, + "step": 33177 + }, + { + "epoch": 90.40326975476839, + "grad_norm": 2.4611148834228516, + "learning_rate": 4.79152500928135e-07, + "loss": 0.0281, + "step": 33178 + }, + { + "epoch": 90.40599455040872, + "grad_norm": 2.7731146812438965, + "learning_rate": 4.788826408590153e-07, + "loss": 0.1032, + "step": 33179 + }, + { + "epoch": 90.40871934604904, + "grad_norm": 3.252362012863159, + "learning_rate": 4.786128549400492e-07, + "loss": 0.1381, + "step": 33180 + }, + { + "epoch": 90.41144414168937, + "grad_norm": 2.8525171279907227, + "learning_rate": 4.783431431733421e-07, + "loss": 0.057, + "step": 33181 + }, + { + "epoch": 90.4141689373297, + "grad_norm": 3.271495819091797, + "learning_rate": 4.780735055609908e-07, + "loss": 0.0342, + "step": 33182 + }, + { + "epoch": 90.41689373297002, + "grad_norm": 2.9020233154296875, + "learning_rate": 4.778039421050973e-07, + "loss": 0.0522, + "step": 33183 + }, + { + "epoch": 90.41961852861036, + "grad_norm": 2.4161126613616943, + "learning_rate": 4.775344528077596e-07, + "loss": 0.0938, + "step": 33184 + }, + { + "epoch": 90.42234332425068, + "grad_norm": 2.141167640686035, + "learning_rate": 4.772650376710775e-07, + "loss": 0.0195, + "step": 33185 + }, + { + "epoch": 90.42506811989101, + "grad_norm": 2.094120502471924, + "learning_rate": 4.76995696697149e-07, + "loss": 0.0517, + "step": 33186 + }, + { + "epoch": 90.42779291553134, + "grad_norm": 2.9432313442230225, + "learning_rate": 4.767264298880714e-07, + "loss": 0.0285, + "step": 33187 + }, + { + "epoch": 90.43051771117166, + "grad_norm": 2.2481791973114014, + "learning_rate": 4.7645723724594084e-07, + "loss": 0.0209, + "step": 33188 + }, + { + "epoch": 90.433242506812, + "grad_norm": 2.260496139526367, + "learning_rate": 4.7618811877285566e-07, + "loss": 0.1094, + "step": 33189 + }, + { + "epoch": 90.43596730245231, + "grad_norm": 1.7597731351852417, + "learning_rate": 4.759190744709119e-07, + "loss": 0.0279, + "step": 33190 + }, + { + "epoch": 90.43869209809264, + "grad_norm": 1.820627212524414, + "learning_rate": 4.756501043422024e-07, + "loss": 0.0206, + "step": 33191 + }, + { + "epoch": 90.44141689373296, + "grad_norm": 1.9359986782073975, + "learning_rate": 4.7538120838882317e-07, + "loss": 0.0673, + "step": 33192 + }, + { + "epoch": 90.4441416893733, + "grad_norm": 1.9540246725082397, + "learning_rate": 4.751123866128693e-07, + "loss": 0.0265, + "step": 33193 + }, + { + "epoch": 90.44686648501363, + "grad_norm": 1.3852287530899048, + "learning_rate": 4.748436390164346e-07, + "loss": 0.0168, + "step": 33194 + }, + { + "epoch": 90.44959128065395, + "grad_norm": 2.3974239826202393, + "learning_rate": 4.7457496560160966e-07, + "loss": 0.0339, + "step": 33195 + }, + { + "epoch": 90.45231607629428, + "grad_norm": 3.4479024410247803, + "learning_rate": 4.743063663704883e-07, + "loss": 0.0371, + "step": 33196 + }, + { + "epoch": 90.4550408719346, + "grad_norm": 2.633267402648926, + "learning_rate": 4.740378413251634e-07, + "loss": 0.0262, + "step": 33197 + }, + { + "epoch": 90.45776566757493, + "grad_norm": 2.8179562091827393, + "learning_rate": 4.737693904677243e-07, + "loss": 0.0523, + "step": 33198 + }, + { + "epoch": 90.46049046321527, + "grad_norm": 4.019863128662109, + "learning_rate": 4.735010138002616e-07, + "loss": 0.0303, + "step": 33199 + }, + { + "epoch": 90.46321525885558, + "grad_norm": 3.3150060176849365, + "learning_rate": 4.7323271132486805e-07, + "loss": 0.0812, + "step": 33200 + }, + { + "epoch": 90.46594005449592, + "grad_norm": 2.257672071456909, + "learning_rate": 4.7296448304363086e-07, + "loss": 0.1424, + "step": 33201 + }, + { + "epoch": 90.46866485013624, + "grad_norm": 1.8890174627304077, + "learning_rate": 4.726963289586395e-07, + "loss": 0.0244, + "step": 33202 + }, + { + "epoch": 90.47138964577657, + "grad_norm": 2.707345962524414, + "learning_rate": 4.7242824907198335e-07, + "loss": 0.0507, + "step": 33203 + }, + { + "epoch": 90.47411444141689, + "grad_norm": 2.1585302352905273, + "learning_rate": 4.721602433857497e-07, + "loss": 0.0332, + "step": 33204 + }, + { + "epoch": 90.47683923705722, + "grad_norm": 3.414416790008545, + "learning_rate": 4.7189231190202353e-07, + "loss": 0.0402, + "step": 33205 + }, + { + "epoch": 90.47956403269755, + "grad_norm": 3.5887913703918457, + "learning_rate": 4.716244546228943e-07, + "loss": 0.1115, + "step": 33206 + }, + { + "epoch": 90.48228882833787, + "grad_norm": 2.6446781158447266, + "learning_rate": 4.7135667155044807e-07, + "loss": 0.0781, + "step": 33207 + }, + { + "epoch": 90.4850136239782, + "grad_norm": 2.568363904953003, + "learning_rate": 4.710889626867687e-07, + "loss": 0.0355, + "step": 33208 + }, + { + "epoch": 90.48773841961852, + "grad_norm": 3.135401725769043, + "learning_rate": 4.7082132803394133e-07, + "loss": 0.1715, + "step": 33209 + }, + { + "epoch": 90.49046321525886, + "grad_norm": 2.086153030395508, + "learning_rate": 4.7055376759405083e-07, + "loss": 0.0418, + "step": 33210 + }, + { + "epoch": 90.49318801089919, + "grad_norm": 2.0694377422332764, + "learning_rate": 4.702862813691822e-07, + "loss": 0.032, + "step": 33211 + }, + { + "epoch": 90.49591280653951, + "grad_norm": 3.0108795166015625, + "learning_rate": 4.700188693614149e-07, + "loss": 0.0358, + "step": 33212 + }, + { + "epoch": 90.49863760217984, + "grad_norm": 2.128230333328247, + "learning_rate": 4.6975153157283624e-07, + "loss": 0.0269, + "step": 33213 + }, + { + "epoch": 90.50136239782016, + "grad_norm": 2.0283594131469727, + "learning_rate": 4.6948426800552447e-07, + "loss": 0.0262, + "step": 33214 + }, + { + "epoch": 90.50408719346049, + "grad_norm": 2.122006416320801, + "learning_rate": 4.692170786615635e-07, + "loss": 0.0266, + "step": 33215 + }, + { + "epoch": 90.50681198910081, + "grad_norm": 2.366952896118164, + "learning_rate": 4.689499635430317e-07, + "loss": 0.0328, + "step": 33216 + }, + { + "epoch": 90.50953678474114, + "grad_norm": 4.551375865936279, + "learning_rate": 4.6868292265201176e-07, + "loss": 0.1529, + "step": 33217 + }, + { + "epoch": 90.51226158038148, + "grad_norm": 3.2515320777893066, + "learning_rate": 4.684159559905821e-07, + "loss": 0.089, + "step": 33218 + }, + { + "epoch": 90.5149863760218, + "grad_norm": 2.7918386459350586, + "learning_rate": 4.681490635608232e-07, + "loss": 0.0421, + "step": 33219 + }, + { + "epoch": 90.51771117166213, + "grad_norm": 2.5816855430603027, + "learning_rate": 4.678822453648124e-07, + "loss": 0.1112, + "step": 33220 + }, + { + "epoch": 90.52043596730245, + "grad_norm": 3.7270753383636475, + "learning_rate": 4.676155014046269e-07, + "loss": 0.0949, + "step": 33221 + }, + { + "epoch": 90.52316076294278, + "grad_norm": 1.7641098499298096, + "learning_rate": 4.6734883168234603e-07, + "loss": 0.0251, + "step": 33222 + }, + { + "epoch": 90.52588555858311, + "grad_norm": 2.6046302318573, + "learning_rate": 4.67082236200046e-07, + "loss": 0.2202, + "step": 33223 + }, + { + "epoch": 90.52861035422343, + "grad_norm": 2.0669286251068115, + "learning_rate": 4.6681571495980184e-07, + "loss": 0.0338, + "step": 33224 + }, + { + "epoch": 90.53133514986376, + "grad_norm": 2.0476019382476807, + "learning_rate": 4.665492679636896e-07, + "loss": 0.0939, + "step": 33225 + }, + { + "epoch": 90.53405994550408, + "grad_norm": 1.4179803133010864, + "learning_rate": 4.6628289521378543e-07, + "loss": 0.0189, + "step": 33226 + }, + { + "epoch": 90.53678474114442, + "grad_norm": 1.2024822235107422, + "learning_rate": 4.6601659671216325e-07, + "loss": 0.0137, + "step": 33227 + }, + { + "epoch": 90.53950953678473, + "grad_norm": 2.3939061164855957, + "learning_rate": 4.6575037246089807e-07, + "loss": 0.0314, + "step": 33228 + }, + { + "epoch": 90.54223433242507, + "grad_norm": 3.4228403568267822, + "learning_rate": 4.6548422246206036e-07, + "loss": 0.0695, + "step": 33229 + }, + { + "epoch": 90.5449591280654, + "grad_norm": 3.3970940113067627, + "learning_rate": 4.6521814671772525e-07, + "loss": 0.0558, + "step": 33230 + }, + { + "epoch": 90.54768392370572, + "grad_norm": 2.596010446548462, + "learning_rate": 4.6495214522996435e-07, + "loss": 0.0431, + "step": 33231 + }, + { + "epoch": 90.55040871934605, + "grad_norm": 2.1344926357269287, + "learning_rate": 4.6468621800085043e-07, + "loss": 0.0554, + "step": 33232 + }, + { + "epoch": 90.55313351498637, + "grad_norm": 2.735389232635498, + "learning_rate": 4.644203650324508e-07, + "loss": 0.0426, + "step": 33233 + }, + { + "epoch": 90.5558583106267, + "grad_norm": 2.161064624786377, + "learning_rate": 4.641545863268393e-07, + "loss": 0.0639, + "step": 33234 + }, + { + "epoch": 90.55858310626704, + "grad_norm": 1.9047894477844238, + "learning_rate": 4.6388888188608537e-07, + "loss": 0.169, + "step": 33235 + }, + { + "epoch": 90.56130790190736, + "grad_norm": 2.8913934230804443, + "learning_rate": 4.636232517122585e-07, + "loss": 0.0823, + "step": 33236 + }, + { + "epoch": 90.56403269754769, + "grad_norm": 3.5276243686676025, + "learning_rate": 4.6335769580742594e-07, + "loss": 0.0984, + "step": 33237 + }, + { + "epoch": 90.566757493188, + "grad_norm": 3.1056935787200928, + "learning_rate": 4.6309221417365826e-07, + "loss": 0.0543, + "step": 33238 + }, + { + "epoch": 90.56948228882834, + "grad_norm": 2.3912622928619385, + "learning_rate": 4.6282680681302037e-07, + "loss": 0.0452, + "step": 33239 + }, + { + "epoch": 90.57220708446866, + "grad_norm": 2.9406867027282715, + "learning_rate": 4.6256147372758074e-07, + "loss": 0.0303, + "step": 33240 + }, + { + "epoch": 90.57493188010899, + "grad_norm": 2.1630442142486572, + "learning_rate": 4.622962149194044e-07, + "loss": 0.0268, + "step": 33241 + }, + { + "epoch": 90.57765667574932, + "grad_norm": 2.3760886192321777, + "learning_rate": 4.620310303905584e-07, + "loss": 0.0304, + "step": 33242 + }, + { + "epoch": 90.58038147138964, + "grad_norm": 1.802119255065918, + "learning_rate": 4.617659201431091e-07, + "loss": 0.0811, + "step": 33243 + }, + { + "epoch": 90.58310626702998, + "grad_norm": 1.9501885175704956, + "learning_rate": 4.6150088417911907e-07, + "loss": 0.0422, + "step": 33244 + }, + { + "epoch": 90.5858310626703, + "grad_norm": 2.0498251914978027, + "learning_rate": 4.612359225006524e-07, + "loss": 0.0322, + "step": 33245 + }, + { + "epoch": 90.58855585831063, + "grad_norm": 2.3923566341400146, + "learning_rate": 4.60971035109774e-07, + "loss": 0.024, + "step": 33246 + }, + { + "epoch": 90.59128065395096, + "grad_norm": 1.9519447088241577, + "learning_rate": 4.6070622200854673e-07, + "loss": 0.0396, + "step": 33247 + }, + { + "epoch": 90.59400544959128, + "grad_norm": 5.094139575958252, + "learning_rate": 4.6044148319903225e-07, + "loss": 0.0344, + "step": 33248 + }, + { + "epoch": 90.59673024523161, + "grad_norm": 1.788164496421814, + "learning_rate": 4.6017681868329114e-07, + "loss": 0.0995, + "step": 33249 + }, + { + "epoch": 90.59945504087193, + "grad_norm": 2.2989003658294678, + "learning_rate": 4.5991222846338724e-07, + "loss": 0.1095, + "step": 33250 + }, + { + "epoch": 90.60217983651226, + "grad_norm": 2.3944873809814453, + "learning_rate": 4.5964771254137785e-07, + "loss": 0.0313, + "step": 33251 + }, + { + "epoch": 90.60490463215258, + "grad_norm": 3.388947010040283, + "learning_rate": 4.5938327091932687e-07, + "loss": 0.1775, + "step": 33252 + }, + { + "epoch": 90.60762942779292, + "grad_norm": 3.04106068611145, + "learning_rate": 4.591189035992916e-07, + "loss": 0.1037, + "step": 33253 + }, + { + "epoch": 90.61035422343325, + "grad_norm": 3.9841744899749756, + "learning_rate": 4.5885461058333137e-07, + "loss": 0.0915, + "step": 33254 + }, + { + "epoch": 90.61307901907357, + "grad_norm": 2.1753439903259277, + "learning_rate": 4.585903918735046e-07, + "loss": 0.0271, + "step": 33255 + }, + { + "epoch": 90.6158038147139, + "grad_norm": 2.460171937942505, + "learning_rate": 4.583262474718686e-07, + "loss": 0.0358, + "step": 33256 + }, + { + "epoch": 90.61852861035422, + "grad_norm": 1.941246747970581, + "learning_rate": 4.5806217738047944e-07, + "loss": 0.0189, + "step": 33257 + }, + { + "epoch": 90.62125340599455, + "grad_norm": 2.2588279247283936, + "learning_rate": 4.5779818160139657e-07, + "loss": 0.0527, + "step": 33258 + }, + { + "epoch": 90.62397820163488, + "grad_norm": 2.660083293914795, + "learning_rate": 4.575342601366739e-07, + "loss": 0.1105, + "step": 33259 + }, + { + "epoch": 90.6267029972752, + "grad_norm": 2.6605067253112793, + "learning_rate": 4.572704129883676e-07, + "loss": 0.1001, + "step": 33260 + }, + { + "epoch": 90.62942779291554, + "grad_norm": 3.0070695877075195, + "learning_rate": 4.5700664015853045e-07, + "loss": 0.045, + "step": 33261 + }, + { + "epoch": 90.63215258855585, + "grad_norm": 2.5714046955108643, + "learning_rate": 4.567429416492208e-07, + "loss": 0.0329, + "step": 33262 + }, + { + "epoch": 90.63487738419619, + "grad_norm": 2.4974591732025146, + "learning_rate": 4.564793174624893e-07, + "loss": 0.0388, + "step": 33263 + }, + { + "epoch": 90.6376021798365, + "grad_norm": 2.819182872772217, + "learning_rate": 4.5621576760038975e-07, + "loss": 0.0227, + "step": 33264 + }, + { + "epoch": 90.64032697547684, + "grad_norm": 2.4309027194976807, + "learning_rate": 4.5595229206497283e-07, + "loss": 0.0433, + "step": 33265 + }, + { + "epoch": 90.64305177111717, + "grad_norm": 2.3355817794799805, + "learning_rate": 4.556888908582946e-07, + "loss": 0.0586, + "step": 33266 + }, + { + "epoch": 90.64577656675749, + "grad_norm": 3.9397144317626953, + "learning_rate": 4.5542556398240347e-07, + "loss": 0.0755, + "step": 33267 + }, + { + "epoch": 90.64850136239782, + "grad_norm": 2.4091289043426514, + "learning_rate": 4.5516231143935e-07, + "loss": 0.0391, + "step": 33268 + }, + { + "epoch": 90.65122615803814, + "grad_norm": 1.3573044538497925, + "learning_rate": 4.5489913323118585e-07, + "loss": 0.0272, + "step": 33269 + }, + { + "epoch": 90.65395095367847, + "grad_norm": 1.8493995666503906, + "learning_rate": 4.546360293599594e-07, + "loss": 0.0203, + "step": 33270 + }, + { + "epoch": 90.65667574931881, + "grad_norm": 4.400302410125732, + "learning_rate": 4.543729998277213e-07, + "loss": 0.0481, + "step": 33271 + }, + { + "epoch": 90.65940054495913, + "grad_norm": 2.390752077102661, + "learning_rate": 4.5411004463651877e-07, + "loss": 0.1424, + "step": 33272 + }, + { + "epoch": 90.66212534059946, + "grad_norm": 2.43003511428833, + "learning_rate": 4.538471637884001e-07, + "loss": 0.0527, + "step": 33273 + }, + { + "epoch": 90.66485013623978, + "grad_norm": 2.8040931224823, + "learning_rate": 4.535843572854115e-07, + "loss": 0.0502, + "step": 33274 + }, + { + "epoch": 90.66757493188011, + "grad_norm": 2.7672746181488037, + "learning_rate": 4.5332162512960245e-07, + "loss": 0.0543, + "step": 33275 + }, + { + "epoch": 90.67029972752043, + "grad_norm": 2.0645103454589844, + "learning_rate": 4.5305896732301566e-07, + "loss": 0.0863, + "step": 33276 + }, + { + "epoch": 90.67302452316076, + "grad_norm": 4.056310653686523, + "learning_rate": 4.527963838676985e-07, + "loss": 0.0236, + "step": 33277 + }, + { + "epoch": 90.6757493188011, + "grad_norm": 1.9052339792251587, + "learning_rate": 4.525338747656971e-07, + "loss": 0.0204, + "step": 33278 + }, + { + "epoch": 90.67847411444141, + "grad_norm": 3.4017715454101562, + "learning_rate": 4.522714400190542e-07, + "loss": 0.1799, + "step": 33279 + }, + { + "epoch": 90.68119891008175, + "grad_norm": 1.9250975847244263, + "learning_rate": 4.5200907962981376e-07, + "loss": 0.0192, + "step": 33280 + }, + { + "epoch": 90.68392370572207, + "grad_norm": 2.553457260131836, + "learning_rate": 4.517467936000186e-07, + "loss": 0.0503, + "step": 33281 + }, + { + "epoch": 90.6866485013624, + "grad_norm": 2.4489798545837402, + "learning_rate": 4.5148458193171264e-07, + "loss": 0.0429, + "step": 33282 + }, + { + "epoch": 90.68937329700273, + "grad_norm": 2.2490460872650146, + "learning_rate": 4.5122244462693865e-07, + "loss": 0.0753, + "step": 33283 + }, + { + "epoch": 90.69209809264305, + "grad_norm": 2.6086504459381104, + "learning_rate": 4.5096038168773613e-07, + "loss": 0.1151, + "step": 33284 + }, + { + "epoch": 90.69482288828338, + "grad_norm": 2.2189416885375977, + "learning_rate": 4.506983931161457e-07, + "loss": 0.1018, + "step": 33285 + }, + { + "epoch": 90.6975476839237, + "grad_norm": 1.7940874099731445, + "learning_rate": 4.5043647891420794e-07, + "loss": 0.0262, + "step": 33286 + }, + { + "epoch": 90.70027247956403, + "grad_norm": 1.604964256286621, + "learning_rate": 4.5017463908396564e-07, + "loss": 0.015, + "step": 33287 + }, + { + "epoch": 90.70299727520435, + "grad_norm": 2.4309797286987305, + "learning_rate": 4.4991287362745604e-07, + "loss": 0.051, + "step": 33288 + }, + { + "epoch": 90.70572207084469, + "grad_norm": 2.2586495876312256, + "learning_rate": 4.496511825467176e-07, + "loss": 0.0343, + "step": 33289 + }, + { + "epoch": 90.70844686648502, + "grad_norm": 3.711592197418213, + "learning_rate": 4.493895658437875e-07, + "loss": 0.0437, + "step": 33290 + }, + { + "epoch": 90.71117166212534, + "grad_norm": 2.5330240726470947, + "learning_rate": 4.4912802352070406e-07, + "loss": 0.0431, + "step": 33291 + }, + { + "epoch": 90.71389645776567, + "grad_norm": 2.8791136741638184, + "learning_rate": 4.4886655557950576e-07, + "loss": 0.0315, + "step": 33292 + }, + { + "epoch": 90.71662125340599, + "grad_norm": 2.8156704902648926, + "learning_rate": 4.486051620222265e-07, + "loss": 0.0554, + "step": 33293 + }, + { + "epoch": 90.71934604904632, + "grad_norm": 1.548614501953125, + "learning_rate": 4.4834384285090126e-07, + "loss": 0.027, + "step": 33294 + }, + { + "epoch": 90.72207084468666, + "grad_norm": 2.3263797760009766, + "learning_rate": 4.480825980675685e-07, + "loss": 0.0552, + "step": 33295 + }, + { + "epoch": 90.72479564032697, + "grad_norm": 1.9418562650680542, + "learning_rate": 4.47821427674261e-07, + "loss": 0.2023, + "step": 33296 + }, + { + "epoch": 90.7275204359673, + "grad_norm": 3.4640796184539795, + "learning_rate": 4.475603316730115e-07, + "loss": 0.0359, + "step": 33297 + }, + { + "epoch": 90.73024523160763, + "grad_norm": 2.2104876041412354, + "learning_rate": 4.4729931006585514e-07, + "loss": 0.0195, + "step": 33298 + }, + { + "epoch": 90.73297002724796, + "grad_norm": 2.9146504402160645, + "learning_rate": 4.470383628548247e-07, + "loss": 0.0797, + "step": 33299 + }, + { + "epoch": 90.73569482288828, + "grad_norm": 2.01104736328125, + "learning_rate": 4.4677749004195305e-07, + "loss": 0.0232, + "step": 33300 + }, + { + "epoch": 90.73841961852861, + "grad_norm": 2.4689102172851562, + "learning_rate": 4.4651669162926847e-07, + "loss": 0.0239, + "step": 33301 + }, + { + "epoch": 90.74114441416894, + "grad_norm": 2.313556671142578, + "learning_rate": 4.4625596761880496e-07, + "loss": 0.0345, + "step": 33302 + }, + { + "epoch": 90.74386920980926, + "grad_norm": 3.654481887817383, + "learning_rate": 4.459953180125931e-07, + "loss": 0.0701, + "step": 33303 + }, + { + "epoch": 90.7465940054496, + "grad_norm": 3.117694616317749, + "learning_rate": 4.457347428126635e-07, + "loss": 0.0298, + "step": 33304 + }, + { + "epoch": 90.74931880108991, + "grad_norm": 2.7887511253356934, + "learning_rate": 4.454742420210434e-07, + "loss": 0.0302, + "step": 33305 + }, + { + "epoch": 90.75204359673025, + "grad_norm": 1.46806001663208, + "learning_rate": 4.452138156397612e-07, + "loss": 0.0195, + "step": 33306 + }, + { + "epoch": 90.75476839237058, + "grad_norm": 2.515507459640503, + "learning_rate": 4.449534636708475e-07, + "loss": 0.1116, + "step": 33307 + }, + { + "epoch": 90.7574931880109, + "grad_norm": 2.274747848510742, + "learning_rate": 4.446931861163284e-07, + "loss": 0.0289, + "step": 33308 + }, + { + "epoch": 90.76021798365123, + "grad_norm": 1.96199631690979, + "learning_rate": 4.4443298297823124e-07, + "loss": 0.0757, + "step": 33309 + }, + { + "epoch": 90.76294277929155, + "grad_norm": 2.8164730072021484, + "learning_rate": 4.4417285425858213e-07, + "loss": 0.0958, + "step": 33310 + }, + { + "epoch": 90.76566757493188, + "grad_norm": 2.6038970947265625, + "learning_rate": 4.4391279995940727e-07, + "loss": 0.1446, + "step": 33311 + }, + { + "epoch": 90.7683923705722, + "grad_norm": 4.647005081176758, + "learning_rate": 4.436528200827328e-07, + "loss": 0.0769, + "step": 33312 + }, + { + "epoch": 90.77111716621253, + "grad_norm": 2.5276827812194824, + "learning_rate": 4.4339291463058266e-07, + "loss": 0.0724, + "step": 33313 + }, + { + "epoch": 90.77384196185287, + "grad_norm": 2.7569687366485596, + "learning_rate": 4.4313308360497855e-07, + "loss": 0.0411, + "step": 33314 + }, + { + "epoch": 90.77656675749319, + "grad_norm": 3.9350979328155518, + "learning_rate": 4.428733270079488e-07, + "loss": 0.0261, + "step": 33315 + }, + { + "epoch": 90.77929155313352, + "grad_norm": 3.995311737060547, + "learning_rate": 4.4261364484151416e-07, + "loss": 0.0485, + "step": 33316 + }, + { + "epoch": 90.78201634877384, + "grad_norm": 2.352081775665283, + "learning_rate": 4.423540371076962e-07, + "loss": 0.0359, + "step": 33317 + }, + { + "epoch": 90.78474114441417, + "grad_norm": 1.513340950012207, + "learning_rate": 4.420945038085156e-07, + "loss": 0.1367, + "step": 33318 + }, + { + "epoch": 90.7874659400545, + "grad_norm": 2.9075117111206055, + "learning_rate": 4.418350449459974e-07, + "loss": 0.0439, + "step": 33319 + }, + { + "epoch": 90.79019073569482, + "grad_norm": 2.7996304035186768, + "learning_rate": 4.4157566052215885e-07, + "loss": 0.0388, + "step": 33320 + }, + { + "epoch": 90.79291553133515, + "grad_norm": 2.642317533493042, + "learning_rate": 4.413163505390228e-07, + "loss": 0.0463, + "step": 33321 + }, + { + "epoch": 90.79564032697547, + "grad_norm": 2.271878957748413, + "learning_rate": 4.410571149986065e-07, + "loss": 0.0385, + "step": 33322 + }, + { + "epoch": 90.7983651226158, + "grad_norm": 3.982398271560669, + "learning_rate": 4.4079795390293057e-07, + "loss": 0.062, + "step": 33323 + }, + { + "epoch": 90.80108991825612, + "grad_norm": 2.5257749557495117, + "learning_rate": 4.405388672540123e-07, + "loss": 0.1699, + "step": 33324 + }, + { + "epoch": 90.80381471389646, + "grad_norm": 1.8141134977340698, + "learning_rate": 4.4027985505387005e-07, + "loss": 0.0563, + "step": 33325 + }, + { + "epoch": 90.80653950953679, + "grad_norm": 2.4545209407806396, + "learning_rate": 4.400209173045189e-07, + "loss": 0.061, + "step": 33326 + }, + { + "epoch": 90.80926430517711, + "grad_norm": 2.4928431510925293, + "learning_rate": 4.397620540079794e-07, + "loss": 0.1313, + "step": 33327 + }, + { + "epoch": 90.81198910081744, + "grad_norm": 2.2530672550201416, + "learning_rate": 4.395032651662645e-07, + "loss": 0.1197, + "step": 33328 + }, + { + "epoch": 90.81471389645776, + "grad_norm": 3.323392152786255, + "learning_rate": 4.3924455078139027e-07, + "loss": 0.0545, + "step": 33329 + }, + { + "epoch": 90.8174386920981, + "grad_norm": 3.538079261779785, + "learning_rate": 4.389859108553707e-07, + "loss": 0.043, + "step": 33330 + }, + { + "epoch": 90.82016348773843, + "grad_norm": 2.706392526626587, + "learning_rate": 4.38727345390223e-07, + "loss": 0.1092, + "step": 33331 + }, + { + "epoch": 90.82288828337875, + "grad_norm": 2.1860039234161377, + "learning_rate": 4.384688543879578e-07, + "loss": 0.0803, + "step": 33332 + }, + { + "epoch": 90.82561307901908, + "grad_norm": 2.5086474418640137, + "learning_rate": 4.382104378505903e-07, + "loss": 0.0513, + "step": 33333 + }, + { + "epoch": 90.8283378746594, + "grad_norm": 2.532987356185913, + "learning_rate": 4.3795209578013085e-07, + "loss": 0.0891, + "step": 33334 + }, + { + "epoch": 90.83106267029973, + "grad_norm": 3.6119742393493652, + "learning_rate": 4.3769382817859363e-07, + "loss": 0.1391, + "step": 33335 + }, + { + "epoch": 90.83378746594005, + "grad_norm": 2.609095335006714, + "learning_rate": 4.3743563504799027e-07, + "loss": 0.0496, + "step": 33336 + }, + { + "epoch": 90.83651226158038, + "grad_norm": 2.4013712406158447, + "learning_rate": 4.37177516390328e-07, + "loss": 0.0557, + "step": 33337 + }, + { + "epoch": 90.83923705722071, + "grad_norm": 2.670222043991089, + "learning_rate": 4.3691947220762087e-07, + "loss": 0.0429, + "step": 33338 + }, + { + "epoch": 90.84196185286103, + "grad_norm": 2.525219202041626, + "learning_rate": 4.366615025018761e-07, + "loss": 0.0419, + "step": 33339 + }, + { + "epoch": 90.84468664850137, + "grad_norm": 1.774667501449585, + "learning_rate": 4.364036072751043e-07, + "loss": 0.0353, + "step": 33340 + }, + { + "epoch": 90.84741144414168, + "grad_norm": 2.6277847290039062, + "learning_rate": 4.361457865293139e-07, + "loss": 0.089, + "step": 33341 + }, + { + "epoch": 90.85013623978202, + "grad_norm": 3.0051229000091553, + "learning_rate": 4.358880402665111e-07, + "loss": 0.0772, + "step": 33342 + }, + { + "epoch": 90.85286103542235, + "grad_norm": 2.5538885593414307, + "learning_rate": 4.3563036848870535e-07, + "loss": 0.0836, + "step": 33343 + }, + { + "epoch": 90.85558583106267, + "grad_norm": 2.340928077697754, + "learning_rate": 4.353727711979028e-07, + "loss": 0.0471, + "step": 33344 + }, + { + "epoch": 90.858310626703, + "grad_norm": 2.7762279510498047, + "learning_rate": 4.351152483961096e-07, + "loss": 0.0334, + "step": 33345 + }, + { + "epoch": 90.86103542234332, + "grad_norm": 3.309253215789795, + "learning_rate": 4.3485780008532987e-07, + "loss": 0.2737, + "step": 33346 + }, + { + "epoch": 90.86376021798365, + "grad_norm": 1.7336481809616089, + "learning_rate": 4.346004262675707e-07, + "loss": 0.0176, + "step": 33347 + }, + { + "epoch": 90.86648501362397, + "grad_norm": 3.786724805831909, + "learning_rate": 4.3434312694483504e-07, + "loss": 0.1904, + "step": 33348 + }, + { + "epoch": 90.8692098092643, + "grad_norm": 2.521250009536743, + "learning_rate": 4.3408590211912793e-07, + "loss": 0.0308, + "step": 33349 + }, + { + "epoch": 90.87193460490464, + "grad_norm": 4.147480010986328, + "learning_rate": 4.3382875179244997e-07, + "loss": 0.0684, + "step": 33350 + }, + { + "epoch": 90.87465940054496, + "grad_norm": 3.3927242755889893, + "learning_rate": 4.335716759668074e-07, + "loss": 0.0555, + "step": 33351 + }, + { + "epoch": 90.87738419618529, + "grad_norm": 3.3246638774871826, + "learning_rate": 4.3331467464420076e-07, + "loss": 0.0367, + "step": 33352 + }, + { + "epoch": 90.88010899182561, + "grad_norm": 3.043524742126465, + "learning_rate": 4.330577478266318e-07, + "loss": 0.0418, + "step": 33353 + }, + { + "epoch": 90.88283378746594, + "grad_norm": 2.6775705814361572, + "learning_rate": 4.3280089551609895e-07, + "loss": 0.0372, + "step": 33354 + }, + { + "epoch": 90.88555858310627, + "grad_norm": 2.337829351425171, + "learning_rate": 4.3254411771460616e-07, + "loss": 0.0257, + "step": 33355 + }, + { + "epoch": 90.88828337874659, + "grad_norm": 2.7748048305511475, + "learning_rate": 4.322874144241518e-07, + "loss": 0.0877, + "step": 33356 + }, + { + "epoch": 90.89100817438693, + "grad_norm": 2.3835325241088867, + "learning_rate": 4.320307856467365e-07, + "loss": 0.0485, + "step": 33357 + }, + { + "epoch": 90.89373297002724, + "grad_norm": 3.358006477355957, + "learning_rate": 4.317742313843565e-07, + "loss": 0.0338, + "step": 33358 + }, + { + "epoch": 90.89645776566758, + "grad_norm": 2.6560401916503906, + "learning_rate": 4.315177516390101e-07, + "loss": 0.0605, + "step": 33359 + }, + { + "epoch": 90.8991825613079, + "grad_norm": 1.7317368984222412, + "learning_rate": 4.312613464126958e-07, + "loss": 0.0275, + "step": 33360 + }, + { + "epoch": 90.90190735694823, + "grad_norm": 3.597325086593628, + "learning_rate": 4.310050157074108e-07, + "loss": 0.1089, + "step": 33361 + }, + { + "epoch": 90.90463215258856, + "grad_norm": 1.9957163333892822, + "learning_rate": 4.307487595251503e-07, + "loss": 0.0344, + "step": 33362 + }, + { + "epoch": 90.90735694822888, + "grad_norm": 2.671257734298706, + "learning_rate": 4.304925778679103e-07, + "loss": 0.029, + "step": 33363 + }, + { + "epoch": 90.91008174386921, + "grad_norm": 2.490180730819702, + "learning_rate": 4.3023647073768716e-07, + "loss": 0.0937, + "step": 33364 + }, + { + "epoch": 90.91280653950953, + "grad_norm": 3.191882848739624, + "learning_rate": 4.299804381364736e-07, + "loss": 0.0824, + "step": 33365 + }, + { + "epoch": 90.91553133514986, + "grad_norm": 2.27536678314209, + "learning_rate": 4.2972448006626366e-07, + "loss": 0.0944, + "step": 33366 + }, + { + "epoch": 90.9182561307902, + "grad_norm": 1.630289912223816, + "learning_rate": 4.294685965290535e-07, + "loss": 0.02, + "step": 33367 + }, + { + "epoch": 90.92098092643052, + "grad_norm": 2.409642219543457, + "learning_rate": 4.292127875268326e-07, + "loss": 0.054, + "step": 33368 + }, + { + "epoch": 90.92370572207085, + "grad_norm": 2.299753189086914, + "learning_rate": 4.2895705306159497e-07, + "loss": 0.0938, + "step": 33369 + }, + { + "epoch": 90.92643051771117, + "grad_norm": 2.03139066696167, + "learning_rate": 4.2870139313533013e-07, + "loss": 0.0332, + "step": 33370 + }, + { + "epoch": 90.9291553133515, + "grad_norm": 2.4000296592712402, + "learning_rate": 4.284458077500309e-07, + "loss": 0.0326, + "step": 33371 + }, + { + "epoch": 90.93188010899182, + "grad_norm": 2.0949079990386963, + "learning_rate": 4.2819029690768896e-07, + "loss": 0.0334, + "step": 33372 + }, + { + "epoch": 90.93460490463215, + "grad_norm": 1.8479863405227661, + "learning_rate": 4.27934860610294e-07, + "loss": 0.0391, + "step": 33373 + }, + { + "epoch": 90.93732970027249, + "grad_norm": 3.3907392024993896, + "learning_rate": 4.2767949885983316e-07, + "loss": 0.0548, + "step": 33374 + }, + { + "epoch": 90.9400544959128, + "grad_norm": 5.232072830200195, + "learning_rate": 4.27424211658295e-07, + "loss": 0.0527, + "step": 33375 + }, + { + "epoch": 90.94277929155314, + "grad_norm": 6.1928277015686035, + "learning_rate": 4.2716899900766994e-07, + "loss": 0.0623, + "step": 33376 + }, + { + "epoch": 90.94550408719346, + "grad_norm": 2.1101908683776855, + "learning_rate": 4.2691386090994545e-07, + "loss": 0.0787, + "step": 33377 + }, + { + "epoch": 90.94822888283379, + "grad_norm": 2.824894666671753, + "learning_rate": 4.266587973671077e-07, + "loss": 0.0559, + "step": 33378 + }, + { + "epoch": 90.95095367847412, + "grad_norm": 2.098055839538574, + "learning_rate": 4.264038083811417e-07, + "loss": 0.0314, + "step": 33379 + }, + { + "epoch": 90.95367847411444, + "grad_norm": 1.8382599353790283, + "learning_rate": 4.261488939540348e-07, + "loss": 0.0219, + "step": 33380 + }, + { + "epoch": 90.95640326975477, + "grad_norm": 1.9304697513580322, + "learning_rate": 4.2589405408777426e-07, + "loss": 0.041, + "step": 33381 + }, + { + "epoch": 90.95912806539509, + "grad_norm": 1.5916671752929688, + "learning_rate": 4.256392887843408e-07, + "loss": 0.0181, + "step": 33382 + }, + { + "epoch": 90.96185286103542, + "grad_norm": 3.523991584777832, + "learning_rate": 4.2538459804572053e-07, + "loss": 0.0605, + "step": 33383 + }, + { + "epoch": 90.96457765667574, + "grad_norm": 2.8593709468841553, + "learning_rate": 4.251299818738974e-07, + "loss": 0.0684, + "step": 33384 + }, + { + "epoch": 90.96730245231608, + "grad_norm": 1.5864038467407227, + "learning_rate": 4.2487544027085435e-07, + "loss": 0.021, + "step": 33385 + }, + { + "epoch": 90.97002724795641, + "grad_norm": 2.613136053085327, + "learning_rate": 4.246209732385709e-07, + "loss": 0.0299, + "step": 33386 + }, + { + "epoch": 90.97275204359673, + "grad_norm": 2.5730583667755127, + "learning_rate": 4.2436658077903316e-07, + "loss": 0.0347, + "step": 33387 + }, + { + "epoch": 90.97547683923706, + "grad_norm": 2.8248631954193115, + "learning_rate": 4.2411226289421846e-07, + "loss": 0.0812, + "step": 33388 + }, + { + "epoch": 90.97820163487738, + "grad_norm": 1.930606484413147, + "learning_rate": 4.2385801958611196e-07, + "loss": 0.0202, + "step": 33389 + }, + { + "epoch": 90.98092643051771, + "grad_norm": 2.477756977081299, + "learning_rate": 4.2360385085668976e-07, + "loss": 0.083, + "step": 33390 + }, + { + "epoch": 90.98365122615803, + "grad_norm": 2.007246494293213, + "learning_rate": 4.2334975670793145e-07, + "loss": 0.093, + "step": 33391 + }, + { + "epoch": 90.98637602179836, + "grad_norm": 2.4395124912261963, + "learning_rate": 4.2309573714181763e-07, + "loss": 0.0392, + "step": 33392 + }, + { + "epoch": 90.9891008174387, + "grad_norm": 1.9157994985580444, + "learning_rate": 4.2284179216032675e-07, + "loss": 0.0248, + "step": 33393 + }, + { + "epoch": 90.99182561307902, + "grad_norm": 2.822202444076538, + "learning_rate": 4.2258792176543604e-07, + "loss": 0.0293, + "step": 33394 + }, + { + "epoch": 90.99455040871935, + "grad_norm": 2.7082839012145996, + "learning_rate": 4.223341259591207e-07, + "loss": 0.1149, + "step": 33395 + }, + { + "epoch": 90.99727520435967, + "grad_norm": 1.8892465829849243, + "learning_rate": 4.220804047433602e-07, + "loss": 0.0301, + "step": 33396 + }, + { + "epoch": 91.0, + "grad_norm": 2.780186653137207, + "learning_rate": 4.218267581201296e-07, + "loss": 0.0568, + "step": 33397 + }, + { + "epoch": 91.00272479564033, + "grad_norm": 1.4437553882598877, + "learning_rate": 4.2157318609140407e-07, + "loss": 0.0134, + "step": 33398 + }, + { + "epoch": 91.00544959128065, + "grad_norm": 3.407665491104126, + "learning_rate": 4.213196886591564e-07, + "loss": 0.0875, + "step": 33399 + }, + { + "epoch": 91.00817438692098, + "grad_norm": 2.379626512527466, + "learning_rate": 4.2106626582536394e-07, + "loss": 0.0695, + "step": 33400 + }, + { + "epoch": 91.0108991825613, + "grad_norm": 2.8182828426361084, + "learning_rate": 4.208129175919995e-07, + "loss": 0.0438, + "step": 33401 + }, + { + "epoch": 91.01362397820164, + "grad_norm": 3.4735851287841797, + "learning_rate": 4.205596439610349e-07, + "loss": 0.0233, + "step": 33402 + }, + { + "epoch": 91.01634877384195, + "grad_norm": 2.151665687561035, + "learning_rate": 4.2030644493444294e-07, + "loss": 0.0711, + "step": 33403 + }, + { + "epoch": 91.01907356948229, + "grad_norm": 2.8269784450531006, + "learning_rate": 4.200533205141977e-07, + "loss": 0.0331, + "step": 33404 + }, + { + "epoch": 91.02179836512262, + "grad_norm": 2.588975191116333, + "learning_rate": 4.1980027070226857e-07, + "loss": 0.1352, + "step": 33405 + }, + { + "epoch": 91.02452316076294, + "grad_norm": 2.4744315147399902, + "learning_rate": 4.195472955006252e-07, + "loss": 0.1165, + "step": 33406 + }, + { + "epoch": 91.02724795640327, + "grad_norm": 3.606994867324829, + "learning_rate": 4.1929439491123936e-07, + "loss": 0.0979, + "step": 33407 + }, + { + "epoch": 91.02997275204359, + "grad_norm": 2.223158359527588, + "learning_rate": 4.190415689360816e-07, + "loss": 0.0704, + "step": 33408 + }, + { + "epoch": 91.03269754768392, + "grad_norm": 2.95735502243042, + "learning_rate": 4.187888175771193e-07, + "loss": 0.1644, + "step": 33409 + }, + { + "epoch": 91.03542234332426, + "grad_norm": 2.433638095855713, + "learning_rate": 4.1853614083632197e-07, + "loss": 0.144, + "step": 33410 + }, + { + "epoch": 91.03814713896458, + "grad_norm": 2.4552266597747803, + "learning_rate": 4.1828353871565473e-07, + "loss": 0.0506, + "step": 33411 + }, + { + "epoch": 91.04087193460491, + "grad_norm": 3.9573609828948975, + "learning_rate": 4.180310112170882e-07, + "loss": 0.1673, + "step": 33412 + }, + { + "epoch": 91.04359673024523, + "grad_norm": 3.0006465911865234, + "learning_rate": 4.177785583425886e-07, + "loss": 0.0325, + "step": 33413 + }, + { + "epoch": 91.04632152588556, + "grad_norm": 2.318074941635132, + "learning_rate": 4.1752618009412105e-07, + "loss": 0.1645, + "step": 33414 + }, + { + "epoch": 91.04904632152588, + "grad_norm": 3.8660340309143066, + "learning_rate": 4.1727387647364945e-07, + "loss": 0.0506, + "step": 33415 + }, + { + "epoch": 91.05177111716621, + "grad_norm": 2.045443296432495, + "learning_rate": 4.1702164748314236e-07, + "loss": 0.0262, + "step": 33416 + }, + { + "epoch": 91.05449591280654, + "grad_norm": 2.0326268672943115, + "learning_rate": 4.167694931245614e-07, + "loss": 0.0406, + "step": 33417 + }, + { + "epoch": 91.05722070844686, + "grad_norm": 2.635942220687866, + "learning_rate": 4.165174133998717e-07, + "loss": 0.0441, + "step": 33418 + }, + { + "epoch": 91.0599455040872, + "grad_norm": 2.3526809215545654, + "learning_rate": 4.1626540831103513e-07, + "loss": 0.1848, + "step": 33419 + }, + { + "epoch": 91.06267029972751, + "grad_norm": 2.0343103408813477, + "learning_rate": 4.1601347786001557e-07, + "loss": 0.0459, + "step": 33420 + }, + { + "epoch": 91.06539509536785, + "grad_norm": 2.195220947265625, + "learning_rate": 4.1576162204877477e-07, + "loss": 0.0446, + "step": 33421 + }, + { + "epoch": 91.06811989100818, + "grad_norm": 2.0926713943481445, + "learning_rate": 4.155098408792735e-07, + "loss": 0.0235, + "step": 33422 + }, + { + "epoch": 91.0708446866485, + "grad_norm": 2.789863109588623, + "learning_rate": 4.152581343534734e-07, + "loss": 0.0288, + "step": 33423 + }, + { + "epoch": 91.07356948228883, + "grad_norm": 3.174238920211792, + "learning_rate": 4.1500650247333294e-07, + "loss": 0.131, + "step": 33424 + }, + { + "epoch": 91.07629427792915, + "grad_norm": 2.6352181434631348, + "learning_rate": 4.1475494524081504e-07, + "loss": 0.1396, + "step": 33425 + }, + { + "epoch": 91.07901907356948, + "grad_norm": 2.5747056007385254, + "learning_rate": 4.14503462657877e-07, + "loss": 0.0291, + "step": 33426 + }, + { + "epoch": 91.0817438692098, + "grad_norm": 1.8077361583709717, + "learning_rate": 4.142520547264772e-07, + "loss": 0.0832, + "step": 33427 + }, + { + "epoch": 91.08446866485014, + "grad_norm": 5.838677406311035, + "learning_rate": 4.140007214485742e-07, + "loss": 0.0286, + "step": 33428 + }, + { + "epoch": 91.08719346049047, + "grad_norm": 2.1196765899658203, + "learning_rate": 4.1374946282612517e-07, + "loss": 0.0281, + "step": 33429 + }, + { + "epoch": 91.08991825613079, + "grad_norm": 2.8270084857940674, + "learning_rate": 4.134982788610875e-07, + "loss": 0.1324, + "step": 33430 + }, + { + "epoch": 91.09264305177112, + "grad_norm": 2.859435796737671, + "learning_rate": 4.132471695554141e-07, + "loss": 0.0835, + "step": 33431 + }, + { + "epoch": 91.09536784741144, + "grad_norm": 1.551326036453247, + "learning_rate": 4.1299613491106563e-07, + "loss": 0.057, + "step": 33432 + }, + { + "epoch": 91.09809264305177, + "grad_norm": 2.9040513038635254, + "learning_rate": 4.127451749299938e-07, + "loss": 0.1105, + "step": 33433 + }, + { + "epoch": 91.1008174386921, + "grad_norm": 3.816948175430298, + "learning_rate": 4.1249428961415485e-07, + "loss": 0.0303, + "step": 33434 + }, + { + "epoch": 91.10354223433242, + "grad_norm": 2.374884605407715, + "learning_rate": 4.122434789655005e-07, + "loss": 0.0507, + "step": 33435 + }, + { + "epoch": 91.10626702997276, + "grad_norm": 2.461409330368042, + "learning_rate": 4.11992742985986e-07, + "loss": 0.1273, + "step": 33436 + }, + { + "epoch": 91.10899182561307, + "grad_norm": 2.029978036880493, + "learning_rate": 4.1174208167756414e-07, + "loss": 0.0329, + "step": 33437 + }, + { + "epoch": 91.11171662125341, + "grad_norm": 2.182032823562622, + "learning_rate": 4.1149149504218553e-07, + "loss": 0.0626, + "step": 33438 + }, + { + "epoch": 91.11444141689373, + "grad_norm": 2.0493831634521484, + "learning_rate": 4.1124098308180204e-07, + "loss": 0.0948, + "step": 33439 + }, + { + "epoch": 91.11716621253406, + "grad_norm": 5.559768199920654, + "learning_rate": 4.109905457983643e-07, + "loss": 0.0607, + "step": 33440 + }, + { + "epoch": 91.11989100817439, + "grad_norm": 3.1644163131713867, + "learning_rate": 4.1074018319382513e-07, + "loss": 0.0151, + "step": 33441 + }, + { + "epoch": 91.12261580381471, + "grad_norm": 2.7557992935180664, + "learning_rate": 4.1048989527013306e-07, + "loss": 0.0219, + "step": 33442 + }, + { + "epoch": 91.12534059945504, + "grad_norm": 2.05183744430542, + "learning_rate": 4.102396820292376e-07, + "loss": 0.0322, + "step": 33443 + }, + { + "epoch": 91.12806539509536, + "grad_norm": 2.707655429840088, + "learning_rate": 4.0998954347308496e-07, + "loss": 0.0763, + "step": 33444 + }, + { + "epoch": 91.1307901907357, + "grad_norm": 4.005188941955566, + "learning_rate": 4.0973947960362583e-07, + "loss": 0.1092, + "step": 33445 + }, + { + "epoch": 91.13351498637603, + "grad_norm": 2.3927321434020996, + "learning_rate": 4.094894904228075e-07, + "loss": 0.0331, + "step": 33446 + }, + { + "epoch": 91.13623978201635, + "grad_norm": 2.6593899726867676, + "learning_rate": 4.0923957593257626e-07, + "loss": 0.1845, + "step": 33447 + }, + { + "epoch": 91.13896457765668, + "grad_norm": 5.125622749328613, + "learning_rate": 4.0898973613487714e-07, + "loss": 0.0479, + "step": 33448 + }, + { + "epoch": 91.141689373297, + "grad_norm": 2.3418519496917725, + "learning_rate": 4.0873997103165976e-07, + "loss": 0.0268, + "step": 33449 + }, + { + "epoch": 91.14441416893733, + "grad_norm": 2.0520389080047607, + "learning_rate": 4.084902806248647e-07, + "loss": 0.056, + "step": 33450 + }, + { + "epoch": 91.14713896457765, + "grad_norm": 1.4824223518371582, + "learning_rate": 4.0824066491643944e-07, + "loss": 0.0185, + "step": 33451 + }, + { + "epoch": 91.14986376021798, + "grad_norm": 1.5708297491073608, + "learning_rate": 4.079911239083267e-07, + "loss": 0.0176, + "step": 33452 + }, + { + "epoch": 91.15258855585832, + "grad_norm": 2.229505777359009, + "learning_rate": 4.0774165760247177e-07, + "loss": 0.0347, + "step": 33453 + }, + { + "epoch": 91.15531335149863, + "grad_norm": 2.8612000942230225, + "learning_rate": 4.0749226600081513e-07, + "loss": 0.1015, + "step": 33454 + }, + { + "epoch": 91.15803814713897, + "grad_norm": 6.5360002517700195, + "learning_rate": 4.0724294910529873e-07, + "loss": 0.0984, + "step": 33455 + }, + { + "epoch": 91.16076294277929, + "grad_norm": 2.2636289596557617, + "learning_rate": 4.069937069178675e-07, + "loss": 0.0405, + "step": 33456 + }, + { + "epoch": 91.16348773841962, + "grad_norm": 2.311821699142456, + "learning_rate": 4.06744539440459e-07, + "loss": 0.0265, + "step": 33457 + }, + { + "epoch": 91.16621253405995, + "grad_norm": 2.3678250312805176, + "learning_rate": 4.0649544667501595e-07, + "loss": 0.0243, + "step": 33458 + }, + { + "epoch": 91.16893732970027, + "grad_norm": 2.6175408363342285, + "learning_rate": 4.0624642862347796e-07, + "loss": 0.1141, + "step": 33459 + }, + { + "epoch": 91.1716621253406, + "grad_norm": 2.510948896408081, + "learning_rate": 4.059974852877824e-07, + "loss": 0.0226, + "step": 33460 + }, + { + "epoch": 91.17438692098092, + "grad_norm": 5.691770553588867, + "learning_rate": 4.057486166698721e-07, + "loss": 0.0702, + "step": 33461 + }, + { + "epoch": 91.17711171662125, + "grad_norm": 2.44684100151062, + "learning_rate": 4.054998227716822e-07, + "loss": 0.0304, + "step": 33462 + }, + { + "epoch": 91.17983651226157, + "grad_norm": 5.354679584503174, + "learning_rate": 4.0525110359515005e-07, + "loss": 0.0891, + "step": 33463 + }, + { + "epoch": 91.1825613079019, + "grad_norm": 2.2572429180145264, + "learning_rate": 4.0500245914221303e-07, + "loss": 0.0472, + "step": 33464 + }, + { + "epoch": 91.18528610354224, + "grad_norm": 2.445316791534424, + "learning_rate": 4.0475388941480955e-07, + "loss": 0.099, + "step": 33465 + }, + { + "epoch": 91.18801089918256, + "grad_norm": 2.737708568572998, + "learning_rate": 4.045053944148736e-07, + "loss": 0.1087, + "step": 33466 + }, + { + "epoch": 91.19073569482289, + "grad_norm": 7.153319835662842, + "learning_rate": 4.0425697414434027e-07, + "loss": 0.0616, + "step": 33467 + }, + { + "epoch": 91.19346049046321, + "grad_norm": 3.299309730529785, + "learning_rate": 4.0400862860514366e-07, + "loss": 0.0564, + "step": 33468 + }, + { + "epoch": 91.19618528610354, + "grad_norm": 1.737561583518982, + "learning_rate": 4.037603577992211e-07, + "loss": 0.0378, + "step": 33469 + }, + { + "epoch": 91.19891008174388, + "grad_norm": 3.6247615814208984, + "learning_rate": 4.035121617285032e-07, + "loss": 0.1782, + "step": 33470 + }, + { + "epoch": 91.2016348773842, + "grad_norm": 1.6658930778503418, + "learning_rate": 4.0326404039492283e-07, + "loss": 0.0205, + "step": 33471 + }, + { + "epoch": 91.20435967302453, + "grad_norm": 2.3101959228515625, + "learning_rate": 4.030159938004141e-07, + "loss": 0.052, + "step": 33472 + }, + { + "epoch": 91.20708446866485, + "grad_norm": 3.1363327503204346, + "learning_rate": 4.027680219469088e-07, + "loss": 0.0296, + "step": 33473 + }, + { + "epoch": 91.20980926430518, + "grad_norm": 2.6599698066711426, + "learning_rate": 4.025201248363353e-07, + "loss": 0.0759, + "step": 33474 + }, + { + "epoch": 91.2125340599455, + "grad_norm": 3.1961421966552734, + "learning_rate": 4.0227230247062765e-07, + "loss": 0.0918, + "step": 33475 + }, + { + "epoch": 91.21525885558583, + "grad_norm": 2.746758222579956, + "learning_rate": 4.020245548517132e-07, + "loss": 0.0485, + "step": 33476 + }, + { + "epoch": 91.21798365122616, + "grad_norm": 1.916736125946045, + "learning_rate": 4.017768819815238e-07, + "loss": 0.0269, + "step": 33477 + }, + { + "epoch": 91.22070844686648, + "grad_norm": 2.2074666023254395, + "learning_rate": 4.0152928386198775e-07, + "loss": 0.0681, + "step": 33478 + }, + { + "epoch": 91.22343324250681, + "grad_norm": 2.259948968887329, + "learning_rate": 4.0128176049503145e-07, + "loss": 0.0316, + "step": 33479 + }, + { + "epoch": 91.22615803814713, + "grad_norm": 2.186495780944824, + "learning_rate": 4.0103431188258324e-07, + "loss": 0.0496, + "step": 33480 + }, + { + "epoch": 91.22888283378747, + "grad_norm": 2.4739370346069336, + "learning_rate": 4.0078693802657273e-07, + "loss": 0.0324, + "step": 33481 + }, + { + "epoch": 91.2316076294278, + "grad_norm": 2.4121856689453125, + "learning_rate": 4.00539638928924e-07, + "loss": 0.0351, + "step": 33482 + }, + { + "epoch": 91.23433242506812, + "grad_norm": 1.9716999530792236, + "learning_rate": 4.002924145915632e-07, + "loss": 0.0273, + "step": 33483 + }, + { + "epoch": 91.23705722070845, + "grad_norm": 8.593786239624023, + "learning_rate": 4.000452650164155e-07, + "loss": 0.0512, + "step": 33484 + }, + { + "epoch": 91.23978201634877, + "grad_norm": 2.205383777618408, + "learning_rate": 3.997981902054071e-07, + "loss": 0.0648, + "step": 33485 + }, + { + "epoch": 91.2425068119891, + "grad_norm": 2.3848838806152344, + "learning_rate": 3.9955119016046206e-07, + "loss": 0.0469, + "step": 33486 + }, + { + "epoch": 91.24523160762942, + "grad_norm": 2.675579071044922, + "learning_rate": 3.9930426488350215e-07, + "loss": 0.0393, + "step": 33487 + }, + { + "epoch": 91.24795640326975, + "grad_norm": 2.5658624172210693, + "learning_rate": 3.990574143764514e-07, + "loss": 0.061, + "step": 33488 + }, + { + "epoch": 91.25068119891009, + "grad_norm": 4.218019485473633, + "learning_rate": 3.988106386412338e-07, + "loss": 0.1922, + "step": 33489 + }, + { + "epoch": 91.2534059945504, + "grad_norm": 4.758276462554932, + "learning_rate": 3.9856393767976896e-07, + "loss": 0.0652, + "step": 33490 + }, + { + "epoch": 91.25613079019074, + "grad_norm": 2.8237547874450684, + "learning_rate": 3.983173114939798e-07, + "loss": 0.147, + "step": 33491 + }, + { + "epoch": 91.25885558583106, + "grad_norm": 3.6301066875457764, + "learning_rate": 3.980707600857847e-07, + "loss": 0.0747, + "step": 33492 + }, + { + "epoch": 91.26158038147139, + "grad_norm": 3.5691137313842773, + "learning_rate": 3.9782428345710665e-07, + "loss": 0.0587, + "step": 33493 + }, + { + "epoch": 91.26430517711172, + "grad_norm": 1.843849778175354, + "learning_rate": 3.9757788160986524e-07, + "loss": 0.0175, + "step": 33494 + }, + { + "epoch": 91.26702997275204, + "grad_norm": 2.163905143737793, + "learning_rate": 3.9733155454597774e-07, + "loss": 0.0555, + "step": 33495 + }, + { + "epoch": 91.26975476839237, + "grad_norm": 2.266207456588745, + "learning_rate": 3.970853022673615e-07, + "loss": 0.0617, + "step": 33496 + }, + { + "epoch": 91.2724795640327, + "grad_norm": 2.2678987979888916, + "learning_rate": 3.9683912477593734e-07, + "loss": 0.1042, + "step": 33497 + }, + { + "epoch": 91.27520435967303, + "grad_norm": 3.014303684234619, + "learning_rate": 3.965930220736203e-07, + "loss": 0.099, + "step": 33498 + }, + { + "epoch": 91.27792915531334, + "grad_norm": 2.7640128135681152, + "learning_rate": 3.963469941623288e-07, + "loss": 0.0359, + "step": 33499 + }, + { + "epoch": 91.28065395095368, + "grad_norm": 3.1587300300598145, + "learning_rate": 3.9610104104397586e-07, + "loss": 0.0582, + "step": 33500 + }, + { + "epoch": 91.28337874659401, + "grad_norm": 2.873241901397705, + "learning_rate": 3.9585516272047984e-07, + "loss": 0.051, + "step": 33501 + }, + { + "epoch": 91.28610354223433, + "grad_norm": 1.3458555936813354, + "learning_rate": 3.9560935919375597e-07, + "loss": 0.0152, + "step": 33502 + }, + { + "epoch": 91.28882833787466, + "grad_norm": 1.8848713636398315, + "learning_rate": 3.95363630465716e-07, + "loss": 0.0282, + "step": 33503 + }, + { + "epoch": 91.29155313351498, + "grad_norm": 3.7567384243011475, + "learning_rate": 3.95117976538274e-07, + "loss": 0.0269, + "step": 33504 + }, + { + "epoch": 91.29427792915531, + "grad_norm": 1.807776689529419, + "learning_rate": 3.9487239741334615e-07, + "loss": 0.0602, + "step": 33505 + }, + { + "epoch": 91.29700272479565, + "grad_norm": 2.626446485519409, + "learning_rate": 3.946268930928421e-07, + "loss": 0.035, + "step": 33506 + }, + { + "epoch": 91.29972752043597, + "grad_norm": 2.3312532901763916, + "learning_rate": 3.9438146357867467e-07, + "loss": 0.0379, + "step": 33507 + }, + { + "epoch": 91.3024523160763, + "grad_norm": 2.165179967880249, + "learning_rate": 3.9413610887275466e-07, + "loss": 0.0512, + "step": 33508 + }, + { + "epoch": 91.30517711171662, + "grad_norm": 6.76454496383667, + "learning_rate": 3.938908289769927e-07, + "loss": 0.0985, + "step": 33509 + }, + { + "epoch": 91.30790190735695, + "grad_norm": 1.9388389587402344, + "learning_rate": 3.9364562389330174e-07, + "loss": 0.0325, + "step": 33510 + }, + { + "epoch": 91.31062670299727, + "grad_norm": 3.389204978942871, + "learning_rate": 3.934004936235891e-07, + "loss": 0.1059, + "step": 33511 + }, + { + "epoch": 91.3133514986376, + "grad_norm": 3.885791540145874, + "learning_rate": 3.9315543816976444e-07, + "loss": 0.1031, + "step": 33512 + }, + { + "epoch": 91.31607629427793, + "grad_norm": 5.326609134674072, + "learning_rate": 3.92910457533735e-07, + "loss": 0.0411, + "step": 33513 + }, + { + "epoch": 91.31880108991825, + "grad_norm": 3.149608850479126, + "learning_rate": 3.926655517174105e-07, + "loss": 0.0509, + "step": 33514 + }, + { + "epoch": 91.32152588555859, + "grad_norm": 2.390986919403076, + "learning_rate": 3.924207207226971e-07, + "loss": 0.0467, + "step": 33515 + }, + { + "epoch": 91.3242506811989, + "grad_norm": 4.05216121673584, + "learning_rate": 3.9217596455150107e-07, + "loss": 0.0544, + "step": 33516 + }, + { + "epoch": 91.32697547683924, + "grad_norm": 2.684932231903076, + "learning_rate": 3.9193128320573095e-07, + "loss": 0.036, + "step": 33517 + }, + { + "epoch": 91.32970027247957, + "grad_norm": 3.469726085662842, + "learning_rate": 3.916866766872907e-07, + "loss": 0.0539, + "step": 33518 + }, + { + "epoch": 91.33242506811989, + "grad_norm": 4.65806245803833, + "learning_rate": 3.914421449980854e-07, + "loss": 0.1012, + "step": 33519 + }, + { + "epoch": 91.33514986376022, + "grad_norm": 1.6177089214324951, + "learning_rate": 3.9119768814001813e-07, + "loss": 0.0148, + "step": 33520 + }, + { + "epoch": 91.33787465940054, + "grad_norm": 2.87542462348938, + "learning_rate": 3.9095330611499506e-07, + "loss": 0.0337, + "step": 33521 + }, + { + "epoch": 91.34059945504087, + "grad_norm": 2.579695701599121, + "learning_rate": 3.90708998924918e-07, + "loss": 0.0322, + "step": 33522 + }, + { + "epoch": 91.34332425068119, + "grad_norm": 1.7988877296447754, + "learning_rate": 3.9046476657168985e-07, + "loss": 0.018, + "step": 33523 + }, + { + "epoch": 91.34604904632153, + "grad_norm": 4.781064510345459, + "learning_rate": 3.9022060905721246e-07, + "loss": 0.1467, + "step": 33524 + }, + { + "epoch": 91.34877384196186, + "grad_norm": 3.165649652481079, + "learning_rate": 3.8997652638338876e-07, + "loss": 0.0347, + "step": 33525 + }, + { + "epoch": 91.35149863760218, + "grad_norm": 2.6371865272521973, + "learning_rate": 3.8973251855211726e-07, + "loss": 0.0762, + "step": 33526 + }, + { + "epoch": 91.35422343324251, + "grad_norm": 1.6691075563430786, + "learning_rate": 3.8948858556530077e-07, + "loss": 0.1173, + "step": 33527 + }, + { + "epoch": 91.35694822888283, + "grad_norm": 2.2323529720306396, + "learning_rate": 3.8924472742483785e-07, + "loss": 0.0237, + "step": 33528 + }, + { + "epoch": 91.35967302452316, + "grad_norm": 2.1835381984710693, + "learning_rate": 3.890009441326259e-07, + "loss": 0.1515, + "step": 33529 + }, + { + "epoch": 91.3623978201635, + "grad_norm": 1.8728735446929932, + "learning_rate": 3.887572356905678e-07, + "loss": 0.096, + "step": 33530 + }, + { + "epoch": 91.36512261580381, + "grad_norm": 2.2562313079833984, + "learning_rate": 3.8851360210055755e-07, + "loss": 0.0289, + "step": 33531 + }, + { + "epoch": 91.36784741144415, + "grad_norm": 2.5280210971832275, + "learning_rate": 3.882700433644948e-07, + "loss": 0.0519, + "step": 33532 + }, + { + "epoch": 91.37057220708446, + "grad_norm": 2.778721809387207, + "learning_rate": 3.880265594842747e-07, + "loss": 0.0577, + "step": 33533 + }, + { + "epoch": 91.3732970027248, + "grad_norm": 3.2019004821777344, + "learning_rate": 3.877831504617946e-07, + "loss": 0.0572, + "step": 33534 + }, + { + "epoch": 91.37602179836512, + "grad_norm": 2.290388584136963, + "learning_rate": 3.8753981629895076e-07, + "loss": 0.0806, + "step": 33535 + }, + { + "epoch": 91.37874659400545, + "grad_norm": 8.816770553588867, + "learning_rate": 3.8729655699763613e-07, + "loss": 0.0885, + "step": 33536 + }, + { + "epoch": 91.38147138964578, + "grad_norm": 3.0813393592834473, + "learning_rate": 3.8705337255974697e-07, + "loss": 0.0245, + "step": 33537 + }, + { + "epoch": 91.3841961852861, + "grad_norm": 2.967586040496826, + "learning_rate": 3.8681026298717836e-07, + "loss": 0.0285, + "step": 33538 + }, + { + "epoch": 91.38692098092643, + "grad_norm": 2.6449077129364014, + "learning_rate": 3.8656722828182115e-07, + "loss": 0.0307, + "step": 33539 + }, + { + "epoch": 91.38964577656675, + "grad_norm": 2.673945426940918, + "learning_rate": 3.86324268445567e-07, + "loss": 0.0283, + "step": 33540 + }, + { + "epoch": 91.39237057220708, + "grad_norm": 3.387751579284668, + "learning_rate": 3.860813834803123e-07, + "loss": 0.0396, + "step": 33541 + }, + { + "epoch": 91.39509536784742, + "grad_norm": 2.536093235015869, + "learning_rate": 3.858385733879455e-07, + "loss": 0.0341, + "step": 33542 + }, + { + "epoch": 91.39782016348774, + "grad_norm": 2.1067984104156494, + "learning_rate": 3.855958381703584e-07, + "loss": 0.0208, + "step": 33543 + }, + { + "epoch": 91.40054495912807, + "grad_norm": 2.023822069168091, + "learning_rate": 3.853531778294417e-07, + "loss": 0.024, + "step": 33544 + }, + { + "epoch": 91.40326975476839, + "grad_norm": 14.900796890258789, + "learning_rate": 3.851105923670839e-07, + "loss": 0.024, + "step": 33545 + }, + { + "epoch": 91.40599455040872, + "grad_norm": 1.3199199438095093, + "learning_rate": 3.848680817851769e-07, + "loss": 0.0131, + "step": 33546 + }, + { + "epoch": 91.40871934604904, + "grad_norm": 2.8630051612854004, + "learning_rate": 3.8462564608560793e-07, + "loss": 0.0668, + "step": 33547 + }, + { + "epoch": 91.41144414168937, + "grad_norm": 2.70255970954895, + "learning_rate": 3.8438328527026445e-07, + "loss": 0.1183, + "step": 33548 + }, + { + "epoch": 91.4141689373297, + "grad_norm": 1.9144985675811768, + "learning_rate": 3.8414099934103386e-07, + "loss": 0.0836, + "step": 33549 + }, + { + "epoch": 91.41689373297002, + "grad_norm": 1.8344573974609375, + "learning_rate": 3.8389878829980465e-07, + "loss": 0.028, + "step": 33550 + }, + { + "epoch": 91.41961852861036, + "grad_norm": 2.180424690246582, + "learning_rate": 3.836566521484619e-07, + "loss": 0.0435, + "step": 33551 + }, + { + "epoch": 91.42234332425068, + "grad_norm": 2.846090793609619, + "learning_rate": 3.83414590888892e-07, + "loss": 0.0677, + "step": 33552 + }, + { + "epoch": 91.42506811989101, + "grad_norm": 3.0681021213531494, + "learning_rate": 3.8317260452297776e-07, + "loss": 0.051, + "step": 33553 + }, + { + "epoch": 91.42779291553134, + "grad_norm": 2.614234447479248, + "learning_rate": 3.8293069305260776e-07, + "loss": 0.0422, + "step": 33554 + }, + { + "epoch": 91.43051771117166, + "grad_norm": 2.4826254844665527, + "learning_rate": 3.826888564796638e-07, + "loss": 0.1028, + "step": 33555 + }, + { + "epoch": 91.433242506812, + "grad_norm": 2.5016932487487793, + "learning_rate": 3.824470948060299e-07, + "loss": 0.031, + "step": 33556 + }, + { + "epoch": 91.43596730245231, + "grad_norm": 1.9077481031417847, + "learning_rate": 3.8220540803358687e-07, + "loss": 0.0524, + "step": 33557 + }, + { + "epoch": 91.43869209809264, + "grad_norm": 2.917414426803589, + "learning_rate": 3.8196379616421975e-07, + "loss": 0.1687, + "step": 33558 + }, + { + "epoch": 91.44141689373296, + "grad_norm": 2.3211934566497803, + "learning_rate": 3.817222591998093e-07, + "loss": 0.0548, + "step": 33559 + }, + { + "epoch": 91.4441416893733, + "grad_norm": 1.7042837142944336, + "learning_rate": 3.8148079714223407e-07, + "loss": 0.018, + "step": 33560 + }, + { + "epoch": 91.44686648501363, + "grad_norm": 3.297069549560547, + "learning_rate": 3.812394099933781e-07, + "loss": 0.0708, + "step": 33561 + }, + { + "epoch": 91.44959128065395, + "grad_norm": 2.1418566703796387, + "learning_rate": 3.809980977551209e-07, + "loss": 0.041, + "step": 33562 + }, + { + "epoch": 91.45231607629428, + "grad_norm": 1.7914178371429443, + "learning_rate": 3.80756860429341e-07, + "loss": 0.0184, + "step": 33563 + }, + { + "epoch": 91.4550408719346, + "grad_norm": 2.666574239730835, + "learning_rate": 3.80515698017917e-07, + "loss": 0.168, + "step": 33564 + }, + { + "epoch": 91.45776566757493, + "grad_norm": 2.6954071521759033, + "learning_rate": 3.802746105227251e-07, + "loss": 0.0319, + "step": 33565 + }, + { + "epoch": 91.46049046321527, + "grad_norm": 2.6725752353668213, + "learning_rate": 3.800335979456471e-07, + "loss": 0.0334, + "step": 33566 + }, + { + "epoch": 91.46321525885558, + "grad_norm": 2.1421608924865723, + "learning_rate": 3.797926602885582e-07, + "loss": 0.0235, + "step": 33567 + }, + { + "epoch": 91.46594005449592, + "grad_norm": 2.6930532455444336, + "learning_rate": 3.795517975533336e-07, + "loss": 0.0431, + "step": 33568 + }, + { + "epoch": 91.46866485013624, + "grad_norm": 1.8473962545394897, + "learning_rate": 3.7931100974184843e-07, + "loss": 0.0312, + "step": 33569 + }, + { + "epoch": 91.47138964577657, + "grad_norm": 2.257495641708374, + "learning_rate": 3.790702968559812e-07, + "loss": 0.0495, + "step": 33570 + }, + { + "epoch": 91.47411444141689, + "grad_norm": 5.894565105438232, + "learning_rate": 3.788296588976048e-07, + "loss": 0.1056, + "step": 33571 + }, + { + "epoch": 91.47683923705722, + "grad_norm": 1.855755090713501, + "learning_rate": 3.785890958685945e-07, + "loss": 0.024, + "step": 33572 + }, + { + "epoch": 91.47956403269755, + "grad_norm": 1.4998773336410522, + "learning_rate": 3.783486077708198e-07, + "loss": 0.0202, + "step": 33573 + }, + { + "epoch": 91.48228882833787, + "grad_norm": 2.37126088142395, + "learning_rate": 3.781081946061582e-07, + "loss": 0.075, + "step": 33574 + }, + { + "epoch": 91.4850136239782, + "grad_norm": 2.227522373199463, + "learning_rate": 3.778678563764804e-07, + "loss": 0.0289, + "step": 33575 + }, + { + "epoch": 91.48773841961852, + "grad_norm": 2.0605151653289795, + "learning_rate": 3.7762759308365814e-07, + "loss": 0.0328, + "step": 33576 + }, + { + "epoch": 91.49046321525886, + "grad_norm": 3.265958786010742, + "learning_rate": 3.7738740472956115e-07, + "loss": 0.0554, + "step": 33577 + }, + { + "epoch": 91.49318801089919, + "grad_norm": 2.8525846004486084, + "learning_rate": 3.771472913160612e-07, + "loss": 0.0791, + "step": 33578 + }, + { + "epoch": 91.49591280653951, + "grad_norm": 2.7092018127441406, + "learning_rate": 3.769072528450302e-07, + "loss": 0.1028, + "step": 33579 + }, + { + "epoch": 91.49863760217984, + "grad_norm": 2.29067325592041, + "learning_rate": 3.766672893183354e-07, + "loss": 0.0203, + "step": 33580 + }, + { + "epoch": 91.50136239782016, + "grad_norm": 1.9763702154159546, + "learning_rate": 3.7642740073784435e-07, + "loss": 0.0196, + "step": 33581 + }, + { + "epoch": 91.50408719346049, + "grad_norm": 4.412403583526611, + "learning_rate": 3.761875871054288e-07, + "loss": 0.046, + "step": 33582 + }, + { + "epoch": 91.50681198910081, + "grad_norm": 2.6487820148468018, + "learning_rate": 3.7594784842295505e-07, + "loss": 0.1694, + "step": 33583 + }, + { + "epoch": 91.50953678474114, + "grad_norm": 4.80283260345459, + "learning_rate": 3.7570818469228834e-07, + "loss": 0.1223, + "step": 33584 + }, + { + "epoch": 91.51226158038148, + "grad_norm": 2.7220542430877686, + "learning_rate": 3.754685959152971e-07, + "loss": 0.1134, + "step": 33585 + }, + { + "epoch": 91.5149863760218, + "grad_norm": 3.8485357761383057, + "learning_rate": 3.7522908209384644e-07, + "loss": 0.2028, + "step": 33586 + }, + { + "epoch": 91.51771117166213, + "grad_norm": 2.6554503440856934, + "learning_rate": 3.749896432298017e-07, + "loss": 0.1133, + "step": 33587 + }, + { + "epoch": 91.52043596730245, + "grad_norm": 2.0981926918029785, + "learning_rate": 3.7475027932502904e-07, + "loss": 0.0922, + "step": 33588 + }, + { + "epoch": 91.52316076294278, + "grad_norm": 3.087574005126953, + "learning_rate": 3.7451099038138926e-07, + "loss": 0.0973, + "step": 33589 + }, + { + "epoch": 91.52588555858311, + "grad_norm": 3.2297282218933105, + "learning_rate": 3.742717764007497e-07, + "loss": 0.0312, + "step": 33590 + }, + { + "epoch": 91.52861035422343, + "grad_norm": 3.242899179458618, + "learning_rate": 3.740326373849723e-07, + "loss": 0.0356, + "step": 33591 + }, + { + "epoch": 91.53133514986376, + "grad_norm": 2.4582908153533936, + "learning_rate": 3.737935733359177e-07, + "loss": 0.0553, + "step": 33592 + }, + { + "epoch": 91.53405994550408, + "grad_norm": 3.2118515968322754, + "learning_rate": 3.735545842554489e-07, + "loss": 0.1782, + "step": 33593 + }, + { + "epoch": 91.53678474114442, + "grad_norm": 2.3374011516571045, + "learning_rate": 3.733156701454277e-07, + "loss": 0.0223, + "step": 33594 + }, + { + "epoch": 91.53950953678473, + "grad_norm": 1.7692631483078003, + "learning_rate": 3.7307683100771377e-07, + "loss": 0.0255, + "step": 33595 + }, + { + "epoch": 91.54223433242507, + "grad_norm": 2.864637851715088, + "learning_rate": 3.7283806684416777e-07, + "loss": 0.0542, + "step": 33596 + }, + { + "epoch": 91.5449591280654, + "grad_norm": 3.0823960304260254, + "learning_rate": 3.7259937765664943e-07, + "loss": 0.0928, + "step": 33597 + }, + { + "epoch": 91.54768392370572, + "grad_norm": 2.6931047439575195, + "learning_rate": 3.7236076344701613e-07, + "loss": 0.0545, + "step": 33598 + }, + { + "epoch": 91.55040871934605, + "grad_norm": 3.286928415298462, + "learning_rate": 3.721222242171285e-07, + "loss": 0.1571, + "step": 33599 + }, + { + "epoch": 91.55313351498637, + "grad_norm": 2.4106199741363525, + "learning_rate": 3.7188375996884295e-07, + "loss": 0.027, + "step": 33600 + }, + { + "epoch": 91.5558583106267, + "grad_norm": 2.004592180252075, + "learning_rate": 3.7164537070401573e-07, + "loss": 0.0409, + "step": 33601 + }, + { + "epoch": 91.55858310626704, + "grad_norm": 2.57600998878479, + "learning_rate": 3.7140705642450647e-07, + "loss": 0.0441, + "step": 33602 + }, + { + "epoch": 91.56130790190736, + "grad_norm": 3.2495641708374023, + "learning_rate": 3.711688171321681e-07, + "loss": 0.0579, + "step": 33603 + }, + { + "epoch": 91.56403269754769, + "grad_norm": 2.7735214233398438, + "learning_rate": 3.709306528288581e-07, + "loss": 0.1541, + "step": 33604 + }, + { + "epoch": 91.566757493188, + "grad_norm": 2.1506876945495605, + "learning_rate": 3.7069256351642823e-07, + "loss": 0.0256, + "step": 33605 + }, + { + "epoch": 91.56948228882834, + "grad_norm": 1.6449873447418213, + "learning_rate": 3.7045454919673597e-07, + "loss": 0.0372, + "step": 33606 + }, + { + "epoch": 91.57220708446866, + "grad_norm": 2.3814804553985596, + "learning_rate": 3.702166098716342e-07, + "loss": 0.0548, + "step": 33607 + }, + { + "epoch": 91.57493188010899, + "grad_norm": 2.2766847610473633, + "learning_rate": 3.6997874554297484e-07, + "loss": 0.0293, + "step": 33608 + }, + { + "epoch": 91.57765667574932, + "grad_norm": 2.326969861984253, + "learning_rate": 3.697409562126109e-07, + "loss": 0.0851, + "step": 33609 + }, + { + "epoch": 91.58038147138964, + "grad_norm": 2.594961166381836, + "learning_rate": 3.6950324188239517e-07, + "loss": 0.0711, + "step": 33610 + }, + { + "epoch": 91.58310626702998, + "grad_norm": 3.5385637283325195, + "learning_rate": 3.6926560255417745e-07, + "loss": 0.0458, + "step": 33611 + }, + { + "epoch": 91.5858310626703, + "grad_norm": 2.9375243186950684, + "learning_rate": 3.690280382298095e-07, + "loss": 0.11, + "step": 33612 + }, + { + "epoch": 91.58855585831063, + "grad_norm": 2.3595938682556152, + "learning_rate": 3.68790548911141e-07, + "loss": 0.1431, + "step": 33613 + }, + { + "epoch": 91.59128065395096, + "grad_norm": 3.097893238067627, + "learning_rate": 3.685531346000215e-07, + "loss": 0.1205, + "step": 33614 + }, + { + "epoch": 91.59400544959128, + "grad_norm": 2.1998302936553955, + "learning_rate": 3.6831579529830076e-07, + "loss": 0.0663, + "step": 33615 + }, + { + "epoch": 91.59673024523161, + "grad_norm": 2.487896203994751, + "learning_rate": 3.680785310078272e-07, + "loss": 0.0908, + "step": 33616 + }, + { + "epoch": 91.59945504087193, + "grad_norm": 2.552617311477661, + "learning_rate": 3.6784134173044716e-07, + "loss": 0.1584, + "step": 33617 + }, + { + "epoch": 91.60217983651226, + "grad_norm": 3.077333688735962, + "learning_rate": 3.6760422746800806e-07, + "loss": 0.0641, + "step": 33618 + }, + { + "epoch": 91.60490463215258, + "grad_norm": 2.582639455795288, + "learning_rate": 3.673671882223595e-07, + "loss": 0.0266, + "step": 33619 + }, + { + "epoch": 91.60762942779292, + "grad_norm": 1.9093434810638428, + "learning_rate": 3.671302239953434e-07, + "loss": 0.0241, + "step": 33620 + }, + { + "epoch": 91.61035422343325, + "grad_norm": 2.607896566390991, + "learning_rate": 3.6689333478880816e-07, + "loss": 0.0547, + "step": 33621 + }, + { + "epoch": 91.61307901907357, + "grad_norm": 2.725715398788452, + "learning_rate": 3.6665652060459576e-07, + "loss": 0.0311, + "step": 33622 + }, + { + "epoch": 91.6158038147139, + "grad_norm": 3.2464728355407715, + "learning_rate": 3.664197814445547e-07, + "loss": 0.0368, + "step": 33623 + }, + { + "epoch": 91.61852861035422, + "grad_norm": 2.1419646739959717, + "learning_rate": 3.661831173105257e-07, + "loss": 0.0655, + "step": 33624 + }, + { + "epoch": 91.62125340599455, + "grad_norm": 2.5510311126708984, + "learning_rate": 3.6594652820435064e-07, + "loss": 0.0382, + "step": 33625 + }, + { + "epoch": 91.62397820163488, + "grad_norm": 3.1216113567352295, + "learning_rate": 3.657100141278758e-07, + "loss": 0.1129, + "step": 33626 + }, + { + "epoch": 91.6267029972752, + "grad_norm": 2.985828399658203, + "learning_rate": 3.654735750829408e-07, + "loss": 0.0323, + "step": 33627 + }, + { + "epoch": 91.62942779291554, + "grad_norm": 2.9723455905914307, + "learning_rate": 3.652372110713887e-07, + "loss": 0.0374, + "step": 33628 + }, + { + "epoch": 91.63215258855585, + "grad_norm": 1.8881319761276245, + "learning_rate": 3.650009220950568e-07, + "loss": 0.0244, + "step": 33629 + }, + { + "epoch": 91.63487738419619, + "grad_norm": 3.5544631481170654, + "learning_rate": 3.647647081557881e-07, + "loss": 0.0679, + "step": 33630 + }, + { + "epoch": 91.6376021798365, + "grad_norm": 2.0359060764312744, + "learning_rate": 3.6452856925542235e-07, + "loss": 0.1462, + "step": 33631 + }, + { + "epoch": 91.64032697547684, + "grad_norm": 5.320764541625977, + "learning_rate": 3.642925053957991e-07, + "loss": 0.0766, + "step": 33632 + }, + { + "epoch": 91.64305177111717, + "grad_norm": 3.1832618713378906, + "learning_rate": 3.6405651657875464e-07, + "loss": 0.1352, + "step": 33633 + }, + { + "epoch": 91.64577656675749, + "grad_norm": 2.471998929977417, + "learning_rate": 3.638206028061264e-07, + "loss": 0.0287, + "step": 33634 + }, + { + "epoch": 91.64850136239782, + "grad_norm": 2.826984405517578, + "learning_rate": 3.635847640797552e-07, + "loss": 0.0576, + "step": 33635 + }, + { + "epoch": 91.65122615803814, + "grad_norm": 2.281329393386841, + "learning_rate": 3.6334900040147615e-07, + "loss": 0.0428, + "step": 33636 + }, + { + "epoch": 91.65395095367847, + "grad_norm": 2.644656181335449, + "learning_rate": 3.6311331177312447e-07, + "loss": 0.0397, + "step": 33637 + }, + { + "epoch": 91.65667574931881, + "grad_norm": 2.2187631130218506, + "learning_rate": 3.628776981965343e-07, + "loss": 0.0267, + "step": 33638 + }, + { + "epoch": 91.65940054495913, + "grad_norm": 3.246809720993042, + "learning_rate": 3.626421596735441e-07, + "loss": 0.1343, + "step": 33639 + }, + { + "epoch": 91.66212534059946, + "grad_norm": 3.6670730113983154, + "learning_rate": 3.624066962059869e-07, + "loss": 0.0282, + "step": 33640 + }, + { + "epoch": 91.66485013623978, + "grad_norm": 2.6588709354400635, + "learning_rate": 3.6217130779569565e-07, + "loss": 0.1344, + "step": 33641 + }, + { + "epoch": 91.66757493188011, + "grad_norm": 2.7214791774749756, + "learning_rate": 3.6193599444450335e-07, + "loss": 0.0726, + "step": 33642 + }, + { + "epoch": 91.67029972752043, + "grad_norm": 2.9262428283691406, + "learning_rate": 3.6170075615424407e-07, + "loss": 0.0926, + "step": 33643 + }, + { + "epoch": 91.67302452316076, + "grad_norm": 2.1330814361572266, + "learning_rate": 3.6146559292674967e-07, + "loss": 0.0458, + "step": 33644 + }, + { + "epoch": 91.6757493188011, + "grad_norm": 5.586047172546387, + "learning_rate": 3.612305047638487e-07, + "loss": 0.0862, + "step": 33645 + }, + { + "epoch": 91.67847411444141, + "grad_norm": 4.77297306060791, + "learning_rate": 3.6099549166737527e-07, + "loss": 0.0338, + "step": 33646 + }, + { + "epoch": 91.68119891008175, + "grad_norm": 2.5954415798187256, + "learning_rate": 3.6076055363916005e-07, + "loss": 0.0248, + "step": 33647 + }, + { + "epoch": 91.68392370572207, + "grad_norm": 1.8317947387695312, + "learning_rate": 3.605256906810306e-07, + "loss": 0.053, + "step": 33648 + }, + { + "epoch": 91.6866485013624, + "grad_norm": 2.3642208576202393, + "learning_rate": 3.602909027948176e-07, + "loss": 0.0615, + "step": 33649 + }, + { + "epoch": 91.68937329700273, + "grad_norm": 1.713407278060913, + "learning_rate": 3.6005618998234736e-07, + "loss": 0.02, + "step": 33650 + }, + { + "epoch": 91.69209809264305, + "grad_norm": 2.612757682800293, + "learning_rate": 3.598215522454507e-07, + "loss": 0.0179, + "step": 33651 + }, + { + "epoch": 91.69482288828338, + "grad_norm": 2.575063467025757, + "learning_rate": 3.595869895859527e-07, + "loss": 0.0919, + "step": 33652 + }, + { + "epoch": 91.6975476839237, + "grad_norm": 3.129669189453125, + "learning_rate": 3.593525020056821e-07, + "loss": 0.0883, + "step": 33653 + }, + { + "epoch": 91.70027247956403, + "grad_norm": 2.1432507038116455, + "learning_rate": 3.5911808950646165e-07, + "loss": 0.0318, + "step": 33654 + }, + { + "epoch": 91.70299727520435, + "grad_norm": 2.2757797241210938, + "learning_rate": 3.588837520901212e-07, + "loss": 0.0857, + "step": 33655 + }, + { + "epoch": 91.70572207084469, + "grad_norm": 1.5385581254959106, + "learning_rate": 3.586494897584836e-07, + "loss": 0.0671, + "step": 33656 + }, + { + "epoch": 91.70844686648502, + "grad_norm": 2.107974052429199, + "learning_rate": 3.5841530251337297e-07, + "loss": 0.034, + "step": 33657 + }, + { + "epoch": 91.71117166212534, + "grad_norm": 1.6791565418243408, + "learning_rate": 3.581811903566135e-07, + "loss": 0.0604, + "step": 33658 + }, + { + "epoch": 91.71389645776567, + "grad_norm": 2.79116153717041, + "learning_rate": 3.5794715329002805e-07, + "loss": 0.0358, + "step": 33659 + }, + { + "epoch": 91.71662125340599, + "grad_norm": 1.8962323665618896, + "learning_rate": 3.577131913154419e-07, + "loss": 0.0316, + "step": 33660 + }, + { + "epoch": 91.71934604904632, + "grad_norm": 3.239900827407837, + "learning_rate": 3.574793044346736e-07, + "loss": 0.0465, + "step": 33661 + }, + { + "epoch": 91.72207084468666, + "grad_norm": 2.495074510574341, + "learning_rate": 3.57245492649545e-07, + "loss": 0.0499, + "step": 33662 + }, + { + "epoch": 91.72479564032697, + "grad_norm": 1.73086416721344, + "learning_rate": 3.570117559618802e-07, + "loss": 0.0188, + "step": 33663 + }, + { + "epoch": 91.7275204359673, + "grad_norm": 2.6486928462982178, + "learning_rate": 3.5677809437349554e-07, + "loss": 0.0922, + "step": 33664 + }, + { + "epoch": 91.73024523160763, + "grad_norm": 4.095842361450195, + "learning_rate": 3.565445078862151e-07, + "loss": 0.0817, + "step": 33665 + }, + { + "epoch": 91.73297002724796, + "grad_norm": 2.5894007682800293, + "learning_rate": 3.5631099650185294e-07, + "loss": 0.1523, + "step": 33666 + }, + { + "epoch": 91.73569482288828, + "grad_norm": 3.8926684856414795, + "learning_rate": 3.5607756022223216e-07, + "loss": 0.0471, + "step": 33667 + }, + { + "epoch": 91.73841961852861, + "grad_norm": 1.8081189393997192, + "learning_rate": 3.55844199049169e-07, + "loss": 0.0228, + "step": 33668 + }, + { + "epoch": 91.74114441416894, + "grad_norm": 2.48095703125, + "learning_rate": 3.556109129844809e-07, + "loss": 0.0646, + "step": 33669 + }, + { + "epoch": 91.74386920980926, + "grad_norm": 1.7749342918395996, + "learning_rate": 3.5537770202998314e-07, + "loss": 0.0618, + "step": 33670 + }, + { + "epoch": 91.7465940054496, + "grad_norm": 2.6271684169769287, + "learning_rate": 3.551445661874953e-07, + "loss": 0.0256, + "step": 33671 + }, + { + "epoch": 91.74931880108991, + "grad_norm": 2.2914161682128906, + "learning_rate": 3.5491150545883034e-07, + "loss": 0.0509, + "step": 33672 + }, + { + "epoch": 91.75204359673025, + "grad_norm": 2.0748889446258545, + "learning_rate": 3.546785198458047e-07, + "loss": 0.0317, + "step": 33673 + }, + { + "epoch": 91.75476839237058, + "grad_norm": 3.947211742401123, + "learning_rate": 3.544456093502313e-07, + "loss": 0.0782, + "step": 33674 + }, + { + "epoch": 91.7574931880109, + "grad_norm": 3.420990228652954, + "learning_rate": 3.542127739739254e-07, + "loss": 0.1598, + "step": 33675 + }, + { + "epoch": 91.76021798365123, + "grad_norm": 2.767961263656616, + "learning_rate": 3.5398001371870104e-07, + "loss": 0.1616, + "step": 33676 + }, + { + "epoch": 91.76294277929155, + "grad_norm": 2.000896692276001, + "learning_rate": 3.537473285863691e-07, + "loss": 0.0293, + "step": 33677 + }, + { + "epoch": 91.76566757493188, + "grad_norm": 2.8828723430633545, + "learning_rate": 3.535147185787413e-07, + "loss": 0.0387, + "step": 33678 + }, + { + "epoch": 91.7683923705722, + "grad_norm": 2.0531177520751953, + "learning_rate": 3.532821836976319e-07, + "loss": 0.0248, + "step": 33679 + }, + { + "epoch": 91.77111716621253, + "grad_norm": 2.825890064239502, + "learning_rate": 3.530497239448505e-07, + "loss": 0.0398, + "step": 33680 + }, + { + "epoch": 91.77384196185287, + "grad_norm": 3.0841400623321533, + "learning_rate": 3.5281733932220566e-07, + "loss": 0.079, + "step": 33681 + }, + { + "epoch": 91.77656675749319, + "grad_norm": 2.8627307415008545, + "learning_rate": 3.525850298315103e-07, + "loss": 0.0676, + "step": 33682 + }, + { + "epoch": 91.77929155313352, + "grad_norm": 2.518963575363159, + "learning_rate": 3.523527954745709e-07, + "loss": 0.0749, + "step": 33683 + }, + { + "epoch": 91.78201634877384, + "grad_norm": 3.7561941146850586, + "learning_rate": 3.5212063625319925e-07, + "loss": 0.102, + "step": 33684 + }, + { + "epoch": 91.78474114441417, + "grad_norm": 1.9617749452590942, + "learning_rate": 3.518885521692006e-07, + "loss": 0.0882, + "step": 33685 + }, + { + "epoch": 91.7874659400545, + "grad_norm": 2.847410202026367, + "learning_rate": 3.516565432243824e-07, + "loss": 0.0457, + "step": 33686 + }, + { + "epoch": 91.79019073569482, + "grad_norm": 2.5235135555267334, + "learning_rate": 3.5142460942055424e-07, + "loss": 0.0293, + "step": 33687 + }, + { + "epoch": 91.79291553133515, + "grad_norm": 1.7744661569595337, + "learning_rate": 3.511927507595203e-07, + "loss": 0.0175, + "step": 33688 + }, + { + "epoch": 91.79564032697547, + "grad_norm": 3.418145179748535, + "learning_rate": 3.5096096724308694e-07, + "loss": 0.1074, + "step": 33689 + }, + { + "epoch": 91.7983651226158, + "grad_norm": 3.91782283782959, + "learning_rate": 3.507292588730582e-07, + "loss": 0.0572, + "step": 33690 + }, + { + "epoch": 91.80108991825612, + "grad_norm": 2.7733798027038574, + "learning_rate": 3.5049762565123936e-07, + "loss": 0.0856, + "step": 33691 + }, + { + "epoch": 91.80381471389646, + "grad_norm": 2.2111968994140625, + "learning_rate": 3.502660675794356e-07, + "loss": 0.0317, + "step": 33692 + }, + { + "epoch": 91.80653950953679, + "grad_norm": 2.8142967224121094, + "learning_rate": 3.5003458465944884e-07, + "loss": 0.0327, + "step": 33693 + }, + { + "epoch": 91.80926430517711, + "grad_norm": 3.807567596435547, + "learning_rate": 3.4980317689308094e-07, + "loss": 0.0731, + "step": 33694 + }, + { + "epoch": 91.81198910081744, + "grad_norm": 2.0858969688415527, + "learning_rate": 3.495718442821361e-07, + "loss": 0.0324, + "step": 33695 + }, + { + "epoch": 91.81471389645776, + "grad_norm": 3.3685550689697266, + "learning_rate": 3.493405868284161e-07, + "loss": 0.0615, + "step": 33696 + }, + { + "epoch": 91.8174386920981, + "grad_norm": 2.0874626636505127, + "learning_rate": 3.491094045337196e-07, + "loss": 0.0597, + "step": 33697 + }, + { + "epoch": 91.82016348773843, + "grad_norm": 2.850393295288086, + "learning_rate": 3.4887829739984836e-07, + "loss": 0.0755, + "step": 33698 + }, + { + "epoch": 91.82288828337875, + "grad_norm": 2.832606792449951, + "learning_rate": 3.486472654286022e-07, + "loss": 0.0285, + "step": 33699 + }, + { + "epoch": 91.82561307901908, + "grad_norm": 2.2394144535064697, + "learning_rate": 3.484163086217818e-07, + "loss": 0.0505, + "step": 33700 + }, + { + "epoch": 91.8283378746594, + "grad_norm": 2.5283920764923096, + "learning_rate": 3.481854269811835e-07, + "loss": 0.0438, + "step": 33701 + }, + { + "epoch": 91.83106267029973, + "grad_norm": 2.624202251434326, + "learning_rate": 3.4795462050860704e-07, + "loss": 0.0469, + "step": 33702 + }, + { + "epoch": 91.83378746594005, + "grad_norm": 2.273449182510376, + "learning_rate": 3.4772388920584877e-07, + "loss": 0.0507, + "step": 33703 + }, + { + "epoch": 91.83651226158038, + "grad_norm": 2.364443063735962, + "learning_rate": 3.4749323307470717e-07, + "loss": 0.0252, + "step": 33704 + }, + { + "epoch": 91.83923705722071, + "grad_norm": 1.9928584098815918, + "learning_rate": 3.472626521169775e-07, + "loss": 0.027, + "step": 33705 + }, + { + "epoch": 91.84196185286103, + "grad_norm": 1.871195912361145, + "learning_rate": 3.4703214633445504e-07, + "loss": 0.0257, + "step": 33706 + }, + { + "epoch": 91.84468664850137, + "grad_norm": 3.812786102294922, + "learning_rate": 3.4680171572893494e-07, + "loss": 0.0723, + "step": 33707 + }, + { + "epoch": 91.84741144414168, + "grad_norm": 1.8385227918624878, + "learning_rate": 3.465713603022136e-07, + "loss": 0.0223, + "step": 33708 + }, + { + "epoch": 91.85013623978202, + "grad_norm": 2.821190357208252, + "learning_rate": 3.463410800560829e-07, + "loss": 0.0453, + "step": 33709 + }, + { + "epoch": 91.85286103542235, + "grad_norm": 1.599543809890747, + "learning_rate": 3.4611087499233696e-07, + "loss": 0.0168, + "step": 33710 + }, + { + "epoch": 91.85558583106267, + "grad_norm": 3.0530357360839844, + "learning_rate": 3.458807451127699e-07, + "loss": 0.1428, + "step": 33711 + }, + { + "epoch": 91.858310626703, + "grad_norm": 2.7457163333892822, + "learning_rate": 3.4565069041917256e-07, + "loss": 0.0344, + "step": 33712 + }, + { + "epoch": 91.86103542234332, + "grad_norm": 3.1225500106811523, + "learning_rate": 3.4542071091333674e-07, + "loss": 0.0873, + "step": 33713 + }, + { + "epoch": 91.86376021798365, + "grad_norm": 2.1477506160736084, + "learning_rate": 3.451908065970533e-07, + "loss": 0.0194, + "step": 33714 + }, + { + "epoch": 91.86648501362397, + "grad_norm": 2.862032175064087, + "learning_rate": 3.44960977472113e-07, + "loss": 0.0379, + "step": 33715 + }, + { + "epoch": 91.8692098092643, + "grad_norm": 2.6753666400909424, + "learning_rate": 3.4473122354030663e-07, + "loss": 0.0976, + "step": 33716 + }, + { + "epoch": 91.87193460490464, + "grad_norm": 2.248840093612671, + "learning_rate": 3.445015448034228e-07, + "loss": 0.0481, + "step": 33717 + }, + { + "epoch": 91.87465940054496, + "grad_norm": 3.4635705947875977, + "learning_rate": 3.4427194126325006e-07, + "loss": 0.0485, + "step": 33718 + }, + { + "epoch": 91.87738419618529, + "grad_norm": 3.2419512271881104, + "learning_rate": 3.4404241292157583e-07, + "loss": 0.0752, + "step": 33719 + }, + { + "epoch": 91.88010899182561, + "grad_norm": 2.5881309509277344, + "learning_rate": 3.438129597801898e-07, + "loss": 0.0365, + "step": 33720 + }, + { + "epoch": 91.88283378746594, + "grad_norm": 1.7208349704742432, + "learning_rate": 3.4358358184087727e-07, + "loss": 0.0199, + "step": 33721 + }, + { + "epoch": 91.88555858310627, + "grad_norm": 2.5771822929382324, + "learning_rate": 3.433542791054245e-07, + "loss": 0.0535, + "step": 33722 + }, + { + "epoch": 91.88828337874659, + "grad_norm": 3.0956103801727295, + "learning_rate": 3.4312505157561794e-07, + "loss": 0.0918, + "step": 33723 + }, + { + "epoch": 91.89100817438693, + "grad_norm": 4.567342758178711, + "learning_rate": 3.428958992532427e-07, + "loss": 0.0456, + "step": 33724 + }, + { + "epoch": 91.89373297002724, + "grad_norm": 2.660275936126709, + "learning_rate": 3.4266682214008416e-07, + "loss": 0.0622, + "step": 33725 + }, + { + "epoch": 91.89645776566758, + "grad_norm": 2.371448278427124, + "learning_rate": 3.424378202379253e-07, + "loss": 0.1388, + "step": 33726 + }, + { + "epoch": 91.8991825613079, + "grad_norm": 2.8419129848480225, + "learning_rate": 3.422088935485479e-07, + "loss": 0.0684, + "step": 33727 + }, + { + "epoch": 91.90190735694823, + "grad_norm": 2.1045830249786377, + "learning_rate": 3.419800420737396e-07, + "loss": 0.0243, + "step": 33728 + }, + { + "epoch": 91.90463215258856, + "grad_norm": 2.5817203521728516, + "learning_rate": 3.4175126581527883e-07, + "loss": 0.0577, + "step": 33729 + }, + { + "epoch": 91.90735694822888, + "grad_norm": 3.000640869140625, + "learning_rate": 3.4152256477494874e-07, + "loss": 0.0625, + "step": 33730 + }, + { + "epoch": 91.91008174386921, + "grad_norm": 2.578950881958008, + "learning_rate": 3.412939389545289e-07, + "loss": 0.0262, + "step": 33731 + }, + { + "epoch": 91.91280653950953, + "grad_norm": 3.0867624282836914, + "learning_rate": 3.410653883558002e-07, + "loss": 0.0719, + "step": 33732 + }, + { + "epoch": 91.91553133514986, + "grad_norm": 3.0393404960632324, + "learning_rate": 3.4083691298054556e-07, + "loss": 0.0374, + "step": 33733 + }, + { + "epoch": 91.9182561307902, + "grad_norm": 1.9768339395523071, + "learning_rate": 3.406085128305414e-07, + "loss": 0.1099, + "step": 33734 + }, + { + "epoch": 91.92098092643052, + "grad_norm": 1.7287859916687012, + "learning_rate": 3.4038018790756634e-07, + "loss": 0.0207, + "step": 33735 + }, + { + "epoch": 91.92370572207085, + "grad_norm": 2.799020290374756, + "learning_rate": 3.401519382134011e-07, + "loss": 0.026, + "step": 33736 + }, + { + "epoch": 91.92643051771117, + "grad_norm": 2.3542044162750244, + "learning_rate": 3.3992376374982097e-07, + "loss": 0.0261, + "step": 33737 + }, + { + "epoch": 91.9291553133515, + "grad_norm": 2.599226236343384, + "learning_rate": 3.396956645186045e-07, + "loss": 0.1167, + "step": 33738 + }, + { + "epoch": 91.93188010899182, + "grad_norm": 3.9881465435028076, + "learning_rate": 3.3946764052152583e-07, + "loss": 0.0425, + "step": 33739 + }, + { + "epoch": 91.93460490463215, + "grad_norm": 2.5314364433288574, + "learning_rate": 3.392396917603624e-07, + "loss": 0.096, + "step": 33740 + }, + { + "epoch": 91.93732970027249, + "grad_norm": 3.1245369911193848, + "learning_rate": 3.3901181823689065e-07, + "loss": 0.1295, + "step": 33741 + }, + { + "epoch": 91.9400544959128, + "grad_norm": 2.1980035305023193, + "learning_rate": 3.3878401995288357e-07, + "loss": 0.0631, + "step": 33742 + }, + { + "epoch": 91.94277929155314, + "grad_norm": 4.632396221160889, + "learning_rate": 3.385562969101142e-07, + "loss": 0.0321, + "step": 33743 + }, + { + "epoch": 91.94550408719346, + "grad_norm": 2.9690186977386475, + "learning_rate": 3.3832864911035877e-07, + "loss": 0.0629, + "step": 33744 + }, + { + "epoch": 91.94822888283379, + "grad_norm": 4.375700950622559, + "learning_rate": 3.3810107655538826e-07, + "loss": 0.0235, + "step": 33745 + }, + { + "epoch": 91.95095367847412, + "grad_norm": 2.0469024181365967, + "learning_rate": 3.378735792469756e-07, + "loss": 0.1086, + "step": 33746 + }, + { + "epoch": 91.95367847411444, + "grad_norm": 2.8312370777130127, + "learning_rate": 3.3764615718689273e-07, + "loss": 0.039, + "step": 33747 + }, + { + "epoch": 91.95640326975477, + "grad_norm": 2.2449893951416016, + "learning_rate": 3.374188103769105e-07, + "loss": 0.0656, + "step": 33748 + }, + { + "epoch": 91.95912806539509, + "grad_norm": 1.5328950881958008, + "learning_rate": 3.3719153881879963e-07, + "loss": 0.0206, + "step": 33749 + }, + { + "epoch": 91.96185286103542, + "grad_norm": 2.7683541774749756, + "learning_rate": 3.3696434251432984e-07, + "loss": 0.0481, + "step": 33750 + }, + { + "epoch": 91.96457765667574, + "grad_norm": 2.1966023445129395, + "learning_rate": 3.3673722146526976e-07, + "loss": 0.0204, + "step": 33751 + }, + { + "epoch": 91.96730245231608, + "grad_norm": 2.9148166179656982, + "learning_rate": 3.365101756733913e-07, + "loss": 0.138, + "step": 33752 + }, + { + "epoch": 91.97002724795641, + "grad_norm": 1.3568527698516846, + "learning_rate": 3.3628320514045963e-07, + "loss": 0.0172, + "step": 33753 + }, + { + "epoch": 91.97275204359673, + "grad_norm": 2.014632225036621, + "learning_rate": 3.3605630986824346e-07, + "loss": 0.0262, + "step": 33754 + }, + { + "epoch": 91.97547683923706, + "grad_norm": 2.359649181365967, + "learning_rate": 3.3582948985850904e-07, + "loss": 0.0657, + "step": 33755 + }, + { + "epoch": 91.97820163487738, + "grad_norm": 2.4967103004455566, + "learning_rate": 3.35602745113025e-07, + "loss": 0.0798, + "step": 33756 + }, + { + "epoch": 91.98092643051771, + "grad_norm": 3.5767691135406494, + "learning_rate": 3.3537607563355447e-07, + "loss": 0.1311, + "step": 33757 + }, + { + "epoch": 91.98365122615803, + "grad_norm": 2.6671438217163086, + "learning_rate": 3.3514948142186476e-07, + "loss": 0.0781, + "step": 33758 + }, + { + "epoch": 91.98637602179836, + "grad_norm": 2.795790195465088, + "learning_rate": 3.34922962479719e-07, + "loss": 0.0394, + "step": 33759 + }, + { + "epoch": 91.9891008174387, + "grad_norm": 2.46382737159729, + "learning_rate": 3.3469651880888245e-07, + "loss": 0.0613, + "step": 33760 + }, + { + "epoch": 91.99182561307902, + "grad_norm": 2.0662951469421387, + "learning_rate": 3.344701504111192e-07, + "loss": 0.0232, + "step": 33761 + }, + { + "epoch": 91.99455040871935, + "grad_norm": 3.3746325969696045, + "learning_rate": 3.342438572881912e-07, + "loss": 0.0299, + "step": 33762 + }, + { + "epoch": 91.99727520435967, + "grad_norm": 2.9933717250823975, + "learning_rate": 3.3401763944185927e-07, + "loss": 0.0388, + "step": 33763 + }, + { + "epoch": 92.0, + "grad_norm": 2.1233444213867188, + "learning_rate": 3.3379149687388866e-07, + "loss": 0.0288, + "step": 33764 + }, + { + "epoch": 92.00272479564033, + "grad_norm": 1.8295189142227173, + "learning_rate": 3.33565429586038e-07, + "loss": 0.0429, + "step": 33765 + }, + { + "epoch": 92.00544959128065, + "grad_norm": 2.276864528656006, + "learning_rate": 3.3333943758006914e-07, + "loss": 0.024, + "step": 33766 + }, + { + "epoch": 92.00817438692098, + "grad_norm": 1.9273000955581665, + "learning_rate": 3.331135208577407e-07, + "loss": 0.023, + "step": 33767 + }, + { + "epoch": 92.0108991825613, + "grad_norm": 3.3115742206573486, + "learning_rate": 3.3288767942081244e-07, + "loss": 0.047, + "step": 33768 + }, + { + "epoch": 92.01362397820164, + "grad_norm": 2.849778652191162, + "learning_rate": 3.326619132710451e-07, + "loss": 0.1022, + "step": 33769 + }, + { + "epoch": 92.01634877384195, + "grad_norm": 6.2739152908325195, + "learning_rate": 3.3243622241019623e-07, + "loss": 0.0394, + "step": 33770 + }, + { + "epoch": 92.01907356948229, + "grad_norm": 2.2515010833740234, + "learning_rate": 3.3221060684002217e-07, + "loss": 0.0365, + "step": 33771 + }, + { + "epoch": 92.02179836512262, + "grad_norm": 2.3634426593780518, + "learning_rate": 3.3198506656228037e-07, + "loss": 0.0382, + "step": 33772 + }, + { + "epoch": 92.02452316076294, + "grad_norm": 2.7536566257476807, + "learning_rate": 3.317596015787283e-07, + "loss": 0.1642, + "step": 33773 + }, + { + "epoch": 92.02724795640327, + "grad_norm": 2.3946402072906494, + "learning_rate": 3.3153421189112136e-07, + "loss": 0.0194, + "step": 33774 + }, + { + "epoch": 92.02997275204359, + "grad_norm": 4.876133441925049, + "learning_rate": 3.313088975012135e-07, + "loss": 0.081, + "step": 33775 + }, + { + "epoch": 92.03269754768392, + "grad_norm": 2.2528655529022217, + "learning_rate": 3.310836584107624e-07, + "loss": 0.0558, + "step": 33776 + }, + { + "epoch": 92.03542234332426, + "grad_norm": 4.052096843719482, + "learning_rate": 3.308584946215199e-07, + "loss": 0.1273, + "step": 33777 + }, + { + "epoch": 92.03814713896458, + "grad_norm": 2.179211139678955, + "learning_rate": 3.306334061352401e-07, + "loss": 0.0219, + "step": 33778 + }, + { + "epoch": 92.04087193460491, + "grad_norm": 3.1627750396728516, + "learning_rate": 3.304083929536761e-07, + "loss": 0.0674, + "step": 33779 + }, + { + "epoch": 92.04359673024523, + "grad_norm": 1.9695805311203003, + "learning_rate": 3.3018345507858094e-07, + "loss": 0.0354, + "step": 33780 + }, + { + "epoch": 92.04632152588556, + "grad_norm": 2.447617530822754, + "learning_rate": 3.2995859251170547e-07, + "loss": 0.0315, + "step": 33781 + }, + { + "epoch": 92.04904632152588, + "grad_norm": 2.6950347423553467, + "learning_rate": 3.297338052548016e-07, + "loss": 0.0234, + "step": 33782 + }, + { + "epoch": 92.05177111716621, + "grad_norm": 2.954461097717285, + "learning_rate": 3.295090933096179e-07, + "loss": 0.03, + "step": 33783 + }, + { + "epoch": 92.05449591280654, + "grad_norm": 2.3865628242492676, + "learning_rate": 3.292844566779063e-07, + "loss": 0.0267, + "step": 33784 + }, + { + "epoch": 92.05722070844686, + "grad_norm": 2.331212043762207, + "learning_rate": 3.290598953614177e-07, + "loss": 0.0233, + "step": 33785 + }, + { + "epoch": 92.0599455040872, + "grad_norm": 3.273543357849121, + "learning_rate": 3.288354093618995e-07, + "loss": 0.0275, + "step": 33786 + }, + { + "epoch": 92.06267029972751, + "grad_norm": 2.712019443511963, + "learning_rate": 3.2861099868109924e-07, + "loss": 0.0686, + "step": 33787 + }, + { + "epoch": 92.06539509536785, + "grad_norm": 3.1281256675720215, + "learning_rate": 3.283866633207644e-07, + "loss": 0.0644, + "step": 33788 + }, + { + "epoch": 92.06811989100818, + "grad_norm": 2.5526158809661865, + "learning_rate": 3.281624032826447e-07, + "loss": 0.1136, + "step": 33789 + }, + { + "epoch": 92.0708446866485, + "grad_norm": 7.320584297180176, + "learning_rate": 3.279382185684843e-07, + "loss": 0.1053, + "step": 33790 + }, + { + "epoch": 92.07356948228883, + "grad_norm": 2.609349489212036, + "learning_rate": 3.2771410918002954e-07, + "loss": 0.1718, + "step": 33791 + }, + { + "epoch": 92.07629427792915, + "grad_norm": 3.035057544708252, + "learning_rate": 3.2749007511902463e-07, + "loss": 0.1156, + "step": 33792 + }, + { + "epoch": 92.07901907356948, + "grad_norm": 2.4524147510528564, + "learning_rate": 3.272661163872182e-07, + "loss": 0.0752, + "step": 33793 + }, + { + "epoch": 92.0817438692098, + "grad_norm": 2.105128526687622, + "learning_rate": 3.2704223298635096e-07, + "loss": 0.0281, + "step": 33794 + }, + { + "epoch": 92.08446866485014, + "grad_norm": 1.708139419555664, + "learning_rate": 3.2681842491816716e-07, + "loss": 0.0242, + "step": 33795 + }, + { + "epoch": 92.08719346049047, + "grad_norm": 2.3079190254211426, + "learning_rate": 3.2659469218440986e-07, + "loss": 0.0351, + "step": 33796 + }, + { + "epoch": 92.08991825613079, + "grad_norm": 3.039968967437744, + "learning_rate": 3.263710347868221e-07, + "loss": 0.0407, + "step": 33797 + }, + { + "epoch": 92.09264305177112, + "grad_norm": 1.8194310665130615, + "learning_rate": 3.2614745272714577e-07, + "loss": 0.2152, + "step": 33798 + }, + { + "epoch": 92.09536784741144, + "grad_norm": 2.3963255882263184, + "learning_rate": 3.2592394600712065e-07, + "loss": 0.0882, + "step": 33799 + }, + { + "epoch": 92.09809264305177, + "grad_norm": 2.6452293395996094, + "learning_rate": 3.2570051462848973e-07, + "loss": 0.1105, + "step": 33800 + }, + { + "epoch": 92.1008174386921, + "grad_norm": 4.206119060516357, + "learning_rate": 3.2547715859299055e-07, + "loss": 0.0643, + "step": 33801 + }, + { + "epoch": 92.10354223433242, + "grad_norm": 3.5175535678863525, + "learning_rate": 3.2525387790236507e-07, + "loss": 0.14, + "step": 33802 + }, + { + "epoch": 92.10626702997276, + "grad_norm": 2.516937255859375, + "learning_rate": 3.250306725583507e-07, + "loss": 0.0917, + "step": 33803 + }, + { + "epoch": 92.10899182561307, + "grad_norm": 2.569063186645508, + "learning_rate": 3.248075425626851e-07, + "loss": 0.0828, + "step": 33804 + }, + { + "epoch": 92.11171662125341, + "grad_norm": 4.731888771057129, + "learning_rate": 3.2458448791710786e-07, + "loss": 0.0611, + "step": 33805 + }, + { + "epoch": 92.11444141689373, + "grad_norm": 3.3217012882232666, + "learning_rate": 3.2436150862335536e-07, + "loss": 0.1254, + "step": 33806 + }, + { + "epoch": 92.11716621253406, + "grad_norm": 1.359853982925415, + "learning_rate": 3.2413860468316517e-07, + "loss": 0.0155, + "step": 33807 + }, + { + "epoch": 92.11989100817439, + "grad_norm": 3.0055317878723145, + "learning_rate": 3.239157760982692e-07, + "loss": 0.0317, + "step": 33808 + }, + { + "epoch": 92.12261580381471, + "grad_norm": 2.7368526458740234, + "learning_rate": 3.2369302287040826e-07, + "loss": 0.0179, + "step": 33809 + }, + { + "epoch": 92.12534059945504, + "grad_norm": 2.9150002002716064, + "learning_rate": 3.234703450013132e-07, + "loss": 0.0273, + "step": 33810 + }, + { + "epoch": 92.12806539509536, + "grad_norm": 3.0399937629699707, + "learning_rate": 3.232477424927205e-07, + "loss": 0.03, + "step": 33811 + }, + { + "epoch": 92.1307901907357, + "grad_norm": 2.771402597427368, + "learning_rate": 3.23025215346362e-07, + "loss": 0.0927, + "step": 33812 + }, + { + "epoch": 92.13351498637603, + "grad_norm": 3.0156381130218506, + "learning_rate": 3.22802763563973e-07, + "loss": 0.0229, + "step": 33813 + }, + { + "epoch": 92.13623978201635, + "grad_norm": 4.398390769958496, + "learning_rate": 3.2258038714728436e-07, + "loss": 0.0324, + "step": 33814 + }, + { + "epoch": 92.13896457765668, + "grad_norm": 2.441612958908081, + "learning_rate": 3.22358086098028e-07, + "loss": 0.077, + "step": 33815 + }, + { + "epoch": 92.141689373297, + "grad_norm": 3.5289855003356934, + "learning_rate": 3.2213586041793364e-07, + "loss": 0.0612, + "step": 33816 + }, + { + "epoch": 92.14441416893733, + "grad_norm": 4.272944927215576, + "learning_rate": 3.219137101087355e-07, + "loss": 0.1212, + "step": 33817 + }, + { + "epoch": 92.14713896457765, + "grad_norm": 2.395763874053955, + "learning_rate": 3.2169163517216217e-07, + "loss": 0.0767, + "step": 33818 + }, + { + "epoch": 92.14986376021798, + "grad_norm": 2.5885632038116455, + "learning_rate": 3.2146963560994226e-07, + "loss": 0.0385, + "step": 33819 + }, + { + "epoch": 92.15258855585832, + "grad_norm": 2.7076330184936523, + "learning_rate": 3.212477114238044e-07, + "loss": 0.0864, + "step": 33820 + }, + { + "epoch": 92.15531335149863, + "grad_norm": 1.8669532537460327, + "learning_rate": 3.210258626154794e-07, + "loss": 0.0355, + "step": 33821 + }, + { + "epoch": 92.15803814713897, + "grad_norm": 2.4068408012390137, + "learning_rate": 3.208040891866926e-07, + "loss": 0.085, + "step": 33822 + }, + { + "epoch": 92.16076294277929, + "grad_norm": 1.6939899921417236, + "learning_rate": 3.2058239113917256e-07, + "loss": 0.0219, + "step": 33823 + }, + { + "epoch": 92.16348773841962, + "grad_norm": 2.367842435836792, + "learning_rate": 3.2036076847464457e-07, + "loss": 0.0448, + "step": 33824 + }, + { + "epoch": 92.16621253405995, + "grad_norm": 2.184643030166626, + "learning_rate": 3.201392211948362e-07, + "loss": 0.1056, + "step": 33825 + }, + { + "epoch": 92.16893732970027, + "grad_norm": 1.9597187042236328, + "learning_rate": 3.199177493014716e-07, + "loss": 0.019, + "step": 33826 + }, + { + "epoch": 92.1716621253406, + "grad_norm": 2.8972485065460205, + "learning_rate": 3.196963527962771e-07, + "loss": 0.0623, + "step": 33827 + }, + { + "epoch": 92.17438692098092, + "grad_norm": 1.8783094882965088, + "learning_rate": 3.194750316809736e-07, + "loss": 0.0487, + "step": 33828 + }, + { + "epoch": 92.17711171662125, + "grad_norm": 2.029810905456543, + "learning_rate": 3.192537859572886e-07, + "loss": 0.0499, + "step": 33829 + }, + { + "epoch": 92.17983651226157, + "grad_norm": 1.5199320316314697, + "learning_rate": 3.190326156269441e-07, + "loss": 0.0205, + "step": 33830 + }, + { + "epoch": 92.1825613079019, + "grad_norm": 2.1136865615844727, + "learning_rate": 3.188115206916609e-07, + "loss": 0.0296, + "step": 33831 + }, + { + "epoch": 92.18528610354224, + "grad_norm": 4.115062713623047, + "learning_rate": 3.1859050115316205e-07, + "loss": 0.1639, + "step": 33832 + }, + { + "epoch": 92.18801089918256, + "grad_norm": 2.2568817138671875, + "learning_rate": 3.183695570131695e-07, + "loss": 0.028, + "step": 33833 + }, + { + "epoch": 92.19073569482289, + "grad_norm": 2.664994239807129, + "learning_rate": 3.1814868827340194e-07, + "loss": 0.0336, + "step": 33834 + }, + { + "epoch": 92.19346049046321, + "grad_norm": 2.2303590774536133, + "learning_rate": 3.179278949355824e-07, + "loss": 0.0771, + "step": 33835 + }, + { + "epoch": 92.19618528610354, + "grad_norm": 2.1022610664367676, + "learning_rate": 3.177071770014273e-07, + "loss": 0.0669, + "step": 33836 + }, + { + "epoch": 92.19891008174388, + "grad_norm": 2.6430466175079346, + "learning_rate": 3.1748653447265634e-07, + "loss": 0.1713, + "step": 33837 + }, + { + "epoch": 92.2016348773842, + "grad_norm": 2.0570852756500244, + "learning_rate": 3.1726596735099035e-07, + "loss": 0.0271, + "step": 33838 + }, + { + "epoch": 92.20435967302453, + "grad_norm": 3.03989315032959, + "learning_rate": 3.1704547563814583e-07, + "loss": 0.0814, + "step": 33839 + }, + { + "epoch": 92.20708446866485, + "grad_norm": 2.5764822959899902, + "learning_rate": 3.1682505933583796e-07, + "loss": 0.0468, + "step": 33840 + }, + { + "epoch": 92.20980926430518, + "grad_norm": 1.3078769445419312, + "learning_rate": 3.166047184457854e-07, + "loss": 0.014, + "step": 33841 + }, + { + "epoch": 92.2125340599455, + "grad_norm": 2.423530340194702, + "learning_rate": 3.1638445296970463e-07, + "loss": 0.0674, + "step": 33842 + }, + { + "epoch": 92.21525885558583, + "grad_norm": 2.24601149559021, + "learning_rate": 3.1616426290930977e-07, + "loss": 0.0497, + "step": 33843 + }, + { + "epoch": 92.21798365122616, + "grad_norm": 2.4931259155273438, + "learning_rate": 3.159441482663139e-07, + "loss": 0.0338, + "step": 33844 + }, + { + "epoch": 92.22070844686648, + "grad_norm": 2.9073128700256348, + "learning_rate": 3.1572410904243566e-07, + "loss": 0.025, + "step": 33845 + }, + { + "epoch": 92.22343324250681, + "grad_norm": 2.2473936080932617, + "learning_rate": 3.155041452393859e-07, + "loss": 0.0278, + "step": 33846 + }, + { + "epoch": 92.22615803814713, + "grad_norm": 2.516573429107666, + "learning_rate": 3.1528425685887874e-07, + "loss": 0.0929, + "step": 33847 + }, + { + "epoch": 92.22888283378747, + "grad_norm": 1.886380910873413, + "learning_rate": 3.15064443902624e-07, + "loss": 0.0492, + "step": 33848 + }, + { + "epoch": 92.2316076294278, + "grad_norm": 2.5071778297424316, + "learning_rate": 3.14844706372337e-07, + "loss": 0.0298, + "step": 33849 + }, + { + "epoch": 92.23433242506812, + "grad_norm": 2.0962769985198975, + "learning_rate": 3.146250442697285e-07, + "loss": 0.0935, + "step": 33850 + }, + { + "epoch": 92.23705722070845, + "grad_norm": 1.873889446258545, + "learning_rate": 3.144054575965072e-07, + "loss": 0.131, + "step": 33851 + }, + { + "epoch": 92.23978201634877, + "grad_norm": 2.5482842922210693, + "learning_rate": 3.141859463543839e-07, + "loss": 0.0302, + "step": 33852 + }, + { + "epoch": 92.2425068119891, + "grad_norm": 2.989535331726074, + "learning_rate": 3.1396651054506956e-07, + "loss": 0.0689, + "step": 33853 + }, + { + "epoch": 92.24523160762942, + "grad_norm": 4.189667701721191, + "learning_rate": 3.137471501702727e-07, + "loss": 0.1763, + "step": 33854 + }, + { + "epoch": 92.24795640326975, + "grad_norm": 2.7423295974731445, + "learning_rate": 3.1352786523170085e-07, + "loss": 0.0604, + "step": 33855 + }, + { + "epoch": 92.25068119891009, + "grad_norm": 2.076279640197754, + "learning_rate": 3.1330865573106274e-07, + "loss": 0.0995, + "step": 33856 + }, + { + "epoch": 92.2534059945504, + "grad_norm": 3.0084567070007324, + "learning_rate": 3.130895216700636e-07, + "loss": 0.0348, + "step": 33857 + }, + { + "epoch": 92.25613079019074, + "grad_norm": 2.3064050674438477, + "learning_rate": 3.1287046305041313e-07, + "loss": 0.0329, + "step": 33858 + }, + { + "epoch": 92.25885558583106, + "grad_norm": 2.7155561447143555, + "learning_rate": 3.126514798738156e-07, + "loss": 0.0493, + "step": 33859 + }, + { + "epoch": 92.26158038147139, + "grad_norm": 2.3363630771636963, + "learning_rate": 3.124325721419752e-07, + "loss": 0.1445, + "step": 33860 + }, + { + "epoch": 92.26430517711172, + "grad_norm": 2.6246142387390137, + "learning_rate": 3.122137398565994e-07, + "loss": 0.0325, + "step": 33861 + }, + { + "epoch": 92.26702997275204, + "grad_norm": 2.3935251235961914, + "learning_rate": 3.119949830193902e-07, + "loss": 0.0408, + "step": 33862 + }, + { + "epoch": 92.26975476839237, + "grad_norm": 2.4321534633636475, + "learning_rate": 3.1177630163205406e-07, + "loss": 0.0187, + "step": 33863 + }, + { + "epoch": 92.2724795640327, + "grad_norm": 2.471033811569214, + "learning_rate": 3.115576956962896e-07, + "loss": 0.0168, + "step": 33864 + }, + { + "epoch": 92.27520435967303, + "grad_norm": 3.132131576538086, + "learning_rate": 3.1133916521380427e-07, + "loss": 0.0318, + "step": 33865 + }, + { + "epoch": 92.27792915531334, + "grad_norm": 1.8041948080062866, + "learning_rate": 3.111207101862968e-07, + "loss": 0.1519, + "step": 33866 + }, + { + "epoch": 92.28065395095368, + "grad_norm": 2.8425796031951904, + "learning_rate": 3.1090233061547017e-07, + "loss": 0.0531, + "step": 33867 + }, + { + "epoch": 92.28337874659401, + "grad_norm": 2.4926719665527344, + "learning_rate": 3.106840265030231e-07, + "loss": 0.0273, + "step": 33868 + }, + { + "epoch": 92.28610354223433, + "grad_norm": 2.3687140941619873, + "learning_rate": 3.1046579785065756e-07, + "loss": 0.0198, + "step": 33869 + }, + { + "epoch": 92.28882833787466, + "grad_norm": 2.088261604309082, + "learning_rate": 3.1024764466007106e-07, + "loss": 0.1923, + "step": 33870 + }, + { + "epoch": 92.29155313351498, + "grad_norm": 1.6418927907943726, + "learning_rate": 3.100295669329667e-07, + "loss": 0.0157, + "step": 33871 + }, + { + "epoch": 92.29427792915531, + "grad_norm": 2.099968671798706, + "learning_rate": 3.0981156467103867e-07, + "loss": 0.0943, + "step": 33872 + }, + { + "epoch": 92.29700272479565, + "grad_norm": 2.534358024597168, + "learning_rate": 3.095936378759856e-07, + "loss": 0.0436, + "step": 33873 + }, + { + "epoch": 92.29972752043597, + "grad_norm": 1.4658430814743042, + "learning_rate": 3.0937578654950727e-07, + "loss": 0.0202, + "step": 33874 + }, + { + "epoch": 92.3024523160763, + "grad_norm": 1.372265338897705, + "learning_rate": 3.091580106932979e-07, + "loss": 0.0189, + "step": 33875 + }, + { + "epoch": 92.30517711171662, + "grad_norm": 2.6411492824554443, + "learning_rate": 3.089403103090538e-07, + "loss": 0.0938, + "step": 33876 + }, + { + "epoch": 92.30790190735695, + "grad_norm": 2.502680778503418, + "learning_rate": 3.0872268539846926e-07, + "loss": 0.0486, + "step": 33877 + }, + { + "epoch": 92.31062670299727, + "grad_norm": 2.4906811714172363, + "learning_rate": 3.0850513596324294e-07, + "loss": 0.0482, + "step": 33878 + }, + { + "epoch": 92.3133514986376, + "grad_norm": 2.694629430770874, + "learning_rate": 3.0828766200506563e-07, + "loss": 0.0248, + "step": 33879 + }, + { + "epoch": 92.31607629427793, + "grad_norm": 2.9682085514068604, + "learning_rate": 3.0807026352563273e-07, + "loss": 0.0943, + "step": 33880 + }, + { + "epoch": 92.31880108991825, + "grad_norm": 2.0423824787139893, + "learning_rate": 3.078529405266351e-07, + "loss": 0.0683, + "step": 33881 + }, + { + "epoch": 92.32152588555859, + "grad_norm": 2.5169155597686768, + "learning_rate": 3.0763569300976794e-07, + "loss": 0.0746, + "step": 33882 + }, + { + "epoch": 92.3242506811989, + "grad_norm": 3.171461820602417, + "learning_rate": 3.074185209767222e-07, + "loss": 0.0347, + "step": 33883 + }, + { + "epoch": 92.32697547683924, + "grad_norm": 1.595274567604065, + "learning_rate": 3.0720142442918765e-07, + "loss": 0.0359, + "step": 33884 + }, + { + "epoch": 92.32970027247957, + "grad_norm": 2.9492576122283936, + "learning_rate": 3.069844033688574e-07, + "loss": 0.0247, + "step": 33885 + }, + { + "epoch": 92.33242506811989, + "grad_norm": 2.830124616622925, + "learning_rate": 3.0676745779742114e-07, + "loss": 0.0705, + "step": 33886 + }, + { + "epoch": 92.33514986376022, + "grad_norm": 1.7882606983184814, + "learning_rate": 3.0655058771656755e-07, + "loss": 0.024, + "step": 33887 + }, + { + "epoch": 92.33787465940054, + "grad_norm": 3.2372705936431885, + "learning_rate": 3.0633379312798637e-07, + "loss": 0.1056, + "step": 33888 + }, + { + "epoch": 92.34059945504087, + "grad_norm": 2.8747408390045166, + "learning_rate": 3.061170740333641e-07, + "loss": 0.0396, + "step": 33889 + }, + { + "epoch": 92.34332425068119, + "grad_norm": 3.1066174507141113, + "learning_rate": 3.0590043043439156e-07, + "loss": 0.0566, + "step": 33890 + }, + { + "epoch": 92.34604904632153, + "grad_norm": 2.6151490211486816, + "learning_rate": 3.0568386233275404e-07, + "loss": 0.0434, + "step": 33891 + }, + { + "epoch": 92.34877384196186, + "grad_norm": 2.095111131668091, + "learning_rate": 3.0546736973013915e-07, + "loss": 0.0364, + "step": 33892 + }, + { + "epoch": 92.35149863760218, + "grad_norm": 2.777678966522217, + "learning_rate": 3.05250952628231e-07, + "loss": 0.1083, + "step": 33893 + }, + { + "epoch": 92.35422343324251, + "grad_norm": 4.020278453826904, + "learning_rate": 3.0503461102871836e-07, + "loss": 0.0248, + "step": 33894 + }, + { + "epoch": 92.35694822888283, + "grad_norm": 2.4880988597869873, + "learning_rate": 3.048183449332831e-07, + "loss": 0.1197, + "step": 33895 + }, + { + "epoch": 92.35967302452316, + "grad_norm": 2.075143575668335, + "learning_rate": 3.046021543436106e-07, + "loss": 0.0303, + "step": 33896 + }, + { + "epoch": 92.3623978201635, + "grad_norm": 2.5300533771514893, + "learning_rate": 3.04386039261384e-07, + "loss": 0.0272, + "step": 33897 + }, + { + "epoch": 92.36512261580381, + "grad_norm": 2.7739245891571045, + "learning_rate": 3.0416999968828743e-07, + "loss": 0.0377, + "step": 33898 + }, + { + "epoch": 92.36784741144415, + "grad_norm": 3.773585557937622, + "learning_rate": 3.039540356260029e-07, + "loss": 0.2318, + "step": 33899 + }, + { + "epoch": 92.37057220708446, + "grad_norm": 7.179575443267822, + "learning_rate": 3.037381470762124e-07, + "loss": 0.0426, + "step": 33900 + }, + { + "epoch": 92.3732970027248, + "grad_norm": 3.2828152179718018, + "learning_rate": 3.035223340405957e-07, + "loss": 0.0307, + "step": 33901 + }, + { + "epoch": 92.37602179836512, + "grad_norm": 1.574810266494751, + "learning_rate": 3.033065965208359e-07, + "loss": 0.0183, + "step": 33902 + }, + { + "epoch": 92.37874659400545, + "grad_norm": 3.448099374771118, + "learning_rate": 3.030909345186128e-07, + "loss": 0.0909, + "step": 33903 + }, + { + "epoch": 92.38147138964578, + "grad_norm": 2.6964199542999268, + "learning_rate": 3.028753480356061e-07, + "loss": 0.0343, + "step": 33904 + }, + { + "epoch": 92.3841961852861, + "grad_norm": 3.373821973800659, + "learning_rate": 3.026598370734912e-07, + "loss": 0.0957, + "step": 33905 + }, + { + "epoch": 92.38692098092643, + "grad_norm": 2.0266878604888916, + "learning_rate": 3.0244440163395115e-07, + "loss": 0.0232, + "step": 33906 + }, + { + "epoch": 92.38964577656675, + "grad_norm": 2.847181558609009, + "learning_rate": 3.022290417186624e-07, + "loss": 0.0471, + "step": 33907 + }, + { + "epoch": 92.39237057220708, + "grad_norm": 2.4669415950775146, + "learning_rate": 3.020137573293014e-07, + "loss": 0.0267, + "step": 33908 + }, + { + "epoch": 92.39509536784742, + "grad_norm": 2.3490042686462402, + "learning_rate": 3.0179854846754455e-07, + "loss": 0.1935, + "step": 33909 + }, + { + "epoch": 92.39782016348774, + "grad_norm": 2.1643900871276855, + "learning_rate": 3.015834151350694e-07, + "loss": 0.0982, + "step": 33910 + }, + { + "epoch": 92.40054495912807, + "grad_norm": 2.525986671447754, + "learning_rate": 3.0136835733355017e-07, + "loss": 0.1271, + "step": 33911 + }, + { + "epoch": 92.40326975476839, + "grad_norm": 2.159219264984131, + "learning_rate": 3.0115337506466226e-07, + "loss": 0.034, + "step": 33912 + }, + { + "epoch": 92.40599455040872, + "grad_norm": 1.880326271057129, + "learning_rate": 3.009384683300787e-07, + "loss": 0.0264, + "step": 33913 + }, + { + "epoch": 92.40871934604904, + "grad_norm": 2.5172228813171387, + "learning_rate": 3.007236371314748e-07, + "loss": 0.0838, + "step": 33914 + }, + { + "epoch": 92.41144414168937, + "grad_norm": 2.4819085597991943, + "learning_rate": 3.0050888147052373e-07, + "loss": 0.0646, + "step": 33915 + }, + { + "epoch": 92.4141689373297, + "grad_norm": 2.8474478721618652, + "learning_rate": 3.002942013488974e-07, + "loss": 0.1233, + "step": 33916 + }, + { + "epoch": 92.41689373297002, + "grad_norm": 3.8018252849578857, + "learning_rate": 3.000795967682657e-07, + "loss": 0.0632, + "step": 33917 + }, + { + "epoch": 92.41961852861036, + "grad_norm": 2.0780482292175293, + "learning_rate": 2.9986506773030386e-07, + "loss": 0.0195, + "step": 33918 + }, + { + "epoch": 92.42234332425068, + "grad_norm": 2.081063985824585, + "learning_rate": 2.996506142366795e-07, + "loss": 0.0369, + "step": 33919 + }, + { + "epoch": 92.42506811989101, + "grad_norm": 2.663294553756714, + "learning_rate": 2.994362362890657e-07, + "loss": 0.105, + "step": 33920 + }, + { + "epoch": 92.42779291553134, + "grad_norm": 6.76279354095459, + "learning_rate": 2.992219338891278e-07, + "loss": 0.0461, + "step": 33921 + }, + { + "epoch": 92.43051771117166, + "grad_norm": 7.834489345550537, + "learning_rate": 2.9900770703853774e-07, + "loss": 0.1696, + "step": 33922 + }, + { + "epoch": 92.433242506812, + "grad_norm": 2.504335880279541, + "learning_rate": 2.9879355573896427e-07, + "loss": 0.0169, + "step": 33923 + }, + { + "epoch": 92.43596730245231, + "grad_norm": 3.097688674926758, + "learning_rate": 2.9857947999207493e-07, + "loss": 0.114, + "step": 33924 + }, + { + "epoch": 92.43869209809264, + "grad_norm": 2.420255184173584, + "learning_rate": 2.98365479799535e-07, + "loss": 0.1299, + "step": 33925 + }, + { + "epoch": 92.44141689373296, + "grad_norm": 1.806056261062622, + "learning_rate": 2.981515551630132e-07, + "loss": 0.1179, + "step": 33926 + }, + { + "epoch": 92.4441416893733, + "grad_norm": 2.9265284538269043, + "learning_rate": 2.979377060841748e-07, + "loss": 0.0961, + "step": 33927 + }, + { + "epoch": 92.44686648501363, + "grad_norm": 1.9160208702087402, + "learning_rate": 2.9772393256468634e-07, + "loss": 0.0191, + "step": 33928 + }, + { + "epoch": 92.44959128065395, + "grad_norm": 4.044418811798096, + "learning_rate": 2.9751023460620975e-07, + "loss": 0.0364, + "step": 33929 + }, + { + "epoch": 92.45231607629428, + "grad_norm": 1.8257092237472534, + "learning_rate": 2.972966122104115e-07, + "loss": 0.0263, + "step": 33930 + }, + { + "epoch": 92.4550408719346, + "grad_norm": 4.9430084228515625, + "learning_rate": 2.9708306537895583e-07, + "loss": 0.0443, + "step": 33931 + }, + { + "epoch": 92.45776566757493, + "grad_norm": 2.891047716140747, + "learning_rate": 2.968695941135047e-07, + "loss": 0.0549, + "step": 33932 + }, + { + "epoch": 92.46049046321527, + "grad_norm": 2.730832576751709, + "learning_rate": 2.9665619841572015e-07, + "loss": 0.057, + "step": 33933 + }, + { + "epoch": 92.46321525885558, + "grad_norm": 2.0785939693450928, + "learning_rate": 2.964428782872664e-07, + "loss": 0.0262, + "step": 33934 + }, + { + "epoch": 92.46594005449592, + "grad_norm": 2.5021350383758545, + "learning_rate": 2.9622963372980204e-07, + "loss": 0.1014, + "step": 33935 + }, + { + "epoch": 92.46866485013624, + "grad_norm": 4.288695335388184, + "learning_rate": 2.9601646474498926e-07, + "loss": 0.089, + "step": 33936 + }, + { + "epoch": 92.47138964577657, + "grad_norm": 1.9641176462173462, + "learning_rate": 2.958033713344877e-07, + "loss": 0.0488, + "step": 33937 + }, + { + "epoch": 92.47411444141689, + "grad_norm": 1.865676999092102, + "learning_rate": 2.9559035349995715e-07, + "loss": 0.0206, + "step": 33938 + }, + { + "epoch": 92.47683923705722, + "grad_norm": 3.2440242767333984, + "learning_rate": 2.953774112430563e-07, + "loss": 0.0937, + "step": 33939 + }, + { + "epoch": 92.47956403269755, + "grad_norm": 3.238081932067871, + "learning_rate": 2.9516454456544386e-07, + "loss": 0.0362, + "step": 33940 + }, + { + "epoch": 92.48228882833787, + "grad_norm": 2.4168434143066406, + "learning_rate": 2.9495175346877846e-07, + "loss": 0.0429, + "step": 33941 + }, + { + "epoch": 92.4850136239782, + "grad_norm": 2.8645784854888916, + "learning_rate": 2.9473903795471546e-07, + "loss": 0.0703, + "step": 33942 + }, + { + "epoch": 92.48773841961852, + "grad_norm": 1.7716959714889526, + "learning_rate": 2.9452639802491356e-07, + "loss": 0.1213, + "step": 33943 + }, + { + "epoch": 92.49046321525886, + "grad_norm": 1.8242135047912598, + "learning_rate": 2.9431383368102696e-07, + "loss": 0.0413, + "step": 33944 + }, + { + "epoch": 92.49318801089919, + "grad_norm": 5.517455101013184, + "learning_rate": 2.941013449247132e-07, + "loss": 0.0914, + "step": 33945 + }, + { + "epoch": 92.49591280653951, + "grad_norm": 1.8510369062423706, + "learning_rate": 2.9388893175762325e-07, + "loss": 0.0972, + "step": 33946 + }, + { + "epoch": 92.49863760217984, + "grad_norm": 9.689813613891602, + "learning_rate": 2.936765941814157e-07, + "loss": 0.2035, + "step": 33947 + }, + { + "epoch": 92.50136239782016, + "grad_norm": 4.921730995178223, + "learning_rate": 2.934643321977426e-07, + "loss": 0.0542, + "step": 33948 + }, + { + "epoch": 92.50408719346049, + "grad_norm": 2.1656479835510254, + "learning_rate": 2.932521458082549e-07, + "loss": 0.0777, + "step": 33949 + }, + { + "epoch": 92.50681198910081, + "grad_norm": 1.4755820035934448, + "learning_rate": 2.93040035014609e-07, + "loss": 0.0167, + "step": 33950 + }, + { + "epoch": 92.50953678474114, + "grad_norm": 1.8112258911132812, + "learning_rate": 2.9282799981845464e-07, + "loss": 0.0222, + "step": 33951 + }, + { + "epoch": 92.51226158038148, + "grad_norm": 2.7130534648895264, + "learning_rate": 2.9261604022144397e-07, + "loss": 0.0382, + "step": 33952 + }, + { + "epoch": 92.5149863760218, + "grad_norm": 3.03053879737854, + "learning_rate": 2.9240415622522557e-07, + "loss": 0.0258, + "step": 33953 + }, + { + "epoch": 92.51771117166213, + "grad_norm": 2.6802375316619873, + "learning_rate": 2.9219234783145147e-07, + "loss": 0.042, + "step": 33954 + }, + { + "epoch": 92.52043596730245, + "grad_norm": 1.7798711061477661, + "learning_rate": 2.9198061504177144e-07, + "loss": 0.0275, + "step": 33955 + }, + { + "epoch": 92.52316076294278, + "grad_norm": 2.7639007568359375, + "learning_rate": 2.917689578578331e-07, + "loss": 0.0403, + "step": 33956 + }, + { + "epoch": 92.52588555858311, + "grad_norm": 2.2817227840423584, + "learning_rate": 2.915573762812873e-07, + "loss": 0.0218, + "step": 33957 + }, + { + "epoch": 92.52861035422343, + "grad_norm": 2.4043657779693604, + "learning_rate": 2.9134587031377835e-07, + "loss": 0.037, + "step": 33958 + }, + { + "epoch": 92.53133514986376, + "grad_norm": 2.5717053413391113, + "learning_rate": 2.91134439956956e-07, + "loss": 0.0334, + "step": 33959 + }, + { + "epoch": 92.53405994550408, + "grad_norm": 1.61574387550354, + "learning_rate": 2.909230852124667e-07, + "loss": 0.0585, + "step": 33960 + }, + { + "epoch": 92.53678474114442, + "grad_norm": 5.058300495147705, + "learning_rate": 2.907118060819569e-07, + "loss": 0.0487, + "step": 33961 + }, + { + "epoch": 92.53950953678473, + "grad_norm": 8.652349472045898, + "learning_rate": 2.905006025670687e-07, + "loss": 0.051, + "step": 33962 + }, + { + "epoch": 92.54223433242507, + "grad_norm": 1.8410452604293823, + "learning_rate": 2.902894746694507e-07, + "loss": 0.0222, + "step": 33963 + }, + { + "epoch": 92.5449591280654, + "grad_norm": 2.593010902404785, + "learning_rate": 2.90078422390746e-07, + "loss": 0.1177, + "step": 33964 + }, + { + "epoch": 92.54768392370572, + "grad_norm": 2.5542678833007812, + "learning_rate": 2.898674457325967e-07, + "loss": 0.0236, + "step": 33965 + }, + { + "epoch": 92.55040871934605, + "grad_norm": 2.2600033283233643, + "learning_rate": 2.8965654469664815e-07, + "loss": 0.0518, + "step": 33966 + }, + { + "epoch": 92.55313351498637, + "grad_norm": 3.8037288188934326, + "learning_rate": 2.8944571928454126e-07, + "loss": 0.034, + "step": 33967 + }, + { + "epoch": 92.5558583106267, + "grad_norm": 2.4722979068756104, + "learning_rate": 2.892349694979202e-07, + "loss": 0.0835, + "step": 33968 + }, + { + "epoch": 92.55858310626704, + "grad_norm": 2.584477424621582, + "learning_rate": 2.890242953384237e-07, + "loss": 0.0879, + "step": 33969 + }, + { + "epoch": 92.56130790190736, + "grad_norm": 3.628197431564331, + "learning_rate": 2.888136968076927e-07, + "loss": 0.0753, + "step": 33970 + }, + { + "epoch": 92.56403269754769, + "grad_norm": 4.6860456466674805, + "learning_rate": 2.88603173907368e-07, + "loss": 0.028, + "step": 33971 + }, + { + "epoch": 92.566757493188, + "grad_norm": 2.555469512939453, + "learning_rate": 2.883927266390907e-07, + "loss": 0.1143, + "step": 33972 + }, + { + "epoch": 92.56948228882834, + "grad_norm": 2.003568410873413, + "learning_rate": 2.88182355004496e-07, + "loss": 0.0231, + "step": 33973 + }, + { + "epoch": 92.57220708446866, + "grad_norm": 2.3181540966033936, + "learning_rate": 2.8797205900522594e-07, + "loss": 0.0463, + "step": 33974 + }, + { + "epoch": 92.57493188010899, + "grad_norm": 2.0930943489074707, + "learning_rate": 2.877618386429171e-07, + "loss": 0.0286, + "step": 33975 + }, + { + "epoch": 92.57765667574932, + "grad_norm": 3.4334566593170166, + "learning_rate": 2.875516939192069e-07, + "loss": 0.1159, + "step": 33976 + }, + { + "epoch": 92.58038147138964, + "grad_norm": 2.914374589920044, + "learning_rate": 2.873416248357308e-07, + "loss": 0.0362, + "step": 33977 + }, + { + "epoch": 92.58310626702998, + "grad_norm": 2.764923572540283, + "learning_rate": 2.8713163139412527e-07, + "loss": 0.0882, + "step": 33978 + }, + { + "epoch": 92.5858310626703, + "grad_norm": 2.67028546333313, + "learning_rate": 2.869217135960267e-07, + "loss": 0.0173, + "step": 33979 + }, + { + "epoch": 92.58855585831063, + "grad_norm": 3.2267072200775146, + "learning_rate": 2.8671187144306834e-07, + "loss": 0.1514, + "step": 33980 + }, + { + "epoch": 92.59128065395096, + "grad_norm": 3.0317184925079346, + "learning_rate": 2.8650210493688656e-07, + "loss": 0.0301, + "step": 33981 + }, + { + "epoch": 92.59400544959128, + "grad_norm": 2.4306561946868896, + "learning_rate": 2.862924140791123e-07, + "loss": 0.0282, + "step": 33982 + }, + { + "epoch": 92.59673024523161, + "grad_norm": 3.262852668762207, + "learning_rate": 2.8608279887138103e-07, + "loss": 0.1281, + "step": 33983 + }, + { + "epoch": 92.59945504087193, + "grad_norm": 1.7691593170166016, + "learning_rate": 2.858732593153246e-07, + "loss": 0.0888, + "step": 33984 + }, + { + "epoch": 92.60217983651226, + "grad_norm": 2.297663450241089, + "learning_rate": 2.8566379541257406e-07, + "loss": 0.0638, + "step": 33985 + }, + { + "epoch": 92.60490463215258, + "grad_norm": 2.7999699115753174, + "learning_rate": 2.8545440716476025e-07, + "loss": 0.0363, + "step": 33986 + }, + { + "epoch": 92.60762942779292, + "grad_norm": 2.7875518798828125, + "learning_rate": 2.8524509457351635e-07, + "loss": 0.2239, + "step": 33987 + }, + { + "epoch": 92.61035422343325, + "grad_norm": 2.7598700523376465, + "learning_rate": 2.85035857640471e-07, + "loss": 0.066, + "step": 33988 + }, + { + "epoch": 92.61307901907357, + "grad_norm": 2.471369743347168, + "learning_rate": 2.84826696367253e-07, + "loss": 0.0293, + "step": 33989 + }, + { + "epoch": 92.6158038147139, + "grad_norm": 4.669155597686768, + "learning_rate": 2.846176107554921e-07, + "loss": 0.1098, + "step": 33990 + }, + { + "epoch": 92.61852861035422, + "grad_norm": 3.655745029449463, + "learning_rate": 2.8440860080681587e-07, + "loss": 0.053, + "step": 33991 + }, + { + "epoch": 92.62125340599455, + "grad_norm": 4.2164387702941895, + "learning_rate": 2.8419966652285303e-07, + "loss": 0.0607, + "step": 33992 + }, + { + "epoch": 92.62397820163488, + "grad_norm": 2.9698784351348877, + "learning_rate": 2.8399080790523227e-07, + "loss": 0.0811, + "step": 33993 + }, + { + "epoch": 92.6267029972752, + "grad_norm": 2.3326776027679443, + "learning_rate": 2.837820249555756e-07, + "loss": 0.0591, + "step": 33994 + }, + { + "epoch": 92.62942779291554, + "grad_norm": 2.5954360961914062, + "learning_rate": 2.8357331767551397e-07, + "loss": 0.1233, + "step": 33995 + }, + { + "epoch": 92.63215258855585, + "grad_norm": 2.092036485671997, + "learning_rate": 2.8336468606667057e-07, + "loss": 0.0322, + "step": 33996 + }, + { + "epoch": 92.63487738419619, + "grad_norm": 2.1663055419921875, + "learning_rate": 2.8315613013066954e-07, + "loss": 0.0681, + "step": 33997 + }, + { + "epoch": 92.6376021798365, + "grad_norm": 3.1835341453552246, + "learning_rate": 2.8294764986913524e-07, + "loss": 0.0715, + "step": 33998 + }, + { + "epoch": 92.64032697547684, + "grad_norm": 2.3628365993499756, + "learning_rate": 2.82739245283693e-07, + "loss": 0.0383, + "step": 33999 + }, + { + "epoch": 92.64305177111717, + "grad_norm": 2.6618759632110596, + "learning_rate": 2.8253091637596485e-07, + "loss": 0.0366, + "step": 34000 + }, + { + "epoch": 92.64577656675749, + "grad_norm": 1.9609527587890625, + "learning_rate": 2.8232266314757286e-07, + "loss": 0.0268, + "step": 34001 + }, + { + "epoch": 92.64850136239782, + "grad_norm": 2.5003442764282227, + "learning_rate": 2.8211448560013787e-07, + "loss": 0.0296, + "step": 34002 + }, + { + "epoch": 92.65122615803814, + "grad_norm": 2.237795829772949, + "learning_rate": 2.8190638373528423e-07, + "loss": 0.1536, + "step": 34003 + }, + { + "epoch": 92.65395095367847, + "grad_norm": 1.9150476455688477, + "learning_rate": 2.816983575546306e-07, + "loss": 0.0887, + "step": 34004 + }, + { + "epoch": 92.65667574931881, + "grad_norm": 1.8825595378875732, + "learning_rate": 2.814904070597979e-07, + "loss": 0.0742, + "step": 34005 + }, + { + "epoch": 92.65940054495913, + "grad_norm": 2.8478167057037354, + "learning_rate": 2.8128253225240376e-07, + "loss": 0.0588, + "step": 34006 + }, + { + "epoch": 92.66212534059946, + "grad_norm": 2.597182035446167, + "learning_rate": 2.810747331340691e-07, + "loss": 0.0318, + "step": 34007 + }, + { + "epoch": 92.66485013623978, + "grad_norm": 2.7154324054718018, + "learning_rate": 2.8086700970641034e-07, + "loss": 0.0613, + "step": 34008 + }, + { + "epoch": 92.66757493188011, + "grad_norm": 1.348683476448059, + "learning_rate": 2.806593619710485e-07, + "loss": 0.0579, + "step": 34009 + }, + { + "epoch": 92.67029972752043, + "grad_norm": 2.6856653690338135, + "learning_rate": 2.804517899295978e-07, + "loss": 0.0467, + "step": 34010 + }, + { + "epoch": 92.67302452316076, + "grad_norm": 2.5943455696105957, + "learning_rate": 2.802442935836758e-07, + "loss": 0.0436, + "step": 34011 + }, + { + "epoch": 92.6757493188011, + "grad_norm": 2.033085346221924, + "learning_rate": 2.800368729348979e-07, + "loss": 0.0649, + "step": 34012 + }, + { + "epoch": 92.67847411444141, + "grad_norm": 2.114762783050537, + "learning_rate": 2.798295279848817e-07, + "loss": 0.0651, + "step": 34013 + }, + { + "epoch": 92.68119891008175, + "grad_norm": 1.8358843326568604, + "learning_rate": 2.796222587352382e-07, + "loss": 0.0417, + "step": 34014 + }, + { + "epoch": 92.68392370572207, + "grad_norm": 2.147197961807251, + "learning_rate": 2.7941506518758486e-07, + "loss": 0.0844, + "step": 34015 + }, + { + "epoch": 92.6866485013624, + "grad_norm": 3.4548144340515137, + "learning_rate": 2.7920794734353384e-07, + "loss": 0.1095, + "step": 34016 + }, + { + "epoch": 92.68937329700273, + "grad_norm": 2.261824607849121, + "learning_rate": 2.790009052046994e-07, + "loss": 0.0237, + "step": 34017 + }, + { + "epoch": 92.69209809264305, + "grad_norm": 3.58293080329895, + "learning_rate": 2.787939387726912e-07, + "loss": 0.1708, + "step": 34018 + }, + { + "epoch": 92.69482288828338, + "grad_norm": 2.4535138607025146, + "learning_rate": 2.7858704804912483e-07, + "loss": 0.0762, + "step": 34019 + }, + { + "epoch": 92.6975476839237, + "grad_norm": 2.3390798568725586, + "learning_rate": 2.7838023303560893e-07, + "loss": 0.0258, + "step": 34020 + }, + { + "epoch": 92.70027247956403, + "grad_norm": 3.6526169776916504, + "learning_rate": 2.7817349373375545e-07, + "loss": 0.1148, + "step": 34021 + }, + { + "epoch": 92.70299727520435, + "grad_norm": 3.0535171031951904, + "learning_rate": 2.779668301451721e-07, + "loss": 0.1209, + "step": 34022 + }, + { + "epoch": 92.70572207084469, + "grad_norm": 2.691586971282959, + "learning_rate": 2.7776024227147093e-07, + "loss": 0.1376, + "step": 34023 + }, + { + "epoch": 92.70844686648502, + "grad_norm": 2.9899306297302246, + "learning_rate": 2.775537301142617e-07, + "loss": 0.0464, + "step": 34024 + }, + { + "epoch": 92.71117166212534, + "grad_norm": 2.928201675415039, + "learning_rate": 2.773472936751487e-07, + "loss": 0.0454, + "step": 34025 + }, + { + "epoch": 92.71389645776567, + "grad_norm": 2.3313519954681396, + "learning_rate": 2.7714093295574285e-07, + "loss": 0.0542, + "step": 34026 + }, + { + "epoch": 92.71662125340599, + "grad_norm": 2.7227885723114014, + "learning_rate": 2.769346479576507e-07, + "loss": 0.0309, + "step": 34027 + }, + { + "epoch": 92.71934604904632, + "grad_norm": 2.697957992553711, + "learning_rate": 2.7672843868247865e-07, + "loss": 0.0889, + "step": 34028 + }, + { + "epoch": 92.72207084468666, + "grad_norm": 2.8073959350585938, + "learning_rate": 2.765223051318333e-07, + "loss": 0.0918, + "step": 34029 + }, + { + "epoch": 92.72479564032697, + "grad_norm": 2.9638912677764893, + "learning_rate": 2.7631624730731887e-07, + "loss": 0.0469, + "step": 34030 + }, + { + "epoch": 92.7275204359673, + "grad_norm": 2.047313928604126, + "learning_rate": 2.7611026521053963e-07, + "loss": 0.0369, + "step": 34031 + }, + { + "epoch": 92.73024523160763, + "grad_norm": 2.096829414367676, + "learning_rate": 2.75904358843101e-07, + "loss": 0.178, + "step": 34032 + }, + { + "epoch": 92.73297002724796, + "grad_norm": 1.9505131244659424, + "learning_rate": 2.7569852820660713e-07, + "loss": 0.0207, + "step": 34033 + }, + { + "epoch": 92.73569482288828, + "grad_norm": 2.60426664352417, + "learning_rate": 2.754927733026591e-07, + "loss": 0.0933, + "step": 34034 + }, + { + "epoch": 92.73841961852861, + "grad_norm": 2.333433151245117, + "learning_rate": 2.7528709413286116e-07, + "loss": 0.0694, + "step": 34035 + }, + { + "epoch": 92.74114441416894, + "grad_norm": 5.702267646789551, + "learning_rate": 2.750814906988142e-07, + "loss": 0.0833, + "step": 34036 + }, + { + "epoch": 92.74386920980926, + "grad_norm": 2.6554129123687744, + "learning_rate": 2.748759630021203e-07, + "loss": 0.0762, + "step": 34037 + }, + { + "epoch": 92.7465940054496, + "grad_norm": 2.1196606159210205, + "learning_rate": 2.74670511044377e-07, + "loss": 0.0267, + "step": 34038 + }, + { + "epoch": 92.74931880108991, + "grad_norm": 3.2828564643859863, + "learning_rate": 2.7446513482718874e-07, + "loss": 0.0958, + "step": 34039 + }, + { + "epoch": 92.75204359673025, + "grad_norm": 1.9908270835876465, + "learning_rate": 2.74259834352153e-07, + "loss": 0.0813, + "step": 34040 + }, + { + "epoch": 92.75476839237058, + "grad_norm": 2.8551061153411865, + "learning_rate": 2.740546096208685e-07, + "loss": 0.0485, + "step": 34041 + }, + { + "epoch": 92.7574931880109, + "grad_norm": 2.666900634765625, + "learning_rate": 2.738494606349329e-07, + "loss": 0.1288, + "step": 34042 + }, + { + "epoch": 92.76021798365123, + "grad_norm": 2.8463668823242188, + "learning_rate": 2.736443873959449e-07, + "loss": 0.0801, + "step": 34043 + }, + { + "epoch": 92.76294277929155, + "grad_norm": 2.9144234657287598, + "learning_rate": 2.73439389905501e-07, + "loss": 0.1398, + "step": 34044 + }, + { + "epoch": 92.76566757493188, + "grad_norm": 3.478212833404541, + "learning_rate": 2.7323446816519993e-07, + "loss": 0.0857, + "step": 34045 + }, + { + "epoch": 92.7683923705722, + "grad_norm": 2.7649264335632324, + "learning_rate": 2.7302962217663486e-07, + "loss": 0.0933, + "step": 34046 + }, + { + "epoch": 92.77111716621253, + "grad_norm": 1.8461920022964478, + "learning_rate": 2.728248519414001e-07, + "loss": 0.0556, + "step": 34047 + }, + { + "epoch": 92.77384196185287, + "grad_norm": 1.3719723224639893, + "learning_rate": 2.7262015746109425e-07, + "loss": 0.0191, + "step": 34048 + }, + { + "epoch": 92.77656675749319, + "grad_norm": 1.9794155359268188, + "learning_rate": 2.7241553873730953e-07, + "loss": 0.0377, + "step": 34049 + }, + { + "epoch": 92.77929155313352, + "grad_norm": 2.6414873600006104, + "learning_rate": 2.722109957716401e-07, + "loss": 0.0381, + "step": 34050 + }, + { + "epoch": 92.78201634877384, + "grad_norm": 1.8735049962997437, + "learning_rate": 2.72006528565677e-07, + "loss": 0.0307, + "step": 34051 + }, + { + "epoch": 92.78474114441417, + "grad_norm": 2.5010695457458496, + "learning_rate": 2.7180213712101444e-07, + "loss": 0.0549, + "step": 34052 + }, + { + "epoch": 92.7874659400545, + "grad_norm": 3.3076906204223633, + "learning_rate": 2.715978214392434e-07, + "loss": 0.0963, + "step": 34053 + }, + { + "epoch": 92.79019073569482, + "grad_norm": 2.291006088256836, + "learning_rate": 2.7139358152195707e-07, + "loss": 0.0794, + "step": 34054 + }, + { + "epoch": 92.79291553133515, + "grad_norm": 2.7565507888793945, + "learning_rate": 2.711894173707419e-07, + "loss": 0.0644, + "step": 34055 + }, + { + "epoch": 92.79564032697547, + "grad_norm": 2.482112169265747, + "learning_rate": 2.709853289871922e-07, + "loss": 0.0345, + "step": 34056 + }, + { + "epoch": 92.7983651226158, + "grad_norm": 4.1855974197387695, + "learning_rate": 2.707813163728945e-07, + "loss": 0.0315, + "step": 34057 + }, + { + "epoch": 92.80108991825612, + "grad_norm": 3.153151512145996, + "learning_rate": 2.7057737952943863e-07, + "loss": 0.0973, + "step": 34058 + }, + { + "epoch": 92.80381471389646, + "grad_norm": 2.8204071521759033, + "learning_rate": 2.703735184584133e-07, + "loss": 0.1251, + "step": 34059 + }, + { + "epoch": 92.80653950953679, + "grad_norm": 2.1790354251861572, + "learning_rate": 2.701697331614062e-07, + "loss": 0.0381, + "step": 34060 + }, + { + "epoch": 92.80926430517711, + "grad_norm": 1.5505914688110352, + "learning_rate": 2.699660236400048e-07, + "loss": 0.0189, + "step": 34061 + }, + { + "epoch": 92.81198910081744, + "grad_norm": 2.216620445251465, + "learning_rate": 2.697623898957946e-07, + "loss": 0.037, + "step": 34062 + }, + { + "epoch": 92.81471389645776, + "grad_norm": 2.371647834777832, + "learning_rate": 2.695588319303599e-07, + "loss": 0.0263, + "step": 34063 + }, + { + "epoch": 92.8174386920981, + "grad_norm": 4.299121856689453, + "learning_rate": 2.693553497452905e-07, + "loss": 0.0937, + "step": 34064 + }, + { + "epoch": 92.82016348773843, + "grad_norm": 2.558760643005371, + "learning_rate": 2.6915194334216743e-07, + "loss": 0.1025, + "step": 34065 + }, + { + "epoch": 92.82288828337875, + "grad_norm": 2.4167726039886475, + "learning_rate": 2.68948612722576e-07, + "loss": 0.0633, + "step": 34066 + }, + { + "epoch": 92.82561307901908, + "grad_norm": 5.8445634841918945, + "learning_rate": 2.687453578880983e-07, + "loss": 0.0416, + "step": 34067 + }, + { + "epoch": 92.8283378746594, + "grad_norm": 2.8583555221557617, + "learning_rate": 2.6854217884031974e-07, + "loss": 0.0557, + "step": 34068 + }, + { + "epoch": 92.83106267029973, + "grad_norm": 2.0511131286621094, + "learning_rate": 2.683390755808213e-07, + "loss": 0.0339, + "step": 34069 + }, + { + "epoch": 92.83378746594005, + "grad_norm": 2.37980055809021, + "learning_rate": 2.68136048111185e-07, + "loss": 0.0433, + "step": 34070 + }, + { + "epoch": 92.83651226158038, + "grad_norm": 2.8480749130249023, + "learning_rate": 2.679330964329907e-07, + "loss": 0.0747, + "step": 34071 + }, + { + "epoch": 92.83923705722071, + "grad_norm": 2.049267053604126, + "learning_rate": 2.677302205478216e-07, + "loss": 0.0238, + "step": 34072 + }, + { + "epoch": 92.84196185286103, + "grad_norm": 2.4598608016967773, + "learning_rate": 2.675274204572564e-07, + "loss": 0.0273, + "step": 34073 + }, + { + "epoch": 92.84468664850137, + "grad_norm": 2.6839537620544434, + "learning_rate": 2.6732469616287393e-07, + "loss": 0.043, + "step": 34074 + }, + { + "epoch": 92.84741144414168, + "grad_norm": 1.7694298028945923, + "learning_rate": 2.671220476662528e-07, + "loss": 0.0244, + "step": 34075 + }, + { + "epoch": 92.85013623978202, + "grad_norm": 4.0129547119140625, + "learning_rate": 2.66919474968973e-07, + "loss": 0.0408, + "step": 34076 + }, + { + "epoch": 92.85286103542235, + "grad_norm": 2.5996809005737305, + "learning_rate": 2.667169780726109e-07, + "loss": 0.031, + "step": 34077 + }, + { + "epoch": 92.85558583106267, + "grad_norm": 1.9990999698638916, + "learning_rate": 2.6651455697874306e-07, + "loss": 0.0315, + "step": 34078 + }, + { + "epoch": 92.858310626703, + "grad_norm": 3.263554811477661, + "learning_rate": 2.6631221168894603e-07, + "loss": 0.0862, + "step": 34079 + }, + { + "epoch": 92.86103542234332, + "grad_norm": 3.1881675720214844, + "learning_rate": 2.661099422047986e-07, + "loss": 0.0491, + "step": 34080 + }, + { + "epoch": 92.86376021798365, + "grad_norm": 2.8475282192230225, + "learning_rate": 2.659077485278716e-07, + "loss": 0.1043, + "step": 34081 + }, + { + "epoch": 92.86648501362397, + "grad_norm": 2.2266502380371094, + "learning_rate": 2.6570563065974273e-07, + "loss": 0.0251, + "step": 34082 + }, + { + "epoch": 92.8692098092643, + "grad_norm": 2.85383677482605, + "learning_rate": 2.655035886019841e-07, + "loss": 0.0694, + "step": 34083 + }, + { + "epoch": 92.87193460490464, + "grad_norm": 2.5152273178100586, + "learning_rate": 2.653016223561722e-07, + "loss": 0.0277, + "step": 34084 + }, + { + "epoch": 92.87465940054496, + "grad_norm": 2.0699732303619385, + "learning_rate": 2.650997319238768e-07, + "loss": 0.0297, + "step": 34085 + }, + { + "epoch": 92.87738419618529, + "grad_norm": 2.2521121501922607, + "learning_rate": 2.6489791730667125e-07, + "loss": 0.0556, + "step": 34086 + }, + { + "epoch": 92.88010899182561, + "grad_norm": 4.227232933044434, + "learning_rate": 2.6469617850612637e-07, + "loss": 0.0309, + "step": 34087 + }, + { + "epoch": 92.88283378746594, + "grad_norm": 3.299978494644165, + "learning_rate": 2.6449451552381653e-07, + "loss": 0.042, + "step": 34088 + }, + { + "epoch": 92.88555858310627, + "grad_norm": 1.921689510345459, + "learning_rate": 2.642929283613094e-07, + "loss": 0.0245, + "step": 34089 + }, + { + "epoch": 92.88828337874659, + "grad_norm": 2.025585174560547, + "learning_rate": 2.640914170201747e-07, + "loss": 0.0316, + "step": 34090 + }, + { + "epoch": 92.89100817438693, + "grad_norm": 3.765036106109619, + "learning_rate": 2.6388998150198243e-07, + "loss": 0.0277, + "step": 34091 + }, + { + "epoch": 92.89373297002724, + "grad_norm": 2.3546907901763916, + "learning_rate": 2.6368862180830234e-07, + "loss": 0.0305, + "step": 34092 + }, + { + "epoch": 92.89645776566758, + "grad_norm": 3.1595547199249268, + "learning_rate": 2.6348733794070215e-07, + "loss": 0.0391, + "step": 34093 + }, + { + "epoch": 92.8991825613079, + "grad_norm": 2.0853705406188965, + "learning_rate": 2.632861299007483e-07, + "loss": 0.0227, + "step": 34094 + }, + { + "epoch": 92.90190735694823, + "grad_norm": 2.2090907096862793, + "learning_rate": 2.6308499769000963e-07, + "loss": 0.1551, + "step": 34095 + }, + { + "epoch": 92.90463215258856, + "grad_norm": 2.1396069526672363, + "learning_rate": 2.6288394131005147e-07, + "loss": 0.0316, + "step": 34096 + }, + { + "epoch": 92.90735694822888, + "grad_norm": 1.9962027072906494, + "learning_rate": 2.6268296076243925e-07, + "loss": 0.0397, + "step": 34097 + }, + { + "epoch": 92.91008174386921, + "grad_norm": 3.098529815673828, + "learning_rate": 2.6248205604873955e-07, + "loss": 0.0372, + "step": 34098 + }, + { + "epoch": 92.91280653950953, + "grad_norm": 1.867499828338623, + "learning_rate": 2.622812271705155e-07, + "loss": 0.0802, + "step": 34099 + }, + { + "epoch": 92.91553133514986, + "grad_norm": 3.4928348064422607, + "learning_rate": 2.6208047412933145e-07, + "loss": 0.0863, + "step": 34100 + }, + { + "epoch": 92.9182561307902, + "grad_norm": 2.3808937072753906, + "learning_rate": 2.618797969267528e-07, + "loss": 0.134, + "step": 34101 + }, + { + "epoch": 92.92098092643052, + "grad_norm": 2.0302734375, + "learning_rate": 2.616791955643405e-07, + "loss": 0.0347, + "step": 34102 + }, + { + "epoch": 92.92370572207085, + "grad_norm": 3.0014467239379883, + "learning_rate": 2.614786700436556e-07, + "loss": 0.0685, + "step": 34103 + }, + { + "epoch": 92.92643051771117, + "grad_norm": 2.118467092514038, + "learning_rate": 2.6127822036626337e-07, + "loss": 0.0334, + "step": 34104 + }, + { + "epoch": 92.9291553133515, + "grad_norm": 2.6980319023132324, + "learning_rate": 2.610778465337216e-07, + "loss": 0.0775, + "step": 34105 + }, + { + "epoch": 92.93188010899182, + "grad_norm": 2.85756254196167, + "learning_rate": 2.608775485475934e-07, + "loss": 0.0507, + "step": 34106 + }, + { + "epoch": 92.93460490463215, + "grad_norm": 2.651165723800659, + "learning_rate": 2.606773264094353e-07, + "loss": 0.0421, + "step": 34107 + }, + { + "epoch": 92.93732970027249, + "grad_norm": 2.8043205738067627, + "learning_rate": 2.6047718012081056e-07, + "loss": 0.0273, + "step": 34108 + }, + { + "epoch": 92.9400544959128, + "grad_norm": 1.5109548568725586, + "learning_rate": 2.602771096832757e-07, + "loss": 0.0216, + "step": 34109 + }, + { + "epoch": 92.94277929155314, + "grad_norm": 3.034245491027832, + "learning_rate": 2.600771150983894e-07, + "loss": 0.0412, + "step": 34110 + }, + { + "epoch": 92.94550408719346, + "grad_norm": 1.7956622838974, + "learning_rate": 2.5987719636770824e-07, + "loss": 0.0181, + "step": 34111 + }, + { + "epoch": 92.94822888283379, + "grad_norm": 2.136606216430664, + "learning_rate": 2.5967735349278877e-07, + "loss": 0.0679, + "step": 34112 + }, + { + "epoch": 92.95095367847412, + "grad_norm": 6.898420810699463, + "learning_rate": 2.5947758647519085e-07, + "loss": 0.0742, + "step": 34113 + }, + { + "epoch": 92.95367847411444, + "grad_norm": 2.685142755508423, + "learning_rate": 2.592778953164676e-07, + "loss": 0.0492, + "step": 34114 + }, + { + "epoch": 92.95640326975477, + "grad_norm": 2.132816791534424, + "learning_rate": 2.590782800181746e-07, + "loss": 0.0309, + "step": 34115 + }, + { + "epoch": 92.95912806539509, + "grad_norm": 2.2591047286987305, + "learning_rate": 2.5887874058186604e-07, + "loss": 0.0847, + "step": 34116 + }, + { + "epoch": 92.96185286103542, + "grad_norm": 2.0352091789245605, + "learning_rate": 2.5867927700909624e-07, + "loss": 0.0544, + "step": 34117 + }, + { + "epoch": 92.96457765667574, + "grad_norm": 1.5847419500350952, + "learning_rate": 2.584798893014195e-07, + "loss": 0.0198, + "step": 34118 + }, + { + "epoch": 92.96730245231608, + "grad_norm": 2.906217336654663, + "learning_rate": 2.58280577460388e-07, + "loss": 0.0427, + "step": 34119 + }, + { + "epoch": 92.97002724795641, + "grad_norm": 1.7440987825393677, + "learning_rate": 2.580813414875516e-07, + "loss": 0.0764, + "step": 34120 + }, + { + "epoch": 92.97275204359673, + "grad_norm": 1.9244767427444458, + "learning_rate": 2.578821813844667e-07, + "loss": 0.0396, + "step": 34121 + }, + { + "epoch": 92.97547683923706, + "grad_norm": 2.3534650802612305, + "learning_rate": 2.5768309715268116e-07, + "loss": 0.0735, + "step": 34122 + }, + { + "epoch": 92.97820163487738, + "grad_norm": 3.1908464431762695, + "learning_rate": 2.5748408879374463e-07, + "loss": 0.0278, + "step": 34123 + }, + { + "epoch": 92.98092643051771, + "grad_norm": 2.015676498413086, + "learning_rate": 2.572851563092105e-07, + "loss": 0.0538, + "step": 34124 + }, + { + "epoch": 92.98365122615803, + "grad_norm": 2.5479812622070312, + "learning_rate": 2.5708629970062516e-07, + "loss": 0.0211, + "step": 34125 + }, + { + "epoch": 92.98637602179836, + "grad_norm": 2.6128368377685547, + "learning_rate": 2.5688751896953854e-07, + "loss": 0.0451, + "step": 34126 + }, + { + "epoch": 92.9891008174387, + "grad_norm": 2.622509717941284, + "learning_rate": 2.566888141174972e-07, + "loss": 0.0434, + "step": 34127 + }, + { + "epoch": 92.99182561307902, + "grad_norm": 2.1178672313690186, + "learning_rate": 2.5649018514604995e-07, + "loss": 0.0419, + "step": 34128 + }, + { + "epoch": 92.99455040871935, + "grad_norm": 2.688542604446411, + "learning_rate": 2.5629163205674434e-07, + "loss": 0.0435, + "step": 34129 + }, + { + "epoch": 92.99727520435967, + "grad_norm": 3.2054944038391113, + "learning_rate": 2.5609315485112583e-07, + "loss": 0.0137, + "step": 34130 + }, + { + "epoch": 93.0, + "grad_norm": 2.3210439682006836, + "learning_rate": 2.5589475353073987e-07, + "loss": 0.0262, + "step": 34131 + }, + { + "epoch": 93.00272479564033, + "grad_norm": 4.622258186340332, + "learning_rate": 2.556964280971319e-07, + "loss": 0.0309, + "step": 34132 + }, + { + "epoch": 93.00544959128065, + "grad_norm": 2.673596143722534, + "learning_rate": 2.5549817855184624e-07, + "loss": 0.0432, + "step": 34133 + }, + { + "epoch": 93.00817438692098, + "grad_norm": 1.615040898323059, + "learning_rate": 2.5530000489642823e-07, + "loss": 0.0253, + "step": 34134 + }, + { + "epoch": 93.0108991825613, + "grad_norm": 3.2961864471435547, + "learning_rate": 2.5510190713242014e-07, + "loss": 0.0502, + "step": 34135 + }, + { + "epoch": 93.01362397820164, + "grad_norm": 2.0259194374084473, + "learning_rate": 2.5490388526136387e-07, + "loss": 0.069, + "step": 34136 + }, + { + "epoch": 93.01634877384195, + "grad_norm": 3.0652382373809814, + "learning_rate": 2.547059392848028e-07, + "loss": 0.1025, + "step": 34137 + }, + { + "epoch": 93.01907356948229, + "grad_norm": 1.6499525308609009, + "learning_rate": 2.5450806920427783e-07, + "loss": 0.0217, + "step": 34138 + }, + { + "epoch": 93.02179836512262, + "grad_norm": 2.7060530185699463, + "learning_rate": 2.543102750213311e-07, + "loss": 0.1126, + "step": 34139 + }, + { + "epoch": 93.02452316076294, + "grad_norm": 1.6776399612426758, + "learning_rate": 2.5411255673750137e-07, + "loss": 0.1076, + "step": 34140 + }, + { + "epoch": 93.02724795640327, + "grad_norm": 2.6825172901153564, + "learning_rate": 2.539149143543307e-07, + "loss": 0.1334, + "step": 34141 + }, + { + "epoch": 93.02997275204359, + "grad_norm": 2.8298847675323486, + "learning_rate": 2.5371734787335676e-07, + "loss": 0.0385, + "step": 34142 + }, + { + "epoch": 93.03269754768392, + "grad_norm": 2.77170991897583, + "learning_rate": 2.535198572961173e-07, + "loss": 0.1052, + "step": 34143 + }, + { + "epoch": 93.03542234332426, + "grad_norm": 4.709928512573242, + "learning_rate": 2.5332244262415207e-07, + "loss": 0.1541, + "step": 34144 + }, + { + "epoch": 93.03814713896458, + "grad_norm": 2.9608826637268066, + "learning_rate": 2.5312510385899767e-07, + "loss": 0.0999, + "step": 34145 + }, + { + "epoch": 93.04087193460491, + "grad_norm": 3.854839324951172, + "learning_rate": 2.5292784100219184e-07, + "loss": 0.0419, + "step": 34146 + }, + { + "epoch": 93.04359673024523, + "grad_norm": 2.5647788047790527, + "learning_rate": 2.5273065405526986e-07, + "loss": 0.0319, + "step": 34147 + }, + { + "epoch": 93.04632152588556, + "grad_norm": 2.588716506958008, + "learning_rate": 2.525335430197673e-07, + "loss": 0.0529, + "step": 34148 + }, + { + "epoch": 93.04904632152588, + "grad_norm": 2.4272661209106445, + "learning_rate": 2.5233650789722063e-07, + "loss": 0.0329, + "step": 34149 + }, + { + "epoch": 93.05177111716621, + "grad_norm": 2.615199565887451, + "learning_rate": 2.5213954868916425e-07, + "loss": 0.0225, + "step": 34150 + }, + { + "epoch": 93.05449591280654, + "grad_norm": 1.897565245628357, + "learning_rate": 2.519426653971302e-07, + "loss": 0.074, + "step": 34151 + }, + { + "epoch": 93.05722070844686, + "grad_norm": 2.6388299465179443, + "learning_rate": 2.517458580226528e-07, + "loss": 0.0837, + "step": 34152 + }, + { + "epoch": 93.0599455040872, + "grad_norm": 1.9054664373397827, + "learning_rate": 2.515491265672654e-07, + "loss": 0.0197, + "step": 34153 + }, + { + "epoch": 93.06267029972751, + "grad_norm": 2.1602330207824707, + "learning_rate": 2.513524710324999e-07, + "loss": 0.0283, + "step": 34154 + }, + { + "epoch": 93.06539509536785, + "grad_norm": 2.7745659351348877, + "learning_rate": 2.511558914198875e-07, + "loss": 0.1196, + "step": 34155 + }, + { + "epoch": 93.06811989100818, + "grad_norm": 2.5935699939727783, + "learning_rate": 2.5095938773095906e-07, + "loss": 0.0422, + "step": 34156 + }, + { + "epoch": 93.0708446866485, + "grad_norm": 2.0105862617492676, + "learning_rate": 2.5076295996724454e-07, + "loss": 0.0292, + "step": 34157 + }, + { + "epoch": 93.07356948228883, + "grad_norm": 2.6986520290374756, + "learning_rate": 2.5056660813027603e-07, + "loss": 0.0456, + "step": 34158 + }, + { + "epoch": 93.07629427792915, + "grad_norm": 3.2956032752990723, + "learning_rate": 2.5037033222158003e-07, + "loss": 0.1097, + "step": 34159 + }, + { + "epoch": 93.07901907356948, + "grad_norm": 2.2541451454162598, + "learning_rate": 2.501741322426854e-07, + "loss": 0.0521, + "step": 34160 + }, + { + "epoch": 93.0817438692098, + "grad_norm": 3.0680980682373047, + "learning_rate": 2.4997800819512086e-07, + "loss": 0.1117, + "step": 34161 + }, + { + "epoch": 93.08446866485014, + "grad_norm": 1.7472697496414185, + "learning_rate": 2.497819600804152e-07, + "loss": 0.0215, + "step": 34162 + }, + { + "epoch": 93.08719346049047, + "grad_norm": 2.953049421310425, + "learning_rate": 2.495859879000917e-07, + "loss": 0.0596, + "step": 34163 + }, + { + "epoch": 93.08991825613079, + "grad_norm": 2.394619941711426, + "learning_rate": 2.4939009165567904e-07, + "loss": 0.158, + "step": 34164 + }, + { + "epoch": 93.09264305177112, + "grad_norm": 2.5953469276428223, + "learning_rate": 2.491942713487039e-07, + "loss": 0.0652, + "step": 34165 + }, + { + "epoch": 93.09536784741144, + "grad_norm": 2.1170380115509033, + "learning_rate": 2.4899852698068937e-07, + "loss": 0.0165, + "step": 34166 + }, + { + "epoch": 93.09809264305177, + "grad_norm": 2.6129448413848877, + "learning_rate": 2.48802858553161e-07, + "loss": 0.0543, + "step": 34167 + }, + { + "epoch": 93.1008174386921, + "grad_norm": 2.3921217918395996, + "learning_rate": 2.4860726606764086e-07, + "loss": 0.1412, + "step": 34168 + }, + { + "epoch": 93.10354223433242, + "grad_norm": 2.644024133682251, + "learning_rate": 2.484117495256544e-07, + "loss": 0.1369, + "step": 34169 + }, + { + "epoch": 93.10626702997276, + "grad_norm": 2.567168951034546, + "learning_rate": 2.4821630892872375e-07, + "loss": 0.0346, + "step": 34170 + }, + { + "epoch": 93.10899182561307, + "grad_norm": 2.645113945007324, + "learning_rate": 2.48020944278371e-07, + "loss": 0.0458, + "step": 34171 + }, + { + "epoch": 93.11171662125341, + "grad_norm": 4.088079452514648, + "learning_rate": 2.4782565557611494e-07, + "loss": 0.0426, + "step": 34172 + }, + { + "epoch": 93.11444141689373, + "grad_norm": 3.1976189613342285, + "learning_rate": 2.4763044282348105e-07, + "loss": 0.1211, + "step": 34173 + }, + { + "epoch": 93.11716621253406, + "grad_norm": 1.549565076828003, + "learning_rate": 2.47435306021987e-07, + "loss": 0.056, + "step": 34174 + }, + { + "epoch": 93.11989100817439, + "grad_norm": 2.4160778522491455, + "learning_rate": 2.472402451731526e-07, + "loss": 0.0659, + "step": 34175 + }, + { + "epoch": 93.12261580381471, + "grad_norm": 3.090144395828247, + "learning_rate": 2.4704526027849675e-07, + "loss": 0.0466, + "step": 34176 + }, + { + "epoch": 93.12534059945504, + "grad_norm": 1.9743715524673462, + "learning_rate": 2.4685035133953926e-07, + "loss": 0.1164, + "step": 34177 + }, + { + "epoch": 93.12806539509536, + "grad_norm": 2.8321149349212646, + "learning_rate": 2.466555183577968e-07, + "loss": 0.0461, + "step": 34178 + }, + { + "epoch": 93.1307901907357, + "grad_norm": 3.1648738384246826, + "learning_rate": 2.4646076133478803e-07, + "loss": 0.0556, + "step": 34179 + }, + { + "epoch": 93.13351498637603, + "grad_norm": 1.6319115161895752, + "learning_rate": 2.4626608027202735e-07, + "loss": 0.0174, + "step": 34180 + }, + { + "epoch": 93.13623978201635, + "grad_norm": 2.7480781078338623, + "learning_rate": 2.4607147517103356e-07, + "loss": 0.0356, + "step": 34181 + }, + { + "epoch": 93.13896457765668, + "grad_norm": 3.361598014831543, + "learning_rate": 2.45876946033321e-07, + "loss": 0.1172, + "step": 34182 + }, + { + "epoch": 93.141689373297, + "grad_norm": 2.1728339195251465, + "learning_rate": 2.456824928604051e-07, + "loss": 0.1057, + "step": 34183 + }, + { + "epoch": 93.14441416893733, + "grad_norm": 2.9169201850891113, + "learning_rate": 2.454881156538003e-07, + "loss": 0.073, + "step": 34184 + }, + { + "epoch": 93.14713896457765, + "grad_norm": 1.6619789600372314, + "learning_rate": 2.4529381441501963e-07, + "loss": 0.0222, + "step": 34185 + }, + { + "epoch": 93.14986376021798, + "grad_norm": 3.128669500350952, + "learning_rate": 2.450995891455765e-07, + "loss": 0.0412, + "step": 34186 + }, + { + "epoch": 93.15258855585832, + "grad_norm": 3.3330488204956055, + "learning_rate": 2.449054398469852e-07, + "loss": 0.0367, + "step": 34187 + }, + { + "epoch": 93.15531335149863, + "grad_norm": 2.5604634284973145, + "learning_rate": 2.4471136652075454e-07, + "loss": 0.0289, + "step": 34188 + }, + { + "epoch": 93.15803814713897, + "grad_norm": 3.2581260204315186, + "learning_rate": 2.4451736916839884e-07, + "loss": 0.028, + "step": 34189 + }, + { + "epoch": 93.16076294277929, + "grad_norm": 2.336686134338379, + "learning_rate": 2.44323447791428e-07, + "loss": 0.052, + "step": 34190 + }, + { + "epoch": 93.16348773841962, + "grad_norm": 11.666519165039062, + "learning_rate": 2.44129602391352e-07, + "loss": 0.0311, + "step": 34191 + }, + { + "epoch": 93.16621253405995, + "grad_norm": 4.859091758728027, + "learning_rate": 2.439358329696795e-07, + "loss": 0.0224, + "step": 34192 + }, + { + "epoch": 93.16893732970027, + "grad_norm": 3.556523561477661, + "learning_rate": 2.437421395279216e-07, + "loss": 0.0548, + "step": 34193 + }, + { + "epoch": 93.1716621253406, + "grad_norm": 2.490582227706909, + "learning_rate": 2.4354852206758705e-07, + "loss": 0.1204, + "step": 34194 + }, + { + "epoch": 93.17438692098092, + "grad_norm": 3.8178818225860596, + "learning_rate": 2.4335498059018135e-07, + "loss": 0.0335, + "step": 34195 + }, + { + "epoch": 93.17711171662125, + "grad_norm": 2.508756637573242, + "learning_rate": 2.431615150972133e-07, + "loss": 0.0202, + "step": 34196 + }, + { + "epoch": 93.17983651226157, + "grad_norm": 2.6220171451568604, + "learning_rate": 2.4296812559018835e-07, + "loss": 0.0391, + "step": 34197 + }, + { + "epoch": 93.1825613079019, + "grad_norm": 6.727607727050781, + "learning_rate": 2.4277481207061527e-07, + "loss": 0.0764, + "step": 34198 + }, + { + "epoch": 93.18528610354224, + "grad_norm": 2.875270366668701, + "learning_rate": 2.425815745399973e-07, + "loss": 0.0705, + "step": 34199 + }, + { + "epoch": 93.18801089918256, + "grad_norm": 3.164824962615967, + "learning_rate": 2.4238841299983997e-07, + "loss": 0.1021, + "step": 34200 + }, + { + "epoch": 93.19073569482289, + "grad_norm": 2.8297324180603027, + "learning_rate": 2.421953274516464e-07, + "loss": 0.0582, + "step": 34201 + }, + { + "epoch": 93.19346049046321, + "grad_norm": 2.2060811519622803, + "learning_rate": 2.420023178969233e-07, + "loss": 0.0214, + "step": 34202 + }, + { + "epoch": 93.19618528610354, + "grad_norm": 1.5179919004440308, + "learning_rate": 2.418093843371716e-07, + "loss": 0.0166, + "step": 34203 + }, + { + "epoch": 93.19891008174388, + "grad_norm": 2.476790189743042, + "learning_rate": 2.416165267738946e-07, + "loss": 0.0463, + "step": 34204 + }, + { + "epoch": 93.2016348773842, + "grad_norm": 3.1280102729797363, + "learning_rate": 2.414237452085932e-07, + "loss": 0.2226, + "step": 34205 + }, + { + "epoch": 93.20435967302453, + "grad_norm": 2.301055431365967, + "learning_rate": 2.4123103964277085e-07, + "loss": 0.0308, + "step": 34206 + }, + { + "epoch": 93.20708446866485, + "grad_norm": 2.773564338684082, + "learning_rate": 2.410384100779262e-07, + "loss": 0.0365, + "step": 34207 + }, + { + "epoch": 93.20980926430518, + "grad_norm": 2.866030693054199, + "learning_rate": 2.4084585651556025e-07, + "loss": 0.1479, + "step": 34208 + }, + { + "epoch": 93.2125340599455, + "grad_norm": 1.6615641117095947, + "learning_rate": 2.40653378957173e-07, + "loss": 0.0245, + "step": 34209 + }, + { + "epoch": 93.21525885558583, + "grad_norm": 2.9816291332244873, + "learning_rate": 2.404609774042632e-07, + "loss": 0.0344, + "step": 34210 + }, + { + "epoch": 93.21798365122616, + "grad_norm": 2.267970561981201, + "learning_rate": 2.402686518583297e-07, + "loss": 0.0972, + "step": 34211 + }, + { + "epoch": 93.22070844686648, + "grad_norm": 2.694411516189575, + "learning_rate": 2.4007640232086793e-07, + "loss": 0.0242, + "step": 34212 + }, + { + "epoch": 93.22343324250681, + "grad_norm": 1.6629489660263062, + "learning_rate": 2.398842287933789e-07, + "loss": 0.0738, + "step": 34213 + }, + { + "epoch": 93.22615803814713, + "grad_norm": 2.829502582550049, + "learning_rate": 2.396921312773559e-07, + "loss": 0.0413, + "step": 34214 + }, + { + "epoch": 93.22888283378747, + "grad_norm": 1.7646427154541016, + "learning_rate": 2.395001097742977e-07, + "loss": 0.0263, + "step": 34215 + }, + { + "epoch": 93.2316076294278, + "grad_norm": 3.0148816108703613, + "learning_rate": 2.393081642856976e-07, + "loss": 0.0272, + "step": 34216 + }, + { + "epoch": 93.23433242506812, + "grad_norm": 2.923034191131592, + "learning_rate": 2.39116294813051e-07, + "loss": 0.0519, + "step": 34217 + }, + { + "epoch": 93.23705722070845, + "grad_norm": 3.248408794403076, + "learning_rate": 2.3892450135785447e-07, + "loss": 0.1798, + "step": 34218 + }, + { + "epoch": 93.23978201634877, + "grad_norm": 3.2799253463745117, + "learning_rate": 2.3873278392159806e-07, + "loss": 0.0405, + "step": 34219 + }, + { + "epoch": 93.2425068119891, + "grad_norm": 3.820754289627075, + "learning_rate": 2.385411425057782e-07, + "loss": 0.0569, + "step": 34220 + }, + { + "epoch": 93.24523160762942, + "grad_norm": 2.1387405395507812, + "learning_rate": 2.3834957711188378e-07, + "loss": 0.0413, + "step": 34221 + }, + { + "epoch": 93.24795640326975, + "grad_norm": 2.9989240169525146, + "learning_rate": 2.3815808774141025e-07, + "loss": 0.0516, + "step": 34222 + }, + { + "epoch": 93.25068119891009, + "grad_norm": 2.485605001449585, + "learning_rate": 2.379666743958464e-07, + "loss": 0.0338, + "step": 34223 + }, + { + "epoch": 93.2534059945504, + "grad_norm": 3.5497841835021973, + "learning_rate": 2.3777533707668444e-07, + "loss": 0.1429, + "step": 34224 + }, + { + "epoch": 93.25613079019074, + "grad_norm": 4.257180690765381, + "learning_rate": 2.375840757854131e-07, + "loss": 0.0999, + "step": 34225 + }, + { + "epoch": 93.25885558583106, + "grad_norm": 2.6541223526000977, + "learning_rate": 2.3739289052352344e-07, + "loss": 0.0505, + "step": 34226 + }, + { + "epoch": 93.26158038147139, + "grad_norm": 2.5403902530670166, + "learning_rate": 2.3720178129250425e-07, + "loss": 0.1491, + "step": 34227 + }, + { + "epoch": 93.26430517711172, + "grad_norm": 1.8508092164993286, + "learning_rate": 2.3701074809384327e-07, + "loss": 0.0757, + "step": 34228 + }, + { + "epoch": 93.26702997275204, + "grad_norm": 4.365070819854736, + "learning_rate": 2.3681979092902706e-07, + "loss": 0.0883, + "step": 34229 + }, + { + "epoch": 93.26975476839237, + "grad_norm": 2.5791027545928955, + "learning_rate": 2.3662890979954556e-07, + "loss": 0.0205, + "step": 34230 + }, + { + "epoch": 93.2724795640327, + "grad_norm": 2.260385036468506, + "learning_rate": 2.36438104706882e-07, + "loss": 0.031, + "step": 34231 + }, + { + "epoch": 93.27520435967303, + "grad_norm": 3.0480616092681885, + "learning_rate": 2.362473756525263e-07, + "loss": 0.0362, + "step": 34232 + }, + { + "epoch": 93.27792915531334, + "grad_norm": 2.6555707454681396, + "learning_rate": 2.3605672263796066e-07, + "loss": 0.0336, + "step": 34233 + }, + { + "epoch": 93.28065395095368, + "grad_norm": 5.330408573150635, + "learning_rate": 2.358661456646716e-07, + "loss": 0.0981, + "step": 34234 + }, + { + "epoch": 93.28337874659401, + "grad_norm": 1.8813849687576294, + "learning_rate": 2.3567564473414239e-07, + "loss": 0.0253, + "step": 34235 + }, + { + "epoch": 93.28610354223433, + "grad_norm": 3.5582058429718018, + "learning_rate": 2.3548521984785745e-07, + "loss": 0.0325, + "step": 34236 + }, + { + "epoch": 93.28882833787466, + "grad_norm": 2.186025857925415, + "learning_rate": 2.3529487100729774e-07, + "loss": 0.1027, + "step": 34237 + }, + { + "epoch": 93.29155313351498, + "grad_norm": 1.7551841735839844, + "learning_rate": 2.3510459821394883e-07, + "loss": 0.0227, + "step": 34238 + }, + { + "epoch": 93.29427792915531, + "grad_norm": 5.63027286529541, + "learning_rate": 2.3491440146929168e-07, + "loss": 0.1174, + "step": 34239 + }, + { + "epoch": 93.29700272479565, + "grad_norm": 3.5584611892700195, + "learning_rate": 2.3472428077480625e-07, + "loss": 0.0759, + "step": 34240 + }, + { + "epoch": 93.29972752043597, + "grad_norm": 1.5529555082321167, + "learning_rate": 2.3453423613197245e-07, + "loss": 0.0208, + "step": 34241 + }, + { + "epoch": 93.3024523160763, + "grad_norm": 2.823137044906616, + "learning_rate": 2.3434426754227358e-07, + "loss": 0.0649, + "step": 34242 + }, + { + "epoch": 93.30517711171662, + "grad_norm": 2.305696964263916, + "learning_rate": 2.3415437500718618e-07, + "loss": 0.0302, + "step": 34243 + }, + { + "epoch": 93.30790190735695, + "grad_norm": 2.765134811401367, + "learning_rate": 2.3396455852819133e-07, + "loss": 0.0973, + "step": 34244 + }, + { + "epoch": 93.31062670299727, + "grad_norm": 2.4256081581115723, + "learning_rate": 2.337748181067645e-07, + "loss": 0.0542, + "step": 34245 + }, + { + "epoch": 93.3133514986376, + "grad_norm": 3.1596426963806152, + "learning_rate": 2.335851537443856e-07, + "loss": 0.1633, + "step": 34246 + }, + { + "epoch": 93.31607629427793, + "grad_norm": 2.5621795654296875, + "learning_rate": 2.3339556544253238e-07, + "loss": 0.0685, + "step": 34247 + }, + { + "epoch": 93.31880108991825, + "grad_norm": 2.953115701675415, + "learning_rate": 2.332060532026792e-07, + "loss": 0.0967, + "step": 34248 + }, + { + "epoch": 93.32152588555859, + "grad_norm": 1.5390170812606812, + "learning_rate": 2.3301661702630153e-07, + "loss": 0.023, + "step": 34249 + }, + { + "epoch": 93.3242506811989, + "grad_norm": 3.682244300842285, + "learning_rate": 2.3282725691487817e-07, + "loss": 0.0305, + "step": 34250 + }, + { + "epoch": 93.32697547683924, + "grad_norm": 2.5427091121673584, + "learning_rate": 2.3263797286988132e-07, + "loss": 0.042, + "step": 34251 + }, + { + "epoch": 93.32970027247957, + "grad_norm": 1.9223684072494507, + "learning_rate": 2.3244876489278534e-07, + "loss": 0.0358, + "step": 34252 + }, + { + "epoch": 93.33242506811989, + "grad_norm": 1.8607436418533325, + "learning_rate": 2.3225963298506348e-07, + "loss": 0.0421, + "step": 34253 + }, + { + "epoch": 93.33514986376022, + "grad_norm": 3.368166446685791, + "learning_rate": 2.3207057714819015e-07, + "loss": 0.031, + "step": 34254 + }, + { + "epoch": 93.33787465940054, + "grad_norm": 2.6873717308044434, + "learning_rate": 2.3188159738363637e-07, + "loss": 0.0496, + "step": 34255 + }, + { + "epoch": 93.34059945504087, + "grad_norm": 1.9688893556594849, + "learning_rate": 2.316926936928754e-07, + "loss": 0.0509, + "step": 34256 + }, + { + "epoch": 93.34332425068119, + "grad_norm": 2.0882997512817383, + "learning_rate": 2.3150386607737497e-07, + "loss": 0.0204, + "step": 34257 + }, + { + "epoch": 93.34604904632153, + "grad_norm": 1.618839144706726, + "learning_rate": 2.3131511453861056e-07, + "loss": 0.0216, + "step": 34258 + }, + { + "epoch": 93.34877384196186, + "grad_norm": 2.171215534210205, + "learning_rate": 2.3112643907804877e-07, + "loss": 0.0214, + "step": 34259 + }, + { + "epoch": 93.35149863760218, + "grad_norm": 2.2503678798675537, + "learning_rate": 2.3093783969715954e-07, + "loss": 0.0209, + "step": 34260 + }, + { + "epoch": 93.35422343324251, + "grad_norm": 3.4730801582336426, + "learning_rate": 2.3074931639741172e-07, + "loss": 0.0775, + "step": 34261 + }, + { + "epoch": 93.35694822888283, + "grad_norm": 1.5985684394836426, + "learning_rate": 2.305608691802741e-07, + "loss": 0.018, + "step": 34262 + }, + { + "epoch": 93.35967302452316, + "grad_norm": 2.013010025024414, + "learning_rate": 2.303724980472144e-07, + "loss": 0.0174, + "step": 34263 + }, + { + "epoch": 93.3623978201635, + "grad_norm": 2.307169198989868, + "learning_rate": 2.3018420299969924e-07, + "loss": 0.0526, + "step": 34264 + }, + { + "epoch": 93.36512261580381, + "grad_norm": 3.5073304176330566, + "learning_rate": 2.299959840391941e-07, + "loss": 0.0499, + "step": 34265 + }, + { + "epoch": 93.36784741144415, + "grad_norm": 2.8495914936065674, + "learning_rate": 2.298078411671656e-07, + "loss": 0.0715, + "step": 34266 + }, + { + "epoch": 93.37057220708446, + "grad_norm": 3.1446921825408936, + "learning_rate": 2.2961977438508033e-07, + "loss": 0.0734, + "step": 34267 + }, + { + "epoch": 93.3732970027248, + "grad_norm": 2.7543461322784424, + "learning_rate": 2.2943178369440155e-07, + "loss": 0.1745, + "step": 34268 + }, + { + "epoch": 93.37602179836512, + "grad_norm": 2.799346923828125, + "learning_rate": 2.292438690965937e-07, + "loss": 0.0898, + "step": 34269 + }, + { + "epoch": 93.37874659400545, + "grad_norm": 3.420541524887085, + "learning_rate": 2.2905603059311998e-07, + "loss": 0.0635, + "step": 34270 + }, + { + "epoch": 93.38147138964578, + "grad_norm": 2.3576390743255615, + "learning_rate": 2.2886826818544262e-07, + "loss": 0.0312, + "step": 34271 + }, + { + "epoch": 93.3841961852861, + "grad_norm": 1.5556529760360718, + "learning_rate": 2.2868058187502595e-07, + "loss": 0.0141, + "step": 34272 + }, + { + "epoch": 93.38692098092643, + "grad_norm": 1.5678285360336304, + "learning_rate": 2.2849297166332996e-07, + "loss": 0.0245, + "step": 34273 + }, + { + "epoch": 93.38964577656675, + "grad_norm": 2.376685857772827, + "learning_rate": 2.2830543755181566e-07, + "loss": 0.1673, + "step": 34274 + }, + { + "epoch": 93.39237057220708, + "grad_norm": 2.1394050121307373, + "learning_rate": 2.2811797954194527e-07, + "loss": 0.0282, + "step": 34275 + }, + { + "epoch": 93.39509536784742, + "grad_norm": 2.103039264678955, + "learning_rate": 2.2793059763517756e-07, + "loss": 0.0496, + "step": 34276 + }, + { + "epoch": 93.39782016348774, + "grad_norm": 1.8962243795394897, + "learning_rate": 2.277432918329703e-07, + "loss": 0.0658, + "step": 34277 + }, + { + "epoch": 93.40054495912807, + "grad_norm": 2.451472759246826, + "learning_rate": 2.2755606213678448e-07, + "loss": 0.0565, + "step": 34278 + }, + { + "epoch": 93.40326975476839, + "grad_norm": 2.0736703872680664, + "learning_rate": 2.2736890854807792e-07, + "loss": 0.0239, + "step": 34279 + }, + { + "epoch": 93.40599455040872, + "grad_norm": 3.8964591026306152, + "learning_rate": 2.2718183106830826e-07, + "loss": 0.0884, + "step": 34280 + }, + { + "epoch": 93.40871934604904, + "grad_norm": 3.147368907928467, + "learning_rate": 2.2699482969892994e-07, + "loss": 0.0358, + "step": 34281 + }, + { + "epoch": 93.41144414168937, + "grad_norm": 3.8105955123901367, + "learning_rate": 2.2680790444140287e-07, + "loss": 0.0969, + "step": 34282 + }, + { + "epoch": 93.4141689373297, + "grad_norm": 3.1020357608795166, + "learning_rate": 2.2662105529718036e-07, + "loss": 0.0388, + "step": 34283 + }, + { + "epoch": 93.41689373297002, + "grad_norm": 2.4139652252197266, + "learning_rate": 2.2643428226772013e-07, + "loss": 0.0501, + "step": 34284 + }, + { + "epoch": 93.41961852861036, + "grad_norm": 2.5008866786956787, + "learning_rate": 2.2624758535447432e-07, + "loss": 0.0276, + "step": 34285 + }, + { + "epoch": 93.42234332425068, + "grad_norm": 3.279120683670044, + "learning_rate": 2.2606096455889736e-07, + "loss": 0.1095, + "step": 34286 + }, + { + "epoch": 93.42506811989101, + "grad_norm": 3.0299057960510254, + "learning_rate": 2.2587441988244362e-07, + "loss": 0.0421, + "step": 34287 + }, + { + "epoch": 93.42779291553134, + "grad_norm": 2.426337718963623, + "learning_rate": 2.256879513265653e-07, + "loss": 0.028, + "step": 34288 + }, + { + "epoch": 93.43051771117166, + "grad_norm": 3.697620391845703, + "learning_rate": 2.2550155889271453e-07, + "loss": 0.0427, + "step": 34289 + }, + { + "epoch": 93.433242506812, + "grad_norm": 2.769820213317871, + "learning_rate": 2.2531524258234238e-07, + "loss": 0.0496, + "step": 34290 + }, + { + "epoch": 93.43596730245231, + "grad_norm": 1.7424660921096802, + "learning_rate": 2.2512900239690104e-07, + "loss": 0.1147, + "step": 34291 + }, + { + "epoch": 93.43869209809264, + "grad_norm": 1.9787771701812744, + "learning_rate": 2.2494283833784047e-07, + "loss": 0.0147, + "step": 34292 + }, + { + "epoch": 93.44141689373296, + "grad_norm": 2.9561150074005127, + "learning_rate": 2.247567504066106e-07, + "loss": 0.1082, + "step": 34293 + }, + { + "epoch": 93.4441416893733, + "grad_norm": 3.1463584899902344, + "learning_rate": 2.2457073860466028e-07, + "loss": 0.0487, + "step": 34294 + }, + { + "epoch": 93.44686648501363, + "grad_norm": 1.4194004535675049, + "learning_rate": 2.2438480293343833e-07, + "loss": 0.0172, + "step": 34295 + }, + { + "epoch": 93.44959128065395, + "grad_norm": 3.0458099842071533, + "learning_rate": 2.2419894339439364e-07, + "loss": 0.0996, + "step": 34296 + }, + { + "epoch": 93.45231607629428, + "grad_norm": 2.9101486206054688, + "learning_rate": 2.2401315998897166e-07, + "loss": 0.0496, + "step": 34297 + }, + { + "epoch": 93.4550408719346, + "grad_norm": 1.791276216506958, + "learning_rate": 2.2382745271862128e-07, + "loss": 0.0283, + "step": 34298 + }, + { + "epoch": 93.45776566757493, + "grad_norm": 2.2020905017852783, + "learning_rate": 2.2364182158478797e-07, + "loss": 0.0927, + "step": 34299 + }, + { + "epoch": 93.46049046321527, + "grad_norm": 3.559235095977783, + "learning_rate": 2.2345626658891728e-07, + "loss": 0.0484, + "step": 34300 + }, + { + "epoch": 93.46321525885558, + "grad_norm": 2.6800601482391357, + "learning_rate": 2.232707877324547e-07, + "loss": 0.1808, + "step": 34301 + }, + { + "epoch": 93.46594005449592, + "grad_norm": 2.735093832015991, + "learning_rate": 2.2308538501684464e-07, + "loss": 0.0293, + "step": 34302 + }, + { + "epoch": 93.46866485013624, + "grad_norm": 1.8304994106292725, + "learning_rate": 2.2290005844353145e-07, + "loss": 0.0239, + "step": 34303 + }, + { + "epoch": 93.47138964577657, + "grad_norm": 1.9497863054275513, + "learning_rate": 2.227148080139574e-07, + "loss": 0.0234, + "step": 34304 + }, + { + "epoch": 93.47411444141689, + "grad_norm": 2.7205569744110107, + "learning_rate": 2.2252963372956572e-07, + "loss": 0.0502, + "step": 34305 + }, + { + "epoch": 93.47683923705722, + "grad_norm": 3.152188301086426, + "learning_rate": 2.2234453559179858e-07, + "loss": 0.056, + "step": 34306 + }, + { + "epoch": 93.47956403269755, + "grad_norm": 3.2019495964050293, + "learning_rate": 2.221595136020971e-07, + "loss": 0.0511, + "step": 34307 + }, + { + "epoch": 93.48228882833787, + "grad_norm": 2.1643855571746826, + "learning_rate": 2.219745677619034e-07, + "loss": 0.0601, + "step": 34308 + }, + { + "epoch": 93.4850136239782, + "grad_norm": 3.378383159637451, + "learning_rate": 2.217896980726575e-07, + "loss": 0.0843, + "step": 34309 + }, + { + "epoch": 93.48773841961852, + "grad_norm": 1.9036085605621338, + "learning_rate": 2.2160490453579707e-07, + "loss": 0.0252, + "step": 34310 + }, + { + "epoch": 93.49046321525886, + "grad_norm": 2.122843027114868, + "learning_rate": 2.2142018715276437e-07, + "loss": 0.0597, + "step": 34311 + }, + { + "epoch": 93.49318801089919, + "grad_norm": 2.473475694656372, + "learning_rate": 2.2123554592499598e-07, + "loss": 0.0629, + "step": 34312 + }, + { + "epoch": 93.49591280653951, + "grad_norm": 2.287557363510132, + "learning_rate": 2.2105098085393073e-07, + "loss": 0.0385, + "step": 34313 + }, + { + "epoch": 93.49863760217984, + "grad_norm": 3.523827075958252, + "learning_rate": 2.208664919410053e-07, + "loss": 0.0415, + "step": 34314 + }, + { + "epoch": 93.50136239782016, + "grad_norm": 1.7135145664215088, + "learning_rate": 2.2068207918765738e-07, + "loss": 0.0199, + "step": 34315 + }, + { + "epoch": 93.50408719346049, + "grad_norm": 2.7096970081329346, + "learning_rate": 2.2049774259532253e-07, + "loss": 0.1068, + "step": 34316 + }, + { + "epoch": 93.50681198910081, + "grad_norm": 2.7034780979156494, + "learning_rate": 2.2031348216543514e-07, + "loss": 0.0798, + "step": 34317 + }, + { + "epoch": 93.50953678474114, + "grad_norm": 2.822631359100342, + "learning_rate": 2.2012929789943183e-07, + "loss": 0.0187, + "step": 34318 + }, + { + "epoch": 93.51226158038148, + "grad_norm": 1.7559870481491089, + "learning_rate": 2.1994518979874812e-07, + "loss": 0.0385, + "step": 34319 + }, + { + "epoch": 93.5149863760218, + "grad_norm": 3.9192328453063965, + "learning_rate": 2.197611578648162e-07, + "loss": 0.0231, + "step": 34320 + }, + { + "epoch": 93.51771117166213, + "grad_norm": 2.06367826461792, + "learning_rate": 2.195772020990705e-07, + "loss": 0.0432, + "step": 34321 + }, + { + "epoch": 93.52043596730245, + "grad_norm": 2.2036385536193848, + "learning_rate": 2.19393322502941e-07, + "loss": 0.0238, + "step": 34322 + }, + { + "epoch": 93.52316076294278, + "grad_norm": 2.166105270385742, + "learning_rate": 2.1920951907786204e-07, + "loss": 0.1484, + "step": 34323 + }, + { + "epoch": 93.52588555858311, + "grad_norm": 2.125516653060913, + "learning_rate": 2.1902579182526584e-07, + "loss": 0.0339, + "step": 34324 + }, + { + "epoch": 93.52861035422343, + "grad_norm": 2.5359044075012207, + "learning_rate": 2.1884214074658127e-07, + "loss": 0.061, + "step": 34325 + }, + { + "epoch": 93.53133514986376, + "grad_norm": 4.177691459655762, + "learning_rate": 2.186585658432383e-07, + "loss": 0.1618, + "step": 34326 + }, + { + "epoch": 93.53405994550408, + "grad_norm": 4.603385925292969, + "learning_rate": 2.18475067116668e-07, + "loss": 0.0564, + "step": 34327 + }, + { + "epoch": 93.53678474114442, + "grad_norm": 3.4245223999023438, + "learning_rate": 2.1829164456829922e-07, + "loss": 0.0345, + "step": 34328 + }, + { + "epoch": 93.53950953678473, + "grad_norm": 4.157337665557861, + "learning_rate": 2.181082981995608e-07, + "loss": 0.0201, + "step": 34329 + }, + { + "epoch": 93.54223433242507, + "grad_norm": 2.2463536262512207, + "learning_rate": 2.1792502801187944e-07, + "loss": 0.0282, + "step": 34330 + }, + { + "epoch": 93.5449591280654, + "grad_norm": 3.085951805114746, + "learning_rate": 2.177418340066839e-07, + "loss": 0.0392, + "step": 34331 + }, + { + "epoch": 93.54768392370572, + "grad_norm": 2.7970926761627197, + "learning_rate": 2.1755871618539981e-07, + "loss": 0.0347, + "step": 34332 + }, + { + "epoch": 93.55040871934605, + "grad_norm": 3.0887789726257324, + "learning_rate": 2.1737567454945374e-07, + "loss": 0.0295, + "step": 34333 + }, + { + "epoch": 93.55313351498637, + "grad_norm": 2.192136526107788, + "learning_rate": 2.1719270910027013e-07, + "loss": 0.0428, + "step": 34334 + }, + { + "epoch": 93.5558583106267, + "grad_norm": 1.9388835430145264, + "learning_rate": 2.1700981983927448e-07, + "loss": 0.0249, + "step": 34335 + }, + { + "epoch": 93.55858310626704, + "grad_norm": 2.0230979919433594, + "learning_rate": 2.1682700676789236e-07, + "loss": 0.0259, + "step": 34336 + }, + { + "epoch": 93.56130790190736, + "grad_norm": 2.2906877994537354, + "learning_rate": 2.1664426988754705e-07, + "loss": 0.0628, + "step": 34337 + }, + { + "epoch": 93.56403269754769, + "grad_norm": 3.3800113201141357, + "learning_rate": 2.1646160919966076e-07, + "loss": 0.1021, + "step": 34338 + }, + { + "epoch": 93.566757493188, + "grad_norm": 1.5669342279434204, + "learning_rate": 2.1627902470565675e-07, + "loss": 0.1427, + "step": 34339 + }, + { + "epoch": 93.56948228882834, + "grad_norm": 3.2367019653320312, + "learning_rate": 2.1609651640695727e-07, + "loss": 0.0375, + "step": 34340 + }, + { + "epoch": 93.57220708446866, + "grad_norm": 2.5182316303253174, + "learning_rate": 2.159140843049834e-07, + "loss": 0.0315, + "step": 34341 + }, + { + "epoch": 93.57493188010899, + "grad_norm": 3.962669610977173, + "learning_rate": 2.1573172840115397e-07, + "loss": 0.0244, + "step": 34342 + }, + { + "epoch": 93.57765667574932, + "grad_norm": 2.234757423400879, + "learning_rate": 2.155494486968923e-07, + "loss": 0.0802, + "step": 34343 + }, + { + "epoch": 93.58038147138964, + "grad_norm": 4.146871566772461, + "learning_rate": 2.153672451936173e-07, + "loss": 0.188, + "step": 34344 + }, + { + "epoch": 93.58310626702998, + "grad_norm": 3.737558603286743, + "learning_rate": 2.1518511789274666e-07, + "loss": 0.0419, + "step": 34345 + }, + { + "epoch": 93.5858310626703, + "grad_norm": 2.5635979175567627, + "learning_rate": 2.1500306679569816e-07, + "loss": 0.0322, + "step": 34346 + }, + { + "epoch": 93.58855585831063, + "grad_norm": 2.7324888706207275, + "learning_rate": 2.1482109190389178e-07, + "loss": 0.0655, + "step": 34347 + }, + { + "epoch": 93.59128065395096, + "grad_norm": 2.9860117435455322, + "learning_rate": 2.1463919321874415e-07, + "loss": 0.1257, + "step": 34348 + }, + { + "epoch": 93.59400544959128, + "grad_norm": 6.02388334274292, + "learning_rate": 2.1445737074167194e-07, + "loss": 0.1173, + "step": 34349 + }, + { + "epoch": 93.59673024523161, + "grad_norm": 2.5729589462280273, + "learning_rate": 2.1427562447408957e-07, + "loss": 0.095, + "step": 34350 + }, + { + "epoch": 93.59945504087193, + "grad_norm": 6.943117141723633, + "learning_rate": 2.1409395441741477e-07, + "loss": 0.0283, + "step": 34351 + }, + { + "epoch": 93.60217983651226, + "grad_norm": 3.964367151260376, + "learning_rate": 2.1391236057305974e-07, + "loss": 0.072, + "step": 34352 + }, + { + "epoch": 93.60490463215258, + "grad_norm": 2.762946605682373, + "learning_rate": 2.1373084294244118e-07, + "loss": 0.0445, + "step": 34353 + }, + { + "epoch": 93.60762942779292, + "grad_norm": 2.5655124187469482, + "learning_rate": 2.1354940152697234e-07, + "loss": 0.0266, + "step": 34354 + }, + { + "epoch": 93.61035422343325, + "grad_norm": 1.9681520462036133, + "learning_rate": 2.1336803632806436e-07, + "loss": 0.0277, + "step": 34355 + }, + { + "epoch": 93.61307901907357, + "grad_norm": 2.3756961822509766, + "learning_rate": 2.1318674734713273e-07, + "loss": 0.093, + "step": 34356 + }, + { + "epoch": 93.6158038147139, + "grad_norm": 4.2671918869018555, + "learning_rate": 2.130055345855875e-07, + "loss": 0.107, + "step": 34357 + }, + { + "epoch": 93.61852861035422, + "grad_norm": 4.12216854095459, + "learning_rate": 2.1282439804483966e-07, + "loss": 0.0344, + "step": 34358 + }, + { + "epoch": 93.62125340599455, + "grad_norm": 2.038247585296631, + "learning_rate": 2.126433377263004e-07, + "loss": 0.1056, + "step": 34359 + }, + { + "epoch": 93.62397820163488, + "grad_norm": 2.291226863861084, + "learning_rate": 2.1246235363137968e-07, + "loss": 0.0285, + "step": 34360 + }, + { + "epoch": 93.6267029972752, + "grad_norm": 4.159404277801514, + "learning_rate": 2.1228144576148857e-07, + "loss": 0.055, + "step": 34361 + }, + { + "epoch": 93.62942779291554, + "grad_norm": 2.844003438949585, + "learning_rate": 2.1210061411803262e-07, + "loss": 0.0615, + "step": 34362 + }, + { + "epoch": 93.63215258855585, + "grad_norm": 2.2398364543914795, + "learning_rate": 2.1191985870242293e-07, + "loss": 0.0427, + "step": 34363 + }, + { + "epoch": 93.63487738419619, + "grad_norm": 3.2485857009887695, + "learning_rate": 2.1173917951606615e-07, + "loss": 0.019, + "step": 34364 + }, + { + "epoch": 93.6376021798365, + "grad_norm": 2.3822646141052246, + "learning_rate": 2.1155857656037004e-07, + "loss": 0.029, + "step": 34365 + }, + { + "epoch": 93.64032697547684, + "grad_norm": 1.5049999952316284, + "learning_rate": 2.1137804983674014e-07, + "loss": 0.0185, + "step": 34366 + }, + { + "epoch": 93.64305177111717, + "grad_norm": 2.549562692642212, + "learning_rate": 2.1119759934658313e-07, + "loss": 0.0777, + "step": 34367 + }, + { + "epoch": 93.64577656675749, + "grad_norm": 1.8893696069717407, + "learning_rate": 2.110172250913045e-07, + "loss": 0.0235, + "step": 34368 + }, + { + "epoch": 93.64850136239782, + "grad_norm": 6.346429824829102, + "learning_rate": 2.1083692707230763e-07, + "loss": 0.0666, + "step": 34369 + }, + { + "epoch": 93.65122615803814, + "grad_norm": 2.1284542083740234, + "learning_rate": 2.1065670529099914e-07, + "loss": 0.0283, + "step": 34370 + }, + { + "epoch": 93.65395095367847, + "grad_norm": 3.1872403621673584, + "learning_rate": 2.1047655974878012e-07, + "loss": 0.0365, + "step": 34371 + }, + { + "epoch": 93.65667574931881, + "grad_norm": 4.941776752471924, + "learning_rate": 2.10296490447055e-07, + "loss": 0.1092, + "step": 34372 + }, + { + "epoch": 93.65940054495913, + "grad_norm": 2.912961959838867, + "learning_rate": 2.1011649738722606e-07, + "loss": 0.0403, + "step": 34373 + }, + { + "epoch": 93.66212534059946, + "grad_norm": 2.130218267440796, + "learning_rate": 2.0993658057069432e-07, + "loss": 0.0346, + "step": 34374 + }, + { + "epoch": 93.66485013623978, + "grad_norm": 2.6625425815582275, + "learning_rate": 2.0975673999886093e-07, + "loss": 0.0248, + "step": 34375 + }, + { + "epoch": 93.66757493188011, + "grad_norm": 1.9598931074142456, + "learning_rate": 2.0957697567312807e-07, + "loss": 0.0479, + "step": 34376 + }, + { + "epoch": 93.67029972752043, + "grad_norm": 5.38246488571167, + "learning_rate": 2.0939728759489463e-07, + "loss": 0.0697, + "step": 34377 + }, + { + "epoch": 93.67302452316076, + "grad_norm": 1.8101924657821655, + "learning_rate": 2.0921767576555952e-07, + "loss": 0.113, + "step": 34378 + }, + { + "epoch": 93.6757493188011, + "grad_norm": 2.1005547046661377, + "learning_rate": 2.0903814018652047e-07, + "loss": 0.0214, + "step": 34379 + }, + { + "epoch": 93.67847411444141, + "grad_norm": 4.3197855949401855, + "learning_rate": 2.088586808591797e-07, + "loss": 0.1892, + "step": 34380 + }, + { + "epoch": 93.68119891008175, + "grad_norm": 2.731203556060791, + "learning_rate": 2.0867929778493167e-07, + "loss": 0.038, + "step": 34381 + }, + { + "epoch": 93.68392370572207, + "grad_norm": 2.2792117595672607, + "learning_rate": 2.0849999096517304e-07, + "loss": 0.0729, + "step": 34382 + }, + { + "epoch": 93.6866485013624, + "grad_norm": 3.9346883296966553, + "learning_rate": 2.0832076040130267e-07, + "loss": 0.0845, + "step": 34383 + }, + { + "epoch": 93.68937329700273, + "grad_norm": 2.5368058681488037, + "learning_rate": 2.08141606094715e-07, + "loss": 0.0493, + "step": 34384 + }, + { + "epoch": 93.69209809264305, + "grad_norm": 2.3298025131225586, + "learning_rate": 2.079625280468045e-07, + "loss": 0.0607, + "step": 34385 + }, + { + "epoch": 93.69482288828338, + "grad_norm": 2.9570140838623047, + "learning_rate": 2.077835262589667e-07, + "loss": 0.0229, + "step": 34386 + }, + { + "epoch": 93.6975476839237, + "grad_norm": 2.169262170791626, + "learning_rate": 2.0760460073259603e-07, + "loss": 0.0641, + "step": 34387 + }, + { + "epoch": 93.70027247956403, + "grad_norm": 2.960768938064575, + "learning_rate": 2.0742575146908583e-07, + "loss": 0.0899, + "step": 34388 + }, + { + "epoch": 93.70299727520435, + "grad_norm": 3.048086404800415, + "learning_rate": 2.0724697846982832e-07, + "loss": 0.2102, + "step": 34389 + }, + { + "epoch": 93.70572207084469, + "grad_norm": 5.074772357940674, + "learning_rate": 2.0706828173621684e-07, + "loss": 0.1722, + "step": 34390 + }, + { + "epoch": 93.70844686648502, + "grad_norm": 3.0789027214050293, + "learning_rate": 2.0688966126964138e-07, + "loss": 0.0328, + "step": 34391 + }, + { + "epoch": 93.71117166212534, + "grad_norm": 2.1476850509643555, + "learning_rate": 2.0671111707149416e-07, + "loss": 0.0343, + "step": 34392 + }, + { + "epoch": 93.71389645776567, + "grad_norm": 2.010178804397583, + "learning_rate": 2.065326491431663e-07, + "loss": 0.1128, + "step": 34393 + }, + { + "epoch": 93.71662125340599, + "grad_norm": 2.3575823307037354, + "learning_rate": 2.0635425748604664e-07, + "loss": 0.0239, + "step": 34394 + }, + { + "epoch": 93.71934604904632, + "grad_norm": 2.0335638523101807, + "learning_rate": 2.0617594210152413e-07, + "loss": 0.0266, + "step": 34395 + }, + { + "epoch": 93.72207084468666, + "grad_norm": 3.2877469062805176, + "learning_rate": 2.0599770299098987e-07, + "loss": 0.146, + "step": 34396 + }, + { + "epoch": 93.72479564032697, + "grad_norm": 2.5627589225769043, + "learning_rate": 2.058195401558294e-07, + "loss": 0.0241, + "step": 34397 + }, + { + "epoch": 93.7275204359673, + "grad_norm": 2.51062273979187, + "learning_rate": 2.0564145359743048e-07, + "loss": 0.0372, + "step": 34398 + }, + { + "epoch": 93.73024523160763, + "grad_norm": 2.7507593631744385, + "learning_rate": 2.0546344331718092e-07, + "loss": 0.0503, + "step": 34399 + }, + { + "epoch": 93.73297002724796, + "grad_norm": 2.953214645385742, + "learning_rate": 2.052855093164674e-07, + "loss": 0.0551, + "step": 34400 + }, + { + "epoch": 93.73569482288828, + "grad_norm": 3.533792734146118, + "learning_rate": 2.0510765159667546e-07, + "loss": 0.1486, + "step": 34401 + }, + { + "epoch": 93.73841961852861, + "grad_norm": 2.928157091140747, + "learning_rate": 2.049298701591884e-07, + "loss": 0.0521, + "step": 34402 + }, + { + "epoch": 93.74114441416894, + "grad_norm": 5.785929203033447, + "learning_rate": 2.0475216500539298e-07, + "loss": 0.033, + "step": 34403 + }, + { + "epoch": 93.74386920980926, + "grad_norm": 2.49468731880188, + "learning_rate": 2.0457453613667134e-07, + "loss": 0.0869, + "step": 34404 + }, + { + "epoch": 93.7465940054496, + "grad_norm": 1.9557398557662964, + "learning_rate": 2.043969835544102e-07, + "loss": 0.0263, + "step": 34405 + }, + { + "epoch": 93.74931880108991, + "grad_norm": 1.865979552268982, + "learning_rate": 2.042195072599884e-07, + "loss": 0.0207, + "step": 34406 + }, + { + "epoch": 93.75204359673025, + "grad_norm": 10.877952575683594, + "learning_rate": 2.0404210725479046e-07, + "loss": 0.0242, + "step": 34407 + }, + { + "epoch": 93.75476839237058, + "grad_norm": 2.2763140201568604, + "learning_rate": 2.0386478354019745e-07, + "loss": 0.0702, + "step": 34408 + }, + { + "epoch": 93.7574931880109, + "grad_norm": 2.745971202850342, + "learning_rate": 2.0368753611759052e-07, + "loss": 0.065, + "step": 34409 + }, + { + "epoch": 93.76021798365123, + "grad_norm": 2.8336164951324463, + "learning_rate": 2.0351036498834965e-07, + "loss": 0.1588, + "step": 34410 + }, + { + "epoch": 93.76294277929155, + "grad_norm": 2.2845332622528076, + "learning_rate": 2.0333327015385373e-07, + "loss": 0.0428, + "step": 34411 + }, + { + "epoch": 93.76566757493188, + "grad_norm": 1.7977302074432373, + "learning_rate": 2.0315625161548392e-07, + "loss": 0.0799, + "step": 34412 + }, + { + "epoch": 93.7683923705722, + "grad_norm": 2.4740443229675293, + "learning_rate": 2.0297930937461685e-07, + "loss": 0.0457, + "step": 34413 + }, + { + "epoch": 93.77111716621253, + "grad_norm": 2.2012076377868652, + "learning_rate": 2.0280244343263366e-07, + "loss": 0.034, + "step": 34414 + }, + { + "epoch": 93.77384196185287, + "grad_norm": 1.926122784614563, + "learning_rate": 2.026256537909077e-07, + "loss": 0.034, + "step": 34415 + }, + { + "epoch": 93.77656675749319, + "grad_norm": 1.7271753549575806, + "learning_rate": 2.0244894045081898e-07, + "loss": 0.0214, + "step": 34416 + }, + { + "epoch": 93.77929155313352, + "grad_norm": 2.1036386489868164, + "learning_rate": 2.0227230341374194e-07, + "loss": 0.0583, + "step": 34417 + }, + { + "epoch": 93.78201634877384, + "grad_norm": 2.506817102432251, + "learning_rate": 2.0209574268105324e-07, + "loss": 0.0401, + "step": 34418 + }, + { + "epoch": 93.78474114441417, + "grad_norm": 2.632697820663452, + "learning_rate": 2.0191925825412739e-07, + "loss": 0.0306, + "step": 34419 + }, + { + "epoch": 93.7874659400545, + "grad_norm": 2.7037792205810547, + "learning_rate": 2.017428501343388e-07, + "loss": 0.0372, + "step": 34420 + }, + { + "epoch": 93.79019073569482, + "grad_norm": 2.159956216812134, + "learning_rate": 2.0156651832306085e-07, + "loss": 0.0497, + "step": 34421 + }, + { + "epoch": 93.79291553133515, + "grad_norm": 2.0200798511505127, + "learning_rate": 2.0139026282166908e-07, + "loss": 0.0236, + "step": 34422 + }, + { + "epoch": 93.79564032697547, + "grad_norm": 1.5987173318862915, + "learning_rate": 2.012140836315335e-07, + "loss": 0.0349, + "step": 34423 + }, + { + "epoch": 93.7983651226158, + "grad_norm": 4.3370680809021, + "learning_rate": 2.0103798075402747e-07, + "loss": 0.1231, + "step": 34424 + }, + { + "epoch": 93.80108991825612, + "grad_norm": 1.7332193851470947, + "learning_rate": 2.0086195419052323e-07, + "loss": 0.0479, + "step": 34425 + }, + { + "epoch": 93.80381471389646, + "grad_norm": 2.297229766845703, + "learning_rate": 2.0068600394238968e-07, + "loss": 0.0286, + "step": 34426 + }, + { + "epoch": 93.80653950953679, + "grad_norm": 1.7435134649276733, + "learning_rate": 2.0051013001099794e-07, + "loss": 0.078, + "step": 34427 + }, + { + "epoch": 93.80926430517711, + "grad_norm": 2.4305944442749023, + "learning_rate": 2.0033433239771803e-07, + "loss": 0.0347, + "step": 34428 + }, + { + "epoch": 93.81198910081744, + "grad_norm": 2.4918837547302246, + "learning_rate": 2.0015861110392e-07, + "loss": 0.0374, + "step": 34429 + }, + { + "epoch": 93.81471389645776, + "grad_norm": 2.407262086868286, + "learning_rate": 1.9998296613097046e-07, + "loss": 0.027, + "step": 34430 + }, + { + "epoch": 93.8174386920981, + "grad_norm": 2.703068256378174, + "learning_rate": 1.9980739748023837e-07, + "loss": 0.0343, + "step": 34431 + }, + { + "epoch": 93.82016348773843, + "grad_norm": 3.4068539142608643, + "learning_rate": 1.9963190515309038e-07, + "loss": 0.0329, + "step": 34432 + }, + { + "epoch": 93.82288828337875, + "grad_norm": 2.6142091751098633, + "learning_rate": 1.9945648915089432e-07, + "loss": 0.0707, + "step": 34433 + }, + { + "epoch": 93.82561307901908, + "grad_norm": 1.7220866680145264, + "learning_rate": 1.9928114947501577e-07, + "loss": 0.0222, + "step": 34434 + }, + { + "epoch": 93.8283378746594, + "grad_norm": 2.0930206775665283, + "learning_rate": 1.9910588612681914e-07, + "loss": 0.0268, + "step": 34435 + }, + { + "epoch": 93.83106267029973, + "grad_norm": 1.6667646169662476, + "learning_rate": 1.9893069910767117e-07, + "loss": 0.0158, + "step": 34436 + }, + { + "epoch": 93.83378746594005, + "grad_norm": 3.9746711254119873, + "learning_rate": 1.9875558841893627e-07, + "loss": 0.046, + "step": 34437 + }, + { + "epoch": 93.83651226158038, + "grad_norm": 2.515366554260254, + "learning_rate": 1.9858055406197562e-07, + "loss": 0.1202, + "step": 34438 + }, + { + "epoch": 93.83923705722071, + "grad_norm": 3.2645912170410156, + "learning_rate": 1.984055960381559e-07, + "loss": 0.0312, + "step": 34439 + }, + { + "epoch": 93.84196185286103, + "grad_norm": 2.400242328643799, + "learning_rate": 1.98230714348836e-07, + "loss": 0.0531, + "step": 34440 + }, + { + "epoch": 93.84468664850137, + "grad_norm": 2.1673269271850586, + "learning_rate": 1.9805590899538152e-07, + "loss": 0.0214, + "step": 34441 + }, + { + "epoch": 93.84741144414168, + "grad_norm": 3.565842628479004, + "learning_rate": 1.9788117997915136e-07, + "loss": 0.122, + "step": 34442 + }, + { + "epoch": 93.85013623978202, + "grad_norm": 1.8552443981170654, + "learning_rate": 1.9770652730150775e-07, + "loss": 0.0175, + "step": 34443 + }, + { + "epoch": 93.85286103542235, + "grad_norm": 3.700861692428589, + "learning_rate": 1.9753195096380962e-07, + "loss": 0.1114, + "step": 34444 + }, + { + "epoch": 93.85558583106267, + "grad_norm": 3.854320764541626, + "learning_rate": 1.973574509674181e-07, + "loss": 0.0952, + "step": 34445 + }, + { + "epoch": 93.858310626703, + "grad_norm": 3.0832605361938477, + "learning_rate": 1.9718302731368988e-07, + "loss": 0.0577, + "step": 34446 + }, + { + "epoch": 93.86103542234332, + "grad_norm": 3.7628276348114014, + "learning_rate": 1.97008680003985e-07, + "loss": 0.0654, + "step": 34447 + }, + { + "epoch": 93.86376021798365, + "grad_norm": 2.3134407997131348, + "learning_rate": 1.9683440903966123e-07, + "loss": 0.0609, + "step": 34448 + }, + { + "epoch": 93.86648501362397, + "grad_norm": 3.2816579341888428, + "learning_rate": 1.9666021442207638e-07, + "loss": 0.0334, + "step": 34449 + }, + { + "epoch": 93.8692098092643, + "grad_norm": 3.8966357707977295, + "learning_rate": 1.9648609615258606e-07, + "loss": 0.1089, + "step": 34450 + }, + { + "epoch": 93.87193460490464, + "grad_norm": 2.2153778076171875, + "learning_rate": 1.9631205423254586e-07, + "loss": 0.0731, + "step": 34451 + }, + { + "epoch": 93.87465940054496, + "grad_norm": 2.281461000442505, + "learning_rate": 1.961380886633113e-07, + "loss": 0.0522, + "step": 34452 + }, + { + "epoch": 93.87738419618529, + "grad_norm": 2.045767307281494, + "learning_rate": 1.959641994462391e-07, + "loss": 0.0919, + "step": 34453 + }, + { + "epoch": 93.88010899182561, + "grad_norm": 3.1510367393493652, + "learning_rate": 1.9579038658268157e-07, + "loss": 0.0767, + "step": 34454 + }, + { + "epoch": 93.88283378746594, + "grad_norm": 2.3584213256835938, + "learning_rate": 1.9561665007399312e-07, + "loss": 0.0968, + "step": 34455 + }, + { + "epoch": 93.88555858310627, + "grad_norm": 2.3251776695251465, + "learning_rate": 1.95442989921526e-07, + "loss": 0.0256, + "step": 34456 + }, + { + "epoch": 93.88828337874659, + "grad_norm": 1.996802806854248, + "learning_rate": 1.9526940612663359e-07, + "loss": 0.054, + "step": 34457 + }, + { + "epoch": 93.89100817438693, + "grad_norm": 2.232168436050415, + "learning_rate": 1.9509589869066814e-07, + "loss": 0.0228, + "step": 34458 + }, + { + "epoch": 93.89373297002724, + "grad_norm": 4.788763046264648, + "learning_rate": 1.9492246761497967e-07, + "loss": 0.0692, + "step": 34459 + }, + { + "epoch": 93.89645776566758, + "grad_norm": 2.8546571731567383, + "learning_rate": 1.9474911290091936e-07, + "loss": 0.0291, + "step": 34460 + }, + { + "epoch": 93.8991825613079, + "grad_norm": 2.0369200706481934, + "learning_rate": 1.9457583454983719e-07, + "loss": 0.0261, + "step": 34461 + }, + { + "epoch": 93.90190735694823, + "grad_norm": 3.6039161682128906, + "learning_rate": 1.9440263256308433e-07, + "loss": 0.0405, + "step": 34462 + }, + { + "epoch": 93.90463215258856, + "grad_norm": 2.0535991191864014, + "learning_rate": 1.942295069420075e-07, + "loss": 0.0367, + "step": 34463 + }, + { + "epoch": 93.90735694822888, + "grad_norm": 1.9097617864608765, + "learning_rate": 1.9405645768795446e-07, + "loss": 0.0474, + "step": 34464 + }, + { + "epoch": 93.91008174386921, + "grad_norm": 1.9148390293121338, + "learning_rate": 1.9388348480227525e-07, + "loss": 0.0228, + "step": 34465 + }, + { + "epoch": 93.91280653950953, + "grad_norm": 3.3699679374694824, + "learning_rate": 1.937105882863155e-07, + "loss": 0.2528, + "step": 34466 + }, + { + "epoch": 93.91553133514986, + "grad_norm": 2.8437659740448, + "learning_rate": 1.935377681414219e-07, + "loss": 0.0644, + "step": 34467 + }, + { + "epoch": 93.9182561307902, + "grad_norm": 1.9749023914337158, + "learning_rate": 1.933650243689411e-07, + "loss": 0.0271, + "step": 34468 + }, + { + "epoch": 93.92098092643052, + "grad_norm": 2.847459316253662, + "learning_rate": 1.9319235697021766e-07, + "loss": 0.0997, + "step": 34469 + }, + { + "epoch": 93.92370572207085, + "grad_norm": 2.587817907333374, + "learning_rate": 1.93019765946596e-07, + "loss": 0.0269, + "step": 34470 + }, + { + "epoch": 93.92643051771117, + "grad_norm": 1.9004254341125488, + "learning_rate": 1.928472512994206e-07, + "loss": 0.1499, + "step": 34471 + }, + { + "epoch": 93.9291553133515, + "grad_norm": 2.5846543312072754, + "learning_rate": 1.9267481303003487e-07, + "loss": 0.0754, + "step": 34472 + }, + { + "epoch": 93.93188010899182, + "grad_norm": 2.302259922027588, + "learning_rate": 1.9250245113978329e-07, + "loss": 0.0876, + "step": 34473 + }, + { + "epoch": 93.93460490463215, + "grad_norm": 1.8402637243270874, + "learning_rate": 1.9233016563000695e-07, + "loss": 0.1349, + "step": 34474 + }, + { + "epoch": 93.93732970027249, + "grad_norm": 3.4466936588287354, + "learning_rate": 1.9215795650204817e-07, + "loss": 0.072, + "step": 34475 + }, + { + "epoch": 93.9400544959128, + "grad_norm": 2.3628551959991455, + "learning_rate": 1.9198582375724584e-07, + "loss": 0.0607, + "step": 34476 + }, + { + "epoch": 93.94277929155314, + "grad_norm": 2.3989202976226807, + "learning_rate": 1.9181376739694336e-07, + "loss": 0.1096, + "step": 34477 + }, + { + "epoch": 93.94550408719346, + "grad_norm": 1.715238094329834, + "learning_rate": 1.9164178742247964e-07, + "loss": 0.0213, + "step": 34478 + }, + { + "epoch": 93.94822888283379, + "grad_norm": 2.344977855682373, + "learning_rate": 1.914698838351936e-07, + "loss": 0.1036, + "step": 34479 + }, + { + "epoch": 93.95095367847412, + "grad_norm": 2.1506311893463135, + "learning_rate": 1.912980566364231e-07, + "loss": 0.073, + "step": 34480 + }, + { + "epoch": 93.95367847411444, + "grad_norm": 2.3233208656311035, + "learning_rate": 1.9112630582750924e-07, + "loss": 0.0492, + "step": 34481 + }, + { + "epoch": 93.95640326975477, + "grad_norm": 2.677304267883301, + "learning_rate": 1.9095463140978876e-07, + "loss": 0.1065, + "step": 34482 + }, + { + "epoch": 93.95912806539509, + "grad_norm": 3.472522735595703, + "learning_rate": 1.9078303338459725e-07, + "loss": 0.0603, + "step": 34483 + }, + { + "epoch": 93.96185286103542, + "grad_norm": 2.663081169128418, + "learning_rate": 1.906115117532703e-07, + "loss": 0.068, + "step": 34484 + }, + { + "epoch": 93.96457765667574, + "grad_norm": 2.479199171066284, + "learning_rate": 1.9044006651714686e-07, + "loss": 0.1596, + "step": 34485 + }, + { + "epoch": 93.96730245231608, + "grad_norm": 2.600506544113159, + "learning_rate": 1.902686976775603e-07, + "loss": 0.0496, + "step": 34486 + }, + { + "epoch": 93.97002724795641, + "grad_norm": 3.1799991130828857, + "learning_rate": 1.9009740523584507e-07, + "loss": 0.0471, + "step": 34487 + }, + { + "epoch": 93.97275204359673, + "grad_norm": 2.479637861251831, + "learning_rate": 1.899261891933346e-07, + "loss": 0.097, + "step": 34488 + }, + { + "epoch": 93.97547683923706, + "grad_norm": 2.694652795791626, + "learning_rate": 1.897550495513645e-07, + "loss": 0.1886, + "step": 34489 + }, + { + "epoch": 93.97820163487738, + "grad_norm": 3.3574304580688477, + "learning_rate": 1.8958398631126586e-07, + "loss": 0.0381, + "step": 34490 + }, + { + "epoch": 93.98092643051771, + "grad_norm": 2.4085183143615723, + "learning_rate": 1.8941299947437098e-07, + "loss": 0.0169, + "step": 34491 + }, + { + "epoch": 93.98365122615803, + "grad_norm": 2.778902292251587, + "learning_rate": 1.8924208904201215e-07, + "loss": 0.1611, + "step": 34492 + }, + { + "epoch": 93.98637602179836, + "grad_norm": 2.933116912841797, + "learning_rate": 1.890712550155205e-07, + "loss": 0.0443, + "step": 34493 + }, + { + "epoch": 93.9891008174387, + "grad_norm": 2.296523094177246, + "learning_rate": 1.8890049739622606e-07, + "loss": 0.0734, + "step": 34494 + }, + { + "epoch": 93.99182561307902, + "grad_norm": 1.8806663751602173, + "learning_rate": 1.8872981618545894e-07, + "loss": 0.0219, + "step": 34495 + }, + { + "epoch": 93.99455040871935, + "grad_norm": 3.0775694847106934, + "learning_rate": 1.8855921138454802e-07, + "loss": 0.0251, + "step": 34496 + }, + { + "epoch": 93.99727520435967, + "grad_norm": 3.0466701984405518, + "learning_rate": 1.8838868299482227e-07, + "loss": 0.0656, + "step": 34497 + }, + { + "epoch": 94.0, + "grad_norm": 2.0074522495269775, + "learning_rate": 1.8821823101760949e-07, + "loss": 0.024, + "step": 34498 + }, + { + "epoch": 94.00272479564033, + "grad_norm": 2.8768908977508545, + "learning_rate": 1.8804785545423753e-07, + "loss": 0.0665, + "step": 34499 + }, + { + "epoch": 94.00544959128065, + "grad_norm": 3.1508963108062744, + "learning_rate": 1.878775563060331e-07, + "loss": 0.0528, + "step": 34500 + }, + { + "epoch": 94.00817438692098, + "grad_norm": 2.9554028511047363, + "learning_rate": 1.8770733357432293e-07, + "loss": 0.0806, + "step": 34501 + }, + { + "epoch": 94.0108991825613, + "grad_norm": 2.331803560256958, + "learning_rate": 1.8753718726043146e-07, + "loss": 0.0652, + "step": 34502 + }, + { + "epoch": 94.01362397820164, + "grad_norm": 2.272080898284912, + "learning_rate": 1.8736711736568547e-07, + "loss": 0.0625, + "step": 34503 + }, + { + "epoch": 94.01634877384195, + "grad_norm": 3.1528565883636475, + "learning_rate": 1.871971238914072e-07, + "loss": 0.0565, + "step": 34504 + }, + { + "epoch": 94.01907356948229, + "grad_norm": 1.681414246559143, + "learning_rate": 1.870272068389223e-07, + "loss": 0.1208, + "step": 34505 + }, + { + "epoch": 94.02179836512262, + "grad_norm": 3.2219901084899902, + "learning_rate": 1.868573662095541e-07, + "loss": 0.069, + "step": 34506 + }, + { + "epoch": 94.02452316076294, + "grad_norm": 3.2177181243896484, + "learning_rate": 1.8668760200462488e-07, + "loss": 0.1558, + "step": 34507 + }, + { + "epoch": 94.02724795640327, + "grad_norm": 1.7715153694152832, + "learning_rate": 1.8651791422545697e-07, + "loss": 0.0177, + "step": 34508 + }, + { + "epoch": 94.02997275204359, + "grad_norm": 2.3313074111938477, + "learning_rate": 1.8634830287337036e-07, + "loss": 0.034, + "step": 34509 + }, + { + "epoch": 94.03269754768392, + "grad_norm": 1.9339600801467896, + "learning_rate": 1.861787679496885e-07, + "loss": 0.0208, + "step": 34510 + }, + { + "epoch": 94.03542234332426, + "grad_norm": 2.1006815433502197, + "learning_rate": 1.8600930945573027e-07, + "loss": 0.1225, + "step": 34511 + }, + { + "epoch": 94.03814713896458, + "grad_norm": 1.6775445938110352, + "learning_rate": 1.8583992739281577e-07, + "loss": 0.0198, + "step": 34512 + }, + { + "epoch": 94.04087193460491, + "grad_norm": 2.6415295600891113, + "learning_rate": 1.8567062176226393e-07, + "loss": 0.0387, + "step": 34513 + }, + { + "epoch": 94.04359673024523, + "grad_norm": 1.607471227645874, + "learning_rate": 1.8550139256539368e-07, + "loss": 0.0159, + "step": 34514 + }, + { + "epoch": 94.04632152588556, + "grad_norm": 2.5552589893341064, + "learning_rate": 1.8533223980352288e-07, + "loss": 0.1056, + "step": 34515 + }, + { + "epoch": 94.04904632152588, + "grad_norm": 2.36251163482666, + "learning_rate": 1.8516316347796826e-07, + "loss": 0.1004, + "step": 34516 + }, + { + "epoch": 94.05177111716621, + "grad_norm": 2.898721218109131, + "learning_rate": 1.8499416359004763e-07, + "loss": 0.1699, + "step": 34517 + }, + { + "epoch": 94.05449591280654, + "grad_norm": 9.90404224395752, + "learning_rate": 1.848252401410755e-07, + "loss": 0.185, + "step": 34518 + }, + { + "epoch": 94.05722070844686, + "grad_norm": 2.253108024597168, + "learning_rate": 1.846563931323697e-07, + "loss": 0.0209, + "step": 34519 + }, + { + "epoch": 94.0599455040872, + "grad_norm": 2.2060775756835938, + "learning_rate": 1.8448762256524256e-07, + "loss": 0.047, + "step": 34520 + }, + { + "epoch": 94.06267029972751, + "grad_norm": 2.2302207946777344, + "learning_rate": 1.8431892844101183e-07, + "loss": 0.0645, + "step": 34521 + }, + { + "epoch": 94.06539509536785, + "grad_norm": 1.3667473793029785, + "learning_rate": 1.8415031076098767e-07, + "loss": 0.0154, + "step": 34522 + }, + { + "epoch": 94.06811989100818, + "grad_norm": 1.537326693534851, + "learning_rate": 1.8398176952648672e-07, + "loss": 0.0214, + "step": 34523 + }, + { + "epoch": 94.0708446866485, + "grad_norm": 2.7625930309295654, + "learning_rate": 1.8381330473881797e-07, + "loss": 0.0634, + "step": 34524 + }, + { + "epoch": 94.07356948228883, + "grad_norm": 2.4522831439971924, + "learning_rate": 1.836449163992948e-07, + "loss": 0.0379, + "step": 34525 + }, + { + "epoch": 94.07629427792915, + "grad_norm": 5.569437026977539, + "learning_rate": 1.8347660450923066e-07, + "loss": 0.046, + "step": 34526 + }, + { + "epoch": 94.07901907356948, + "grad_norm": 3.3365516662597656, + "learning_rate": 1.8330836906993443e-07, + "loss": 0.0771, + "step": 34527 + }, + { + "epoch": 94.0817438692098, + "grad_norm": 5.334017753601074, + "learning_rate": 1.8314021008271732e-07, + "loss": 0.1219, + "step": 34528 + }, + { + "epoch": 94.08446866485014, + "grad_norm": 1.5066051483154297, + "learning_rate": 1.8297212754888716e-07, + "loss": 0.0149, + "step": 34529 + }, + { + "epoch": 94.08719346049047, + "grad_norm": 2.745513916015625, + "learning_rate": 1.8280412146975512e-07, + "loss": 0.0592, + "step": 34530 + }, + { + "epoch": 94.08991825613079, + "grad_norm": 3.194516897201538, + "learning_rate": 1.8263619184662796e-07, + "loss": 0.0473, + "step": 34531 + }, + { + "epoch": 94.09264305177112, + "grad_norm": 2.812309503555298, + "learning_rate": 1.8246833868081348e-07, + "loss": 0.0649, + "step": 34532 + }, + { + "epoch": 94.09536784741144, + "grad_norm": 3.361938714981079, + "learning_rate": 1.8230056197362068e-07, + "loss": 0.0297, + "step": 34533 + }, + { + "epoch": 94.09809264305177, + "grad_norm": 2.9348504543304443, + "learning_rate": 1.8213286172635514e-07, + "loss": 0.0749, + "step": 34534 + }, + { + "epoch": 94.1008174386921, + "grad_norm": 2.29144024848938, + "learning_rate": 1.819652379403225e-07, + "loss": 0.0453, + "step": 34535 + }, + { + "epoch": 94.10354223433242, + "grad_norm": 2.3790197372436523, + "learning_rate": 1.8179769061682838e-07, + "loss": 0.0277, + "step": 34536 + }, + { + "epoch": 94.10626702997276, + "grad_norm": 3.2483694553375244, + "learning_rate": 1.8163021975717841e-07, + "loss": 0.0656, + "step": 34537 + }, + { + "epoch": 94.10899182561307, + "grad_norm": 2.4094700813293457, + "learning_rate": 1.8146282536267602e-07, + "loss": 0.0263, + "step": 34538 + }, + { + "epoch": 94.11171662125341, + "grad_norm": 2.520822525024414, + "learning_rate": 1.8129550743462565e-07, + "loss": 0.032, + "step": 34539 + }, + { + "epoch": 94.11444141689373, + "grad_norm": 1.7595480680465698, + "learning_rate": 1.8112826597432854e-07, + "loss": 0.0228, + "step": 34540 + }, + { + "epoch": 94.11716621253406, + "grad_norm": 2.2441720962524414, + "learning_rate": 1.8096110098308917e-07, + "loss": 0.0673, + "step": 34541 + }, + { + "epoch": 94.11989100817439, + "grad_norm": 2.098578929901123, + "learning_rate": 1.8079401246220874e-07, + "loss": 0.0374, + "step": 34542 + }, + { + "epoch": 94.12261580381471, + "grad_norm": 2.2614755630493164, + "learning_rate": 1.8062700041298952e-07, + "loss": 0.1671, + "step": 34543 + }, + { + "epoch": 94.12534059945504, + "grad_norm": 3.3669607639312744, + "learning_rate": 1.8046006483673052e-07, + "loss": 0.0585, + "step": 34544 + }, + { + "epoch": 94.12806539509536, + "grad_norm": 2.245502233505249, + "learning_rate": 1.8029320573473063e-07, + "loss": 0.1347, + "step": 34545 + }, + { + "epoch": 94.1307901907357, + "grad_norm": 3.2562201023101807, + "learning_rate": 1.801264231082933e-07, + "loss": 0.022, + "step": 34546 + }, + { + "epoch": 94.13351498637603, + "grad_norm": 4.390142917633057, + "learning_rate": 1.7995971695871528e-07, + "loss": 0.0534, + "step": 34547 + }, + { + "epoch": 94.13623978201635, + "grad_norm": 3.1623430252075195, + "learning_rate": 1.7979308728729438e-07, + "loss": 0.0414, + "step": 34548 + }, + { + "epoch": 94.13896457765668, + "grad_norm": 3.983569622039795, + "learning_rate": 1.7962653409532848e-07, + "loss": 0.0453, + "step": 34549 + }, + { + "epoch": 94.141689373297, + "grad_norm": 1.9424781799316406, + "learning_rate": 1.7946005738411654e-07, + "loss": 0.0469, + "step": 34550 + }, + { + "epoch": 94.14441416893733, + "grad_norm": 2.724827527999878, + "learning_rate": 1.7929365715495305e-07, + "loss": 0.1282, + "step": 34551 + }, + { + "epoch": 94.14713896457765, + "grad_norm": 1.7867093086242676, + "learning_rate": 1.791273334091337e-07, + "loss": 0.0156, + "step": 34552 + }, + { + "epoch": 94.14986376021798, + "grad_norm": 2.4984583854675293, + "learning_rate": 1.7896108614795406e-07, + "loss": 0.0294, + "step": 34553 + }, + { + "epoch": 94.15258855585832, + "grad_norm": 2.506727695465088, + "learning_rate": 1.7879491537271087e-07, + "loss": 0.0465, + "step": 34554 + }, + { + "epoch": 94.15531335149863, + "grad_norm": 2.2438740730285645, + "learning_rate": 1.7862882108469648e-07, + "loss": 0.0544, + "step": 34555 + }, + { + "epoch": 94.15803814713897, + "grad_norm": 4.8143086433410645, + "learning_rate": 1.7846280328520428e-07, + "loss": 0.0566, + "step": 34556 + }, + { + "epoch": 94.16076294277929, + "grad_norm": 2.9258768558502197, + "learning_rate": 1.7829686197552766e-07, + "loss": 0.0673, + "step": 34557 + }, + { + "epoch": 94.16348773841962, + "grad_norm": 2.362107515335083, + "learning_rate": 1.7813099715695892e-07, + "loss": 0.1055, + "step": 34558 + }, + { + "epoch": 94.16621253405995, + "grad_norm": 2.643925905227661, + "learning_rate": 1.7796520883079038e-07, + "loss": 0.03, + "step": 34559 + }, + { + "epoch": 94.16893732970027, + "grad_norm": 3.002138137817383, + "learning_rate": 1.7779949699831212e-07, + "loss": 0.0386, + "step": 34560 + }, + { + "epoch": 94.1716621253406, + "grad_norm": 2.3722450733184814, + "learning_rate": 1.776338616608153e-07, + "loss": 0.04, + "step": 34561 + }, + { + "epoch": 94.17438692098092, + "grad_norm": 2.956449270248413, + "learning_rate": 1.7746830281959005e-07, + "loss": 0.0302, + "step": 34562 + }, + { + "epoch": 94.17711171662125, + "grad_norm": 2.5882420539855957, + "learning_rate": 1.7730282047592528e-07, + "loss": 0.0322, + "step": 34563 + }, + { + "epoch": 94.17983651226157, + "grad_norm": 2.4424173831939697, + "learning_rate": 1.7713741463111112e-07, + "loss": 0.0422, + "step": 34564 + }, + { + "epoch": 94.1825613079019, + "grad_norm": 2.284702777862549, + "learning_rate": 1.7697208528643316e-07, + "loss": 0.0971, + "step": 34565 + }, + { + "epoch": 94.18528610354224, + "grad_norm": 1.9086081981658936, + "learning_rate": 1.7680683244318154e-07, + "loss": 0.0183, + "step": 34566 + }, + { + "epoch": 94.18801089918256, + "grad_norm": 4.8580403327941895, + "learning_rate": 1.7664165610264184e-07, + "loss": 0.0258, + "step": 34567 + }, + { + "epoch": 94.19073569482289, + "grad_norm": 1.9023826122283936, + "learning_rate": 1.7647655626610083e-07, + "loss": 0.0848, + "step": 34568 + }, + { + "epoch": 94.19346049046321, + "grad_norm": 2.0843896865844727, + "learning_rate": 1.7631153293484305e-07, + "loss": 0.1473, + "step": 34569 + }, + { + "epoch": 94.19618528610354, + "grad_norm": 0.9969910979270935, + "learning_rate": 1.7614658611015635e-07, + "loss": 0.0124, + "step": 34570 + }, + { + "epoch": 94.19891008174388, + "grad_norm": 1.8536566495895386, + "learning_rate": 1.75981715793323e-07, + "loss": 0.0433, + "step": 34571 + }, + { + "epoch": 94.2016348773842, + "grad_norm": 2.623291015625, + "learning_rate": 1.758169219856287e-07, + "loss": 0.0685, + "step": 34572 + }, + { + "epoch": 94.20435967302453, + "grad_norm": 3.871629238128662, + "learning_rate": 1.7565220468835465e-07, + "loss": 0.0569, + "step": 34573 + }, + { + "epoch": 94.20708446866485, + "grad_norm": 1.906101107597351, + "learning_rate": 1.7548756390278642e-07, + "loss": 0.0122, + "step": 34574 + }, + { + "epoch": 94.20980926430518, + "grad_norm": 2.549010992050171, + "learning_rate": 1.7532299963020417e-07, + "loss": 0.0999, + "step": 34575 + }, + { + "epoch": 94.2125340599455, + "grad_norm": 3.426013469696045, + "learning_rate": 1.7515851187189015e-07, + "loss": 0.0925, + "step": 34576 + }, + { + "epoch": 94.21525885558583, + "grad_norm": 1.9996252059936523, + "learning_rate": 1.749941006291245e-07, + "loss": 0.0175, + "step": 34577 + }, + { + "epoch": 94.21798365122616, + "grad_norm": 5.493715763092041, + "learning_rate": 1.7482976590319058e-07, + "loss": 0.0508, + "step": 34578 + }, + { + "epoch": 94.22070844686648, + "grad_norm": 3.023439645767212, + "learning_rate": 1.7466550769536516e-07, + "loss": 0.0948, + "step": 34579 + }, + { + "epoch": 94.22343324250681, + "grad_norm": 3.408459424972534, + "learning_rate": 1.7450132600692947e-07, + "loss": 0.1383, + "step": 34580 + }, + { + "epoch": 94.22615803814713, + "grad_norm": 1.7766079902648926, + "learning_rate": 1.7433722083915915e-07, + "loss": 0.0212, + "step": 34581 + }, + { + "epoch": 94.22888283378747, + "grad_norm": 2.550326108932495, + "learning_rate": 1.741731921933365e-07, + "loss": 0.0548, + "step": 34582 + }, + { + "epoch": 94.2316076294278, + "grad_norm": 1.5890072584152222, + "learning_rate": 1.7400924007073604e-07, + "loss": 0.0243, + "step": 34583 + }, + { + "epoch": 94.23433242506812, + "grad_norm": 1.7090826034545898, + "learning_rate": 1.7384536447263457e-07, + "loss": 0.0283, + "step": 34584 + }, + { + "epoch": 94.23705722070845, + "grad_norm": 2.8559112548828125, + "learning_rate": 1.736815654003099e-07, + "loss": 0.0353, + "step": 34585 + }, + { + "epoch": 94.23978201634877, + "grad_norm": 3.16033673286438, + "learning_rate": 1.7351784285503658e-07, + "loss": 0.0755, + "step": 34586 + }, + { + "epoch": 94.2425068119891, + "grad_norm": 2.2204842567443848, + "learning_rate": 1.733541968380914e-07, + "loss": 0.0777, + "step": 34587 + }, + { + "epoch": 94.24523160762942, + "grad_norm": 3.550560235977173, + "learning_rate": 1.7319062735074666e-07, + "loss": 0.0356, + "step": 34588 + }, + { + "epoch": 94.24795640326975, + "grad_norm": 2.5729455947875977, + "learning_rate": 1.7302713439427577e-07, + "loss": 0.0206, + "step": 34589 + }, + { + "epoch": 94.25068119891009, + "grad_norm": 2.397031784057617, + "learning_rate": 1.7286371796995438e-07, + "loss": 0.0401, + "step": 34590 + }, + { + "epoch": 94.2534059945504, + "grad_norm": 2.22430419921875, + "learning_rate": 1.7270037807905372e-07, + "loss": 0.0473, + "step": 34591 + }, + { + "epoch": 94.25613079019074, + "grad_norm": 2.6075212955474854, + "learning_rate": 1.7253711472284717e-07, + "loss": 0.0376, + "step": 34592 + }, + { + "epoch": 94.25885558583106, + "grad_norm": 2.732367992401123, + "learning_rate": 1.7237392790260377e-07, + "loss": 0.0377, + "step": 34593 + }, + { + "epoch": 94.26158038147139, + "grad_norm": 2.5315537452697754, + "learning_rate": 1.722108176195958e-07, + "loss": 0.053, + "step": 34594 + }, + { + "epoch": 94.26430517711172, + "grad_norm": 2.3362369537353516, + "learning_rate": 1.7204778387509559e-07, + "loss": 0.1016, + "step": 34595 + }, + { + "epoch": 94.26702997275204, + "grad_norm": 2.551574230194092, + "learning_rate": 1.7188482667036986e-07, + "loss": 0.0376, + "step": 34596 + }, + { + "epoch": 94.26975476839237, + "grad_norm": 1.8957818746566772, + "learning_rate": 1.7172194600668767e-07, + "loss": 0.0707, + "step": 34597 + }, + { + "epoch": 94.2724795640327, + "grad_norm": 1.700167179107666, + "learning_rate": 1.715591418853202e-07, + "loss": 0.0179, + "step": 34598 + }, + { + "epoch": 94.27520435967303, + "grad_norm": 1.6797950267791748, + "learning_rate": 1.7139641430753419e-07, + "loss": 0.0238, + "step": 34599 + }, + { + "epoch": 94.27792915531334, + "grad_norm": 2.126771926879883, + "learning_rate": 1.712337632745964e-07, + "loss": 0.0237, + "step": 34600 + }, + { + "epoch": 94.28065395095368, + "grad_norm": 1.526766061782837, + "learning_rate": 1.7107118878777251e-07, + "loss": 0.0227, + "step": 34601 + }, + { + "epoch": 94.28337874659401, + "grad_norm": 2.9766311645507812, + "learning_rate": 1.709086908483304e-07, + "loss": 0.1157, + "step": 34602 + }, + { + "epoch": 94.28610354223433, + "grad_norm": 2.0408859252929688, + "learning_rate": 1.707462694575357e-07, + "loss": 0.0818, + "step": 34603 + }, + { + "epoch": 94.28882833787466, + "grad_norm": 2.0950992107391357, + "learning_rate": 1.7058392461665185e-07, + "loss": 0.0423, + "step": 34604 + }, + { + "epoch": 94.29155313351498, + "grad_norm": 2.3778860569000244, + "learning_rate": 1.704216563269434e-07, + "loss": 0.0412, + "step": 34605 + }, + { + "epoch": 94.29427792915531, + "grad_norm": 2.916978597640991, + "learning_rate": 1.7025946458967602e-07, + "loss": 0.0325, + "step": 34606 + }, + { + "epoch": 94.29700272479565, + "grad_norm": 3.0695154666900635, + "learning_rate": 1.70097349406112e-07, + "loss": 0.0301, + "step": 34607 + }, + { + "epoch": 94.29972752043597, + "grad_norm": 2.0341145992279053, + "learning_rate": 1.6993531077751256e-07, + "loss": 0.0266, + "step": 34608 + }, + { + "epoch": 94.3024523160763, + "grad_norm": 3.028540849685669, + "learning_rate": 1.6977334870514007e-07, + "loss": 0.0536, + "step": 34609 + }, + { + "epoch": 94.30517711171662, + "grad_norm": 2.2184524536132812, + "learning_rate": 1.696114631902568e-07, + "loss": 0.0932, + "step": 34610 + }, + { + "epoch": 94.30790190735695, + "grad_norm": 3.4266767501831055, + "learning_rate": 1.6944965423412286e-07, + "loss": 0.1048, + "step": 34611 + }, + { + "epoch": 94.31062670299727, + "grad_norm": 2.3393688201904297, + "learning_rate": 1.6928792183799948e-07, + "loss": 0.0234, + "step": 34612 + }, + { + "epoch": 94.3133514986376, + "grad_norm": 1.8931456804275513, + "learning_rate": 1.6912626600314452e-07, + "loss": 0.0588, + "step": 34613 + }, + { + "epoch": 94.31607629427793, + "grad_norm": 2.8492913246154785, + "learning_rate": 1.6896468673081812e-07, + "loss": 0.0502, + "step": 34614 + }, + { + "epoch": 94.31880108991825, + "grad_norm": 3.497866153717041, + "learning_rate": 1.6880318402227814e-07, + "loss": 0.0441, + "step": 34615 + }, + { + "epoch": 94.32152588555859, + "grad_norm": 2.6030144691467285, + "learning_rate": 1.6864175787878244e-07, + "loss": 0.0354, + "step": 34616 + }, + { + "epoch": 94.3242506811989, + "grad_norm": 1.3896472454071045, + "learning_rate": 1.6848040830158895e-07, + "loss": 0.0108, + "step": 34617 + }, + { + "epoch": 94.32697547683924, + "grad_norm": 2.356647253036499, + "learning_rate": 1.683191352919533e-07, + "loss": 0.049, + "step": 34618 + }, + { + "epoch": 94.32970027247957, + "grad_norm": 2.475054979324341, + "learning_rate": 1.681579388511323e-07, + "loss": 0.0868, + "step": 34619 + }, + { + "epoch": 94.33242506811989, + "grad_norm": 4.608496189117432, + "learning_rate": 1.6799681898038044e-07, + "loss": 0.0525, + "step": 34620 + }, + { + "epoch": 94.33514986376022, + "grad_norm": 2.7545180320739746, + "learning_rate": 1.6783577568095123e-07, + "loss": 0.1164, + "step": 34621 + }, + { + "epoch": 94.33787465940054, + "grad_norm": 5.152946472167969, + "learning_rate": 1.6767480895410248e-07, + "loss": 0.0321, + "step": 34622 + }, + { + "epoch": 94.34059945504087, + "grad_norm": 2.800403356552124, + "learning_rate": 1.6751391880108548e-07, + "loss": 0.0271, + "step": 34623 + }, + { + "epoch": 94.34332425068119, + "grad_norm": 4.446054458618164, + "learning_rate": 1.6735310522315473e-07, + "loss": 0.0853, + "step": 34624 + }, + { + "epoch": 94.34604904632153, + "grad_norm": 3.2290141582489014, + "learning_rate": 1.6719236822155927e-07, + "loss": 0.0699, + "step": 34625 + }, + { + "epoch": 94.34877384196186, + "grad_norm": 2.38934588432312, + "learning_rate": 1.6703170779755474e-07, + "loss": 0.0337, + "step": 34626 + }, + { + "epoch": 94.35149863760218, + "grad_norm": 2.058783531188965, + "learning_rate": 1.6687112395239014e-07, + "loss": 0.0264, + "step": 34627 + }, + { + "epoch": 94.35422343324251, + "grad_norm": 2.4210948944091797, + "learning_rate": 1.667106166873167e-07, + "loss": 0.0656, + "step": 34628 + }, + { + "epoch": 94.35694822888283, + "grad_norm": 2.59696626663208, + "learning_rate": 1.6655018600358452e-07, + "loss": 0.0207, + "step": 34629 + }, + { + "epoch": 94.35967302452316, + "grad_norm": 2.635974407196045, + "learning_rate": 1.6638983190244374e-07, + "loss": 0.0218, + "step": 34630 + }, + { + "epoch": 94.3623978201635, + "grad_norm": 2.3381271362304688, + "learning_rate": 1.6622955438514111e-07, + "loss": 0.068, + "step": 34631 + }, + { + "epoch": 94.36512261580381, + "grad_norm": 2.0427045822143555, + "learning_rate": 1.6606935345292785e-07, + "loss": 0.041, + "step": 34632 + }, + { + "epoch": 94.36784741144415, + "grad_norm": 1.729866623878479, + "learning_rate": 1.6590922910704966e-07, + "loss": 0.0193, + "step": 34633 + }, + { + "epoch": 94.37057220708446, + "grad_norm": 1.777673602104187, + "learning_rate": 1.6574918134875216e-07, + "loss": 0.0764, + "step": 34634 + }, + { + "epoch": 94.3732970027248, + "grad_norm": 2.5636448860168457, + "learning_rate": 1.6558921017928554e-07, + "loss": 0.0331, + "step": 34635 + }, + { + "epoch": 94.37602179836512, + "grad_norm": 3.057037830352783, + "learning_rate": 1.6542931559989316e-07, + "loss": 0.0802, + "step": 34636 + }, + { + "epoch": 94.37874659400545, + "grad_norm": 1.9381567239761353, + "learning_rate": 1.6526949761182076e-07, + "loss": 0.0238, + "step": 34637 + }, + { + "epoch": 94.38147138964578, + "grad_norm": 2.2974367141723633, + "learning_rate": 1.6510975621631177e-07, + "loss": 0.028, + "step": 34638 + }, + { + "epoch": 94.3841961852861, + "grad_norm": 2.2948877811431885, + "learning_rate": 1.6495009141461293e-07, + "loss": 0.0575, + "step": 34639 + }, + { + "epoch": 94.38692098092643, + "grad_norm": 2.0891711711883545, + "learning_rate": 1.6479050320796552e-07, + "loss": 0.0268, + "step": 34640 + }, + { + "epoch": 94.38964577656675, + "grad_norm": 2.469036340713501, + "learning_rate": 1.646309915976141e-07, + "loss": 0.0417, + "step": 34641 + }, + { + "epoch": 94.39237057220708, + "grad_norm": 2.298543930053711, + "learning_rate": 1.6447155658479763e-07, + "loss": 0.0302, + "step": 34642 + }, + { + "epoch": 94.39509536784742, + "grad_norm": 2.1329193115234375, + "learning_rate": 1.6431219817076182e-07, + "loss": 0.0637, + "step": 34643 + }, + { + "epoch": 94.39782016348774, + "grad_norm": 1.99644136428833, + "learning_rate": 1.6415291635674567e-07, + "loss": 0.016, + "step": 34644 + }, + { + "epoch": 94.40054495912807, + "grad_norm": 3.191816806793213, + "learning_rate": 1.6399371114399043e-07, + "loss": 0.0399, + "step": 34645 + }, + { + "epoch": 94.40326975476839, + "grad_norm": 2.9646823406219482, + "learning_rate": 1.6383458253373508e-07, + "loss": 0.1386, + "step": 34646 + }, + { + "epoch": 94.40599455040872, + "grad_norm": 2.5656116008758545, + "learning_rate": 1.6367553052721973e-07, + "loss": 0.0417, + "step": 34647 + }, + { + "epoch": 94.40871934604904, + "grad_norm": 2.7245559692382812, + "learning_rate": 1.6351655512568343e-07, + "loss": 0.0449, + "step": 34648 + }, + { + "epoch": 94.41144414168937, + "grad_norm": 3.228842258453369, + "learning_rate": 1.6335765633036294e-07, + "loss": 0.0432, + "step": 34649 + }, + { + "epoch": 94.4141689373297, + "grad_norm": 3.2125754356384277, + "learning_rate": 1.6319883414249615e-07, + "loss": 0.0931, + "step": 34650 + }, + { + "epoch": 94.41689373297002, + "grad_norm": 7.564841270446777, + "learning_rate": 1.63040088563321e-07, + "loss": 0.0781, + "step": 34651 + }, + { + "epoch": 94.41961852861036, + "grad_norm": 1.8873380422592163, + "learning_rate": 1.62881419594072e-07, + "loss": 0.1736, + "step": 34652 + }, + { + "epoch": 94.42234332425068, + "grad_norm": 2.9355266094207764, + "learning_rate": 1.6272282723598709e-07, + "loss": 0.0941, + "step": 34653 + }, + { + "epoch": 94.42506811989101, + "grad_norm": 1.7448080778121948, + "learning_rate": 1.625643114902986e-07, + "loss": 0.0231, + "step": 34654 + }, + { + "epoch": 94.42779291553134, + "grad_norm": 2.837740182876587, + "learning_rate": 1.6240587235824445e-07, + "loss": 0.1172, + "step": 34655 + }, + { + "epoch": 94.43051771117166, + "grad_norm": 2.8005638122558594, + "learning_rate": 1.6224750984105586e-07, + "loss": 0.0266, + "step": 34656 + }, + { + "epoch": 94.433242506812, + "grad_norm": 2.181720733642578, + "learning_rate": 1.620892239399674e-07, + "loss": 0.0925, + "step": 34657 + }, + { + "epoch": 94.43596730245231, + "grad_norm": 1.8403340578079224, + "learning_rate": 1.6193101465621031e-07, + "loss": 0.0208, + "step": 34658 + }, + { + "epoch": 94.43869209809264, + "grad_norm": 1.3620636463165283, + "learning_rate": 1.6177288199101915e-07, + "loss": 0.014, + "step": 34659 + }, + { + "epoch": 94.44141689373296, + "grad_norm": 2.899869918823242, + "learning_rate": 1.6161482594562404e-07, + "loss": 0.0623, + "step": 34660 + }, + { + "epoch": 94.4441416893733, + "grad_norm": 3.126708745956421, + "learning_rate": 1.6145684652125625e-07, + "loss": 0.0266, + "step": 34661 + }, + { + "epoch": 94.44686648501363, + "grad_norm": 2.637641668319702, + "learning_rate": 1.6129894371914368e-07, + "loss": 0.1349, + "step": 34662 + }, + { + "epoch": 94.44959128065395, + "grad_norm": 1.7988773584365845, + "learning_rate": 1.6114111754051976e-07, + "loss": 0.0491, + "step": 34663 + }, + { + "epoch": 94.45231607629428, + "grad_norm": 2.367905616760254, + "learning_rate": 1.609833679866124e-07, + "loss": 0.0518, + "step": 34664 + }, + { + "epoch": 94.4550408719346, + "grad_norm": 2.809880018234253, + "learning_rate": 1.6082569505865064e-07, + "loss": 0.0969, + "step": 34665 + }, + { + "epoch": 94.45776566757493, + "grad_norm": 1.9134714603424072, + "learning_rate": 1.6066809875786016e-07, + "loss": 0.0241, + "step": 34666 + }, + { + "epoch": 94.46049046321527, + "grad_norm": 5.269023418426514, + "learning_rate": 1.6051057908546997e-07, + "loss": 0.0367, + "step": 34667 + }, + { + "epoch": 94.46321525885558, + "grad_norm": 1.4486260414123535, + "learning_rate": 1.6035313604270798e-07, + "loss": 0.026, + "step": 34668 + }, + { + "epoch": 94.46594005449592, + "grad_norm": 2.5442888736724854, + "learning_rate": 1.6019576963079875e-07, + "loss": 0.1106, + "step": 34669 + }, + { + "epoch": 94.46866485013624, + "grad_norm": 1.3832812309265137, + "learning_rate": 1.6003847985096687e-07, + "loss": 0.1066, + "step": 34670 + }, + { + "epoch": 94.47138964577657, + "grad_norm": 2.9172377586364746, + "learning_rate": 1.5988126670444026e-07, + "loss": 0.0438, + "step": 34671 + }, + { + "epoch": 94.47411444141689, + "grad_norm": 1.9467462301254272, + "learning_rate": 1.5972413019244014e-07, + "loss": 0.0671, + "step": 34672 + }, + { + "epoch": 94.47683923705722, + "grad_norm": 2.916339159011841, + "learning_rate": 1.5956707031619333e-07, + "loss": 0.1237, + "step": 34673 + }, + { + "epoch": 94.47956403269755, + "grad_norm": 2.2039833068847656, + "learning_rate": 1.5941008707691996e-07, + "loss": 0.0389, + "step": 34674 + }, + { + "epoch": 94.48228882833787, + "grad_norm": 3.202559232711792, + "learning_rate": 1.592531804758446e-07, + "loss": 0.0786, + "step": 34675 + }, + { + "epoch": 94.4850136239782, + "grad_norm": 1.8219290971755981, + "learning_rate": 1.590963505141896e-07, + "loss": 0.0706, + "step": 34676 + }, + { + "epoch": 94.48773841961852, + "grad_norm": 3.4272594451904297, + "learning_rate": 1.589395971931751e-07, + "loss": 0.1694, + "step": 34677 + }, + { + "epoch": 94.49046321525886, + "grad_norm": 3.208918333053589, + "learning_rate": 1.5878292051402123e-07, + "loss": 0.159, + "step": 34678 + }, + { + "epoch": 94.49318801089919, + "grad_norm": 2.3203773498535156, + "learning_rate": 1.5862632047795033e-07, + "loss": 0.0333, + "step": 34679 + }, + { + "epoch": 94.49591280653951, + "grad_norm": 2.039985418319702, + "learning_rate": 1.5846979708618038e-07, + "loss": 0.089, + "step": 34680 + }, + { + "epoch": 94.49863760217984, + "grad_norm": 4.308788299560547, + "learning_rate": 1.5831335033993144e-07, + "loss": 0.0241, + "step": 34681 + }, + { + "epoch": 94.50136239782016, + "grad_norm": 2.6852211952209473, + "learning_rate": 1.5815698024042147e-07, + "loss": 0.0672, + "step": 34682 + }, + { + "epoch": 94.50408719346049, + "grad_norm": 3.191239833831787, + "learning_rate": 1.5800068678886726e-07, + "loss": 0.0601, + "step": 34683 + }, + { + "epoch": 94.50681198910081, + "grad_norm": 2.4062161445617676, + "learning_rate": 1.5784446998648784e-07, + "loss": 0.0248, + "step": 34684 + }, + { + "epoch": 94.50953678474114, + "grad_norm": 2.261762857437134, + "learning_rate": 1.5768832983449888e-07, + "loss": 0.0362, + "step": 34685 + }, + { + "epoch": 94.51226158038148, + "grad_norm": 2.3534913063049316, + "learning_rate": 1.57532266334115e-07, + "loss": 0.1233, + "step": 34686 + }, + { + "epoch": 94.5149863760218, + "grad_norm": 4.368196964263916, + "learning_rate": 1.573762794865541e-07, + "loss": 0.3018, + "step": 34687 + }, + { + "epoch": 94.51771117166213, + "grad_norm": 2.6892006397247314, + "learning_rate": 1.5722036929303075e-07, + "loss": 0.0598, + "step": 34688 + }, + { + "epoch": 94.52043596730245, + "grad_norm": 2.1162848472595215, + "learning_rate": 1.5706453575475733e-07, + "loss": 0.0225, + "step": 34689 + }, + { + "epoch": 94.52316076294278, + "grad_norm": 3.426241874694824, + "learning_rate": 1.5690877887294843e-07, + "loss": 0.0446, + "step": 34690 + }, + { + "epoch": 94.52588555858311, + "grad_norm": 5.542628288269043, + "learning_rate": 1.567530986488186e-07, + "loss": 0.0381, + "step": 34691 + }, + { + "epoch": 94.52861035422343, + "grad_norm": 1.7282050848007202, + "learning_rate": 1.5659749508357802e-07, + "loss": 0.028, + "step": 34692 + }, + { + "epoch": 94.53133514986376, + "grad_norm": 3.235380172729492, + "learning_rate": 1.5644196817843904e-07, + "loss": 0.0677, + "step": 34693 + }, + { + "epoch": 94.53405994550408, + "grad_norm": 2.2509677410125732, + "learning_rate": 1.5628651793461292e-07, + "loss": 0.0837, + "step": 34694 + }, + { + "epoch": 94.53678474114442, + "grad_norm": 2.4903781414031982, + "learning_rate": 1.561311443533109e-07, + "loss": 0.0388, + "step": 34695 + }, + { + "epoch": 94.53950953678473, + "grad_norm": 2.4005839824676514, + "learning_rate": 1.55975847435742e-07, + "loss": 0.1346, + "step": 34696 + }, + { + "epoch": 94.54223433242507, + "grad_norm": 2.1250245571136475, + "learning_rate": 1.558206271831175e-07, + "loss": 0.1697, + "step": 34697 + }, + { + "epoch": 94.5449591280654, + "grad_norm": 2.4313042163848877, + "learning_rate": 1.5566548359664423e-07, + "loss": 0.0278, + "step": 34698 + }, + { + "epoch": 94.54768392370572, + "grad_norm": 2.4750702381134033, + "learning_rate": 1.555104166775323e-07, + "loss": 0.1176, + "step": 34699 + }, + { + "epoch": 94.55040871934605, + "grad_norm": 2.4606995582580566, + "learning_rate": 1.5535542642698742e-07, + "loss": 0.0412, + "step": 34700 + }, + { + "epoch": 94.55313351498637, + "grad_norm": 2.120288848876953, + "learning_rate": 1.5520051284621862e-07, + "loss": 0.0402, + "step": 34701 + }, + { + "epoch": 94.5558583106267, + "grad_norm": 2.3898894786834717, + "learning_rate": 1.550456759364316e-07, + "loss": 0.0478, + "step": 34702 + }, + { + "epoch": 94.55858310626704, + "grad_norm": 1.8887131214141846, + "learning_rate": 1.5489091569882986e-07, + "loss": 0.0418, + "step": 34703 + }, + { + "epoch": 94.56130790190736, + "grad_norm": 2.0389652252197266, + "learning_rate": 1.547362321346224e-07, + "loss": 0.0515, + "step": 34704 + }, + { + "epoch": 94.56403269754769, + "grad_norm": 1.8987900018692017, + "learning_rate": 1.5458162524501274e-07, + "loss": 0.0426, + "step": 34705 + }, + { + "epoch": 94.566757493188, + "grad_norm": 2.3834776878356934, + "learning_rate": 1.5442709503120322e-07, + "loss": 0.0643, + "step": 34706 + }, + { + "epoch": 94.56948228882834, + "grad_norm": 2.5971760749816895, + "learning_rate": 1.5427264149439957e-07, + "loss": 0.0614, + "step": 34707 + }, + { + "epoch": 94.57220708446866, + "grad_norm": 3.2082934379577637, + "learning_rate": 1.5411826463580414e-07, + "loss": 0.0374, + "step": 34708 + }, + { + "epoch": 94.57493188010899, + "grad_norm": 1.9501131772994995, + "learning_rate": 1.5396396445661822e-07, + "loss": 0.0257, + "step": 34709 + }, + { + "epoch": 94.57765667574932, + "grad_norm": 2.9001870155334473, + "learning_rate": 1.5380974095804303e-07, + "loss": 0.0464, + "step": 34710 + }, + { + "epoch": 94.58038147138964, + "grad_norm": 4.064499855041504, + "learning_rate": 1.5365559414128207e-07, + "loss": 0.0391, + "step": 34711 + }, + { + "epoch": 94.58310626702998, + "grad_norm": 3.1410655975341797, + "learning_rate": 1.5350152400753326e-07, + "loss": 0.0931, + "step": 34712 + }, + { + "epoch": 94.5858310626703, + "grad_norm": 3.293938636779785, + "learning_rate": 1.533475305579979e-07, + "loss": 0.189, + "step": 34713 + }, + { + "epoch": 94.58855585831063, + "grad_norm": 3.631631851196289, + "learning_rate": 1.5319361379387609e-07, + "loss": 0.0344, + "step": 34714 + }, + { + "epoch": 94.59128065395096, + "grad_norm": 2.9691922664642334, + "learning_rate": 1.530397737163647e-07, + "loss": 0.1473, + "step": 34715 + }, + { + "epoch": 94.59400544959128, + "grad_norm": 2.1044015884399414, + "learning_rate": 1.5288601032666272e-07, + "loss": 0.0305, + "step": 34716 + }, + { + "epoch": 94.59673024523161, + "grad_norm": 2.1065657138824463, + "learning_rate": 1.5273232362596812e-07, + "loss": 0.0323, + "step": 34717 + }, + { + "epoch": 94.59945504087193, + "grad_norm": 4.500377655029297, + "learning_rate": 1.525787136154766e-07, + "loss": 0.0367, + "step": 34718 + }, + { + "epoch": 94.60217983651226, + "grad_norm": 2.984140157699585, + "learning_rate": 1.52425180296385e-07, + "loss": 0.0672, + "step": 34719 + }, + { + "epoch": 94.60490463215258, + "grad_norm": 1.8051056861877441, + "learning_rate": 1.5227172366989006e-07, + "loss": 0.0218, + "step": 34720 + }, + { + "epoch": 94.60762942779292, + "grad_norm": 2.263307571411133, + "learning_rate": 1.5211834373718536e-07, + "loss": 0.0372, + "step": 34721 + }, + { + "epoch": 94.61035422343325, + "grad_norm": 2.80877423286438, + "learning_rate": 1.519650404994666e-07, + "loss": 0.0327, + "step": 34722 + }, + { + "epoch": 94.61307901907357, + "grad_norm": 2.9288394451141357, + "learning_rate": 1.518118139579261e-07, + "loss": 0.0445, + "step": 34723 + }, + { + "epoch": 94.6158038147139, + "grad_norm": 2.3656704425811768, + "learning_rate": 1.516586641137585e-07, + "loss": 0.064, + "step": 34724 + }, + { + "epoch": 94.61852861035422, + "grad_norm": 2.8486154079437256, + "learning_rate": 1.515055909681562e-07, + "loss": 0.0574, + "step": 34725 + }, + { + "epoch": 94.62125340599455, + "grad_norm": 3.6664655208587646, + "learning_rate": 1.5135259452231265e-07, + "loss": 0.0231, + "step": 34726 + }, + { + "epoch": 94.62397820163488, + "grad_norm": 2.1733145713806152, + "learning_rate": 1.5119967477741694e-07, + "loss": 0.0218, + "step": 34727 + }, + { + "epoch": 94.6267029972752, + "grad_norm": 2.5935847759246826, + "learning_rate": 1.5104683173466139e-07, + "loss": 0.1029, + "step": 34728 + }, + { + "epoch": 94.62942779291554, + "grad_norm": 2.7075705528259277, + "learning_rate": 1.508940653952362e-07, + "loss": 0.0567, + "step": 34729 + }, + { + "epoch": 94.63215258855585, + "grad_norm": 3.5815441608428955, + "learning_rate": 1.5074137576033044e-07, + "loss": 0.0384, + "step": 34730 + }, + { + "epoch": 94.63487738419619, + "grad_norm": 1.7786641120910645, + "learning_rate": 1.5058876283113423e-07, + "loss": 0.047, + "step": 34731 + }, + { + "epoch": 94.6376021798365, + "grad_norm": 2.469461441040039, + "learning_rate": 1.504362266088355e-07, + "loss": 0.0628, + "step": 34732 + }, + { + "epoch": 94.64032697547684, + "grad_norm": 2.8403401374816895, + "learning_rate": 1.5028376709462335e-07, + "loss": 0.1161, + "step": 34733 + }, + { + "epoch": 94.64305177111717, + "grad_norm": 2.908555746078491, + "learning_rate": 1.5013138428968344e-07, + "loss": 0.0575, + "step": 34734 + }, + { + "epoch": 94.64577656675749, + "grad_norm": 2.3483283519744873, + "learning_rate": 1.4997907819520373e-07, + "loss": 0.0565, + "step": 34735 + }, + { + "epoch": 94.64850136239782, + "grad_norm": 6.889547824859619, + "learning_rate": 1.4982684881236996e-07, + "loss": 0.081, + "step": 34736 + }, + { + "epoch": 94.65122615803814, + "grad_norm": 2.152317762374878, + "learning_rate": 1.4967469614236673e-07, + "loss": 0.0224, + "step": 34737 + }, + { + "epoch": 94.65395095367847, + "grad_norm": 1.7832682132720947, + "learning_rate": 1.4952262018638087e-07, + "loss": 0.0297, + "step": 34738 + }, + { + "epoch": 94.65667574931881, + "grad_norm": 2.1328957080841064, + "learning_rate": 1.4937062094559584e-07, + "loss": 0.0452, + "step": 34739 + }, + { + "epoch": 94.65940054495913, + "grad_norm": 4.166618824005127, + "learning_rate": 1.4921869842119518e-07, + "loss": 0.0283, + "step": 34740 + }, + { + "epoch": 94.66212534059946, + "grad_norm": 2.2828242778778076, + "learning_rate": 1.4906685261436238e-07, + "loss": 0.1821, + "step": 34741 + }, + { + "epoch": 94.66485013623978, + "grad_norm": 5.564267158508301, + "learning_rate": 1.4891508352627982e-07, + "loss": 0.0812, + "step": 34742 + }, + { + "epoch": 94.66757493188011, + "grad_norm": 2.802478551864624, + "learning_rate": 1.4876339115812878e-07, + "loss": 0.0782, + "step": 34743 + }, + { + "epoch": 94.67029972752043, + "grad_norm": 2.5819175243377686, + "learning_rate": 1.4861177551109273e-07, + "loss": 0.0679, + "step": 34744 + }, + { + "epoch": 94.67302452316076, + "grad_norm": 2.0222177505493164, + "learning_rate": 1.4846023658634967e-07, + "loss": 0.0399, + "step": 34745 + }, + { + "epoch": 94.6757493188011, + "grad_norm": 3.721381187438965, + "learning_rate": 1.4830877438508308e-07, + "loss": 0.096, + "step": 34746 + }, + { + "epoch": 94.67847411444141, + "grad_norm": 2.32200026512146, + "learning_rate": 1.4815738890846864e-07, + "loss": 0.0876, + "step": 34747 + }, + { + "epoch": 94.68119891008175, + "grad_norm": 2.822448492050171, + "learning_rate": 1.4800608015768768e-07, + "loss": 0.1562, + "step": 34748 + }, + { + "epoch": 94.68392370572207, + "grad_norm": 2.120591640472412, + "learning_rate": 1.4785484813391927e-07, + "loss": 0.0304, + "step": 34749 + }, + { + "epoch": 94.6866485013624, + "grad_norm": 2.949368476867676, + "learning_rate": 1.477036928383402e-07, + "loss": 0.0335, + "step": 34750 + }, + { + "epoch": 94.68937329700273, + "grad_norm": 2.3968918323516846, + "learning_rate": 1.475526142721262e-07, + "loss": 0.0876, + "step": 34751 + }, + { + "epoch": 94.69209809264305, + "grad_norm": 2.2223854064941406, + "learning_rate": 1.4740161243645634e-07, + "loss": 0.1126, + "step": 34752 + }, + { + "epoch": 94.69482288828338, + "grad_norm": 2.491565465927124, + "learning_rate": 1.4725068733250636e-07, + "loss": 0.0706, + "step": 34753 + }, + { + "epoch": 94.6975476839237, + "grad_norm": 2.282160758972168, + "learning_rate": 1.4709983896145085e-07, + "loss": 0.0501, + "step": 34754 + }, + { + "epoch": 94.70027247956403, + "grad_norm": 2.711899757385254, + "learning_rate": 1.4694906732446334e-07, + "loss": 0.0634, + "step": 34755 + }, + { + "epoch": 94.70299727520435, + "grad_norm": 2.785217523574829, + "learning_rate": 1.4679837242272065e-07, + "loss": 0.0427, + "step": 34756 + }, + { + "epoch": 94.70572207084469, + "grad_norm": 2.9921822547912598, + "learning_rate": 1.4664775425739408e-07, + "loss": 0.1068, + "step": 34757 + }, + { + "epoch": 94.70844686648502, + "grad_norm": 3.676082134246826, + "learning_rate": 1.4649721282965934e-07, + "loss": 0.0345, + "step": 34758 + }, + { + "epoch": 94.71117166212534, + "grad_norm": 2.53202486038208, + "learning_rate": 1.463467481406855e-07, + "loss": 0.0923, + "step": 34759 + }, + { + "epoch": 94.71389645776567, + "grad_norm": 2.301422357559204, + "learning_rate": 1.4619636019164608e-07, + "loss": 0.0299, + "step": 34760 + }, + { + "epoch": 94.71662125340599, + "grad_norm": 3.420034170150757, + "learning_rate": 1.4604604898371344e-07, + "loss": 0.12, + "step": 34761 + }, + { + "epoch": 94.71934604904632, + "grad_norm": 3.044668436050415, + "learning_rate": 1.4589581451805666e-07, + "loss": 0.0365, + "step": 34762 + }, + { + "epoch": 94.72207084468666, + "grad_norm": 2.417459726333618, + "learning_rate": 1.4574565679584485e-07, + "loss": 0.0298, + "step": 34763 + }, + { + "epoch": 94.72479564032697, + "grad_norm": 3.5302438735961914, + "learning_rate": 1.4559557581825034e-07, + "loss": 0.0893, + "step": 34764 + }, + { + "epoch": 94.7275204359673, + "grad_norm": 3.776052951812744, + "learning_rate": 1.4544557158643892e-07, + "loss": 0.1533, + "step": 34765 + }, + { + "epoch": 94.73024523160763, + "grad_norm": 2.5752294063568115, + "learning_rate": 1.452956441015807e-07, + "loss": 0.0309, + "step": 34766 + }, + { + "epoch": 94.73297002724796, + "grad_norm": 2.660784959793091, + "learning_rate": 1.4514579336484368e-07, + "loss": 0.0954, + "step": 34767 + }, + { + "epoch": 94.73569482288828, + "grad_norm": 2.7385683059692383, + "learning_rate": 1.4499601937739249e-07, + "loss": 0.0214, + "step": 34768 + }, + { + "epoch": 94.73841961852861, + "grad_norm": 4.5096354484558105, + "learning_rate": 1.448463221403962e-07, + "loss": 0.0708, + "step": 34769 + }, + { + "epoch": 94.74114441416894, + "grad_norm": 3.276843786239624, + "learning_rate": 1.4469670165502047e-07, + "loss": 0.1191, + "step": 34770 + }, + { + "epoch": 94.74386920980926, + "grad_norm": 1.9798550605773926, + "learning_rate": 1.445471579224278e-07, + "loss": 0.0333, + "step": 34771 + }, + { + "epoch": 94.7465940054496, + "grad_norm": 13.764991760253906, + "learning_rate": 1.4439769094378498e-07, + "loss": 0.1301, + "step": 34772 + }, + { + "epoch": 94.74931880108991, + "grad_norm": 2.390716791152954, + "learning_rate": 1.4424830072025664e-07, + "loss": 0.0536, + "step": 34773 + }, + { + "epoch": 94.75204359673025, + "grad_norm": 1.7884615659713745, + "learning_rate": 1.440989872530052e-07, + "loss": 0.023, + "step": 34774 + }, + { + "epoch": 94.75476839237058, + "grad_norm": 2.6902616024017334, + "learning_rate": 1.4394975054319305e-07, + "loss": 0.0813, + "step": 34775 + }, + { + "epoch": 94.7574931880109, + "grad_norm": 3.49226450920105, + "learning_rate": 1.438005905919837e-07, + "loss": 0.1183, + "step": 34776 + }, + { + "epoch": 94.76021798365123, + "grad_norm": 3.289321184158325, + "learning_rate": 1.4365150740053735e-07, + "loss": 0.0721, + "step": 34777 + }, + { + "epoch": 94.76294277929155, + "grad_norm": 2.1775777339935303, + "learning_rate": 1.435025009700175e-07, + "loss": 0.0245, + "step": 34778 + }, + { + "epoch": 94.76566757493188, + "grad_norm": 2.1738474369049072, + "learning_rate": 1.43353571301581e-07, + "loss": 0.0346, + "step": 34779 + }, + { + "epoch": 94.7683923705722, + "grad_norm": 2.144057273864746, + "learning_rate": 1.4320471839639027e-07, + "loss": 0.1144, + "step": 34780 + }, + { + "epoch": 94.77111716621253, + "grad_norm": 2.4447195529937744, + "learning_rate": 1.4305594225560438e-07, + "loss": 0.0375, + "step": 34781 + }, + { + "epoch": 94.77384196185287, + "grad_norm": 2.6953911781311035, + "learning_rate": 1.4290724288038016e-07, + "loss": 0.0446, + "step": 34782 + }, + { + "epoch": 94.77656675749319, + "grad_norm": 2.8725662231445312, + "learning_rate": 1.4275862027187893e-07, + "loss": 0.0365, + "step": 34783 + }, + { + "epoch": 94.77929155313352, + "grad_norm": 2.246803045272827, + "learning_rate": 1.4261007443125418e-07, + "loss": 0.0665, + "step": 34784 + }, + { + "epoch": 94.78201634877384, + "grad_norm": 3.250502586364746, + "learning_rate": 1.4246160535966725e-07, + "loss": 0.0291, + "step": 34785 + }, + { + "epoch": 94.78474114441417, + "grad_norm": 2.5454702377319336, + "learning_rate": 1.423132130582705e-07, + "loss": 0.0901, + "step": 34786 + }, + { + "epoch": 94.7874659400545, + "grad_norm": 4.991804122924805, + "learning_rate": 1.4216489752822192e-07, + "loss": 0.1351, + "step": 34787 + }, + { + "epoch": 94.79019073569482, + "grad_norm": 2.541097640991211, + "learning_rate": 1.4201665877067615e-07, + "loss": 0.0225, + "step": 34788 + }, + { + "epoch": 94.79291553133515, + "grad_norm": 2.268462896347046, + "learning_rate": 1.418684967867867e-07, + "loss": 0.0845, + "step": 34789 + }, + { + "epoch": 94.79564032697547, + "grad_norm": 3.6317033767700195, + "learning_rate": 1.4172041157770822e-07, + "loss": 0.1054, + "step": 34790 + }, + { + "epoch": 94.7983651226158, + "grad_norm": 3.203853130340576, + "learning_rate": 1.415724031445942e-07, + "loss": 0.0231, + "step": 34791 + }, + { + "epoch": 94.80108991825612, + "grad_norm": 1.9054230451583862, + "learning_rate": 1.4142447148859706e-07, + "loss": 0.0158, + "step": 34792 + }, + { + "epoch": 94.80381471389646, + "grad_norm": 2.7306485176086426, + "learning_rate": 1.412766166108681e-07, + "loss": 0.0643, + "step": 34793 + }, + { + "epoch": 94.80653950953679, + "grad_norm": 2.510159730911255, + "learning_rate": 1.4112883851256088e-07, + "loss": 0.0526, + "step": 34794 + }, + { + "epoch": 94.80926430517711, + "grad_norm": 2.6023669242858887, + "learning_rate": 1.4098113719482333e-07, + "loss": 0.0602, + "step": 34795 + }, + { + "epoch": 94.81198910081744, + "grad_norm": 2.7218353748321533, + "learning_rate": 1.4083351265880786e-07, + "loss": 0.0315, + "step": 34796 + }, + { + "epoch": 94.81471389645776, + "grad_norm": 2.2368712425231934, + "learning_rate": 1.4068596490566467e-07, + "loss": 0.0282, + "step": 34797 + }, + { + "epoch": 94.8174386920981, + "grad_norm": 2.698629379272461, + "learning_rate": 1.405384939365406e-07, + "loss": 0.1544, + "step": 34798 + }, + { + "epoch": 94.82016348773843, + "grad_norm": 2.3174290657043457, + "learning_rate": 1.403910997525859e-07, + "loss": 0.0643, + "step": 34799 + }, + { + "epoch": 94.82288828337875, + "grad_norm": 2.633542537689209, + "learning_rate": 1.402437823549474e-07, + "loss": 0.106, + "step": 34800 + }, + { + "epoch": 94.82561307901908, + "grad_norm": 3.1691648960113525, + "learning_rate": 1.4009654174477417e-07, + "loss": 0.0706, + "step": 34801 + }, + { + "epoch": 94.8283378746594, + "grad_norm": 2.363712787628174, + "learning_rate": 1.3994937792321085e-07, + "loss": 0.0458, + "step": 34802 + }, + { + "epoch": 94.83106267029973, + "grad_norm": 2.7807717323303223, + "learning_rate": 1.398022908914054e-07, + "loss": 0.0264, + "step": 34803 + }, + { + "epoch": 94.83378746594005, + "grad_norm": 1.9537835121154785, + "learning_rate": 1.3965528065050137e-07, + "loss": 0.0303, + "step": 34804 + }, + { + "epoch": 94.83651226158038, + "grad_norm": 3.4546995162963867, + "learning_rate": 1.3950834720164453e-07, + "loss": 0.0301, + "step": 34805 + }, + { + "epoch": 94.83923705722071, + "grad_norm": 1.9009343385696411, + "learning_rate": 1.3936149054598058e-07, + "loss": 0.2329, + "step": 34806 + }, + { + "epoch": 94.84196185286103, + "grad_norm": 7.271117210388184, + "learning_rate": 1.3921471068465085e-07, + "loss": 0.0348, + "step": 34807 + }, + { + "epoch": 94.84468664850137, + "grad_norm": 1.2325505018234253, + "learning_rate": 1.390680076188e-07, + "loss": 0.014, + "step": 34808 + }, + { + "epoch": 94.84741144414168, + "grad_norm": 3.228151798248291, + "learning_rate": 1.3892138134957045e-07, + "loss": 0.0402, + "step": 34809 + }, + { + "epoch": 94.85013623978202, + "grad_norm": 2.0668442249298096, + "learning_rate": 1.3877483187810348e-07, + "loss": 0.0264, + "step": 34810 + }, + { + "epoch": 94.85286103542235, + "grad_norm": 2.6093668937683105, + "learning_rate": 1.386283592055404e-07, + "loss": 0.0447, + "step": 34811 + }, + { + "epoch": 94.85558583106267, + "grad_norm": 2.0860109329223633, + "learning_rate": 1.3848196333302255e-07, + "loss": 0.0235, + "step": 34812 + }, + { + "epoch": 94.858310626703, + "grad_norm": 2.5715420246124268, + "learning_rate": 1.383356442616901e-07, + "loss": 0.0397, + "step": 34813 + }, + { + "epoch": 94.86103542234332, + "grad_norm": 2.8539466857910156, + "learning_rate": 1.3818940199268216e-07, + "loss": 0.0655, + "step": 34814 + }, + { + "epoch": 94.86376021798365, + "grad_norm": 2.208131790161133, + "learning_rate": 1.380432365271378e-07, + "loss": 0.0873, + "step": 34815 + }, + { + "epoch": 94.86648501362397, + "grad_norm": 3.4260189533233643, + "learning_rate": 1.378971478661939e-07, + "loss": 0.0779, + "step": 34816 + }, + { + "epoch": 94.8692098092643, + "grad_norm": 2.421434164047241, + "learning_rate": 1.3775113601099067e-07, + "loss": 0.1207, + "step": 34817 + }, + { + "epoch": 94.87193460490464, + "grad_norm": 2.585602283477783, + "learning_rate": 1.3760520096266494e-07, + "loss": 0.0743, + "step": 34818 + }, + { + "epoch": 94.87465940054496, + "grad_norm": 2.9377658367156982, + "learning_rate": 1.374593427223514e-07, + "loss": 0.1534, + "step": 34819 + }, + { + "epoch": 94.87738419618529, + "grad_norm": 2.74346661567688, + "learning_rate": 1.373135612911869e-07, + "loss": 0.041, + "step": 34820 + }, + { + "epoch": 94.88010899182561, + "grad_norm": 2.9906270503997803, + "learning_rate": 1.371678566703083e-07, + "loss": 0.0464, + "step": 34821 + }, + { + "epoch": 94.88283378746594, + "grad_norm": 1.8314659595489502, + "learning_rate": 1.3702222886084803e-07, + "loss": 0.155, + "step": 34822 + }, + { + "epoch": 94.88555858310627, + "grad_norm": 1.394993782043457, + "learning_rate": 1.3687667786394188e-07, + "loss": 0.0141, + "step": 34823 + }, + { + "epoch": 94.88828337874659, + "grad_norm": 3.0631768703460693, + "learning_rate": 1.3673120368072224e-07, + "loss": 0.0293, + "step": 34824 + }, + { + "epoch": 94.89100817438693, + "grad_norm": 3.240985870361328, + "learning_rate": 1.3658580631232266e-07, + "loss": 0.0798, + "step": 34825 + }, + { + "epoch": 94.89373297002724, + "grad_norm": 1.8917561769485474, + "learning_rate": 1.3644048575987557e-07, + "loss": 0.0424, + "step": 34826 + }, + { + "epoch": 94.89645776566758, + "grad_norm": 2.289652109146118, + "learning_rate": 1.3629524202451228e-07, + "loss": 0.0411, + "step": 34827 + }, + { + "epoch": 94.8991825613079, + "grad_norm": 2.186800003051758, + "learning_rate": 1.36150075107363e-07, + "loss": 0.0278, + "step": 34828 + }, + { + "epoch": 94.90190735694823, + "grad_norm": 3.771892547607422, + "learning_rate": 1.3600498500956129e-07, + "loss": 0.0681, + "step": 34829 + }, + { + "epoch": 94.90463215258856, + "grad_norm": 2.043431282043457, + "learning_rate": 1.3585997173223396e-07, + "loss": 0.0308, + "step": 34830 + }, + { + "epoch": 94.90735694822888, + "grad_norm": 2.3939459323883057, + "learning_rate": 1.3571503527651352e-07, + "loss": 0.0374, + "step": 34831 + }, + { + "epoch": 94.91008174386921, + "grad_norm": 3.482168197631836, + "learning_rate": 1.355701756435246e-07, + "loss": 0.1204, + "step": 34832 + }, + { + "epoch": 94.91280653950953, + "grad_norm": 1.9421875476837158, + "learning_rate": 1.3542539283439959e-07, + "loss": 0.0264, + "step": 34833 + }, + { + "epoch": 94.91553133514986, + "grad_norm": 2.034855842590332, + "learning_rate": 1.3528068685026208e-07, + "loss": 0.0312, + "step": 34834 + }, + { + "epoch": 94.9182561307902, + "grad_norm": 3.001547336578369, + "learning_rate": 1.3513605769224225e-07, + "loss": 0.0714, + "step": 34835 + }, + { + "epoch": 94.92098092643052, + "grad_norm": 4.648657321929932, + "learning_rate": 1.3499150536146588e-07, + "loss": 0.1142, + "step": 34836 + }, + { + "epoch": 94.92370572207085, + "grad_norm": 1.7883365154266357, + "learning_rate": 1.3484702985905763e-07, + "loss": 0.0209, + "step": 34837 + }, + { + "epoch": 94.92643051771117, + "grad_norm": 2.4563634395599365, + "learning_rate": 1.3470263118614324e-07, + "loss": 0.0313, + "step": 34838 + }, + { + "epoch": 94.9291553133515, + "grad_norm": 3.1272811889648438, + "learning_rate": 1.345583093438474e-07, + "loss": 0.0541, + "step": 34839 + }, + { + "epoch": 94.93188010899182, + "grad_norm": 2.5367186069488525, + "learning_rate": 1.3441406433329362e-07, + "loss": 0.0364, + "step": 34840 + }, + { + "epoch": 94.93460490463215, + "grad_norm": 2.2692346572875977, + "learning_rate": 1.3426989615560548e-07, + "loss": 0.0676, + "step": 34841 + }, + { + "epoch": 94.93732970027249, + "grad_norm": 1.523105263710022, + "learning_rate": 1.3412580481190651e-07, + "loss": 0.0242, + "step": 34842 + }, + { + "epoch": 94.9400544959128, + "grad_norm": 2.6941287517547607, + "learning_rate": 1.3398179030331805e-07, + "loss": 0.1296, + "step": 34843 + }, + { + "epoch": 94.94277929155314, + "grad_norm": 3.5964252948760986, + "learning_rate": 1.3383785263096138e-07, + "loss": 0.0895, + "step": 34844 + }, + { + "epoch": 94.94550408719346, + "grad_norm": 2.8641791343688965, + "learning_rate": 1.3369399179595787e-07, + "loss": 0.0594, + "step": 34845 + }, + { + "epoch": 94.94822888283379, + "grad_norm": 3.23000168800354, + "learning_rate": 1.3355020779942883e-07, + "loss": 0.0459, + "step": 34846 + }, + { + "epoch": 94.95095367847412, + "grad_norm": 2.3119685649871826, + "learning_rate": 1.3340650064249337e-07, + "loss": 0.0358, + "step": 34847 + }, + { + "epoch": 94.95367847411444, + "grad_norm": 2.7140254974365234, + "learning_rate": 1.3326287032626838e-07, + "loss": 0.2672, + "step": 34848 + }, + { + "epoch": 94.95640326975477, + "grad_norm": 1.8845314979553223, + "learning_rate": 1.331193168518774e-07, + "loss": 0.0227, + "step": 34849 + }, + { + "epoch": 94.95912806539509, + "grad_norm": 3.730475664138794, + "learning_rate": 1.3297584022043396e-07, + "loss": 0.0285, + "step": 34850 + }, + { + "epoch": 94.96185286103542, + "grad_norm": 1.4961528778076172, + "learning_rate": 1.328324404330572e-07, + "loss": 0.0202, + "step": 34851 + }, + { + "epoch": 94.96457765667574, + "grad_norm": 2.212015151977539, + "learning_rate": 1.32689117490864e-07, + "loss": 0.0771, + "step": 34852 + }, + { + "epoch": 94.96730245231608, + "grad_norm": 2.486266851425171, + "learning_rate": 1.325458713949701e-07, + "loss": 0.0441, + "step": 34853 + }, + { + "epoch": 94.97002724795641, + "grad_norm": 2.460434675216675, + "learning_rate": 1.3240270214649242e-07, + "loss": 0.0419, + "step": 34854 + }, + { + "epoch": 94.97275204359673, + "grad_norm": 3.0918476581573486, + "learning_rate": 1.322596097465445e-07, + "loss": 0.1347, + "step": 34855 + }, + { + "epoch": 94.97547683923706, + "grad_norm": 3.1286609172821045, + "learning_rate": 1.3211659419624102e-07, + "loss": 0.0341, + "step": 34856 + }, + { + "epoch": 94.97820163487738, + "grad_norm": 2.5470151901245117, + "learning_rate": 1.319736554966955e-07, + "loss": 0.0253, + "step": 34857 + }, + { + "epoch": 94.98092643051771, + "grad_norm": 1.877874493598938, + "learning_rate": 1.3183079364902153e-07, + "loss": 0.0297, + "step": 34858 + }, + { + "epoch": 94.98365122615803, + "grad_norm": 2.961230516433716, + "learning_rate": 1.3168800865433262e-07, + "loss": 0.0691, + "step": 34859 + }, + { + "epoch": 94.98637602179836, + "grad_norm": 2.6252262592315674, + "learning_rate": 1.3154530051373904e-07, + "loss": 0.0482, + "step": 34860 + }, + { + "epoch": 94.9891008174387, + "grad_norm": 3.1088922023773193, + "learning_rate": 1.3140266922835322e-07, + "loss": 0.1247, + "step": 34861 + }, + { + "epoch": 94.99182561307902, + "grad_norm": 2.101668119430542, + "learning_rate": 1.3126011479928646e-07, + "loss": 0.0299, + "step": 34862 + }, + { + "epoch": 94.99455040871935, + "grad_norm": 2.313483476638794, + "learning_rate": 1.3111763722764792e-07, + "loss": 0.0253, + "step": 34863 + }, + { + "epoch": 94.99727520435967, + "grad_norm": 2.9240059852600098, + "learning_rate": 1.3097523651454668e-07, + "loss": 0.0541, + "step": 34864 + }, + { + "epoch": 95.0, + "grad_norm": 3.7429819107055664, + "learning_rate": 1.30832912661093e-07, + "loss": 0.0527, + "step": 34865 + }, + { + "epoch": 95.00272479564033, + "grad_norm": 2.7895829677581787, + "learning_rate": 1.3069066566839594e-07, + "loss": 0.1409, + "step": 34866 + }, + { + "epoch": 95.00544959128065, + "grad_norm": 2.324601888656616, + "learning_rate": 1.3054849553756243e-07, + "loss": 0.03, + "step": 34867 + }, + { + "epoch": 95.00817438692098, + "grad_norm": 2.12203049659729, + "learning_rate": 1.3040640226969824e-07, + "loss": 0.0517, + "step": 34868 + }, + { + "epoch": 95.0108991825613, + "grad_norm": 3.364262104034424, + "learning_rate": 1.3026438586591138e-07, + "loss": 0.0823, + "step": 34869 + }, + { + "epoch": 95.01362397820164, + "grad_norm": 2.6119232177734375, + "learning_rate": 1.3012244632730876e-07, + "loss": 0.0527, + "step": 34870 + }, + { + "epoch": 95.01634877384195, + "grad_norm": 2.1571426391601562, + "learning_rate": 1.29980583654995e-07, + "loss": 0.0944, + "step": 34871 + }, + { + "epoch": 95.01907356948229, + "grad_norm": 1.6402757167816162, + "learning_rate": 1.298387978500737e-07, + "loss": 0.0158, + "step": 34872 + }, + { + "epoch": 95.02179836512262, + "grad_norm": 2.856287956237793, + "learning_rate": 1.2969708891365063e-07, + "loss": 0.0481, + "step": 34873 + }, + { + "epoch": 95.02452316076294, + "grad_norm": 3.9047768115997314, + "learning_rate": 1.2955545684682935e-07, + "loss": 0.0425, + "step": 34874 + }, + { + "epoch": 95.02724795640327, + "grad_norm": 2.873523473739624, + "learning_rate": 1.2941390165071232e-07, + "loss": 0.0315, + "step": 34875 + }, + { + "epoch": 95.02997275204359, + "grad_norm": 2.794736862182617, + "learning_rate": 1.292724233264031e-07, + "loss": 0.04, + "step": 34876 + }, + { + "epoch": 95.03269754768392, + "grad_norm": 1.4680901765823364, + "learning_rate": 1.2913102187500083e-07, + "loss": 0.0192, + "step": 34877 + }, + { + "epoch": 95.03542234332426, + "grad_norm": 2.1529393196105957, + "learning_rate": 1.2898969729760903e-07, + "loss": 0.2289, + "step": 34878 + }, + { + "epoch": 95.03814713896458, + "grad_norm": 3.5629093647003174, + "learning_rate": 1.2884844959532795e-07, + "loss": 0.0351, + "step": 34879 + }, + { + "epoch": 95.04087193460491, + "grad_norm": 4.032271862030029, + "learning_rate": 1.287072787692567e-07, + "loss": 0.1118, + "step": 34880 + }, + { + "epoch": 95.04359673024523, + "grad_norm": 2.075810670852661, + "learning_rate": 1.2856618482049664e-07, + "loss": 0.1547, + "step": 34881 + }, + { + "epoch": 95.04632152588556, + "grad_norm": 1.9002879858016968, + "learning_rate": 1.284251677501458e-07, + "loss": 0.0226, + "step": 34882 + }, + { + "epoch": 95.04904632152588, + "grad_norm": 3.5459165573120117, + "learning_rate": 1.2828422755930103e-07, + "loss": 0.0554, + "step": 34883 + }, + { + "epoch": 95.05177111716621, + "grad_norm": 2.863830089569092, + "learning_rate": 1.2814336424906038e-07, + "loss": 0.0791, + "step": 34884 + }, + { + "epoch": 95.05449591280654, + "grad_norm": 3.0242042541503906, + "learning_rate": 1.2800257782052183e-07, + "loss": 0.0974, + "step": 34885 + }, + { + "epoch": 95.05722070844686, + "grad_norm": 1.5003838539123535, + "learning_rate": 1.2786186827478231e-07, + "loss": 0.0198, + "step": 34886 + }, + { + "epoch": 95.0599455040872, + "grad_norm": 2.3934693336486816, + "learning_rate": 1.2772123561293648e-07, + "loss": 0.0198, + "step": 34887 + }, + { + "epoch": 95.06267029972751, + "grad_norm": 2.5218911170959473, + "learning_rate": 1.2758067983608013e-07, + "loss": 0.0914, + "step": 34888 + }, + { + "epoch": 95.06539509536785, + "grad_norm": 3.184844493865967, + "learning_rate": 1.2744020094530684e-07, + "loss": 0.1183, + "step": 34889 + }, + { + "epoch": 95.06811989100818, + "grad_norm": 4.118417739868164, + "learning_rate": 1.272997989417124e-07, + "loss": 0.124, + "step": 34890 + }, + { + "epoch": 95.0708446866485, + "grad_norm": 4.425246238708496, + "learning_rate": 1.2715947382638927e-07, + "loss": 0.0249, + "step": 34891 + }, + { + "epoch": 95.07356948228883, + "grad_norm": 2.5153684616088867, + "learning_rate": 1.27019225600431e-07, + "loss": 0.089, + "step": 34892 + }, + { + "epoch": 95.07629427792915, + "grad_norm": 2.478933572769165, + "learning_rate": 1.2687905426492786e-07, + "loss": 0.1829, + "step": 34893 + }, + { + "epoch": 95.07901907356948, + "grad_norm": 3.415781259536743, + "learning_rate": 1.267389598209734e-07, + "loss": 0.0884, + "step": 34894 + }, + { + "epoch": 95.0817438692098, + "grad_norm": 2.6993184089660645, + "learning_rate": 1.2659894226965896e-07, + "loss": 0.0449, + "step": 34895 + }, + { + "epoch": 95.08446866485014, + "grad_norm": 3.928115129470825, + "learning_rate": 1.264590016120737e-07, + "loss": 0.1692, + "step": 34896 + }, + { + "epoch": 95.08719346049047, + "grad_norm": 2.283688545227051, + "learning_rate": 1.2631913784930673e-07, + "loss": 0.0338, + "step": 34897 + }, + { + "epoch": 95.08991825613079, + "grad_norm": 2.976043939590454, + "learning_rate": 1.261793509824505e-07, + "loss": 0.0985, + "step": 34898 + }, + { + "epoch": 95.09264305177112, + "grad_norm": 3.0505940914154053, + "learning_rate": 1.260396410125908e-07, + "loss": 0.0369, + "step": 34899 + }, + { + "epoch": 95.09536784741144, + "grad_norm": 2.1225483417510986, + "learning_rate": 1.2590000794081681e-07, + "loss": 0.0746, + "step": 34900 + }, + { + "epoch": 95.09809264305177, + "grad_norm": 2.9096975326538086, + "learning_rate": 1.2576045176821429e-07, + "loss": 0.1006, + "step": 34901 + }, + { + "epoch": 95.1008174386921, + "grad_norm": 3.1333768367767334, + "learning_rate": 1.2562097249587235e-07, + "loss": 0.0552, + "step": 34902 + }, + { + "epoch": 95.10354223433242, + "grad_norm": 2.8274359703063965, + "learning_rate": 1.2548157012487684e-07, + "loss": 0.0454, + "step": 34903 + }, + { + "epoch": 95.10626702997276, + "grad_norm": 2.766693353652954, + "learning_rate": 1.253422446563135e-07, + "loss": 0.1045, + "step": 34904 + }, + { + "epoch": 95.10899182561307, + "grad_norm": 2.684654474258423, + "learning_rate": 1.2520299609126597e-07, + "loss": 0.1276, + "step": 34905 + }, + { + "epoch": 95.11171662125341, + "grad_norm": 2.9204459190368652, + "learning_rate": 1.250638244308211e-07, + "loss": 0.0339, + "step": 34906 + }, + { + "epoch": 95.11444141689373, + "grad_norm": 2.671907901763916, + "learning_rate": 1.2492472967606028e-07, + "loss": 0.0387, + "step": 34907 + }, + { + "epoch": 95.11716621253406, + "grad_norm": 2.584839105606079, + "learning_rate": 1.247857118280682e-07, + "loss": 0.0333, + "step": 34908 + }, + { + "epoch": 95.11989100817439, + "grad_norm": 1.9556174278259277, + "learning_rate": 1.246467708879262e-07, + "loss": 0.0238, + "step": 34909 + }, + { + "epoch": 95.12261580381471, + "grad_norm": 2.7594969272613525, + "learning_rate": 1.2450790685671898e-07, + "loss": 0.0455, + "step": 34910 + }, + { + "epoch": 95.12534059945504, + "grad_norm": 2.3766114711761475, + "learning_rate": 1.2436911973552567e-07, + "loss": 0.0196, + "step": 34911 + }, + { + "epoch": 95.12806539509536, + "grad_norm": 2.2204349040985107, + "learning_rate": 1.2423040952542764e-07, + "loss": 0.0708, + "step": 34912 + }, + { + "epoch": 95.1307901907357, + "grad_norm": 1.9182202816009521, + "learning_rate": 1.2409177622750511e-07, + "loss": 0.0375, + "step": 34913 + }, + { + "epoch": 95.13351498637603, + "grad_norm": 1.9348313808441162, + "learning_rate": 1.2395321984283836e-07, + "loss": 0.0236, + "step": 34914 + }, + { + "epoch": 95.13623978201635, + "grad_norm": 2.7442848682403564, + "learning_rate": 1.238147403725054e-07, + "loss": 0.0482, + "step": 34915 + }, + { + "epoch": 95.13896457765668, + "grad_norm": 2.229963779449463, + "learning_rate": 1.236763378175865e-07, + "loss": 0.0523, + "step": 34916 + }, + { + "epoch": 95.141689373297, + "grad_norm": 2.6778433322906494, + "learning_rate": 1.235380121791574e-07, + "loss": 0.0208, + "step": 34917 + }, + { + "epoch": 95.14441416893733, + "grad_norm": 2.4531588554382324, + "learning_rate": 1.233997634582973e-07, + "loss": 0.0577, + "step": 34918 + }, + { + "epoch": 95.14713896457765, + "grad_norm": 2.508636474609375, + "learning_rate": 1.2326159165608086e-07, + "loss": 0.0738, + "step": 34919 + }, + { + "epoch": 95.14986376021798, + "grad_norm": 2.7733452320098877, + "learning_rate": 1.2312349677358615e-07, + "loss": 0.0658, + "step": 34920 + }, + { + "epoch": 95.15258855585832, + "grad_norm": 2.0371108055114746, + "learning_rate": 1.2298547881188672e-07, + "loss": 0.0215, + "step": 34921 + }, + { + "epoch": 95.15531335149863, + "grad_norm": 2.1744349002838135, + "learning_rate": 1.228475377720595e-07, + "loss": 0.0386, + "step": 34922 + }, + { + "epoch": 95.15803814713897, + "grad_norm": 2.2133798599243164, + "learning_rate": 1.2270967365517694e-07, + "loss": 0.0324, + "step": 34923 + }, + { + "epoch": 95.16076294277929, + "grad_norm": 2.2831597328186035, + "learning_rate": 1.2257188646231487e-07, + "loss": 0.0644, + "step": 34924 + }, + { + "epoch": 95.16348773841962, + "grad_norm": 2.0685505867004395, + "learning_rate": 1.2243417619454356e-07, + "loss": 0.0373, + "step": 34925 + }, + { + "epoch": 95.16621253405995, + "grad_norm": 2.232891321182251, + "learning_rate": 1.2229654285293767e-07, + "loss": 0.0218, + "step": 34926 + }, + { + "epoch": 95.16893732970027, + "grad_norm": 2.931797981262207, + "learning_rate": 1.221589864385686e-07, + "loss": 0.0796, + "step": 34927 + }, + { + "epoch": 95.1716621253406, + "grad_norm": 1.7469284534454346, + "learning_rate": 1.220215069525077e-07, + "loss": 0.021, + "step": 34928 + }, + { + "epoch": 95.17438692098092, + "grad_norm": 1.9482605457305908, + "learning_rate": 1.218841043958241e-07, + "loss": 0.0509, + "step": 34929 + }, + { + "epoch": 95.17711171662125, + "grad_norm": 1.85743248462677, + "learning_rate": 1.217467787695903e-07, + "loss": 0.0395, + "step": 34930 + }, + { + "epoch": 95.17983651226157, + "grad_norm": 3.2541394233703613, + "learning_rate": 1.216095300748743e-07, + "loss": 0.1675, + "step": 34931 + }, + { + "epoch": 95.1825613079019, + "grad_norm": 4.0061421394348145, + "learning_rate": 1.214723583127464e-07, + "loss": 0.0344, + "step": 34932 + }, + { + "epoch": 95.18528610354224, + "grad_norm": 1.9873977899551392, + "learning_rate": 1.2133526348427237e-07, + "loss": 0.147, + "step": 34933 + }, + { + "epoch": 95.18801089918256, + "grad_norm": 3.1552674770355225, + "learning_rate": 1.211982455905214e-07, + "loss": 0.0817, + "step": 34934 + }, + { + "epoch": 95.19073569482289, + "grad_norm": 3.555838108062744, + "learning_rate": 1.210613046325615e-07, + "loss": 0.0433, + "step": 34935 + }, + { + "epoch": 95.19346049046321, + "grad_norm": 5.451581954956055, + "learning_rate": 1.2092444061145737e-07, + "loss": 0.0562, + "step": 34936 + }, + { + "epoch": 95.19618528610354, + "grad_norm": 2.656935453414917, + "learning_rate": 1.2078765352827591e-07, + "loss": 0.0331, + "step": 34937 + }, + { + "epoch": 95.19891008174388, + "grad_norm": 1.7232446670532227, + "learning_rate": 1.206509433840819e-07, + "loss": 0.0239, + "step": 34938 + }, + { + "epoch": 95.2016348773842, + "grad_norm": 2.219930410385132, + "learning_rate": 1.205143101799411e-07, + "loss": 0.0266, + "step": 34939 + }, + { + "epoch": 95.20435967302453, + "grad_norm": 2.011101722717285, + "learning_rate": 1.2037775391691708e-07, + "loss": 0.0352, + "step": 34940 + }, + { + "epoch": 95.20708446866485, + "grad_norm": 3.57807993888855, + "learning_rate": 1.2024127459607237e-07, + "loss": 0.0253, + "step": 34941 + }, + { + "epoch": 95.20980926430518, + "grad_norm": 4.179675102233887, + "learning_rate": 1.2010487221847056e-07, + "loss": 0.0483, + "step": 34942 + }, + { + "epoch": 95.2125340599455, + "grad_norm": 2.4080264568328857, + "learning_rate": 1.199685467851741e-07, + "loss": 0.0838, + "step": 34943 + }, + { + "epoch": 95.21525885558583, + "grad_norm": 4.186582088470459, + "learning_rate": 1.1983229829724552e-07, + "loss": 0.1244, + "step": 34944 + }, + { + "epoch": 95.21798365122616, + "grad_norm": 2.866173267364502, + "learning_rate": 1.1969612675574394e-07, + "loss": 0.0232, + "step": 34945 + }, + { + "epoch": 95.22070844686648, + "grad_norm": 3.340458869934082, + "learning_rate": 1.1956003216173184e-07, + "loss": 0.0741, + "step": 34946 + }, + { + "epoch": 95.22343324250681, + "grad_norm": 1.252720832824707, + "learning_rate": 1.194240145162673e-07, + "loss": 0.0143, + "step": 34947 + }, + { + "epoch": 95.22615803814713, + "grad_norm": 2.7562851905822754, + "learning_rate": 1.1928807382041163e-07, + "loss": 0.0262, + "step": 34948 + }, + { + "epoch": 95.22888283378747, + "grad_norm": 2.7015018463134766, + "learning_rate": 1.1915221007522182e-07, + "loss": 0.0258, + "step": 34949 + }, + { + "epoch": 95.2316076294278, + "grad_norm": 3.2789742946624756, + "learning_rate": 1.1901642328175589e-07, + "loss": 0.1718, + "step": 34950 + }, + { + "epoch": 95.23433242506812, + "grad_norm": 2.6375033855438232, + "learning_rate": 1.1888071344107299e-07, + "loss": 0.0342, + "step": 34951 + }, + { + "epoch": 95.23705722070845, + "grad_norm": 1.6955173015594482, + "learning_rate": 1.1874508055422895e-07, + "loss": 0.0219, + "step": 34952 + }, + { + "epoch": 95.23978201634877, + "grad_norm": 2.1850240230560303, + "learning_rate": 1.1860952462227959e-07, + "loss": 0.2059, + "step": 34953 + }, + { + "epoch": 95.2425068119891, + "grad_norm": 3.0885190963745117, + "learning_rate": 1.1847404564628185e-07, + "loss": 0.2006, + "step": 34954 + }, + { + "epoch": 95.24523160762942, + "grad_norm": 5.636951923370361, + "learning_rate": 1.1833864362729042e-07, + "loss": 0.1476, + "step": 34955 + }, + { + "epoch": 95.24795640326975, + "grad_norm": 2.7337357997894287, + "learning_rate": 1.1820331856635891e-07, + "loss": 0.0357, + "step": 34956 + }, + { + "epoch": 95.25068119891009, + "grad_norm": 2.0418336391448975, + "learning_rate": 1.1806807046454205e-07, + "loss": 0.0322, + "step": 34957 + }, + { + "epoch": 95.2534059945504, + "grad_norm": 4.560342311859131, + "learning_rate": 1.1793289932289343e-07, + "loss": 0.0235, + "step": 34958 + }, + { + "epoch": 95.25613079019074, + "grad_norm": 2.69103741645813, + "learning_rate": 1.1779780514246442e-07, + "loss": 0.0459, + "step": 34959 + }, + { + "epoch": 95.25885558583106, + "grad_norm": 4.488551139831543, + "learning_rate": 1.1766278792430974e-07, + "loss": 0.0322, + "step": 34960 + }, + { + "epoch": 95.26158038147139, + "grad_norm": 2.9406447410583496, + "learning_rate": 1.1752784766947744e-07, + "loss": 0.071, + "step": 34961 + }, + { + "epoch": 95.26430517711172, + "grad_norm": 3.2513558864593506, + "learning_rate": 1.1739298437902114e-07, + "loss": 0.0599, + "step": 34962 + }, + { + "epoch": 95.26702997275204, + "grad_norm": 1.8449701070785522, + "learning_rate": 1.1725819805398997e-07, + "loss": 0.0858, + "step": 34963 + }, + { + "epoch": 95.26975476839237, + "grad_norm": 2.264432668685913, + "learning_rate": 1.1712348869543421e-07, + "loss": 0.0307, + "step": 34964 + }, + { + "epoch": 95.2724795640327, + "grad_norm": 3.0598464012145996, + "learning_rate": 1.1698885630440193e-07, + "loss": 0.127, + "step": 34965 + }, + { + "epoch": 95.27520435967303, + "grad_norm": 5.287500858306885, + "learning_rate": 1.1685430088194227e-07, + "loss": 0.0581, + "step": 34966 + }, + { + "epoch": 95.27792915531334, + "grad_norm": 2.593297004699707, + "learning_rate": 1.167198224291044e-07, + "loss": 0.0199, + "step": 34967 + }, + { + "epoch": 95.28065395095368, + "grad_norm": 3.269404411315918, + "learning_rate": 1.1658542094693415e-07, + "loss": 0.159, + "step": 34968 + }, + { + "epoch": 95.28337874659401, + "grad_norm": 2.7901294231414795, + "learning_rate": 1.1645109643647734e-07, + "loss": 0.0303, + "step": 34969 + }, + { + "epoch": 95.28610354223433, + "grad_norm": 1.7133756875991821, + "learning_rate": 1.1631684889878203e-07, + "loss": 0.157, + "step": 34970 + }, + { + "epoch": 95.28882833787466, + "grad_norm": 2.4325482845306396, + "learning_rate": 1.1618267833489294e-07, + "loss": 0.0488, + "step": 34971 + }, + { + "epoch": 95.29155313351498, + "grad_norm": 2.3382508754730225, + "learning_rate": 1.160485847458559e-07, + "loss": 0.0534, + "step": 34972 + }, + { + "epoch": 95.29427792915531, + "grad_norm": 1.6980870962142944, + "learning_rate": 1.159145681327134e-07, + "loss": 0.025, + "step": 34973 + }, + { + "epoch": 95.29700272479565, + "grad_norm": 3.9710137844085693, + "learning_rate": 1.1578062849651017e-07, + "loss": 0.0851, + "step": 34974 + }, + { + "epoch": 95.29972752043597, + "grad_norm": 2.86478328704834, + "learning_rate": 1.1564676583828982e-07, + "loss": 0.0642, + "step": 34975 + }, + { + "epoch": 95.3024523160763, + "grad_norm": 3.3024609088897705, + "learning_rate": 1.1551298015909373e-07, + "loss": 0.0735, + "step": 34976 + }, + { + "epoch": 95.30517711171662, + "grad_norm": 2.7386791706085205, + "learning_rate": 1.1537927145996441e-07, + "loss": 0.0259, + "step": 34977 + }, + { + "epoch": 95.30790190735695, + "grad_norm": 2.7702622413635254, + "learning_rate": 1.1524563974194325e-07, + "loss": 0.0774, + "step": 34978 + }, + { + "epoch": 95.31062670299727, + "grad_norm": 2.326133966445923, + "learning_rate": 1.1511208500607163e-07, + "loss": 0.0227, + "step": 34979 + }, + { + "epoch": 95.3133514986376, + "grad_norm": 6.5108723640441895, + "learning_rate": 1.1497860725338872e-07, + "loss": 0.0345, + "step": 34980 + }, + { + "epoch": 95.31607629427793, + "grad_norm": 3.1286725997924805, + "learning_rate": 1.148452064849337e-07, + "loss": 0.0433, + "step": 34981 + }, + { + "epoch": 95.31880108991825, + "grad_norm": 1.9681954383850098, + "learning_rate": 1.1471188270174571e-07, + "loss": 0.0226, + "step": 34982 + }, + { + "epoch": 95.32152588555859, + "grad_norm": 2.716500997543335, + "learning_rate": 1.1457863590486507e-07, + "loss": 0.0421, + "step": 34983 + }, + { + "epoch": 95.3242506811989, + "grad_norm": 2.188465118408203, + "learning_rate": 1.1444546609532648e-07, + "loss": 0.0491, + "step": 34984 + }, + { + "epoch": 95.32697547683924, + "grad_norm": 2.2012417316436768, + "learning_rate": 1.1431237327416911e-07, + "loss": 0.054, + "step": 34985 + }, + { + "epoch": 95.32970027247957, + "grad_norm": 2.2194905281066895, + "learning_rate": 1.1417935744242769e-07, + "loss": 0.1597, + "step": 34986 + }, + { + "epoch": 95.33242506811989, + "grad_norm": 2.5500473976135254, + "learning_rate": 1.140464186011403e-07, + "loss": 0.0604, + "step": 34987 + }, + { + "epoch": 95.33514986376022, + "grad_norm": 2.875729560852051, + "learning_rate": 1.1391355675134164e-07, + "loss": 0.0867, + "step": 34988 + }, + { + "epoch": 95.33787465940054, + "grad_norm": 2.884606122970581, + "learning_rate": 1.1378077189406422e-07, + "loss": 0.0252, + "step": 34989 + }, + { + "epoch": 95.34059945504087, + "grad_norm": 2.349778890609741, + "learning_rate": 1.13648064030345e-07, + "loss": 0.0254, + "step": 34990 + }, + { + "epoch": 95.34332425068119, + "grad_norm": 2.657801628112793, + "learning_rate": 1.135154331612165e-07, + "loss": 0.0343, + "step": 34991 + }, + { + "epoch": 95.34604904632153, + "grad_norm": 3.0789895057678223, + "learning_rate": 1.133828792877123e-07, + "loss": 0.1523, + "step": 34992 + }, + { + "epoch": 95.34877384196186, + "grad_norm": 2.754234790802002, + "learning_rate": 1.1325040241086383e-07, + "loss": 0.0944, + "step": 34993 + }, + { + "epoch": 95.35149863760218, + "grad_norm": 1.4009101390838623, + "learning_rate": 1.1311800253170246e-07, + "loss": 0.017, + "step": 34994 + }, + { + "epoch": 95.35422343324251, + "grad_norm": 2.27170467376709, + "learning_rate": 1.1298567965125962e-07, + "loss": 0.0333, + "step": 34995 + }, + { + "epoch": 95.35694822888283, + "grad_norm": 2.2349345684051514, + "learning_rate": 1.1285343377056668e-07, + "loss": 0.0234, + "step": 34996 + }, + { + "epoch": 95.35967302452316, + "grad_norm": 2.849677562713623, + "learning_rate": 1.1272126489065283e-07, + "loss": 0.0922, + "step": 34997 + }, + { + "epoch": 95.3623978201635, + "grad_norm": 3.9061155319213867, + "learning_rate": 1.1258917301254724e-07, + "loss": 0.0728, + "step": 34998 + }, + { + "epoch": 95.36512261580381, + "grad_norm": 2.703514575958252, + "learning_rate": 1.1245715813727908e-07, + "loss": 0.0204, + "step": 34999 + }, + { + "epoch": 95.36784741144415, + "grad_norm": 4.365962505340576, + "learning_rate": 1.1232522026587755e-07, + "loss": 0.1399, + "step": 35000 + }, + { + "epoch": 95.37057220708446, + "grad_norm": 3.200329065322876, + "learning_rate": 1.1219335939936738e-07, + "loss": 0.1848, + "step": 35001 + }, + { + "epoch": 95.3732970027248, + "grad_norm": 2.2563517093658447, + "learning_rate": 1.1206157553877772e-07, + "loss": 0.0317, + "step": 35002 + }, + { + "epoch": 95.37602179836512, + "grad_norm": 2.1221606731414795, + "learning_rate": 1.1192986868513445e-07, + "loss": 0.0275, + "step": 35003 + }, + { + "epoch": 95.37874659400545, + "grad_norm": 4.090084075927734, + "learning_rate": 1.1179823883946228e-07, + "loss": 0.0462, + "step": 35004 + }, + { + "epoch": 95.38147138964578, + "grad_norm": 3.4763824939727783, + "learning_rate": 1.1166668600278818e-07, + "loss": 0.1238, + "step": 35005 + }, + { + "epoch": 95.3841961852861, + "grad_norm": 1.9323807954788208, + "learning_rate": 1.1153521017613467e-07, + "loss": 0.0498, + "step": 35006 + }, + { + "epoch": 95.38692098092643, + "grad_norm": 3.275866985321045, + "learning_rate": 1.1140381136052758e-07, + "loss": 0.0597, + "step": 35007 + }, + { + "epoch": 95.38964577656675, + "grad_norm": 2.1088693141937256, + "learning_rate": 1.1127248955698833e-07, + "loss": 0.0225, + "step": 35008 + }, + { + "epoch": 95.39237057220708, + "grad_norm": 3.1419129371643066, + "learning_rate": 1.1114124476654164e-07, + "loss": 0.0229, + "step": 35009 + }, + { + "epoch": 95.39509536784742, + "grad_norm": 2.0916402339935303, + "learning_rate": 1.1101007699020782e-07, + "loss": 0.0295, + "step": 35010 + }, + { + "epoch": 95.39782016348774, + "grad_norm": 2.159738779067993, + "learning_rate": 1.108789862290105e-07, + "loss": 0.0459, + "step": 35011 + }, + { + "epoch": 95.40054495912807, + "grad_norm": 1.6449337005615234, + "learning_rate": 1.1074797248396884e-07, + "loss": 0.0187, + "step": 35012 + }, + { + "epoch": 95.40326975476839, + "grad_norm": 2.5766232013702393, + "learning_rate": 1.1061703575610316e-07, + "loss": 0.0264, + "step": 35013 + }, + { + "epoch": 95.40599455040872, + "grad_norm": 2.9680097103118896, + "learning_rate": 1.1048617604643374e-07, + "loss": 0.0848, + "step": 35014 + }, + { + "epoch": 95.40871934604904, + "grad_norm": 2.2628979682922363, + "learning_rate": 1.1035539335598089e-07, + "loss": 0.0191, + "step": 35015 + }, + { + "epoch": 95.41144414168937, + "grad_norm": 2.8828155994415283, + "learning_rate": 1.1022468768576044e-07, + "loss": 0.0382, + "step": 35016 + }, + { + "epoch": 95.4141689373297, + "grad_norm": 3.371868133544922, + "learning_rate": 1.1009405903679271e-07, + "loss": 0.0622, + "step": 35017 + }, + { + "epoch": 95.41689373297002, + "grad_norm": 2.551166296005249, + "learning_rate": 1.0996350741009355e-07, + "loss": 0.0514, + "step": 35018 + }, + { + "epoch": 95.41961852861036, + "grad_norm": 2.7263717651367188, + "learning_rate": 1.0983303280668101e-07, + "loss": 0.0601, + "step": 35019 + }, + { + "epoch": 95.42234332425068, + "grad_norm": 3.4563968181610107, + "learning_rate": 1.0970263522756985e-07, + "loss": 0.0473, + "step": 35020 + }, + { + "epoch": 95.42506811989101, + "grad_norm": 2.899994373321533, + "learning_rate": 1.0957231467377704e-07, + "loss": 0.0742, + "step": 35021 + }, + { + "epoch": 95.42779291553134, + "grad_norm": 2.167938709259033, + "learning_rate": 1.0944207114631622e-07, + "loss": 0.0417, + "step": 35022 + }, + { + "epoch": 95.43051771117166, + "grad_norm": 1.9148547649383545, + "learning_rate": 1.09311904646201e-07, + "loss": 0.0265, + "step": 35023 + }, + { + "epoch": 95.433242506812, + "grad_norm": 2.099299669265747, + "learning_rate": 1.0918181517444836e-07, + "loss": 0.0368, + "step": 35024 + }, + { + "epoch": 95.43596730245231, + "grad_norm": 2.237480401992798, + "learning_rate": 1.0905180273206862e-07, + "loss": 0.0728, + "step": 35025 + }, + { + "epoch": 95.43869209809264, + "grad_norm": 10.043222427368164, + "learning_rate": 1.0892186732007538e-07, + "loss": 0.2052, + "step": 35026 + }, + { + "epoch": 95.44141689373296, + "grad_norm": 2.3342204093933105, + "learning_rate": 1.0879200893947895e-07, + "loss": 0.0426, + "step": 35027 + }, + { + "epoch": 95.4441416893733, + "grad_norm": 2.1813864707946777, + "learning_rate": 1.0866222759129296e-07, + "loss": 0.0953, + "step": 35028 + }, + { + "epoch": 95.44686648501363, + "grad_norm": 2.487837553024292, + "learning_rate": 1.0853252327652775e-07, + "loss": 0.0555, + "step": 35029 + }, + { + "epoch": 95.44959128065395, + "grad_norm": 2.4842350482940674, + "learning_rate": 1.0840289599619247e-07, + "loss": 0.0201, + "step": 35030 + }, + { + "epoch": 95.45231607629428, + "grad_norm": 7.030800819396973, + "learning_rate": 1.0827334575129633e-07, + "loss": 0.0904, + "step": 35031 + }, + { + "epoch": 95.4550408719346, + "grad_norm": 3.4436264038085938, + "learning_rate": 1.0814387254284964e-07, + "loss": 0.0826, + "step": 35032 + }, + { + "epoch": 95.45776566757493, + "grad_norm": 4.5369086265563965, + "learning_rate": 1.0801447637186047e-07, + "loss": 0.033, + "step": 35033 + }, + { + "epoch": 95.46049046321527, + "grad_norm": 2.9388928413391113, + "learning_rate": 1.0788515723933579e-07, + "loss": 0.0466, + "step": 35034 + }, + { + "epoch": 95.46321525885558, + "grad_norm": 9.000701904296875, + "learning_rate": 1.077559151462837e-07, + "loss": 0.1025, + "step": 35035 + }, + { + "epoch": 95.46594005449592, + "grad_norm": 1.9095757007598877, + "learning_rate": 1.0762675009370893e-07, + "loss": 0.0186, + "step": 35036 + }, + { + "epoch": 95.46866485013624, + "grad_norm": 2.6702628135681152, + "learning_rate": 1.0749766208261959e-07, + "loss": 0.0462, + "step": 35037 + }, + { + "epoch": 95.47138964577657, + "grad_norm": 2.052314519882202, + "learning_rate": 1.073686511140204e-07, + "loss": 0.0338, + "step": 35038 + }, + { + "epoch": 95.47411444141689, + "grad_norm": 3.0173497200012207, + "learning_rate": 1.0723971718891502e-07, + "loss": 0.0507, + "step": 35039 + }, + { + "epoch": 95.47683923705722, + "grad_norm": 2.7834537029266357, + "learning_rate": 1.071108603083082e-07, + "loss": 0.0232, + "step": 35040 + }, + { + "epoch": 95.47956403269755, + "grad_norm": 3.012296199798584, + "learning_rate": 1.0698208047320358e-07, + "loss": 0.0333, + "step": 35041 + }, + { + "epoch": 95.48228882833787, + "grad_norm": 2.0441133975982666, + "learning_rate": 1.068533776846048e-07, + "loss": 0.1981, + "step": 35042 + }, + { + "epoch": 95.4850136239782, + "grad_norm": 2.503466844558716, + "learning_rate": 1.0672475194351328e-07, + "loss": 0.1128, + "step": 35043 + }, + { + "epoch": 95.48773841961852, + "grad_norm": 3.115562915802002, + "learning_rate": 1.0659620325093045e-07, + "loss": 0.1557, + "step": 35044 + }, + { + "epoch": 95.49046321525886, + "grad_norm": 3.1295604705810547, + "learning_rate": 1.0646773160785884e-07, + "loss": 0.1138, + "step": 35045 + }, + { + "epoch": 95.49318801089919, + "grad_norm": 1.9670004844665527, + "learning_rate": 1.0633933701529764e-07, + "loss": 0.0264, + "step": 35046 + }, + { + "epoch": 95.49591280653951, + "grad_norm": 2.5413930416107178, + "learning_rate": 1.0621101947424717e-07, + "loss": 0.0849, + "step": 35047 + }, + { + "epoch": 95.49863760217984, + "grad_norm": 4.066226482391357, + "learning_rate": 1.0608277898570663e-07, + "loss": 0.1332, + "step": 35048 + }, + { + "epoch": 95.50136239782016, + "grad_norm": 2.419011354446411, + "learning_rate": 1.0595461555067521e-07, + "loss": 0.0991, + "step": 35049 + }, + { + "epoch": 95.50408719346049, + "grad_norm": 2.352062702178955, + "learning_rate": 1.0582652917015101e-07, + "loss": 0.02, + "step": 35050 + }, + { + "epoch": 95.50681198910081, + "grad_norm": 4.402019023895264, + "learning_rate": 1.0569851984513102e-07, + "loss": 0.0727, + "step": 35051 + }, + { + "epoch": 95.50953678474114, + "grad_norm": 2.710862398147583, + "learning_rate": 1.0557058757661331e-07, + "loss": 0.0717, + "step": 35052 + }, + { + "epoch": 95.51226158038148, + "grad_norm": 3.1294167041778564, + "learning_rate": 1.0544273236559266e-07, + "loss": 0.0402, + "step": 35053 + }, + { + "epoch": 95.5149863760218, + "grad_norm": 2.3434746265411377, + "learning_rate": 1.0531495421306492e-07, + "loss": 0.0988, + "step": 35054 + }, + { + "epoch": 95.51771117166213, + "grad_norm": 7.592291831970215, + "learning_rate": 1.0518725312002709e-07, + "loss": 0.0843, + "step": 35055 + }, + { + "epoch": 95.52043596730245, + "grad_norm": 3.7560784816741943, + "learning_rate": 1.0505962908747281e-07, + "loss": 0.051, + "step": 35056 + }, + { + "epoch": 95.52316076294278, + "grad_norm": 2.4683263301849365, + "learning_rate": 1.0493208211639349e-07, + "loss": 0.0423, + "step": 35057 + }, + { + "epoch": 95.52588555858311, + "grad_norm": 2.3147597312927246, + "learning_rate": 1.0480461220778725e-07, + "loss": 0.0788, + "step": 35058 + }, + { + "epoch": 95.52861035422343, + "grad_norm": 1.7609657049179077, + "learning_rate": 1.0467721936264219e-07, + "loss": 0.0219, + "step": 35059 + }, + { + "epoch": 95.53133514986376, + "grad_norm": 1.9314008951187134, + "learning_rate": 1.0454990358195305e-07, + "loss": 0.0304, + "step": 35060 + }, + { + "epoch": 95.53405994550408, + "grad_norm": 2.434859037399292, + "learning_rate": 1.0442266486671126e-07, + "loss": 0.0556, + "step": 35061 + }, + { + "epoch": 95.53678474114442, + "grad_norm": 2.1970648765563965, + "learning_rate": 1.0429550321790716e-07, + "loss": 0.0566, + "step": 35062 + }, + { + "epoch": 95.53950953678473, + "grad_norm": 3.4781670570373535, + "learning_rate": 1.0416841863653105e-07, + "loss": 0.04, + "step": 35063 + }, + { + "epoch": 95.54223433242507, + "grad_norm": 2.1384620666503906, + "learning_rate": 1.0404141112357325e-07, + "loss": 0.0196, + "step": 35064 + }, + { + "epoch": 95.5449591280654, + "grad_norm": 1.8867310285568237, + "learning_rate": 1.0391448068002185e-07, + "loss": 0.0286, + "step": 35065 + }, + { + "epoch": 95.54768392370572, + "grad_norm": 2.1695098876953125, + "learning_rate": 1.0378762730686609e-07, + "loss": 0.0344, + "step": 35066 + }, + { + "epoch": 95.55040871934605, + "grad_norm": 2.2543327808380127, + "learning_rate": 1.0366085100509405e-07, + "loss": 0.0485, + "step": 35067 + }, + { + "epoch": 95.55313351498637, + "grad_norm": 2.3990397453308105, + "learning_rate": 1.0353415177569271e-07, + "loss": 0.024, + "step": 35068 + }, + { + "epoch": 95.5558583106267, + "grad_norm": 4.668440818786621, + "learning_rate": 1.0340752961964795e-07, + "loss": 0.1383, + "step": 35069 + }, + { + "epoch": 95.55858310626704, + "grad_norm": 3.2616732120513916, + "learning_rate": 1.0328098453794788e-07, + "loss": 0.1184, + "step": 35070 + }, + { + "epoch": 95.56130790190736, + "grad_norm": 2.650279998779297, + "learning_rate": 1.0315451653157615e-07, + "loss": 0.0627, + "step": 35071 + }, + { + "epoch": 95.56403269754769, + "grad_norm": 3.5118069648742676, + "learning_rate": 1.0302812560151976e-07, + "loss": 0.084, + "step": 35072 + }, + { + "epoch": 95.566757493188, + "grad_norm": 2.4976346492767334, + "learning_rate": 1.0290181174876124e-07, + "loss": 0.1904, + "step": 35073 + }, + { + "epoch": 95.56948228882834, + "grad_norm": 2.72570538520813, + "learning_rate": 1.0277557497428536e-07, + "loss": 0.0304, + "step": 35074 + }, + { + "epoch": 95.57220708446866, + "grad_norm": 4.170415878295898, + "learning_rate": 1.0264941527907247e-07, + "loss": 0.1321, + "step": 35075 + }, + { + "epoch": 95.57493188010899, + "grad_norm": 4.140685081481934, + "learning_rate": 1.0252333266410952e-07, + "loss": 0.0586, + "step": 35076 + }, + { + "epoch": 95.57765667574932, + "grad_norm": 2.057738780975342, + "learning_rate": 1.0239732713037576e-07, + "loss": 0.0273, + "step": 35077 + }, + { + "epoch": 95.58038147138964, + "grad_norm": 1.8662406206130981, + "learning_rate": 1.0227139867885371e-07, + "loss": 0.059, + "step": 35078 + }, + { + "epoch": 95.58310626702998, + "grad_norm": 2.9774651527404785, + "learning_rate": 1.0214554731052261e-07, + "loss": 0.0301, + "step": 35079 + }, + { + "epoch": 95.5858310626703, + "grad_norm": 1.653913974761963, + "learning_rate": 1.020197730263639e-07, + "loss": 0.0138, + "step": 35080 + }, + { + "epoch": 95.58855585831063, + "grad_norm": 1.8388270139694214, + "learning_rate": 1.0189407582735566e-07, + "loss": 0.0581, + "step": 35081 + }, + { + "epoch": 95.59128065395096, + "grad_norm": 3.453791379928589, + "learning_rate": 1.0176845571447936e-07, + "loss": 0.0999, + "step": 35082 + }, + { + "epoch": 95.59400544959128, + "grad_norm": 3.2059035301208496, + "learning_rate": 1.0164291268870974e-07, + "loss": 0.0825, + "step": 35083 + }, + { + "epoch": 95.59673024523161, + "grad_norm": 1.9955600500106812, + "learning_rate": 1.0151744675102826e-07, + "loss": 0.0237, + "step": 35084 + }, + { + "epoch": 95.59945504087193, + "grad_norm": 2.2362756729125977, + "learning_rate": 1.0139205790240969e-07, + "loss": 0.0336, + "step": 35085 + }, + { + "epoch": 95.60217983651226, + "grad_norm": 2.192676067352295, + "learning_rate": 1.0126674614383214e-07, + "loss": 0.1018, + "step": 35086 + }, + { + "epoch": 95.60490463215258, + "grad_norm": 3.1578562259674072, + "learning_rate": 1.0114151147626927e-07, + "loss": 0.1314, + "step": 35087 + }, + { + "epoch": 95.60762942779292, + "grad_norm": 2.281991958618164, + "learning_rate": 1.0101635390069809e-07, + "loss": 0.032, + "step": 35088 + }, + { + "epoch": 95.61035422343325, + "grad_norm": 1.8152971267700195, + "learning_rate": 1.0089127341809336e-07, + "loss": 0.0204, + "step": 35089 + }, + { + "epoch": 95.61307901907357, + "grad_norm": 2.4973959922790527, + "learning_rate": 1.0076627002942873e-07, + "loss": 0.0382, + "step": 35090 + }, + { + "epoch": 95.6158038147139, + "grad_norm": 2.242245674133301, + "learning_rate": 1.006413437356768e-07, + "loss": 0.0788, + "step": 35091 + }, + { + "epoch": 95.61852861035422, + "grad_norm": 3.0806093215942383, + "learning_rate": 1.0051649453781231e-07, + "loss": 0.0406, + "step": 35092 + }, + { + "epoch": 95.62125340599455, + "grad_norm": 2.292752265930176, + "learning_rate": 1.0039172243680673e-07, + "loss": 0.0349, + "step": 35093 + }, + { + "epoch": 95.62397820163488, + "grad_norm": 3.0341873168945312, + "learning_rate": 1.0026702743363148e-07, + "loss": 0.0481, + "step": 35094 + }, + { + "epoch": 95.6267029972752, + "grad_norm": 2.9238197803497314, + "learning_rate": 1.0014240952925803e-07, + "loss": 0.0355, + "step": 35095 + }, + { + "epoch": 95.62942779291554, + "grad_norm": 3.0007381439208984, + "learning_rate": 1.000178687246578e-07, + "loss": 0.1112, + "step": 35096 + }, + { + "epoch": 95.63215258855585, + "grad_norm": 2.056663990020752, + "learning_rate": 9.989340502079891e-08, + "loss": 0.0726, + "step": 35097 + }, + { + "epoch": 95.63487738419619, + "grad_norm": 2.571248769760132, + "learning_rate": 9.976901841865172e-08, + "loss": 0.0842, + "step": 35098 + }, + { + "epoch": 95.6376021798365, + "grad_norm": 3.0214622020721436, + "learning_rate": 9.964470891918431e-08, + "loss": 0.1119, + "step": 35099 + }, + { + "epoch": 95.64032697547684, + "grad_norm": 2.4208412170410156, + "learning_rate": 9.952047652336594e-08, + "loss": 0.0899, + "step": 35100 + }, + { + "epoch": 95.64305177111717, + "grad_norm": 4.0630974769592285, + "learning_rate": 9.939632123216359e-08, + "loss": 0.1332, + "step": 35101 + }, + { + "epoch": 95.64577656675749, + "grad_norm": 2.8814077377319336, + "learning_rate": 9.927224304654315e-08, + "loss": 0.1247, + "step": 35102 + }, + { + "epoch": 95.64850136239782, + "grad_norm": 1.5603978633880615, + "learning_rate": 9.914824196747274e-08, + "loss": 0.0197, + "step": 35103 + }, + { + "epoch": 95.65122615803814, + "grad_norm": 3.7697665691375732, + "learning_rate": 9.902431799591605e-08, + "loss": 0.0686, + "step": 35104 + }, + { + "epoch": 95.65395095367847, + "grad_norm": 1.7513145208358765, + "learning_rate": 9.890047113284118e-08, + "loss": 0.0263, + "step": 35105 + }, + { + "epoch": 95.65667574931881, + "grad_norm": 2.5381932258605957, + "learning_rate": 9.877670137920958e-08, + "loss": 0.1025, + "step": 35106 + }, + { + "epoch": 95.65940054495913, + "grad_norm": 2.0419929027557373, + "learning_rate": 9.865300873598605e-08, + "loss": 0.0169, + "step": 35107 + }, + { + "epoch": 95.66212534059946, + "grad_norm": 2.7394063472747803, + "learning_rate": 9.852939320413424e-08, + "loss": 0.0265, + "step": 35108 + }, + { + "epoch": 95.66485013623978, + "grad_norm": 2.241105079650879, + "learning_rate": 9.840585478461673e-08, + "loss": 0.0373, + "step": 35109 + }, + { + "epoch": 95.66757493188011, + "grad_norm": 3.284921646118164, + "learning_rate": 9.828239347839607e-08, + "loss": 0.0297, + "step": 35110 + }, + { + "epoch": 95.67029972752043, + "grad_norm": 2.441310167312622, + "learning_rate": 9.815900928643374e-08, + "loss": 0.055, + "step": 35111 + }, + { + "epoch": 95.67302452316076, + "grad_norm": 2.2745747566223145, + "learning_rate": 9.803570220969006e-08, + "loss": 0.0336, + "step": 35112 + }, + { + "epoch": 95.6757493188011, + "grad_norm": 2.1112680435180664, + "learning_rate": 9.791247224912647e-08, + "loss": 0.0533, + "step": 35113 + }, + { + "epoch": 95.67847411444141, + "grad_norm": 2.212068796157837, + "learning_rate": 9.778931940570113e-08, + "loss": 0.0273, + "step": 35114 + }, + { + "epoch": 95.68119891008175, + "grad_norm": 1.7880301475524902, + "learning_rate": 9.766624368037436e-08, + "loss": 0.0239, + "step": 35115 + }, + { + "epoch": 95.68392370572207, + "grad_norm": 2.708158254623413, + "learning_rate": 9.754324507410317e-08, + "loss": 0.0559, + "step": 35116 + }, + { + "epoch": 95.6866485013624, + "grad_norm": 2.7598323822021484, + "learning_rate": 9.742032358784681e-08, + "loss": 0.0802, + "step": 35117 + }, + { + "epoch": 95.68937329700273, + "grad_norm": 1.3291863203048706, + "learning_rate": 9.729747922256228e-08, + "loss": 0.1452, + "step": 35118 + }, + { + "epoch": 95.69209809264305, + "grad_norm": 2.062356472015381, + "learning_rate": 9.717471197920658e-08, + "loss": 0.0476, + "step": 35119 + }, + { + "epoch": 95.69482288828338, + "grad_norm": 3.2122371196746826, + "learning_rate": 9.705202185873563e-08, + "loss": 0.0231, + "step": 35120 + }, + { + "epoch": 95.6975476839237, + "grad_norm": 1.874733328819275, + "learning_rate": 9.692940886210422e-08, + "loss": 0.0655, + "step": 35121 + }, + { + "epoch": 95.70027247956403, + "grad_norm": 2.1043713092803955, + "learning_rate": 9.680687299026826e-08, + "loss": 0.0402, + "step": 35122 + }, + { + "epoch": 95.70299727520435, + "grad_norm": 2.0644664764404297, + "learning_rate": 9.66844142441814e-08, + "loss": 0.0464, + "step": 35123 + }, + { + "epoch": 95.70572207084469, + "grad_norm": 2.392665147781372, + "learning_rate": 9.656203262479735e-08, + "loss": 0.031, + "step": 35124 + }, + { + "epoch": 95.70844686648502, + "grad_norm": 2.3267199993133545, + "learning_rate": 9.64397281330709e-08, + "loss": 0.0273, + "step": 35125 + }, + { + "epoch": 95.71117166212534, + "grad_norm": 2.2901506423950195, + "learning_rate": 9.631750076995128e-08, + "loss": 0.0514, + "step": 35126 + }, + { + "epoch": 95.71389645776567, + "grad_norm": 1.840728521347046, + "learning_rate": 9.619535053639328e-08, + "loss": 0.0261, + "step": 35127 + }, + { + "epoch": 95.71662125340599, + "grad_norm": 2.655202627182007, + "learning_rate": 9.607327743334616e-08, + "loss": 0.0269, + "step": 35128 + }, + { + "epoch": 95.71934604904632, + "grad_norm": 2.934680223464966, + "learning_rate": 9.595128146176247e-08, + "loss": 0.1405, + "step": 35129 + }, + { + "epoch": 95.72207084468666, + "grad_norm": 1.86601722240448, + "learning_rate": 9.582936262259146e-08, + "loss": 0.0825, + "step": 35130 + }, + { + "epoch": 95.72479564032697, + "grad_norm": 3.856334686279297, + "learning_rate": 9.570752091678237e-08, + "loss": 0.1767, + "step": 35131 + }, + { + "epoch": 95.7275204359673, + "grad_norm": 1.8248963356018066, + "learning_rate": 9.558575634528444e-08, + "loss": 0.0625, + "step": 35132 + }, + { + "epoch": 95.73024523160763, + "grad_norm": 2.632397174835205, + "learning_rate": 9.54640689090458e-08, + "loss": 0.0634, + "step": 35133 + }, + { + "epoch": 95.73297002724796, + "grad_norm": 2.9107959270477295, + "learning_rate": 9.534245860901347e-08, + "loss": 0.0526, + "step": 35134 + }, + { + "epoch": 95.73569482288828, + "grad_norm": 2.6701486110687256, + "learning_rate": 9.522092544613671e-08, + "loss": 0.0803, + "step": 35135 + }, + { + "epoch": 95.73841961852861, + "grad_norm": 2.162994623184204, + "learning_rate": 9.509946942135916e-08, + "loss": 0.0482, + "step": 35136 + }, + { + "epoch": 95.74114441416894, + "grad_norm": 3.5007174015045166, + "learning_rate": 9.497809053562901e-08, + "loss": 0.219, + "step": 35137 + }, + { + "epoch": 95.74386920980926, + "grad_norm": 2.6569952964782715, + "learning_rate": 9.485678878989102e-08, + "loss": 0.0795, + "step": 35138 + }, + { + "epoch": 95.7465940054496, + "grad_norm": 2.499392032623291, + "learning_rate": 9.473556418508889e-08, + "loss": 0.0744, + "step": 35139 + }, + { + "epoch": 95.74931880108991, + "grad_norm": 2.9137237071990967, + "learning_rate": 9.461441672216743e-08, + "loss": 0.0993, + "step": 35140 + }, + { + "epoch": 95.75204359673025, + "grad_norm": 1.7527599334716797, + "learning_rate": 9.449334640207031e-08, + "loss": 0.018, + "step": 35141 + }, + { + "epoch": 95.75476839237058, + "grad_norm": 2.412987470626831, + "learning_rate": 9.437235322574123e-08, + "loss": 0.0639, + "step": 35142 + }, + { + "epoch": 95.7574931880109, + "grad_norm": 2.5925357341766357, + "learning_rate": 9.425143719411945e-08, + "loss": 0.034, + "step": 35143 + }, + { + "epoch": 95.76021798365123, + "grad_norm": 2.732663154602051, + "learning_rate": 9.413059830814975e-08, + "loss": 0.0427, + "step": 35144 + }, + { + "epoch": 95.76294277929155, + "grad_norm": 3.209555149078369, + "learning_rate": 9.400983656877138e-08, + "loss": 0.0641, + "step": 35145 + }, + { + "epoch": 95.76566757493188, + "grad_norm": 1.7188575267791748, + "learning_rate": 9.388915197692694e-08, + "loss": 0.0236, + "step": 35146 + }, + { + "epoch": 95.7683923705722, + "grad_norm": 2.841384172439575, + "learning_rate": 9.376854453355455e-08, + "loss": 0.0549, + "step": 35147 + }, + { + "epoch": 95.77111716621253, + "grad_norm": 3.503021717071533, + "learning_rate": 9.364801423959235e-08, + "loss": 0.0352, + "step": 35148 + }, + { + "epoch": 95.77384196185287, + "grad_norm": 2.6008212566375732, + "learning_rate": 9.352756109598183e-08, + "loss": 0.0562, + "step": 35149 + }, + { + "epoch": 95.77656675749319, + "grad_norm": 2.5199153423309326, + "learning_rate": 9.340718510365998e-08, + "loss": 0.0309, + "step": 35150 + }, + { + "epoch": 95.77929155313352, + "grad_norm": 1.8979390859603882, + "learning_rate": 9.328688626356497e-08, + "loss": 0.0221, + "step": 35151 + }, + { + "epoch": 95.78201634877384, + "grad_norm": 6.1602983474731445, + "learning_rate": 9.316666457663048e-08, + "loss": 0.1581, + "step": 35152 + }, + { + "epoch": 95.78474114441417, + "grad_norm": 2.225799083709717, + "learning_rate": 9.304652004379689e-08, + "loss": 0.1517, + "step": 35153 + }, + { + "epoch": 95.7874659400545, + "grad_norm": 1.7097855806350708, + "learning_rate": 9.292645266599787e-08, + "loss": 0.0147, + "step": 35154 + }, + { + "epoch": 95.79019073569482, + "grad_norm": 2.0193722248077393, + "learning_rate": 9.280646244416936e-08, + "loss": 0.0239, + "step": 35155 + }, + { + "epoch": 95.79291553133515, + "grad_norm": 1.4210405349731445, + "learning_rate": 9.268654937924393e-08, + "loss": 0.0171, + "step": 35156 + }, + { + "epoch": 95.79564032697547, + "grad_norm": 1.6739972829818726, + "learning_rate": 9.256671347215751e-08, + "loss": 0.0285, + "step": 35157 + }, + { + "epoch": 95.7983651226158, + "grad_norm": 3.580216884613037, + "learning_rate": 9.244695472384268e-08, + "loss": 0.1765, + "step": 35158 + }, + { + "epoch": 95.80108991825612, + "grad_norm": 3.1134626865386963, + "learning_rate": 9.232727313523204e-08, + "loss": 0.0541, + "step": 35159 + }, + { + "epoch": 95.80381471389646, + "grad_norm": 2.7235796451568604, + "learning_rate": 9.220766870725705e-08, + "loss": 0.0528, + "step": 35160 + }, + { + "epoch": 95.80653950953679, + "grad_norm": 2.136178970336914, + "learning_rate": 9.208814144085032e-08, + "loss": 0.0256, + "step": 35161 + }, + { + "epoch": 95.80926430517711, + "grad_norm": 2.6942789554595947, + "learning_rate": 9.19686913369422e-08, + "loss": 0.0469, + "step": 35162 + }, + { + "epoch": 95.81198910081744, + "grad_norm": 2.219843626022339, + "learning_rate": 9.184931839646417e-08, + "loss": 0.1022, + "step": 35163 + }, + { + "epoch": 95.81471389645776, + "grad_norm": 2.1608901023864746, + "learning_rate": 9.173002262034326e-08, + "loss": 0.0179, + "step": 35164 + }, + { + "epoch": 95.8174386920981, + "grad_norm": 1.7062442302703857, + "learning_rate": 9.161080400951095e-08, + "loss": 0.0196, + "step": 35165 + }, + { + "epoch": 95.82016348773843, + "grad_norm": 2.1895999908447266, + "learning_rate": 9.149166256489428e-08, + "loss": 0.0239, + "step": 35166 + }, + { + "epoch": 95.82288828337875, + "grad_norm": 2.4063527584075928, + "learning_rate": 9.13725982874214e-08, + "loss": 0.0263, + "step": 35167 + }, + { + "epoch": 95.82561307901908, + "grad_norm": 2.45184326171875, + "learning_rate": 9.125361117802045e-08, + "loss": 0.0287, + "step": 35168 + }, + { + "epoch": 95.8283378746594, + "grad_norm": 2.480238437652588, + "learning_rate": 9.113470123761736e-08, + "loss": 0.1217, + "step": 35169 + }, + { + "epoch": 95.83106267029973, + "grad_norm": 1.7759056091308594, + "learning_rate": 9.101586846713806e-08, + "loss": 0.0375, + "step": 35170 + }, + { + "epoch": 95.83378746594005, + "grad_norm": 3.341256856918335, + "learning_rate": 9.089711286750847e-08, + "loss": 0.0796, + "step": 35171 + }, + { + "epoch": 95.83651226158038, + "grad_norm": 2.291745185852051, + "learning_rate": 9.077843443965229e-08, + "loss": 0.0355, + "step": 35172 + }, + { + "epoch": 95.83923705722071, + "grad_norm": 2.4249584674835205, + "learning_rate": 9.065983318449656e-08, + "loss": 0.0615, + "step": 35173 + }, + { + "epoch": 95.84196185286103, + "grad_norm": 1.8145699501037598, + "learning_rate": 9.054130910296166e-08, + "loss": 0.043, + "step": 35174 + }, + { + "epoch": 95.84468664850137, + "grad_norm": 3.3663463592529297, + "learning_rate": 9.042286219597352e-08, + "loss": 0.0606, + "step": 35175 + }, + { + "epoch": 95.84741144414168, + "grad_norm": 2.636873722076416, + "learning_rate": 9.030449246445139e-08, + "loss": 0.0606, + "step": 35176 + }, + { + "epoch": 95.85013623978202, + "grad_norm": 4.4239959716796875, + "learning_rate": 9.018619990932009e-08, + "loss": 0.0872, + "step": 35177 + }, + { + "epoch": 95.85286103542235, + "grad_norm": 3.954174757003784, + "learning_rate": 9.00679845314989e-08, + "loss": 0.0411, + "step": 35178 + }, + { + "epoch": 95.85558583106267, + "grad_norm": 2.208061933517456, + "learning_rate": 8.99498463319104e-08, + "loss": 0.0258, + "step": 35179 + }, + { + "epoch": 95.858310626703, + "grad_norm": 2.1602532863616943, + "learning_rate": 8.983178531147274e-08, + "loss": 0.0322, + "step": 35180 + }, + { + "epoch": 95.86103542234332, + "grad_norm": 2.9143776893615723, + "learning_rate": 8.971380147110632e-08, + "loss": 0.0405, + "step": 35181 + }, + { + "epoch": 95.86376021798365, + "grad_norm": 1.969183325767517, + "learning_rate": 8.959589481172925e-08, + "loss": 0.0227, + "step": 35182 + }, + { + "epoch": 95.86648501362397, + "grad_norm": 3.16774320602417, + "learning_rate": 8.947806533426195e-08, + "loss": 0.0354, + "step": 35183 + }, + { + "epoch": 95.8692098092643, + "grad_norm": 1.8806781768798828, + "learning_rate": 8.936031303961922e-08, + "loss": 0.0323, + "step": 35184 + }, + { + "epoch": 95.87193460490464, + "grad_norm": 3.9964778423309326, + "learning_rate": 8.924263792872035e-08, + "loss": 0.066, + "step": 35185 + }, + { + "epoch": 95.87465940054496, + "grad_norm": 1.8949394226074219, + "learning_rate": 8.912504000248012e-08, + "loss": 0.0278, + "step": 35186 + }, + { + "epoch": 95.87738419618529, + "grad_norm": 2.26131010055542, + "learning_rate": 8.900751926181561e-08, + "loss": 0.0507, + "step": 35187 + }, + { + "epoch": 95.88010899182561, + "grad_norm": 3.028347969055176, + "learning_rate": 8.889007570764052e-08, + "loss": 0.0646, + "step": 35188 + }, + { + "epoch": 95.88283378746594, + "grad_norm": 2.306881904602051, + "learning_rate": 8.87727093408708e-08, + "loss": 0.0378, + "step": 35189 + }, + { + "epoch": 95.88555858310627, + "grad_norm": 1.7207473516464233, + "learning_rate": 8.865542016242124e-08, + "loss": 0.0357, + "step": 35190 + }, + { + "epoch": 95.88828337874659, + "grad_norm": 2.7475287914276123, + "learning_rate": 8.853820817320447e-08, + "loss": 0.13, + "step": 35191 + }, + { + "epoch": 95.89100817438693, + "grad_norm": 1.9305124282836914, + "learning_rate": 8.842107337413197e-08, + "loss": 0.0186, + "step": 35192 + }, + { + "epoch": 95.89373297002724, + "grad_norm": 3.2990758419036865, + "learning_rate": 8.830401576611747e-08, + "loss": 0.0805, + "step": 35193 + }, + { + "epoch": 95.89645776566758, + "grad_norm": 2.719024658203125, + "learning_rate": 8.818703535007245e-08, + "loss": 0.029, + "step": 35194 + }, + { + "epoch": 95.8991825613079, + "grad_norm": 2.380613327026367, + "learning_rate": 8.807013212690729e-08, + "loss": 0.0452, + "step": 35195 + }, + { + "epoch": 95.90190735694823, + "grad_norm": 2.605151653289795, + "learning_rate": 8.795330609753349e-08, + "loss": 0.088, + "step": 35196 + }, + { + "epoch": 95.90463215258856, + "grad_norm": 2.2973361015319824, + "learning_rate": 8.783655726285922e-08, + "loss": 0.0336, + "step": 35197 + }, + { + "epoch": 95.90735694822888, + "grad_norm": 1.9996578693389893, + "learning_rate": 8.771988562379596e-08, + "loss": 0.0179, + "step": 35198 + }, + { + "epoch": 95.91008174386921, + "grad_norm": 3.072854518890381, + "learning_rate": 8.760329118125189e-08, + "loss": 0.0742, + "step": 35199 + }, + { + "epoch": 95.91280653950953, + "grad_norm": 2.327976703643799, + "learning_rate": 8.748677393613292e-08, + "loss": 0.0356, + "step": 35200 + }, + { + "epoch": 95.91553133514986, + "grad_norm": 2.217430591583252, + "learning_rate": 8.737033388934834e-08, + "loss": 0.0746, + "step": 35201 + }, + { + "epoch": 95.9182561307902, + "grad_norm": 2.879448413848877, + "learning_rate": 8.725397104180521e-08, + "loss": 0.0832, + "step": 35202 + }, + { + "epoch": 95.92098092643052, + "grad_norm": 1.991579294204712, + "learning_rate": 8.713768539440836e-08, + "loss": 0.0212, + "step": 35203 + }, + { + "epoch": 95.92370572207085, + "grad_norm": 3.104318380355835, + "learning_rate": 8.702147694806484e-08, + "loss": 0.0521, + "step": 35204 + }, + { + "epoch": 95.92643051771117, + "grad_norm": 6.036311149597168, + "learning_rate": 8.690534570367837e-08, + "loss": 0.0264, + "step": 35205 + }, + { + "epoch": 95.9291553133515, + "grad_norm": 2.8335986137390137, + "learning_rate": 8.678929166215377e-08, + "loss": 0.03, + "step": 35206 + }, + { + "epoch": 95.93188010899182, + "grad_norm": 2.896843910217285, + "learning_rate": 8.66733148243959e-08, + "loss": 0.0449, + "step": 35207 + }, + { + "epoch": 95.93460490463215, + "grad_norm": 2.7111401557922363, + "learning_rate": 8.655741519130622e-08, + "loss": 0.0224, + "step": 35208 + }, + { + "epoch": 95.93732970027249, + "grad_norm": 2.886784315109253, + "learning_rate": 8.644159276378961e-08, + "loss": 0.0323, + "step": 35209 + }, + { + "epoch": 95.9400544959128, + "grad_norm": 2.641713857650757, + "learning_rate": 8.632584754274642e-08, + "loss": 0.0948, + "step": 35210 + }, + { + "epoch": 95.94277929155314, + "grad_norm": 9.331111907958984, + "learning_rate": 8.621017952907817e-08, + "loss": 0.112, + "step": 35211 + }, + { + "epoch": 95.94550408719346, + "grad_norm": 2.2131526470184326, + "learning_rate": 8.609458872368526e-08, + "loss": 0.0623, + "step": 35212 + }, + { + "epoch": 95.94822888283379, + "grad_norm": 13.232500076293945, + "learning_rate": 8.597907512746917e-08, + "loss": 0.0298, + "step": 35213 + }, + { + "epoch": 95.95095367847412, + "grad_norm": 2.437865734100342, + "learning_rate": 8.58636387413292e-08, + "loss": 0.0221, + "step": 35214 + }, + { + "epoch": 95.95367847411444, + "grad_norm": 2.714003324508667, + "learning_rate": 8.57482795661646e-08, + "loss": 0.0283, + "step": 35215 + }, + { + "epoch": 95.95640326975477, + "grad_norm": 2.802816867828369, + "learning_rate": 8.563299760287358e-08, + "loss": 0.2306, + "step": 35216 + }, + { + "epoch": 95.95912806539509, + "grad_norm": 2.068948268890381, + "learning_rate": 8.551779285235206e-08, + "loss": 0.0736, + "step": 35217 + }, + { + "epoch": 95.96185286103542, + "grad_norm": 2.125474452972412, + "learning_rate": 8.540266531549934e-08, + "loss": 0.0278, + "step": 35218 + }, + { + "epoch": 95.96457765667574, + "grad_norm": 2.1596126556396484, + "learning_rate": 8.528761499321247e-08, + "loss": 0.1153, + "step": 35219 + }, + { + "epoch": 95.96730245231608, + "grad_norm": 3.537027597427368, + "learning_rate": 8.51726418863863e-08, + "loss": 0.0246, + "step": 35220 + }, + { + "epoch": 95.97002724795641, + "grad_norm": 2.5084664821624756, + "learning_rate": 8.505774599591566e-08, + "loss": 0.0961, + "step": 35221 + }, + { + "epoch": 95.97275204359673, + "grad_norm": 3.3551576137542725, + "learning_rate": 8.49429273226976e-08, + "loss": 0.0367, + "step": 35222 + }, + { + "epoch": 95.97547683923706, + "grad_norm": 1.8011064529418945, + "learning_rate": 8.482818586762365e-08, + "loss": 0.085, + "step": 35223 + }, + { + "epoch": 95.97820163487738, + "grad_norm": 3.4674816131591797, + "learning_rate": 8.471352163158974e-08, + "loss": 0.0311, + "step": 35224 + }, + { + "epoch": 95.98092643051771, + "grad_norm": 4.035762310028076, + "learning_rate": 8.45989346154863e-08, + "loss": 0.0504, + "step": 35225 + }, + { + "epoch": 95.98365122615803, + "grad_norm": 2.319643020629883, + "learning_rate": 8.448442482020814e-08, + "loss": 0.0291, + "step": 35226 + }, + { + "epoch": 95.98637602179836, + "grad_norm": 2.304887533187866, + "learning_rate": 8.436999224664677e-08, + "loss": 0.1227, + "step": 35227 + }, + { + "epoch": 95.9891008174387, + "grad_norm": 3.8282926082611084, + "learning_rate": 8.42556368956915e-08, + "loss": 0.03, + "step": 35228 + }, + { + "epoch": 95.99182561307902, + "grad_norm": 1.3371766805648804, + "learning_rate": 8.414135876823382e-08, + "loss": 0.0232, + "step": 35229 + }, + { + "epoch": 95.99455040871935, + "grad_norm": 2.040874719619751, + "learning_rate": 8.402715786516524e-08, + "loss": 0.0617, + "step": 35230 + }, + { + "epoch": 95.99727520435967, + "grad_norm": 3.1709978580474854, + "learning_rate": 8.391303418737395e-08, + "loss": 0.1659, + "step": 35231 + }, + { + "epoch": 96.0, + "grad_norm": 2.1919538974761963, + "learning_rate": 8.379898773574924e-08, + "loss": 0.0646, + "step": 35232 + }, + { + "epoch": 96.00272479564033, + "grad_norm": 2.3267288208007812, + "learning_rate": 8.368501851117816e-08, + "loss": 0.0264, + "step": 35233 + }, + { + "epoch": 96.00544959128065, + "grad_norm": 2.963054656982422, + "learning_rate": 8.357112651454891e-08, + "loss": 0.0735, + "step": 35234 + }, + { + "epoch": 96.00817438692098, + "grad_norm": 2.328134298324585, + "learning_rate": 8.345731174674854e-08, + "loss": 0.06, + "step": 35235 + }, + { + "epoch": 96.0108991825613, + "grad_norm": 2.6362593173980713, + "learning_rate": 8.334357420866413e-08, + "loss": 0.0876, + "step": 35236 + }, + { + "epoch": 96.01362397820164, + "grad_norm": 2.74820876121521, + "learning_rate": 8.322991390117941e-08, + "loss": 0.072, + "step": 35237 + }, + { + "epoch": 96.01634877384195, + "grad_norm": 3.324258804321289, + "learning_rate": 8.311633082518256e-08, + "loss": 0.0661, + "step": 35238 + }, + { + "epoch": 96.01907356948229, + "grad_norm": 1.7469960451126099, + "learning_rate": 8.300282498155621e-08, + "loss": 0.0268, + "step": 35239 + }, + { + "epoch": 96.02179836512262, + "grad_norm": 3.1011860370635986, + "learning_rate": 8.28893963711841e-08, + "loss": 0.0396, + "step": 35240 + }, + { + "epoch": 96.02452316076294, + "grad_norm": 4.629014492034912, + "learning_rate": 8.277604499494995e-08, + "loss": 0.0416, + "step": 35241 + }, + { + "epoch": 96.02724795640327, + "grad_norm": 4.329613208770752, + "learning_rate": 8.266277085373753e-08, + "loss": 0.0248, + "step": 35242 + }, + { + "epoch": 96.02997275204359, + "grad_norm": 1.7718288898468018, + "learning_rate": 8.254957394842833e-08, + "loss": 0.0278, + "step": 35243 + }, + { + "epoch": 96.03269754768392, + "grad_norm": 3.014353036880493, + "learning_rate": 8.243645427990388e-08, + "loss": 0.0374, + "step": 35244 + }, + { + "epoch": 96.03542234332426, + "grad_norm": 2.291088104248047, + "learning_rate": 8.232341184904458e-08, + "loss": 0.0224, + "step": 35245 + }, + { + "epoch": 96.03814713896458, + "grad_norm": 3.4260973930358887, + "learning_rate": 8.221044665673194e-08, + "loss": 0.0697, + "step": 35246 + }, + { + "epoch": 96.04087193460491, + "grad_norm": 4.077487468719482, + "learning_rate": 8.209755870384417e-08, + "loss": 0.2125, + "step": 35247 + }, + { + "epoch": 96.04359673024523, + "grad_norm": 2.3869411945343018, + "learning_rate": 8.198474799126167e-08, + "loss": 0.0244, + "step": 35248 + }, + { + "epoch": 96.04632152588556, + "grad_norm": 4.090585231781006, + "learning_rate": 8.18720145198626e-08, + "loss": 0.0387, + "step": 35249 + }, + { + "epoch": 96.04904632152588, + "grad_norm": 2.4099318981170654, + "learning_rate": 8.175935829052628e-08, + "loss": 0.0259, + "step": 35250 + }, + { + "epoch": 96.05177111716621, + "grad_norm": 4.118835926055908, + "learning_rate": 8.164677930412867e-08, + "loss": 0.058, + "step": 35251 + }, + { + "epoch": 96.05449591280654, + "grad_norm": 3.0008699893951416, + "learning_rate": 8.153427756154575e-08, + "loss": 0.0624, + "step": 35252 + }, + { + "epoch": 96.05722070844686, + "grad_norm": 3.927640914916992, + "learning_rate": 8.142185306365457e-08, + "loss": 0.1975, + "step": 35253 + }, + { + "epoch": 96.0599455040872, + "grad_norm": 3.217844247817993, + "learning_rate": 8.130950581133113e-08, + "loss": 0.0537, + "step": 35254 + }, + { + "epoch": 96.06267029972751, + "grad_norm": 2.599726915359497, + "learning_rate": 8.119723580545136e-08, + "loss": 0.0254, + "step": 35255 + }, + { + "epoch": 96.06539509536785, + "grad_norm": 2.5743327140808105, + "learning_rate": 8.10850430468868e-08, + "loss": 0.1085, + "step": 35256 + }, + { + "epoch": 96.06811989100818, + "grad_norm": 1.2380759716033936, + "learning_rate": 8.097292753651232e-08, + "loss": 0.0119, + "step": 35257 + }, + { + "epoch": 96.0708446866485, + "grad_norm": 1.8359806537628174, + "learning_rate": 8.086088927520274e-08, + "loss": 0.0208, + "step": 35258 + }, + { + "epoch": 96.07356948228883, + "grad_norm": 2.276522159576416, + "learning_rate": 8.074892826382852e-08, + "loss": 0.1583, + "step": 35259 + }, + { + "epoch": 96.07629427792915, + "grad_norm": 2.629805564880371, + "learning_rate": 8.063704450326227e-08, + "loss": 0.044, + "step": 35260 + }, + { + "epoch": 96.07901907356948, + "grad_norm": 2.550387144088745, + "learning_rate": 8.052523799437551e-08, + "loss": 0.0405, + "step": 35261 + }, + { + "epoch": 96.0817438692098, + "grad_norm": 2.132642984390259, + "learning_rate": 8.041350873803978e-08, + "loss": 0.1068, + "step": 35262 + }, + { + "epoch": 96.08446866485014, + "grad_norm": 2.0799076557159424, + "learning_rate": 8.030185673512325e-08, + "loss": 0.036, + "step": 35263 + }, + { + "epoch": 96.08719346049047, + "grad_norm": 2.644192934036255, + "learning_rate": 8.019028198649747e-08, + "loss": 0.0634, + "step": 35264 + }, + { + "epoch": 96.08991825613079, + "grad_norm": 1.6757255792617798, + "learning_rate": 8.007878449303064e-08, + "loss": 0.021, + "step": 35265 + }, + { + "epoch": 96.09264305177112, + "grad_norm": 2.489243745803833, + "learning_rate": 7.996736425558982e-08, + "loss": 0.0435, + "step": 35266 + }, + { + "epoch": 96.09536784741144, + "grad_norm": 2.456620216369629, + "learning_rate": 7.985602127504432e-08, + "loss": 0.0319, + "step": 35267 + }, + { + "epoch": 96.09809264305177, + "grad_norm": 2.1677346229553223, + "learning_rate": 7.974475555226125e-08, + "loss": 0.0727, + "step": 35268 + }, + { + "epoch": 96.1008174386921, + "grad_norm": 2.95621395111084, + "learning_rate": 7.963356708810654e-08, + "loss": 0.0398, + "step": 35269 + }, + { + "epoch": 96.10354223433242, + "grad_norm": 2.322218894958496, + "learning_rate": 7.95224558834462e-08, + "loss": 0.0707, + "step": 35270 + }, + { + "epoch": 96.10626702997276, + "grad_norm": 2.460341215133667, + "learning_rate": 7.941142193914619e-08, + "loss": 0.079, + "step": 35271 + }, + { + "epoch": 96.10899182561307, + "grad_norm": 2.0585649013519287, + "learning_rate": 7.930046525607027e-08, + "loss": 0.0339, + "step": 35272 + }, + { + "epoch": 96.11171662125341, + "grad_norm": 3.2247707843780518, + "learning_rate": 7.91895858350833e-08, + "loss": 0.0878, + "step": 35273 + }, + { + "epoch": 96.11444141689373, + "grad_norm": 4.812054634094238, + "learning_rate": 7.907878367704791e-08, + "loss": 0.0203, + "step": 35274 + }, + { + "epoch": 96.11716621253406, + "grad_norm": 2.8286547660827637, + "learning_rate": 7.896805878282898e-08, + "loss": 0.1109, + "step": 35275 + }, + { + "epoch": 96.11989100817439, + "grad_norm": 2.2864203453063965, + "learning_rate": 7.885741115328583e-08, + "loss": 0.1572, + "step": 35276 + }, + { + "epoch": 96.12261580381471, + "grad_norm": 2.099889039993286, + "learning_rate": 7.87468407892833e-08, + "loss": 0.0327, + "step": 35277 + }, + { + "epoch": 96.12534059945504, + "grad_norm": 4.798058986663818, + "learning_rate": 7.86363476916796e-08, + "loss": 0.0607, + "step": 35278 + }, + { + "epoch": 96.12806539509536, + "grad_norm": 2.89988374710083, + "learning_rate": 7.85259318613385e-08, + "loss": 0.0352, + "step": 35279 + }, + { + "epoch": 96.1307901907357, + "grad_norm": 2.715339422225952, + "learning_rate": 7.841559329911707e-08, + "loss": 0.1212, + "step": 35280 + }, + { + "epoch": 96.13351498637603, + "grad_norm": 4.634676456451416, + "learning_rate": 7.830533200587576e-08, + "loss": 0.0354, + "step": 35281 + }, + { + "epoch": 96.13623978201635, + "grad_norm": 4.271185874938965, + "learning_rate": 7.819514798247274e-08, + "loss": 0.2337, + "step": 35282 + }, + { + "epoch": 96.13896457765668, + "grad_norm": 1.6097041368484497, + "learning_rate": 7.808504122976624e-08, + "loss": 0.0233, + "step": 35283 + }, + { + "epoch": 96.141689373297, + "grad_norm": 4.050378799438477, + "learning_rate": 7.797501174861555e-08, + "loss": 0.1224, + "step": 35284 + }, + { + "epoch": 96.14441416893733, + "grad_norm": 2.521028518676758, + "learning_rate": 7.786505953987555e-08, + "loss": 0.056, + "step": 35285 + }, + { + "epoch": 96.14713896457765, + "grad_norm": 25.072004318237305, + "learning_rate": 7.775518460440223e-08, + "loss": 0.0674, + "step": 35286 + }, + { + "epoch": 96.14986376021798, + "grad_norm": 2.9250643253326416, + "learning_rate": 7.76453869430538e-08, + "loss": 0.0462, + "step": 35287 + }, + { + "epoch": 96.15258855585832, + "grad_norm": 2.3465731143951416, + "learning_rate": 7.753566655668287e-08, + "loss": 0.0944, + "step": 35288 + }, + { + "epoch": 96.15531335149863, + "grad_norm": 1.7991676330566406, + "learning_rate": 7.742602344614547e-08, + "loss": 0.0267, + "step": 35289 + }, + { + "epoch": 96.15803814713897, + "grad_norm": 3.252142906188965, + "learning_rate": 7.731645761229311e-08, + "loss": 0.0387, + "step": 35290 + }, + { + "epoch": 96.16076294277929, + "grad_norm": 2.0888664722442627, + "learning_rate": 7.72069690559829e-08, + "loss": 0.0694, + "step": 35291 + }, + { + "epoch": 96.16348773841962, + "grad_norm": 2.0460405349731445, + "learning_rate": 7.709755777806416e-08, + "loss": 0.0224, + "step": 35292 + }, + { + "epoch": 96.16621253405995, + "grad_norm": 3.1798970699310303, + "learning_rate": 7.698822377939063e-08, + "loss": 0.0712, + "step": 35293 + }, + { + "epoch": 96.16893732970027, + "grad_norm": 1.9900087118148804, + "learning_rate": 7.687896706081388e-08, + "loss": 0.0159, + "step": 35294 + }, + { + "epoch": 96.1716621253406, + "grad_norm": 1.9430514574050903, + "learning_rate": 7.676978762318321e-08, + "loss": 0.0301, + "step": 35295 + }, + { + "epoch": 96.17438692098092, + "grad_norm": 2.5412027835845947, + "learning_rate": 7.666068546735129e-08, + "loss": 0.0431, + "step": 35296 + }, + { + "epoch": 96.17711171662125, + "grad_norm": 2.8897788524627686, + "learning_rate": 7.655166059416519e-08, + "loss": 0.065, + "step": 35297 + }, + { + "epoch": 96.17983651226157, + "grad_norm": 2.243454694747925, + "learning_rate": 7.644271300447647e-08, + "loss": 0.0358, + "step": 35298 + }, + { + "epoch": 96.1825613079019, + "grad_norm": 2.231678009033203, + "learning_rate": 7.633384269913224e-08, + "loss": 0.034, + "step": 35299 + }, + { + "epoch": 96.18528610354224, + "grad_norm": 3.5967888832092285, + "learning_rate": 7.62250496789807e-08, + "loss": 0.1114, + "step": 35300 + }, + { + "epoch": 96.18801089918256, + "grad_norm": 2.564082384109497, + "learning_rate": 7.611633394487005e-08, + "loss": 0.1345, + "step": 35301 + }, + { + "epoch": 96.19073569482289, + "grad_norm": 2.419724941253662, + "learning_rate": 7.600769549764408e-08, + "loss": 0.0257, + "step": 35302 + }, + { + "epoch": 96.19346049046321, + "grad_norm": 2.611628770828247, + "learning_rate": 7.58991343381521e-08, + "loss": 0.028, + "step": 35303 + }, + { + "epoch": 96.19618528610354, + "grad_norm": 2.4860422611236572, + "learning_rate": 7.579065046723789e-08, + "loss": 0.0453, + "step": 35304 + }, + { + "epoch": 96.19891008174388, + "grad_norm": 2.565809965133667, + "learning_rate": 7.56822438857463e-08, + "loss": 0.102, + "step": 35305 + }, + { + "epoch": 96.2016348773842, + "grad_norm": 1.5890276432037354, + "learning_rate": 7.557391459452224e-08, + "loss": 0.0161, + "step": 35306 + }, + { + "epoch": 96.20435967302453, + "grad_norm": 4.1379923820495605, + "learning_rate": 7.546566259440946e-08, + "loss": 0.0432, + "step": 35307 + }, + { + "epoch": 96.20708446866485, + "grad_norm": 4.850417137145996, + "learning_rate": 7.535748788625064e-08, + "loss": 0.0348, + "step": 35308 + }, + { + "epoch": 96.20980926430518, + "grad_norm": 2.616990327835083, + "learning_rate": 7.524939047088842e-08, + "loss": 0.0663, + "step": 35309 + }, + { + "epoch": 96.2125340599455, + "grad_norm": 2.0257766246795654, + "learning_rate": 7.514137034916325e-08, + "loss": 0.1266, + "step": 35310 + }, + { + "epoch": 96.21525885558583, + "grad_norm": 2.8868000507354736, + "learning_rate": 7.503342752191889e-08, + "loss": 0.0744, + "step": 35311 + }, + { + "epoch": 96.21798365122616, + "grad_norm": 2.598789691925049, + "learning_rate": 7.492556198999468e-08, + "loss": 0.0324, + "step": 35312 + }, + { + "epoch": 96.22070844686648, + "grad_norm": 2.572842836380005, + "learning_rate": 7.481777375423105e-08, + "loss": 0.0398, + "step": 35313 + }, + { + "epoch": 96.22343324250681, + "grad_norm": 1.9657859802246094, + "learning_rate": 7.471006281546622e-08, + "loss": 0.0192, + "step": 35314 + }, + { + "epoch": 96.22615803814713, + "grad_norm": 2.165194034576416, + "learning_rate": 7.460242917453952e-08, + "loss": 0.0241, + "step": 35315 + }, + { + "epoch": 96.22888283378747, + "grad_norm": 3.8123340606689453, + "learning_rate": 7.44948728322914e-08, + "loss": 0.0253, + "step": 35316 + }, + { + "epoch": 96.2316076294278, + "grad_norm": 1.8331133127212524, + "learning_rate": 7.438739378955673e-08, + "loss": 0.0222, + "step": 35317 + }, + { + "epoch": 96.23433242506812, + "grad_norm": 3.504307508468628, + "learning_rate": 7.427999204717374e-08, + "loss": 0.1221, + "step": 35318 + }, + { + "epoch": 96.23705722070845, + "grad_norm": 4.067674160003662, + "learning_rate": 7.417266760597842e-08, + "loss": 0.0374, + "step": 35319 + }, + { + "epoch": 96.23978201634877, + "grad_norm": 2.9613125324249268, + "learning_rate": 7.406542046680787e-08, + "loss": 0.0277, + "step": 35320 + }, + { + "epoch": 96.2425068119891, + "grad_norm": 2.0485403537750244, + "learning_rate": 7.395825063049588e-08, + "loss": 0.0232, + "step": 35321 + }, + { + "epoch": 96.24523160762942, + "grad_norm": 2.219895124435425, + "learning_rate": 7.385115809787624e-08, + "loss": 0.0524, + "step": 35322 + }, + { + "epoch": 96.24795640326975, + "grad_norm": 4.913880825042725, + "learning_rate": 7.374414286978604e-08, + "loss": 0.0499, + "step": 35323 + }, + { + "epoch": 96.25068119891009, + "grad_norm": 3.1046810150146484, + "learning_rate": 7.363720494705684e-08, + "loss": 0.1162, + "step": 35324 + }, + { + "epoch": 96.2534059945504, + "grad_norm": 5.151793003082275, + "learning_rate": 7.353034433052131e-08, + "loss": 0.0428, + "step": 35325 + }, + { + "epoch": 96.25613079019074, + "grad_norm": 2.6411540508270264, + "learning_rate": 7.3423561021011e-08, + "loss": 0.1316, + "step": 35326 + }, + { + "epoch": 96.25885558583106, + "grad_norm": 3.530471086502075, + "learning_rate": 7.33168550193597e-08, + "loss": 0.0793, + "step": 35327 + }, + { + "epoch": 96.26158038147139, + "grad_norm": 2.105945110321045, + "learning_rate": 7.321022632639674e-08, + "loss": 0.0338, + "step": 35328 + }, + { + "epoch": 96.26430517711172, + "grad_norm": 2.030118465423584, + "learning_rate": 7.310367494295367e-08, + "loss": 0.037, + "step": 35329 + }, + { + "epoch": 96.26702997275204, + "grad_norm": 2.513051748275757, + "learning_rate": 7.299720086985872e-08, + "loss": 0.0529, + "step": 35330 + }, + { + "epoch": 96.26975476839237, + "grad_norm": 3.9353020191192627, + "learning_rate": 7.289080410794236e-08, + "loss": 0.0363, + "step": 35331 + }, + { + "epoch": 96.2724795640327, + "grad_norm": 2.9553170204162598, + "learning_rate": 7.27844846580339e-08, + "loss": 0.0526, + "step": 35332 + }, + { + "epoch": 96.27520435967303, + "grad_norm": 2.5372941493988037, + "learning_rate": 7.267824252095823e-08, + "loss": 0.0749, + "step": 35333 + }, + { + "epoch": 96.27792915531334, + "grad_norm": 3.0864951610565186, + "learning_rate": 7.257207769754693e-08, + "loss": 0.058, + "step": 35334 + }, + { + "epoch": 96.28065395095368, + "grad_norm": 2.306518077850342, + "learning_rate": 7.246599018862377e-08, + "loss": 0.1582, + "step": 35335 + }, + { + "epoch": 96.28337874659401, + "grad_norm": 2.6885318756103516, + "learning_rate": 7.235997999501587e-08, + "loss": 0.0749, + "step": 35336 + }, + { + "epoch": 96.28610354223433, + "grad_norm": 1.9896204471588135, + "learning_rate": 7.225404711755035e-08, + "loss": 0.0355, + "step": 35337 + }, + { + "epoch": 96.28882833787466, + "grad_norm": 2.0738072395324707, + "learning_rate": 7.214819155704878e-08, + "loss": 0.1249, + "step": 35338 + }, + { + "epoch": 96.29155313351498, + "grad_norm": 2.042652130126953, + "learning_rate": 7.204241331433936e-08, + "loss": 0.0216, + "step": 35339 + }, + { + "epoch": 96.29427792915531, + "grad_norm": 2.8200011253356934, + "learning_rate": 7.193671239024258e-08, + "loss": 0.0403, + "step": 35340 + }, + { + "epoch": 96.29700272479565, + "grad_norm": 1.7782176733016968, + "learning_rate": 7.183108878558443e-08, + "loss": 0.0862, + "step": 35341 + }, + { + "epoch": 96.29972752043597, + "grad_norm": 4.042399883270264, + "learning_rate": 7.172554250118535e-08, + "loss": 0.0868, + "step": 35342 + }, + { + "epoch": 96.3024523160763, + "grad_norm": 2.733473300933838, + "learning_rate": 7.162007353786915e-08, + "loss": 0.0798, + "step": 35343 + }, + { + "epoch": 96.30517711171662, + "grad_norm": 1.9620474576950073, + "learning_rate": 7.151468189645516e-08, + "loss": 0.0238, + "step": 35344 + }, + { + "epoch": 96.30790190735695, + "grad_norm": 3.0320639610290527, + "learning_rate": 7.140936757776607e-08, + "loss": 0.0498, + "step": 35345 + }, + { + "epoch": 96.31062670299727, + "grad_norm": 2.256063938140869, + "learning_rate": 7.13041305826201e-08, + "loss": 0.0794, + "step": 35346 + }, + { + "epoch": 96.3133514986376, + "grad_norm": 1.9673376083374023, + "learning_rate": 7.119897091183991e-08, + "loss": 0.0254, + "step": 35347 + }, + { + "epoch": 96.31607629427793, + "grad_norm": 3.04085373878479, + "learning_rate": 7.109388856624156e-08, + "loss": 0.0749, + "step": 35348 + }, + { + "epoch": 96.31880108991825, + "grad_norm": 2.1095919609069824, + "learning_rate": 7.098888354664435e-08, + "loss": 0.0812, + "step": 35349 + }, + { + "epoch": 96.32152588555859, + "grad_norm": 1.6618585586547852, + "learning_rate": 7.088395585386543e-08, + "loss": 0.0288, + "step": 35350 + }, + { + "epoch": 96.3242506811989, + "grad_norm": 3.0538253784179688, + "learning_rate": 7.077910548872303e-08, + "loss": 0.1133, + "step": 35351 + }, + { + "epoch": 96.32697547683924, + "grad_norm": 3.3978896141052246, + "learning_rate": 7.067433245203426e-08, + "loss": 0.0589, + "step": 35352 + }, + { + "epoch": 96.32970027247957, + "grad_norm": 4.375565528869629, + "learning_rate": 7.056963674461403e-08, + "loss": 0.0765, + "step": 35353 + }, + { + "epoch": 96.33242506811989, + "grad_norm": 5.209430694580078, + "learning_rate": 7.046501836727837e-08, + "loss": 0.0795, + "step": 35354 + }, + { + "epoch": 96.33514986376022, + "grad_norm": 2.466344118118286, + "learning_rate": 7.036047732083995e-08, + "loss": 0.0344, + "step": 35355 + }, + { + "epoch": 96.33787465940054, + "grad_norm": 2.28086519241333, + "learning_rate": 7.025601360611589e-08, + "loss": 0.0393, + "step": 35356 + }, + { + "epoch": 96.34059945504087, + "grad_norm": 1.84520423412323, + "learning_rate": 7.015162722391777e-08, + "loss": 0.0205, + "step": 35357 + }, + { + "epoch": 96.34332425068119, + "grad_norm": 2.9149668216705322, + "learning_rate": 7.004731817505939e-08, + "loss": 0.0349, + "step": 35358 + }, + { + "epoch": 96.34604904632153, + "grad_norm": 2.657827854156494, + "learning_rate": 6.994308646035342e-08, + "loss": 0.0487, + "step": 35359 + }, + { + "epoch": 96.34877384196186, + "grad_norm": 2.733856678009033, + "learning_rate": 6.983893208061032e-08, + "loss": 0.0278, + "step": 35360 + }, + { + "epoch": 96.35149863760218, + "grad_norm": 4.0479631423950195, + "learning_rate": 6.973485503664279e-08, + "loss": 0.1143, + "step": 35361 + }, + { + "epoch": 96.35422343324251, + "grad_norm": 1.9658021926879883, + "learning_rate": 6.963085532925906e-08, + "loss": 0.0263, + "step": 35362 + }, + { + "epoch": 96.35694822888283, + "grad_norm": 3.4346835613250732, + "learning_rate": 6.952693295927182e-08, + "loss": 0.0487, + "step": 35363 + }, + { + "epoch": 96.35967302452316, + "grad_norm": 2.051133394241333, + "learning_rate": 6.942308792748931e-08, + "loss": 0.0518, + "step": 35364 + }, + { + "epoch": 96.3623978201635, + "grad_norm": 2.170633316040039, + "learning_rate": 6.931932023471976e-08, + "loss": 0.0521, + "step": 35365 + }, + { + "epoch": 96.36512261580381, + "grad_norm": 2.4649534225463867, + "learning_rate": 6.921562988177144e-08, + "loss": 0.183, + "step": 35366 + }, + { + "epoch": 96.36784741144415, + "grad_norm": 2.149437427520752, + "learning_rate": 6.911201686945257e-08, + "loss": 0.0513, + "step": 35367 + }, + { + "epoch": 96.37057220708446, + "grad_norm": 2.6818723678588867, + "learning_rate": 6.90084811985703e-08, + "loss": 0.1554, + "step": 35368 + }, + { + "epoch": 96.3732970027248, + "grad_norm": 3.1670899391174316, + "learning_rate": 6.89050228699295e-08, + "loss": 0.0385, + "step": 35369 + }, + { + "epoch": 96.37602179836512, + "grad_norm": 2.5463054180145264, + "learning_rate": 6.880164188433735e-08, + "loss": 0.0399, + "step": 35370 + }, + { + "epoch": 96.37874659400545, + "grad_norm": 2.164754867553711, + "learning_rate": 6.869833824259764e-08, + "loss": 0.0319, + "step": 35371 + }, + { + "epoch": 96.38147138964578, + "grad_norm": 5.0746073722839355, + "learning_rate": 6.859511194551637e-08, + "loss": 0.2198, + "step": 35372 + }, + { + "epoch": 96.3841961852861, + "grad_norm": 3.267862319946289, + "learning_rate": 6.849196299389627e-08, + "loss": 0.024, + "step": 35373 + }, + { + "epoch": 96.38692098092643, + "grad_norm": 6.8015265464782715, + "learning_rate": 6.838889138854221e-08, + "loss": 0.0558, + "step": 35374 + }, + { + "epoch": 96.38964577656675, + "grad_norm": 2.5740325450897217, + "learning_rate": 6.828589713025358e-08, + "loss": 0.0218, + "step": 35375 + }, + { + "epoch": 96.39237057220708, + "grad_norm": 1.7000741958618164, + "learning_rate": 6.818298021983638e-08, + "loss": 0.0205, + "step": 35376 + }, + { + "epoch": 96.39509536784742, + "grad_norm": 2.4573564529418945, + "learning_rate": 6.808014065808998e-08, + "loss": 0.0443, + "step": 35377 + }, + { + "epoch": 96.39782016348774, + "grad_norm": 2.234182834625244, + "learning_rate": 6.797737844581709e-08, + "loss": 0.0831, + "step": 35378 + }, + { + "epoch": 96.40054495912807, + "grad_norm": 4.208703994750977, + "learning_rate": 6.787469358381483e-08, + "loss": 0.0444, + "step": 35379 + }, + { + "epoch": 96.40326975476839, + "grad_norm": 2.4536097049713135, + "learning_rate": 6.777208607288588e-08, + "loss": 0.0255, + "step": 35380 + }, + { + "epoch": 96.40599455040872, + "grad_norm": 2.6513986587524414, + "learning_rate": 6.76695559138274e-08, + "loss": 0.0863, + "step": 35381 + }, + { + "epoch": 96.40871934604904, + "grad_norm": 2.6731977462768555, + "learning_rate": 6.756710310743875e-08, + "loss": 0.0499, + "step": 35382 + }, + { + "epoch": 96.41144414168937, + "grad_norm": 2.5571868419647217, + "learning_rate": 6.746472765451928e-08, + "loss": 0.0251, + "step": 35383 + }, + { + "epoch": 96.4141689373297, + "grad_norm": 3.7371065616607666, + "learning_rate": 6.73624295558628e-08, + "loss": 0.0735, + "step": 35384 + }, + { + "epoch": 96.41689373297002, + "grad_norm": 1.3535984754562378, + "learning_rate": 6.72602088122698e-08, + "loss": 0.0155, + "step": 35385 + }, + { + "epoch": 96.41961852861036, + "grad_norm": 2.044111490249634, + "learning_rate": 6.715806542453407e-08, + "loss": 0.1439, + "step": 35386 + }, + { + "epoch": 96.42234332425068, + "grad_norm": 3.4099745750427246, + "learning_rate": 6.705599939345053e-08, + "loss": 0.0619, + "step": 35387 + }, + { + "epoch": 96.42506811989101, + "grad_norm": 2.2722225189208984, + "learning_rate": 6.695401071981633e-08, + "loss": 0.0918, + "step": 35388 + }, + { + "epoch": 96.42779291553134, + "grad_norm": 2.1422479152679443, + "learning_rate": 6.685209940442527e-08, + "loss": 0.0219, + "step": 35389 + }, + { + "epoch": 96.43051771117166, + "grad_norm": 2.9350244998931885, + "learning_rate": 6.675026544806895e-08, + "loss": 0.0816, + "step": 35390 + }, + { + "epoch": 96.433242506812, + "grad_norm": 2.466939926147461, + "learning_rate": 6.664850885154228e-08, + "loss": 0.0415, + "step": 35391 + }, + { + "epoch": 96.43596730245231, + "grad_norm": 3.0898635387420654, + "learning_rate": 6.654682961563797e-08, + "loss": 0.0723, + "step": 35392 + }, + { + "epoch": 96.43869209809264, + "grad_norm": 3.9820556640625, + "learning_rate": 6.644522774114648e-08, + "loss": 0.0964, + "step": 35393 + }, + { + "epoch": 96.44141689373296, + "grad_norm": 2.8883168697357178, + "learning_rate": 6.634370322886052e-08, + "loss": 0.04, + "step": 35394 + }, + { + "epoch": 96.4441416893733, + "grad_norm": 1.9567556381225586, + "learning_rate": 6.624225607956946e-08, + "loss": 0.0275, + "step": 35395 + }, + { + "epoch": 96.44686648501363, + "grad_norm": 1.7626467943191528, + "learning_rate": 6.614088629406379e-08, + "loss": 0.057, + "step": 35396 + }, + { + "epoch": 96.44959128065395, + "grad_norm": 1.9004507064819336, + "learning_rate": 6.603959387313397e-08, + "loss": 0.019, + "step": 35397 + }, + { + "epoch": 96.45231607629428, + "grad_norm": 2.021732807159424, + "learning_rate": 6.593837881756826e-08, + "loss": 0.0312, + "step": 35398 + }, + { + "epoch": 96.4550408719346, + "grad_norm": 2.7149088382720947, + "learning_rate": 6.583724112815382e-08, + "loss": 0.0346, + "step": 35399 + }, + { + "epoch": 96.45776566757493, + "grad_norm": 2.1930859088897705, + "learning_rate": 6.57361808056789e-08, + "loss": 0.034, + "step": 35400 + }, + { + "epoch": 96.46049046321527, + "grad_norm": 2.3776214122772217, + "learning_rate": 6.563519785093175e-08, + "loss": 0.0262, + "step": 35401 + }, + { + "epoch": 96.46321525885558, + "grad_norm": 3.6150803565979004, + "learning_rate": 6.553429226469732e-08, + "loss": 0.1215, + "step": 35402 + }, + { + "epoch": 96.46594005449592, + "grad_norm": 2.461015462875366, + "learning_rate": 6.543346404776274e-08, + "loss": 0.113, + "step": 35403 + }, + { + "epoch": 96.46866485013624, + "grad_norm": 2.3507983684539795, + "learning_rate": 6.533271320091183e-08, + "loss": 0.1221, + "step": 35404 + }, + { + "epoch": 96.47138964577657, + "grad_norm": 1.8498133420944214, + "learning_rate": 6.523203972493064e-08, + "loss": 0.0516, + "step": 35405 + }, + { + "epoch": 96.47411444141689, + "grad_norm": 5.818890571594238, + "learning_rate": 6.513144362060297e-08, + "loss": 0.0639, + "step": 35406 + }, + { + "epoch": 96.47683923705722, + "grad_norm": 1.764113426208496, + "learning_rate": 6.503092488871043e-08, + "loss": 0.0298, + "step": 35407 + }, + { + "epoch": 96.47956403269755, + "grad_norm": 3.480236053466797, + "learning_rate": 6.493048353003905e-08, + "loss": 0.0312, + "step": 35408 + }, + { + "epoch": 96.48228882833787, + "grad_norm": 3.6187903881073, + "learning_rate": 6.483011954536823e-08, + "loss": 0.0556, + "step": 35409 + }, + { + "epoch": 96.4850136239782, + "grad_norm": 2.8983848094940186, + "learning_rate": 6.472983293548063e-08, + "loss": 0.1239, + "step": 35410 + }, + { + "epoch": 96.48773841961852, + "grad_norm": 3.3406033515930176, + "learning_rate": 6.462962370115789e-08, + "loss": 0.0551, + "step": 35411 + }, + { + "epoch": 96.49046321525886, + "grad_norm": 2.954235315322876, + "learning_rate": 6.452949184317936e-08, + "loss": 0.0333, + "step": 35412 + }, + { + "epoch": 96.49318801089919, + "grad_norm": 3.331435203552246, + "learning_rate": 6.442943736232554e-08, + "loss": 0.0497, + "step": 35413 + }, + { + "epoch": 96.49591280653951, + "grad_norm": 2.757610559463501, + "learning_rate": 6.43294602593758e-08, + "loss": 0.0432, + "step": 35414 + }, + { + "epoch": 96.49863760217984, + "grad_norm": 1.955291748046875, + "learning_rate": 6.422956053510842e-08, + "loss": 0.0197, + "step": 35415 + }, + { + "epoch": 96.50136239782016, + "grad_norm": 2.445478916168213, + "learning_rate": 6.412973819030054e-08, + "loss": 0.0226, + "step": 35416 + }, + { + "epoch": 96.50408719346049, + "grad_norm": 1.7992150783538818, + "learning_rate": 6.402999322573155e-08, + "loss": 0.0188, + "step": 35417 + }, + { + "epoch": 96.50681198910081, + "grad_norm": 3.279829978942871, + "learning_rate": 6.393032564217749e-08, + "loss": 0.1837, + "step": 35418 + }, + { + "epoch": 96.50953678474114, + "grad_norm": 2.0962960720062256, + "learning_rate": 6.383073544041329e-08, + "loss": 0.0301, + "step": 35419 + }, + { + "epoch": 96.51226158038148, + "grad_norm": 3.2004408836364746, + "learning_rate": 6.373122262121501e-08, + "loss": 0.0788, + "step": 35420 + }, + { + "epoch": 96.5149863760218, + "grad_norm": 2.7900593280792236, + "learning_rate": 6.363178718535867e-08, + "loss": 0.0304, + "step": 35421 + }, + { + "epoch": 96.51771117166213, + "grad_norm": 2.743136405944824, + "learning_rate": 6.353242913361923e-08, + "loss": 0.0356, + "step": 35422 + }, + { + "epoch": 96.52043596730245, + "grad_norm": 2.221099376678467, + "learning_rate": 6.34331484667683e-08, + "loss": 0.0544, + "step": 35423 + }, + { + "epoch": 96.52316076294278, + "grad_norm": 2.3044931888580322, + "learning_rate": 6.333394518558078e-08, + "loss": 0.0294, + "step": 35424 + }, + { + "epoch": 96.52588555858311, + "grad_norm": 1.9390853643417358, + "learning_rate": 6.323481929082831e-08, + "loss": 0.0161, + "step": 35425 + }, + { + "epoch": 96.52861035422343, + "grad_norm": 2.6898579597473145, + "learning_rate": 6.313577078328358e-08, + "loss": 0.0737, + "step": 35426 + }, + { + "epoch": 96.53133514986376, + "grad_norm": 2.4154839515686035, + "learning_rate": 6.303679966371712e-08, + "loss": 0.0497, + "step": 35427 + }, + { + "epoch": 96.53405994550408, + "grad_norm": 2.372375249862671, + "learning_rate": 6.29379059329005e-08, + "loss": 0.0916, + "step": 35428 + }, + { + "epoch": 96.53678474114442, + "grad_norm": 1.3991450071334839, + "learning_rate": 6.283908959160424e-08, + "loss": 0.1319, + "step": 35429 + }, + { + "epoch": 96.53950953678473, + "grad_norm": 2.4112188816070557, + "learning_rate": 6.274035064059658e-08, + "loss": 0.0329, + "step": 35430 + }, + { + "epoch": 96.54223433242507, + "grad_norm": 2.5971317291259766, + "learning_rate": 6.264168908064694e-08, + "loss": 0.1263, + "step": 35431 + }, + { + "epoch": 96.5449591280654, + "grad_norm": 2.3224124908447266, + "learning_rate": 6.254310491252469e-08, + "loss": 0.0701, + "step": 35432 + }, + { + "epoch": 96.54768392370572, + "grad_norm": 1.5080344676971436, + "learning_rate": 6.244459813699699e-08, + "loss": 0.0801, + "step": 35433 + }, + { + "epoch": 96.55040871934605, + "grad_norm": 2.822840452194214, + "learning_rate": 6.234616875483101e-08, + "loss": 0.0414, + "step": 35434 + }, + { + "epoch": 96.55313351498637, + "grad_norm": 3.74899959564209, + "learning_rate": 6.224781676679281e-08, + "loss": 0.0468, + "step": 35435 + }, + { + "epoch": 96.5558583106267, + "grad_norm": 3.728947162628174, + "learning_rate": 6.214954217364844e-08, + "loss": 0.1173, + "step": 35436 + }, + { + "epoch": 96.55858310626704, + "grad_norm": 2.3255670070648193, + "learning_rate": 6.205134497616394e-08, + "loss": 0.0326, + "step": 35437 + }, + { + "epoch": 96.56130790190736, + "grad_norm": 3.693643808364868, + "learning_rate": 6.195322517510427e-08, + "loss": 0.0522, + "step": 35438 + }, + { + "epoch": 96.56403269754769, + "grad_norm": 2.8127853870391846, + "learning_rate": 6.185518277123215e-08, + "loss": 0.0293, + "step": 35439 + }, + { + "epoch": 96.566757493188, + "grad_norm": 2.7797751426696777, + "learning_rate": 6.175721776531251e-08, + "loss": 0.0236, + "step": 35440 + }, + { + "epoch": 96.56948228882834, + "grad_norm": 2.783245325088501, + "learning_rate": 6.16593301581081e-08, + "loss": 0.1711, + "step": 35441 + }, + { + "epoch": 96.57220708446866, + "grad_norm": 3.790992021560669, + "learning_rate": 6.156151995038052e-08, + "loss": 0.0772, + "step": 35442 + }, + { + "epoch": 96.57493188010899, + "grad_norm": 2.600486993789673, + "learning_rate": 6.146378714289136e-08, + "loss": 0.2184, + "step": 35443 + }, + { + "epoch": 96.57765667574932, + "grad_norm": 3.12739634513855, + "learning_rate": 6.136613173640338e-08, + "loss": 0.0754, + "step": 35444 + }, + { + "epoch": 96.58038147138964, + "grad_norm": 2.153390645980835, + "learning_rate": 6.126855373167595e-08, + "loss": 0.0289, + "step": 35445 + }, + { + "epoch": 96.58310626702998, + "grad_norm": 3.036858320236206, + "learning_rate": 6.117105312946848e-08, + "loss": 0.0783, + "step": 35446 + }, + { + "epoch": 96.5858310626703, + "grad_norm": 2.371133804321289, + "learning_rate": 6.107362993054145e-08, + "loss": 0.0245, + "step": 35447 + }, + { + "epoch": 96.58855585831063, + "grad_norm": 3.0209193229675293, + "learning_rate": 6.097628413565315e-08, + "loss": 0.1349, + "step": 35448 + }, + { + "epoch": 96.59128065395096, + "grad_norm": 2.7885658740997314, + "learning_rate": 6.087901574556188e-08, + "loss": 0.022, + "step": 35449 + }, + { + "epoch": 96.59400544959128, + "grad_norm": 2.07749342918396, + "learning_rate": 6.078182476102479e-08, + "loss": 0.0191, + "step": 35450 + }, + { + "epoch": 96.59673024523161, + "grad_norm": 2.2811388969421387, + "learning_rate": 6.068471118279796e-08, + "loss": 0.0646, + "step": 35451 + }, + { + "epoch": 96.59945504087193, + "grad_norm": 2.1365513801574707, + "learning_rate": 6.058767501163965e-08, + "loss": 0.0244, + "step": 35452 + }, + { + "epoch": 96.60217983651226, + "grad_norm": 2.067659616470337, + "learning_rate": 6.049071624830371e-08, + "loss": 0.1074, + "step": 35453 + }, + { + "epoch": 96.60490463215258, + "grad_norm": 2.351426601409912, + "learning_rate": 6.039383489354734e-08, + "loss": 0.0185, + "step": 35454 + }, + { + "epoch": 96.60762942779292, + "grad_norm": 2.4213521480560303, + "learning_rate": 6.029703094812433e-08, + "loss": 0.0826, + "step": 35455 + }, + { + "epoch": 96.61035422343325, + "grad_norm": 2.7885429859161377, + "learning_rate": 6.020030441278635e-08, + "loss": 0.1608, + "step": 35456 + }, + { + "epoch": 96.61307901907357, + "grad_norm": 2.439114570617676, + "learning_rate": 6.010365528828944e-08, + "loss": 0.0383, + "step": 35457 + }, + { + "epoch": 96.6158038147139, + "grad_norm": 2.6008098125457764, + "learning_rate": 6.00070835753852e-08, + "loss": 0.0593, + "step": 35458 + }, + { + "epoch": 96.61852861035422, + "grad_norm": 1.9538836479187012, + "learning_rate": 5.991058927482641e-08, + "loss": 0.0721, + "step": 35459 + }, + { + "epoch": 96.62125340599455, + "grad_norm": 2.3058667182922363, + "learning_rate": 5.981417238736353e-08, + "loss": 0.0708, + "step": 35460 + }, + { + "epoch": 96.62397820163488, + "grad_norm": 3.0144667625427246, + "learning_rate": 5.971783291374822e-08, + "loss": 0.0875, + "step": 35461 + }, + { + "epoch": 96.6267029972752, + "grad_norm": 1.9830503463745117, + "learning_rate": 5.962157085473097e-08, + "loss": 0.0986, + "step": 35462 + }, + { + "epoch": 96.62942779291554, + "grad_norm": 4.235957622528076, + "learning_rate": 5.952538621106008e-08, + "loss": 0.1544, + "step": 35463 + }, + { + "epoch": 96.63215258855585, + "grad_norm": 2.2204272747039795, + "learning_rate": 5.942927898348494e-08, + "loss": 0.0731, + "step": 35464 + }, + { + "epoch": 96.63487738419619, + "grad_norm": 2.223872184753418, + "learning_rate": 5.933324917275607e-08, + "loss": 0.0343, + "step": 35465 + }, + { + "epoch": 96.6376021798365, + "grad_norm": 2.088108539581299, + "learning_rate": 5.923729677961954e-08, + "loss": 0.0281, + "step": 35466 + }, + { + "epoch": 96.64032697547684, + "grad_norm": 2.085111141204834, + "learning_rate": 5.914142180482252e-08, + "loss": 0.0408, + "step": 35467 + }, + { + "epoch": 96.64305177111717, + "grad_norm": 3.047095775604248, + "learning_rate": 5.90456242491122e-08, + "loss": 0.0477, + "step": 35468 + }, + { + "epoch": 96.64577656675749, + "grad_norm": 2.2496964931488037, + "learning_rate": 5.8949904113235756e-08, + "loss": 0.0954, + "step": 35469 + }, + { + "epoch": 96.64850136239782, + "grad_norm": 3.0736424922943115, + "learning_rate": 5.885426139793593e-08, + "loss": 0.1502, + "step": 35470 + }, + { + "epoch": 96.65122615803814, + "grad_norm": 8.928645133972168, + "learning_rate": 5.87586961039599e-08, + "loss": 0.1033, + "step": 35471 + }, + { + "epoch": 96.65395095367847, + "grad_norm": 1.8662821054458618, + "learning_rate": 5.866320823205152e-08, + "loss": 0.0277, + "step": 35472 + }, + { + "epoch": 96.65667574931881, + "grad_norm": 3.231903553009033, + "learning_rate": 5.856779778295352e-08, + "loss": 0.0707, + "step": 35473 + }, + { + "epoch": 96.65940054495913, + "grad_norm": 2.469789505004883, + "learning_rate": 5.847246475740975e-08, + "loss": 0.0566, + "step": 35474 + }, + { + "epoch": 96.66212534059946, + "grad_norm": 2.4956843852996826, + "learning_rate": 5.837720915616296e-08, + "loss": 0.0863, + "step": 35475 + }, + { + "epoch": 96.66485013623978, + "grad_norm": 3.3892629146575928, + "learning_rate": 5.828203097995366e-08, + "loss": 0.1029, + "step": 35476 + }, + { + "epoch": 96.66757493188011, + "grad_norm": 3.15836501121521, + "learning_rate": 5.8186930229524595e-08, + "loss": 0.1668, + "step": 35477 + }, + { + "epoch": 96.67029972752043, + "grad_norm": 4.306105136871338, + "learning_rate": 5.809190690561517e-08, + "loss": 0.0819, + "step": 35478 + }, + { + "epoch": 96.67302452316076, + "grad_norm": 2.091834306716919, + "learning_rate": 5.799696100896701e-08, + "loss": 0.0386, + "step": 35479 + }, + { + "epoch": 96.6757493188011, + "grad_norm": 1.1044886112213135, + "learning_rate": 5.790209254031731e-08, + "loss": 0.0143, + "step": 35480 + }, + { + "epoch": 96.67847411444141, + "grad_norm": 2.554041862487793, + "learning_rate": 5.780730150040659e-08, + "loss": 0.1086, + "step": 35481 + }, + { + "epoch": 96.68119891008175, + "grad_norm": 6.993478298187256, + "learning_rate": 5.7712587889973136e-08, + "loss": 0.1051, + "step": 35482 + }, + { + "epoch": 96.68392370572207, + "grad_norm": 2.266606569290161, + "learning_rate": 5.761795170975304e-08, + "loss": 0.0423, + "step": 35483 + }, + { + "epoch": 96.6866485013624, + "grad_norm": 2.4315783977508545, + "learning_rate": 5.752339296048459e-08, + "loss": 0.0336, + "step": 35484 + }, + { + "epoch": 96.68937329700273, + "grad_norm": 1.8120712041854858, + "learning_rate": 5.742891164290498e-08, + "loss": 0.0333, + "step": 35485 + }, + { + "epoch": 96.69209809264305, + "grad_norm": 1.5353174209594727, + "learning_rate": 5.733450775774807e-08, + "loss": 0.0256, + "step": 35486 + }, + { + "epoch": 96.69482288828338, + "grad_norm": 2.4484543800354004, + "learning_rate": 5.724018130574993e-08, + "loss": 0.0365, + "step": 35487 + }, + { + "epoch": 96.6975476839237, + "grad_norm": 4.073673725128174, + "learning_rate": 5.714593228764553e-08, + "loss": 0.0515, + "step": 35488 + }, + { + "epoch": 96.70027247956403, + "grad_norm": 2.161654472351074, + "learning_rate": 5.7051760704168734e-08, + "loss": 0.0338, + "step": 35489 + }, + { + "epoch": 96.70299727520435, + "grad_norm": 2.069058895111084, + "learning_rate": 5.695766655605228e-08, + "loss": 0.0229, + "step": 35490 + }, + { + "epoch": 96.70572207084469, + "grad_norm": 4.5033769607543945, + "learning_rate": 5.686364984403003e-08, + "loss": 0.0317, + "step": 35491 + }, + { + "epoch": 96.70844686648502, + "grad_norm": 1.8857495784759521, + "learning_rate": 5.676971056883362e-08, + "loss": 0.1158, + "step": 35492 + }, + { + "epoch": 96.71117166212534, + "grad_norm": 2.522603988647461, + "learning_rate": 5.6675848731194695e-08, + "loss": 0.0276, + "step": 35493 + }, + { + "epoch": 96.71389645776567, + "grad_norm": 3.187896251678467, + "learning_rate": 5.658206433184377e-08, + "loss": 0.03, + "step": 35494 + }, + { + "epoch": 96.71662125340599, + "grad_norm": 2.375319242477417, + "learning_rate": 5.648835737151248e-08, + "loss": 0.0637, + "step": 35495 + }, + { + "epoch": 96.71934604904632, + "grad_norm": 2.4035370349884033, + "learning_rate": 5.6394727850929145e-08, + "loss": 0.0502, + "step": 35496 + }, + { + "epoch": 96.72207084468666, + "grad_norm": 2.127671957015991, + "learning_rate": 5.6301175770824277e-08, + "loss": 0.0391, + "step": 35497 + }, + { + "epoch": 96.72479564032697, + "grad_norm": 2.6739914417266846, + "learning_rate": 5.620770113192509e-08, + "loss": 0.0335, + "step": 35498 + }, + { + "epoch": 96.7275204359673, + "grad_norm": 2.37778902053833, + "learning_rate": 5.611430393496098e-08, + "loss": 0.0531, + "step": 35499 + }, + { + "epoch": 96.73024523160763, + "grad_norm": 2.3967061042785645, + "learning_rate": 5.602098418065804e-08, + "loss": 0.0332, + "step": 35500 + }, + { + "epoch": 96.73297002724796, + "grad_norm": 2.5274176597595215, + "learning_rate": 5.592774186974348e-08, + "loss": 0.0214, + "step": 35501 + }, + { + "epoch": 96.73569482288828, + "grad_norm": 2.33677077293396, + "learning_rate": 5.5834577002944476e-08, + "loss": 0.0479, + "step": 35502 + }, + { + "epoch": 96.73841961852861, + "grad_norm": 1.8418856859207153, + "learning_rate": 5.574148958098491e-08, + "loss": 0.1129, + "step": 35503 + }, + { + "epoch": 96.74114441416894, + "grad_norm": 2.4903202056884766, + "learning_rate": 5.5648479604590856e-08, + "loss": 0.0392, + "step": 35504 + }, + { + "epoch": 96.74386920980926, + "grad_norm": 1.9814727306365967, + "learning_rate": 5.555554707448618e-08, + "loss": 0.0682, + "step": 35505 + }, + { + "epoch": 96.7465940054496, + "grad_norm": 1.7760999202728271, + "learning_rate": 5.5462691991395865e-08, + "loss": 0.0482, + "step": 35506 + }, + { + "epoch": 96.74931880108991, + "grad_norm": 2.503962516784668, + "learning_rate": 5.5369914356041556e-08, + "loss": 0.0947, + "step": 35507 + }, + { + "epoch": 96.75204359673025, + "grad_norm": 5.7593674659729, + "learning_rate": 5.527721416914489e-08, + "loss": 0.0524, + "step": 35508 + }, + { + "epoch": 96.75476839237058, + "grad_norm": 2.3444464206695557, + "learning_rate": 5.5184591431430845e-08, + "loss": 0.0279, + "step": 35509 + }, + { + "epoch": 96.7574931880109, + "grad_norm": 4.473971366882324, + "learning_rate": 5.5092046143618846e-08, + "loss": 0.1204, + "step": 35510 + }, + { + "epoch": 96.76021798365123, + "grad_norm": 2.6154189109802246, + "learning_rate": 5.4999578306429436e-08, + "loss": 0.0326, + "step": 35511 + }, + { + "epoch": 96.76294277929155, + "grad_norm": 2.3137433528900146, + "learning_rate": 5.490718792058314e-08, + "loss": 0.1018, + "step": 35512 + }, + { + "epoch": 96.76566757493188, + "grad_norm": 1.6487475633621216, + "learning_rate": 5.4814874986800495e-08, + "loss": 0.0256, + "step": 35513 + }, + { + "epoch": 96.7683923705722, + "grad_norm": 2.6181390285491943, + "learning_rate": 5.4722639505798704e-08, + "loss": 0.0454, + "step": 35514 + }, + { + "epoch": 96.77111716621253, + "grad_norm": 2.4293861389160156, + "learning_rate": 5.4630481478297196e-08, + "loss": 0.0397, + "step": 35515 + }, + { + "epoch": 96.77384196185287, + "grad_norm": 2.441007375717163, + "learning_rate": 5.453840090501317e-08, + "loss": 0.0512, + "step": 35516 + }, + { + "epoch": 96.77656675749319, + "grad_norm": 1.941656470298767, + "learning_rate": 5.4446397786664936e-08, + "loss": 0.1108, + "step": 35517 + }, + { + "epoch": 96.77929155313352, + "grad_norm": 3.0584681034088135, + "learning_rate": 5.43544721239675e-08, + "loss": 0.111, + "step": 35518 + }, + { + "epoch": 96.78201634877384, + "grad_norm": 2.185162305831909, + "learning_rate": 5.4262623917636925e-08, + "loss": 0.0354, + "step": 35519 + }, + { + "epoch": 96.78474114441417, + "grad_norm": 2.0862855911254883, + "learning_rate": 5.417085316838933e-08, + "loss": 0.0433, + "step": 35520 + }, + { + "epoch": 96.7874659400545, + "grad_norm": 2.384084463119507, + "learning_rate": 5.407915987693857e-08, + "loss": 0.0238, + "step": 35521 + }, + { + "epoch": 96.79019073569482, + "grad_norm": 2.707002639770508, + "learning_rate": 5.398754404399964e-08, + "loss": 0.0484, + "step": 35522 + }, + { + "epoch": 96.79291553133515, + "grad_norm": 2.577698230743408, + "learning_rate": 5.38960056702853e-08, + "loss": 0.101, + "step": 35523 + }, + { + "epoch": 96.79564032697547, + "grad_norm": 2.1527206897735596, + "learning_rate": 5.380454475650942e-08, + "loss": 0.0341, + "step": 35524 + }, + { + "epoch": 96.7983651226158, + "grad_norm": 2.3384931087493896, + "learning_rate": 5.371316130338255e-08, + "loss": 0.0854, + "step": 35525 + }, + { + "epoch": 96.80108991825612, + "grad_norm": 1.8126362562179565, + "learning_rate": 5.362185531161746e-08, + "loss": 0.0747, + "step": 35526 + }, + { + "epoch": 96.80381471389646, + "grad_norm": 2.0274250507354736, + "learning_rate": 5.353062678192689e-08, + "loss": 0.0655, + "step": 35527 + }, + { + "epoch": 96.80653950953679, + "grad_norm": 2.397373914718628, + "learning_rate": 5.343947571501806e-08, + "loss": 0.0363, + "step": 35528 + }, + { + "epoch": 96.80926430517711, + "grad_norm": 7.551501274108887, + "learning_rate": 5.334840211160264e-08, + "loss": 0.0401, + "step": 35529 + }, + { + "epoch": 96.81198910081744, + "grad_norm": 1.9004566669464111, + "learning_rate": 5.3257405972390043e-08, + "loss": 0.0318, + "step": 35530 + }, + { + "epoch": 96.81471389645776, + "grad_norm": 2.246920108795166, + "learning_rate": 5.316648729808971e-08, + "loss": 0.0643, + "step": 35531 + }, + { + "epoch": 96.8174386920981, + "grad_norm": 2.6450071334838867, + "learning_rate": 5.307564608940663e-08, + "loss": 0.0537, + "step": 35532 + }, + { + "epoch": 96.82016348773843, + "grad_norm": 1.4076768159866333, + "learning_rate": 5.2984882347051345e-08, + "loss": 0.0177, + "step": 35533 + }, + { + "epoch": 96.82288828337875, + "grad_norm": 2.5664820671081543, + "learning_rate": 5.2894196071729966e-08, + "loss": 0.0418, + "step": 35534 + }, + { + "epoch": 96.82561307901908, + "grad_norm": 2.4444258213043213, + "learning_rate": 5.280358726414858e-08, + "loss": 0.0339, + "step": 35535 + }, + { + "epoch": 96.8283378746594, + "grad_norm": 2.2147350311279297, + "learning_rate": 5.271305592501108e-08, + "loss": 0.0499, + "step": 35536 + }, + { + "epoch": 96.83106267029973, + "grad_norm": 2.550987958908081, + "learning_rate": 5.262260205502578e-08, + "loss": 0.0985, + "step": 35537 + }, + { + "epoch": 96.83378746594005, + "grad_norm": 2.4605648517608643, + "learning_rate": 5.253222565489546e-08, + "loss": 0.0767, + "step": 35538 + }, + { + "epoch": 96.83651226158038, + "grad_norm": 4.611190319061279, + "learning_rate": 5.244192672532289e-08, + "loss": 0.2291, + "step": 35539 + }, + { + "epoch": 96.83923705722071, + "grad_norm": 1.9465532302856445, + "learning_rate": 5.2351705267013055e-08, + "loss": 0.0579, + "step": 35540 + }, + { + "epoch": 96.84196185286103, + "grad_norm": 4.9753594398498535, + "learning_rate": 5.2261561280667614e-08, + "loss": 0.1049, + "step": 35541 + }, + { + "epoch": 96.84468664850137, + "grad_norm": 2.467731475830078, + "learning_rate": 5.217149476698935e-08, + "loss": 0.0849, + "step": 35542 + }, + { + "epoch": 96.84741144414168, + "grad_norm": 2.3039093017578125, + "learning_rate": 5.2081505726679916e-08, + "loss": 0.0316, + "step": 35543 + }, + { + "epoch": 96.85013623978202, + "grad_norm": 3.5640945434570312, + "learning_rate": 5.199159416043875e-08, + "loss": 0.0335, + "step": 35544 + }, + { + "epoch": 96.85286103542235, + "grad_norm": 2.324336290359497, + "learning_rate": 5.190176006896641e-08, + "loss": 0.0506, + "step": 35545 + }, + { + "epoch": 96.85558583106267, + "grad_norm": 2.183614492416382, + "learning_rate": 5.181200345296455e-08, + "loss": 0.0506, + "step": 35546 + }, + { + "epoch": 96.858310626703, + "grad_norm": 3.2237741947174072, + "learning_rate": 5.172232431312929e-08, + "loss": 0.03, + "step": 35547 + }, + { + "epoch": 96.86103542234332, + "grad_norm": 2.060969591140747, + "learning_rate": 5.163272265016117e-08, + "loss": 0.0541, + "step": 35548 + }, + { + "epoch": 96.86376021798365, + "grad_norm": 2.4621293544769287, + "learning_rate": 5.154319846475631e-08, + "loss": 0.023, + "step": 35549 + }, + { + "epoch": 96.86648501362397, + "grad_norm": 2.451321840286255, + "learning_rate": 5.1453751757614136e-08, + "loss": 0.0316, + "step": 35550 + }, + { + "epoch": 96.8692098092643, + "grad_norm": 1.8460115194320679, + "learning_rate": 5.1364382529428545e-08, + "loss": 0.0167, + "step": 35551 + }, + { + "epoch": 96.87193460490464, + "grad_norm": 3.7541723251342773, + "learning_rate": 5.1275090780897875e-08, + "loss": 0.0663, + "step": 35552 + }, + { + "epoch": 96.87465940054496, + "grad_norm": 2.6491284370422363, + "learning_rate": 5.1185876512716004e-08, + "loss": 0.0263, + "step": 35553 + }, + { + "epoch": 96.87738419618529, + "grad_norm": 2.2321131229400635, + "learning_rate": 5.109673972557905e-08, + "loss": 0.0197, + "step": 35554 + }, + { + "epoch": 96.88010899182561, + "grad_norm": 7.176581382751465, + "learning_rate": 5.1007680420179786e-08, + "loss": 0.0547, + "step": 35555 + }, + { + "epoch": 96.88283378746594, + "grad_norm": 2.114020586013794, + "learning_rate": 5.0918698597212104e-08, + "loss": 0.1361, + "step": 35556 + }, + { + "epoch": 96.88555858310627, + "grad_norm": 1.994983434677124, + "learning_rate": 5.082979425736989e-08, + "loss": 0.0905, + "step": 35557 + }, + { + "epoch": 96.88828337874659, + "grad_norm": 1.936752438545227, + "learning_rate": 5.074096740134593e-08, + "loss": 0.0306, + "step": 35558 + }, + { + "epoch": 96.89100817438693, + "grad_norm": 2.5228633880615234, + "learning_rate": 5.065221802983078e-08, + "loss": 0.0741, + "step": 35559 + }, + { + "epoch": 96.89373297002724, + "grad_norm": 1.7915103435516357, + "learning_rate": 5.0563546143515e-08, + "loss": 0.1433, + "step": 35560 + }, + { + "epoch": 96.89645776566758, + "grad_norm": 2.609074115753174, + "learning_rate": 5.047495174309025e-08, + "loss": 0.0458, + "step": 35561 + }, + { + "epoch": 96.8991825613079, + "grad_norm": 2.0458016395568848, + "learning_rate": 5.03864348292471e-08, + "loss": 0.022, + "step": 35562 + }, + { + "epoch": 96.90190735694823, + "grad_norm": 2.0826382637023926, + "learning_rate": 5.0297995402673884e-08, + "loss": 0.0388, + "step": 35563 + }, + { + "epoch": 96.90463215258856, + "grad_norm": 1.929991364479065, + "learning_rate": 5.0209633464060046e-08, + "loss": 0.0183, + "step": 35564 + }, + { + "epoch": 96.90735694822888, + "grad_norm": 2.0320088863372803, + "learning_rate": 5.0121349014091715e-08, + "loss": 0.1049, + "step": 35565 + }, + { + "epoch": 96.91008174386921, + "grad_norm": 16.922584533691406, + "learning_rate": 5.003314205345944e-08, + "loss": 0.0905, + "step": 35566 + }, + { + "epoch": 96.91280653950953, + "grad_norm": 2.336092710494995, + "learning_rate": 4.994501258284934e-08, + "loss": 0.1259, + "step": 35567 + }, + { + "epoch": 96.91553133514986, + "grad_norm": 1.9293670654296875, + "learning_rate": 4.985696060294642e-08, + "loss": 0.0248, + "step": 35568 + }, + { + "epoch": 96.9182561307902, + "grad_norm": 4.455367088317871, + "learning_rate": 4.9768986114436814e-08, + "loss": 0.1014, + "step": 35569 + }, + { + "epoch": 96.92098092643052, + "grad_norm": 3.27518630027771, + "learning_rate": 4.968108911800662e-08, + "loss": 0.0501, + "step": 35570 + }, + { + "epoch": 96.92370572207085, + "grad_norm": 3.5886731147766113, + "learning_rate": 4.9593269614339744e-08, + "loss": 0.0365, + "step": 35571 + }, + { + "epoch": 96.92643051771117, + "grad_norm": 2.05401611328125, + "learning_rate": 4.9505527604121194e-08, + "loss": 0.0264, + "step": 35572 + }, + { + "epoch": 96.9291553133515, + "grad_norm": 2.369694948196411, + "learning_rate": 4.941786308803154e-08, + "loss": 0.1041, + "step": 35573 + }, + { + "epoch": 96.93188010899182, + "grad_norm": 2.589430093765259, + "learning_rate": 4.933027606675689e-08, + "loss": 0.0654, + "step": 35574 + }, + { + "epoch": 96.93460490463215, + "grad_norm": 3.099961757659912, + "learning_rate": 4.924276654097671e-08, + "loss": 0.0288, + "step": 35575 + }, + { + "epoch": 96.93732970027249, + "grad_norm": 2.487401008605957, + "learning_rate": 4.9155334511373775e-08, + "loss": 0.1365, + "step": 35576 + }, + { + "epoch": 96.9400544959128, + "grad_norm": 3.020406723022461, + "learning_rate": 4.9067979978629776e-08, + "loss": 0.1856, + "step": 35577 + }, + { + "epoch": 96.94277929155314, + "grad_norm": 2.2442588806152344, + "learning_rate": 4.898070294342305e-08, + "loss": 0.0309, + "step": 35578 + }, + { + "epoch": 96.94550408719346, + "grad_norm": 3.3606913089752197, + "learning_rate": 4.8893503406435285e-08, + "loss": 0.046, + "step": 35579 + }, + { + "epoch": 96.94822888283379, + "grad_norm": 2.7061917781829834, + "learning_rate": 4.8806381368343705e-08, + "loss": 0.0324, + "step": 35580 + }, + { + "epoch": 96.95095367847412, + "grad_norm": 2.671208620071411, + "learning_rate": 4.8719336829827765e-08, + "loss": 0.0912, + "step": 35581 + }, + { + "epoch": 96.95367847411444, + "grad_norm": 2.5573370456695557, + "learning_rate": 4.8632369791565825e-08, + "loss": 0.0715, + "step": 35582 + }, + { + "epoch": 96.95640326975477, + "grad_norm": 2.2591705322265625, + "learning_rate": 4.854548025423511e-08, + "loss": 0.0418, + "step": 35583 + }, + { + "epoch": 96.95912806539509, + "grad_norm": 2.5224218368530273, + "learning_rate": 4.845866821851064e-08, + "loss": 0.0834, + "step": 35584 + }, + { + "epoch": 96.96185286103542, + "grad_norm": 3.1266067028045654, + "learning_rate": 4.837193368507076e-08, + "loss": 0.0334, + "step": 35585 + }, + { + "epoch": 96.96457765667574, + "grad_norm": 2.3245010375976562, + "learning_rate": 4.828527665458937e-08, + "loss": 0.0253, + "step": 35586 + }, + { + "epoch": 96.96730245231608, + "grad_norm": 23.660011291503906, + "learning_rate": 4.8198697127742613e-08, + "loss": 0.0601, + "step": 35587 + }, + { + "epoch": 96.97002724795641, + "grad_norm": 4.185683250427246, + "learning_rate": 4.811219510520437e-08, + "loss": 0.0262, + "step": 35588 + }, + { + "epoch": 96.97275204359673, + "grad_norm": 2.4813575744628906, + "learning_rate": 4.802577058764635e-08, + "loss": 0.0236, + "step": 35589 + }, + { + "epoch": 96.97547683923706, + "grad_norm": 2.5231006145477295, + "learning_rate": 4.793942357574466e-08, + "loss": 0.0427, + "step": 35590 + }, + { + "epoch": 96.97820163487738, + "grad_norm": 2.479731559753418, + "learning_rate": 4.7853154070169885e-08, + "loss": 0.0423, + "step": 35591 + }, + { + "epoch": 96.98092643051771, + "grad_norm": 2.662405014038086, + "learning_rate": 4.776696207159481e-08, + "loss": 0.0286, + "step": 35592 + }, + { + "epoch": 96.98365122615803, + "grad_norm": 2.94612979888916, + "learning_rate": 4.7680847580691136e-08, + "loss": 0.1132, + "step": 35593 + }, + { + "epoch": 96.98637602179836, + "grad_norm": 2.1367650032043457, + "learning_rate": 4.75948105981272e-08, + "loss": 0.0974, + "step": 35594 + }, + { + "epoch": 96.9891008174387, + "grad_norm": 4.904690742492676, + "learning_rate": 4.7508851124574705e-08, + "loss": 0.0674, + "step": 35595 + }, + { + "epoch": 96.99182561307902, + "grad_norm": 1.8304905891418457, + "learning_rate": 4.742296916070421e-08, + "loss": 0.0768, + "step": 35596 + }, + { + "epoch": 96.99455040871935, + "grad_norm": 2.413317918777466, + "learning_rate": 4.733716470718186e-08, + "loss": 0.0181, + "step": 35597 + }, + { + "epoch": 96.99727520435967, + "grad_norm": 2.6462340354919434, + "learning_rate": 4.725143776467822e-08, + "loss": 0.0844, + "step": 35598 + }, + { + "epoch": 97.0, + "grad_norm": 1.5588715076446533, + "learning_rate": 4.716578833386054e-08, + "loss": 0.0205, + "step": 35599 + }, + { + "epoch": 97.00272479564033, + "grad_norm": 2.9802091121673584, + "learning_rate": 4.7080216415394954e-08, + "loss": 0.063, + "step": 35600 + }, + { + "epoch": 97.00544959128065, + "grad_norm": 2.9426045417785645, + "learning_rate": 4.699472200994759e-08, + "loss": 0.0283, + "step": 35601 + }, + { + "epoch": 97.00817438692098, + "grad_norm": 1.8756449222564697, + "learning_rate": 4.69093051181857e-08, + "loss": 0.0593, + "step": 35602 + }, + { + "epoch": 97.0108991825613, + "grad_norm": 3.53544545173645, + "learning_rate": 4.682396574077319e-08, + "loss": 0.0279, + "step": 35603 + }, + { + "epoch": 97.01362397820164, + "grad_norm": 2.3807857036590576, + "learning_rate": 4.6738703878376204e-08, + "loss": 0.0459, + "step": 35604 + }, + { + "epoch": 97.01634877384195, + "grad_norm": 2.192631721496582, + "learning_rate": 4.665351953165642e-08, + "loss": 0.0422, + "step": 35605 + }, + { + "epoch": 97.01907356948229, + "grad_norm": 3.610191822052002, + "learning_rate": 4.656841270127999e-08, + "loss": 0.1389, + "step": 35606 + }, + { + "epoch": 97.02179836512262, + "grad_norm": 2.798900604248047, + "learning_rate": 4.6483383387908585e-08, + "loss": 0.0817, + "step": 35607 + }, + { + "epoch": 97.02452316076294, + "grad_norm": 4.655253887176514, + "learning_rate": 4.6398431592202805e-08, + "loss": 0.0451, + "step": 35608 + }, + { + "epoch": 97.02724795640327, + "grad_norm": 2.315178155899048, + "learning_rate": 4.6313557314826564e-08, + "loss": 0.0496, + "step": 35609 + }, + { + "epoch": 97.02997275204359, + "grad_norm": 1.9423848390579224, + "learning_rate": 4.622876055643932e-08, + "loss": 0.0274, + "step": 35610 + }, + { + "epoch": 97.03269754768392, + "grad_norm": 2.0493133068084717, + "learning_rate": 4.614404131770389e-08, + "loss": 0.0243, + "step": 35611 + }, + { + "epoch": 97.03542234332426, + "grad_norm": 3.3066389560699463, + "learning_rate": 4.605939959927641e-08, + "loss": 0.0523, + "step": 35612 + }, + { + "epoch": 97.03814713896458, + "grad_norm": 4.777273654937744, + "learning_rate": 4.597483540181968e-08, + "loss": 0.0293, + "step": 35613 + }, + { + "epoch": 97.04087193460491, + "grad_norm": 2.330043315887451, + "learning_rate": 4.5890348725988744e-08, + "loss": 0.0261, + "step": 35614 + }, + { + "epoch": 97.04359673024523, + "grad_norm": 3.9469618797302246, + "learning_rate": 4.5805939572444166e-08, + "loss": 0.0224, + "step": 35615 + }, + { + "epoch": 97.04632152588556, + "grad_norm": 2.940596342086792, + "learning_rate": 4.572160794184322e-08, + "loss": 0.0392, + "step": 35616 + }, + { + "epoch": 97.04904632152588, + "grad_norm": 2.8023288249969482, + "learning_rate": 4.563735383484091e-08, + "loss": 0.0338, + "step": 35617 + }, + { + "epoch": 97.05177111716621, + "grad_norm": 2.739731788635254, + "learning_rate": 4.5553177252095624e-08, + "loss": 0.0534, + "step": 35618 + }, + { + "epoch": 97.05449591280654, + "grad_norm": 2.1139893531799316, + "learning_rate": 4.5469078194261276e-08, + "loss": 0.0328, + "step": 35619 + }, + { + "epoch": 97.05722070844686, + "grad_norm": 2.6700010299682617, + "learning_rate": 4.5385056661992886e-08, + "loss": 0.0255, + "step": 35620 + }, + { + "epoch": 97.0599455040872, + "grad_norm": 2.1723580360412598, + "learning_rate": 4.53011126559455e-08, + "loss": 0.0158, + "step": 35621 + }, + { + "epoch": 97.06267029972751, + "grad_norm": 1.5713322162628174, + "learning_rate": 4.5217246176773036e-08, + "loss": 0.0194, + "step": 35622 + }, + { + "epoch": 97.06539509536785, + "grad_norm": 2.799923896789551, + "learning_rate": 4.5133457225128296e-08, + "loss": 0.0423, + "step": 35623 + }, + { + "epoch": 97.06811989100818, + "grad_norm": 2.719472646713257, + "learning_rate": 4.50497458016641e-08, + "loss": 0.0711, + "step": 35624 + }, + { + "epoch": 97.0708446866485, + "grad_norm": 17.930240631103516, + "learning_rate": 4.496611190703104e-08, + "loss": 0.0529, + "step": 35625 + }, + { + "epoch": 97.07356948228883, + "grad_norm": 1.8039621114730835, + "learning_rate": 4.488255554188192e-08, + "loss": 0.1001, + "step": 35626 + }, + { + "epoch": 97.07629427792915, + "grad_norm": 1.8604620695114136, + "learning_rate": 4.479907670686734e-08, + "loss": 0.0262, + "step": 35627 + }, + { + "epoch": 97.07901907356948, + "grad_norm": 2.324397087097168, + "learning_rate": 4.4715675402636774e-08, + "loss": 0.0389, + "step": 35628 + }, + { + "epoch": 97.0817438692098, + "grad_norm": 3.6882824897766113, + "learning_rate": 4.463235162984081e-08, + "loss": 0.0382, + "step": 35629 + }, + { + "epoch": 97.08446866485014, + "grad_norm": 2.095919370651245, + "learning_rate": 4.454910538912671e-08, + "loss": 0.0237, + "step": 35630 + }, + { + "epoch": 97.08719346049047, + "grad_norm": 3.908423900604248, + "learning_rate": 4.446593668114396e-08, + "loss": 0.08, + "step": 35631 + }, + { + "epoch": 97.08991825613079, + "grad_norm": 2.1432840824127197, + "learning_rate": 4.438284550654093e-08, + "loss": 0.0335, + "step": 35632 + }, + { + "epoch": 97.09264305177112, + "grad_norm": 2.915332794189453, + "learning_rate": 4.4299831865962653e-08, + "loss": 0.1137, + "step": 35633 + }, + { + "epoch": 97.09536784741144, + "grad_norm": 3.781524658203125, + "learning_rate": 4.42168957600575e-08, + "loss": 0.1042, + "step": 35634 + }, + { + "epoch": 97.09809264305177, + "grad_norm": 2.3162896633148193, + "learning_rate": 4.413403718947162e-08, + "loss": 0.051, + "step": 35635 + }, + { + "epoch": 97.1008174386921, + "grad_norm": 2.087754011154175, + "learning_rate": 4.4051256154847844e-08, + "loss": 0.022, + "step": 35636 + }, + { + "epoch": 97.10354223433242, + "grad_norm": 2.776384115219116, + "learning_rate": 4.396855265683342e-08, + "loss": 0.0267, + "step": 35637 + }, + { + "epoch": 97.10626702997276, + "grad_norm": 2.3792355060577393, + "learning_rate": 4.388592669607117e-08, + "loss": 0.0267, + "step": 35638 + }, + { + "epoch": 97.10899182561307, + "grad_norm": 1.4954745769500732, + "learning_rate": 4.3803378273205024e-08, + "loss": 0.0215, + "step": 35639 + }, + { + "epoch": 97.11171662125341, + "grad_norm": 3.321103096008301, + "learning_rate": 4.37209073888778e-08, + "loss": 0.1687, + "step": 35640 + }, + { + "epoch": 97.11444141689373, + "grad_norm": 2.249972343444824, + "learning_rate": 4.363851404373121e-08, + "loss": 0.0383, + "step": 35641 + }, + { + "epoch": 97.11716621253406, + "grad_norm": 2.076660394668579, + "learning_rate": 4.3556198238408064e-08, + "loss": 0.0691, + "step": 35642 + }, + { + "epoch": 97.11989100817439, + "grad_norm": 3.3433871269226074, + "learning_rate": 4.3473959973547866e-08, + "loss": 0.0686, + "step": 35643 + }, + { + "epoch": 97.12261580381471, + "grad_norm": 3.1689705848693848, + "learning_rate": 4.339179924979342e-08, + "loss": 0.1157, + "step": 35644 + }, + { + "epoch": 97.12534059945504, + "grad_norm": 2.73633074760437, + "learning_rate": 4.3309716067782e-08, + "loss": 0.1455, + "step": 35645 + }, + { + "epoch": 97.12806539509536, + "grad_norm": 2.4419350624084473, + "learning_rate": 4.322771042815421e-08, + "loss": 0.0266, + "step": 35646 + }, + { + "epoch": 97.1307901907357, + "grad_norm": 2.533695697784424, + "learning_rate": 4.314578233154953e-08, + "loss": 0.0257, + "step": 35647 + }, + { + "epoch": 97.13351498637603, + "grad_norm": 3.47039532661438, + "learning_rate": 4.306393177860413e-08, + "loss": 0.0442, + "step": 35648 + }, + { + "epoch": 97.13623978201635, + "grad_norm": 7.448739051818848, + "learning_rate": 4.2982158769956375e-08, + "loss": 0.1653, + "step": 35649 + }, + { + "epoch": 97.13896457765668, + "grad_norm": 3.205759286880493, + "learning_rate": 4.290046330624354e-08, + "loss": 0.0518, + "step": 35650 + }, + { + "epoch": 97.141689373297, + "grad_norm": 2.101719617843628, + "learning_rate": 4.281884538810066e-08, + "loss": 0.0657, + "step": 35651 + }, + { + "epoch": 97.14441416893733, + "grad_norm": 1.5737000703811646, + "learning_rate": 4.2737305016165024e-08, + "loss": 0.0178, + "step": 35652 + }, + { + "epoch": 97.14713896457765, + "grad_norm": 2.535308599472046, + "learning_rate": 4.265584219107055e-08, + "loss": 0.0216, + "step": 35653 + }, + { + "epoch": 97.14986376021798, + "grad_norm": 1.0927975177764893, + "learning_rate": 4.25744569134523e-08, + "loss": 0.0164, + "step": 35654 + }, + { + "epoch": 97.15258855585832, + "grad_norm": 1.8163610696792603, + "learning_rate": 4.24931491839431e-08, + "loss": 0.0257, + "step": 35655 + }, + { + "epoch": 97.15531335149863, + "grad_norm": 2.726227283477783, + "learning_rate": 4.241191900317687e-08, + "loss": 0.0664, + "step": 35656 + }, + { + "epoch": 97.15803814713897, + "grad_norm": 5.813877105712891, + "learning_rate": 4.233076637178646e-08, + "loss": 0.0466, + "step": 35657 + }, + { + "epoch": 97.16076294277929, + "grad_norm": 2.5090365409851074, + "learning_rate": 4.224969129040246e-08, + "loss": 0.0704, + "step": 35658 + }, + { + "epoch": 97.16348773841962, + "grad_norm": 1.8353524208068848, + "learning_rate": 4.2168693759658815e-08, + "loss": 0.0668, + "step": 35659 + }, + { + "epoch": 97.16621253405995, + "grad_norm": 4.932413578033447, + "learning_rate": 4.208777378018392e-08, + "loss": 0.0461, + "step": 35660 + }, + { + "epoch": 97.16893732970027, + "grad_norm": 3.0826075077056885, + "learning_rate": 4.200693135260836e-08, + "loss": 0.0729, + "step": 35661 + }, + { + "epoch": 97.1716621253406, + "grad_norm": 2.846266269683838, + "learning_rate": 4.192616647756387e-08, + "loss": 0.06, + "step": 35662 + }, + { + "epoch": 97.17438692098092, + "grad_norm": 1.3967534303665161, + "learning_rate": 4.184547915567661e-08, + "loss": 0.0163, + "step": 35663 + }, + { + "epoch": 97.17711171662125, + "grad_norm": 2.4666824340820312, + "learning_rate": 4.1764869387577175e-08, + "loss": 0.0367, + "step": 35664 + }, + { + "epoch": 97.17983651226157, + "grad_norm": 2.026526927947998, + "learning_rate": 4.168433717389286e-08, + "loss": 0.0255, + "step": 35665 + }, + { + "epoch": 97.1825613079019, + "grad_norm": 4.576807498931885, + "learning_rate": 4.1603882515248714e-08, + "loss": 0.0392, + "step": 35666 + }, + { + "epoch": 97.18528610354224, + "grad_norm": 5.354944229125977, + "learning_rate": 4.1523505412274235e-08, + "loss": 0.0359, + "step": 35667 + }, + { + "epoch": 97.18801089918256, + "grad_norm": 4.240804195404053, + "learning_rate": 4.144320586559447e-08, + "loss": 0.0708, + "step": 35668 + }, + { + "epoch": 97.19073569482289, + "grad_norm": 1.174184799194336, + "learning_rate": 4.1362983875833373e-08, + "loss": 0.0165, + "step": 35669 + }, + { + "epoch": 97.19346049046321, + "grad_norm": 2.881422758102417, + "learning_rate": 4.1282839443617106e-08, + "loss": 0.1455, + "step": 35670 + }, + { + "epoch": 97.19618528610354, + "grad_norm": 2.0956594944000244, + "learning_rate": 4.1202772569570724e-08, + "loss": 0.0755, + "step": 35671 + }, + { + "epoch": 97.19891008174388, + "grad_norm": 5.350720405578613, + "learning_rate": 4.1122783254315955e-08, + "loss": 0.0434, + "step": 35672 + }, + { + "epoch": 97.2016348773842, + "grad_norm": 2.869659185409546, + "learning_rate": 4.1042871498476746e-08, + "loss": 0.0341, + "step": 35673 + }, + { + "epoch": 97.20435967302453, + "grad_norm": 2.8423678874969482, + "learning_rate": 4.09630373026737e-08, + "loss": 0.0985, + "step": 35674 + }, + { + "epoch": 97.20708446866485, + "grad_norm": 1.7651212215423584, + "learning_rate": 4.088328066753078e-08, + "loss": 0.1022, + "step": 35675 + }, + { + "epoch": 97.20980926430518, + "grad_norm": 2.8172552585601807, + "learning_rate": 4.0803601593668586e-08, + "loss": 0.0491, + "step": 35676 + }, + { + "epoch": 97.2125340599455, + "grad_norm": 2.1117210388183594, + "learning_rate": 4.072400008170774e-08, + "loss": 0.0731, + "step": 35677 + }, + { + "epoch": 97.21525885558583, + "grad_norm": 5.589637756347656, + "learning_rate": 4.064447613226774e-08, + "loss": 0.0485, + "step": 35678 + }, + { + "epoch": 97.21798365122616, + "grad_norm": 1.5005141496658325, + "learning_rate": 4.0565029745966987e-08, + "loss": 0.0166, + "step": 35679 + }, + { + "epoch": 97.22070844686648, + "grad_norm": 1.5149348974227905, + "learning_rate": 4.0485660923426095e-08, + "loss": 0.0207, + "step": 35680 + }, + { + "epoch": 97.22343324250681, + "grad_norm": 2.9435641765594482, + "learning_rate": 4.0406369665262343e-08, + "loss": 0.0499, + "step": 35681 + }, + { + "epoch": 97.22615803814713, + "grad_norm": 2.9011828899383545, + "learning_rate": 4.032715597209302e-08, + "loss": 0.0581, + "step": 35682 + }, + { + "epoch": 97.22888283378747, + "grad_norm": 3.445481300354004, + "learning_rate": 4.024801984453541e-08, + "loss": 0.0699, + "step": 35683 + }, + { + "epoch": 97.2316076294278, + "grad_norm": 1.88826584815979, + "learning_rate": 4.016896128320569e-08, + "loss": 0.0194, + "step": 35684 + }, + { + "epoch": 97.23433242506812, + "grad_norm": 2.2753238677978516, + "learning_rate": 4.008998028872002e-08, + "loss": 0.0678, + "step": 35685 + }, + { + "epoch": 97.23705722070845, + "grad_norm": 2.4716103076934814, + "learning_rate": 4.0011076861691254e-08, + "loss": 0.0948, + "step": 35686 + }, + { + "epoch": 97.23978201634877, + "grad_norm": 4.816853046417236, + "learning_rate": 3.993225100273779e-08, + "loss": 0.1862, + "step": 35687 + }, + { + "epoch": 97.2425068119891, + "grad_norm": 2.6293253898620605, + "learning_rate": 3.985350271247024e-08, + "loss": 0.0963, + "step": 35688 + }, + { + "epoch": 97.24523160762942, + "grad_norm": 2.2298426628112793, + "learning_rate": 3.9774831991503674e-08, + "loss": 0.0421, + "step": 35689 + }, + { + "epoch": 97.24795640326975, + "grad_norm": 2.217453956604004, + "learning_rate": 3.9696238840448705e-08, + "loss": 0.0459, + "step": 35690 + }, + { + "epoch": 97.25068119891009, + "grad_norm": 2.6928329467773438, + "learning_rate": 3.9617723259920417e-08, + "loss": 0.0229, + "step": 35691 + }, + { + "epoch": 97.2534059945504, + "grad_norm": 2.535069704055786, + "learning_rate": 3.95392852505283e-08, + "loss": 0.0789, + "step": 35692 + }, + { + "epoch": 97.25613079019074, + "grad_norm": 3.881356716156006, + "learning_rate": 3.9460924812884107e-08, + "loss": 0.0964, + "step": 35693 + }, + { + "epoch": 97.25885558583106, + "grad_norm": 2.926912307739258, + "learning_rate": 3.938264194759622e-08, + "loss": 0.1163, + "step": 35694 + }, + { + "epoch": 97.26158038147139, + "grad_norm": 3.2584853172302246, + "learning_rate": 3.9304436655276393e-08, + "loss": 0.0648, + "step": 35695 + }, + { + "epoch": 97.26430517711172, + "grad_norm": 1.52204430103302, + "learning_rate": 3.922630893653301e-08, + "loss": 0.0248, + "step": 35696 + }, + { + "epoch": 97.26702997275204, + "grad_norm": 2.9916036128997803, + "learning_rate": 3.914825879197559e-08, + "loss": 0.1678, + "step": 35697 + }, + { + "epoch": 97.26975476839237, + "grad_norm": 2.6528549194335938, + "learning_rate": 3.9070286222210316e-08, + "loss": 0.068, + "step": 35698 + }, + { + "epoch": 97.2724795640327, + "grad_norm": 2.157846689224243, + "learning_rate": 3.899239122784448e-08, + "loss": 0.0598, + "step": 35699 + }, + { + "epoch": 97.27520435967303, + "grad_norm": 2.51202654838562, + "learning_rate": 3.891457380948538e-08, + "loss": 0.0414, + "step": 35700 + }, + { + "epoch": 97.27792915531334, + "grad_norm": 2.394866943359375, + "learning_rate": 3.883683396773919e-08, + "loss": 0.0283, + "step": 35701 + }, + { + "epoch": 97.28065395095368, + "grad_norm": 3.044130325317383, + "learning_rate": 3.875917170321208e-08, + "loss": 0.1344, + "step": 35702 + }, + { + "epoch": 97.28337874659401, + "grad_norm": 3.3202123641967773, + "learning_rate": 3.8681587016506924e-08, + "loss": 0.0472, + "step": 35703 + }, + { + "epoch": 97.28610354223433, + "grad_norm": 2.31563401222229, + "learning_rate": 3.860407990822879e-08, + "loss": 0.0421, + "step": 35704 + }, + { + "epoch": 97.28882833787466, + "grad_norm": 2.1818692684173584, + "learning_rate": 3.8526650378982736e-08, + "loss": 0.0593, + "step": 35705 + }, + { + "epoch": 97.29155313351498, + "grad_norm": 5.058921813964844, + "learning_rate": 3.8449298429369397e-08, + "loss": 0.0681, + "step": 35706 + }, + { + "epoch": 97.29427792915531, + "grad_norm": 1.8164100646972656, + "learning_rate": 3.8372024059991633e-08, + "loss": 0.0241, + "step": 35707 + }, + { + "epoch": 97.29700272479565, + "grad_norm": 2.463520050048828, + "learning_rate": 3.8294827271453394e-08, + "loss": 0.0571, + "step": 35708 + }, + { + "epoch": 97.29972752043597, + "grad_norm": 3.147904634475708, + "learning_rate": 3.8217708064354206e-08, + "loss": 0.0868, + "step": 35709 + }, + { + "epoch": 97.3024523160763, + "grad_norm": 3.002943515777588, + "learning_rate": 3.81406664392936e-08, + "loss": 0.0569, + "step": 35710 + }, + { + "epoch": 97.30517711171662, + "grad_norm": 1.6419553756713867, + "learning_rate": 3.80637023968744e-08, + "loss": 0.0228, + "step": 35711 + }, + { + "epoch": 97.30790190735695, + "grad_norm": 2.226773738861084, + "learning_rate": 3.798681593769393e-08, + "loss": 0.0746, + "step": 35712 + }, + { + "epoch": 97.31062670299727, + "grad_norm": 4.040128707885742, + "learning_rate": 3.791000706235171e-08, + "loss": 0.0671, + "step": 35713 + }, + { + "epoch": 97.3133514986376, + "grad_norm": 2.2122244834899902, + "learning_rate": 3.783327577144502e-08, + "loss": 0.0241, + "step": 35714 + }, + { + "epoch": 97.31607629427793, + "grad_norm": 1.792174220085144, + "learning_rate": 3.775662206557229e-08, + "loss": 0.0505, + "step": 35715 + }, + { + "epoch": 97.31880108991825, + "grad_norm": 2.6207172870635986, + "learning_rate": 3.768004594533081e-08, + "loss": 0.027, + "step": 35716 + }, + { + "epoch": 97.32152588555859, + "grad_norm": 2.3851215839385986, + "learning_rate": 3.760354741131678e-08, + "loss": 0.0258, + "step": 35717 + }, + { + "epoch": 97.3242506811989, + "grad_norm": 2.7815468311309814, + "learning_rate": 3.752712646412526e-08, + "loss": 0.1268, + "step": 35718 + }, + { + "epoch": 97.32697547683924, + "grad_norm": 2.303602933883667, + "learning_rate": 3.745078310435135e-08, + "loss": 0.0569, + "step": 35719 + }, + { + "epoch": 97.32970027247957, + "grad_norm": 2.026928663253784, + "learning_rate": 3.737451733259123e-08, + "loss": 0.0544, + "step": 35720 + }, + { + "epoch": 97.33242506811989, + "grad_norm": 2.396444797515869, + "learning_rate": 3.729832914943665e-08, + "loss": 0.1104, + "step": 35721 + }, + { + "epoch": 97.33514986376022, + "grad_norm": 2.3454558849334717, + "learning_rate": 3.722221855548269e-08, + "loss": 0.0254, + "step": 35722 + }, + { + "epoch": 97.33787465940054, + "grad_norm": 2.012298822402954, + "learning_rate": 3.71461855513211e-08, + "loss": 0.0865, + "step": 35723 + }, + { + "epoch": 97.34059945504087, + "grad_norm": 2.7653141021728516, + "learning_rate": 3.707023013754474e-08, + "loss": 0.0291, + "step": 35724 + }, + { + "epoch": 97.34332425068119, + "grad_norm": 2.1480188369750977, + "learning_rate": 3.699435231474424e-08, + "loss": 0.0236, + "step": 35725 + }, + { + "epoch": 97.34604904632153, + "grad_norm": 2.642390251159668, + "learning_rate": 3.691855208351136e-08, + "loss": 0.135, + "step": 35726 + }, + { + "epoch": 97.34877384196186, + "grad_norm": 2.243866205215454, + "learning_rate": 3.6842829444436734e-08, + "loss": 0.0227, + "step": 35727 + }, + { + "epoch": 97.35149863760218, + "grad_norm": 2.7783806324005127, + "learning_rate": 3.676718439810767e-08, + "loss": 0.0499, + "step": 35728 + }, + { + "epoch": 97.35422343324251, + "grad_norm": 2.030147075653076, + "learning_rate": 3.6691616945117025e-08, + "loss": 0.0541, + "step": 35729 + }, + { + "epoch": 97.35694822888283, + "grad_norm": 2.5146689414978027, + "learning_rate": 3.6616127086051e-08, + "loss": 0.0337, + "step": 35730 + }, + { + "epoch": 97.35967302452316, + "grad_norm": 4.058608055114746, + "learning_rate": 3.65407148214969e-08, + "loss": 0.0359, + "step": 35731 + }, + { + "epoch": 97.3623978201635, + "grad_norm": 2.2269248962402344, + "learning_rate": 3.646538015204426e-08, + "loss": 0.0251, + "step": 35732 + }, + { + "epoch": 97.36512261580381, + "grad_norm": 3.1376373767852783, + "learning_rate": 3.639012307827816e-08, + "loss": 0.1518, + "step": 35733 + }, + { + "epoch": 97.36784741144415, + "grad_norm": 2.2508909702301025, + "learning_rate": 3.63149436007848e-08, + "loss": 0.1153, + "step": 35734 + }, + { + "epoch": 97.37057220708446, + "grad_norm": 3.2898099422454834, + "learning_rate": 3.623984172015038e-08, + "loss": 0.0883, + "step": 35735 + }, + { + "epoch": 97.3732970027248, + "grad_norm": 2.400824546813965, + "learning_rate": 3.616481743695888e-08, + "loss": 0.0312, + "step": 35736 + }, + { + "epoch": 97.37602179836512, + "grad_norm": 6.968176364898682, + "learning_rate": 3.6089870751795374e-08, + "loss": 0.0395, + "step": 35737 + }, + { + "epoch": 97.37874659400545, + "grad_norm": 3.3455638885498047, + "learning_rate": 3.6015001665243853e-08, + "loss": 0.1089, + "step": 35738 + }, + { + "epoch": 97.38147138964578, + "grad_norm": 1.6406556367874146, + "learning_rate": 3.594021017788607e-08, + "loss": 0.0189, + "step": 35739 + }, + { + "epoch": 97.3841961852861, + "grad_norm": 1.971541404724121, + "learning_rate": 3.586549629030489e-08, + "loss": 0.0838, + "step": 35740 + }, + { + "epoch": 97.38692098092643, + "grad_norm": 2.65551495552063, + "learning_rate": 3.579086000308318e-08, + "loss": 0.0356, + "step": 35741 + }, + { + "epoch": 97.38964577656675, + "grad_norm": 4.395047664642334, + "learning_rate": 3.571630131680159e-08, + "loss": 0.0538, + "step": 35742 + }, + { + "epoch": 97.39237057220708, + "grad_norm": 2.4963653087615967, + "learning_rate": 3.564182023204077e-08, + "loss": 0.0576, + "step": 35743 + }, + { + "epoch": 97.39509536784742, + "grad_norm": 2.5708718299865723, + "learning_rate": 3.556741674938024e-08, + "loss": 0.0657, + "step": 35744 + }, + { + "epoch": 97.39782016348774, + "grad_norm": 1.9411816596984863, + "learning_rate": 3.549309086940067e-08, + "loss": 0.0205, + "step": 35745 + }, + { + "epoch": 97.40054495912807, + "grad_norm": 1.9105851650238037, + "learning_rate": 3.541884259267936e-08, + "loss": 0.0222, + "step": 35746 + }, + { + "epoch": 97.40326975476839, + "grad_norm": 2.73858380317688, + "learning_rate": 3.5344671919795844e-08, + "loss": 0.0624, + "step": 35747 + }, + { + "epoch": 97.40599455040872, + "grad_norm": 2.018718957901001, + "learning_rate": 3.5270578851327454e-08, + "loss": 0.0198, + "step": 35748 + }, + { + "epoch": 97.40871934604904, + "grad_norm": 1.703837275505066, + "learning_rate": 3.519656338785038e-08, + "loss": 0.0571, + "step": 35749 + }, + { + "epoch": 97.41144414168937, + "grad_norm": 2.6347010135650635, + "learning_rate": 3.512262552994305e-08, + "loss": 0.0382, + "step": 35750 + }, + { + "epoch": 97.4141689373297, + "grad_norm": 1.892220377922058, + "learning_rate": 3.504876527817946e-08, + "loss": 0.0325, + "step": 35751 + }, + { + "epoch": 97.41689373297002, + "grad_norm": 2.6764485836029053, + "learning_rate": 3.49749826331347e-08, + "loss": 0.1365, + "step": 35752 + }, + { + "epoch": 97.41961852861036, + "grad_norm": 2.0000882148742676, + "learning_rate": 3.490127759538497e-08, + "loss": 0.0597, + "step": 35753 + }, + { + "epoch": 97.42234332425068, + "grad_norm": 4.685260772705078, + "learning_rate": 3.482765016550316e-08, + "loss": 0.083, + "step": 35754 + }, + { + "epoch": 97.42506811989101, + "grad_norm": 1.8418105840682983, + "learning_rate": 3.475410034406212e-08, + "loss": 0.023, + "step": 35755 + }, + { + "epoch": 97.42779291553134, + "grad_norm": 1.4824579954147339, + "learning_rate": 3.468062813163586e-08, + "loss": 0.0142, + "step": 35756 + }, + { + "epoch": 97.43051771117166, + "grad_norm": 2.7751262187957764, + "learning_rate": 3.4607233528796136e-08, + "loss": 0.0158, + "step": 35757 + }, + { + "epoch": 97.433242506812, + "grad_norm": 4.138879776000977, + "learning_rate": 3.453391653611471e-08, + "loss": 0.1413, + "step": 35758 + }, + { + "epoch": 97.43596730245231, + "grad_norm": 2.429327964782715, + "learning_rate": 3.446067715416224e-08, + "loss": 0.0659, + "step": 35759 + }, + { + "epoch": 97.43869209809264, + "grad_norm": 2.288085699081421, + "learning_rate": 3.438751538350937e-08, + "loss": 0.0298, + "step": 35760 + }, + { + "epoch": 97.44141689373296, + "grad_norm": 3.082080602645874, + "learning_rate": 3.431443122472566e-08, + "loss": 0.0767, + "step": 35761 + }, + { + "epoch": 97.4441416893733, + "grad_norm": 1.9701496362686157, + "learning_rate": 3.424142467838065e-08, + "loss": 0.1448, + "step": 35762 + }, + { + "epoch": 97.44686648501363, + "grad_norm": 2.3054821491241455, + "learning_rate": 3.4168495745042776e-08, + "loss": 0.0486, + "step": 35763 + }, + { + "epoch": 97.44959128065395, + "grad_norm": 2.489908456802368, + "learning_rate": 3.409564442527935e-08, + "loss": 0.0973, + "step": 35764 + }, + { + "epoch": 97.45231607629428, + "grad_norm": 2.0973353385925293, + "learning_rate": 3.402287071965882e-08, + "loss": 0.0333, + "step": 35765 + }, + { + "epoch": 97.4550408719346, + "grad_norm": 2.7435762882232666, + "learning_rate": 3.395017462874739e-08, + "loss": 0.0508, + "step": 35766 + }, + { + "epoch": 97.45776566757493, + "grad_norm": 2.5076231956481934, + "learning_rate": 3.387755615311128e-08, + "loss": 0.0292, + "step": 35767 + }, + { + "epoch": 97.46049046321527, + "grad_norm": 2.5052192211151123, + "learning_rate": 3.380501529331559e-08, + "loss": 0.0485, + "step": 35768 + }, + { + "epoch": 97.46321525885558, + "grad_norm": 7.725629806518555, + "learning_rate": 3.3732552049925423e-08, + "loss": 0.1641, + "step": 35769 + }, + { + "epoch": 97.46594005449592, + "grad_norm": 3.0218212604522705, + "learning_rate": 3.366016642350589e-08, + "loss": 0.0307, + "step": 35770 + }, + { + "epoch": 97.46866485013624, + "grad_norm": 2.0976974964141846, + "learning_rate": 3.358785841462098e-08, + "loss": 0.0806, + "step": 35771 + }, + { + "epoch": 97.47138964577657, + "grad_norm": 7.243982315063477, + "learning_rate": 3.3515628023831346e-08, + "loss": 0.041, + "step": 35772 + }, + { + "epoch": 97.47411444141689, + "grad_norm": 1.8728142976760864, + "learning_rate": 3.344347525170322e-08, + "loss": 0.1892, + "step": 35773 + }, + { + "epoch": 97.47683923705722, + "grad_norm": 2.4406001567840576, + "learning_rate": 3.337140009879503e-08, + "loss": 0.0193, + "step": 35774 + }, + { + "epoch": 97.47956403269755, + "grad_norm": 2.5310189723968506, + "learning_rate": 3.329940256566966e-08, + "loss": 0.0227, + "step": 35775 + }, + { + "epoch": 97.48228882833787, + "grad_norm": 3.100160598754883, + "learning_rate": 3.3227482652888885e-08, + "loss": 0.0585, + "step": 35776 + }, + { + "epoch": 97.4850136239782, + "grad_norm": 2.3535513877868652, + "learning_rate": 3.315564036101115e-08, + "loss": 0.0286, + "step": 35777 + }, + { + "epoch": 97.48773841961852, + "grad_norm": 2.1238162517547607, + "learning_rate": 3.308387569059601e-08, + "loss": 0.1461, + "step": 35778 + }, + { + "epoch": 97.49046321525886, + "grad_norm": 2.19785475730896, + "learning_rate": 3.3012188642203015e-08, + "loss": 0.031, + "step": 35779 + }, + { + "epoch": 97.49318801089919, + "grad_norm": 5.525651454925537, + "learning_rate": 3.29405792163906e-08, + "loss": 0.0845, + "step": 35780 + }, + { + "epoch": 97.49591280653951, + "grad_norm": 3.4149084091186523, + "learning_rate": 3.2869047413716104e-08, + "loss": 0.0955, + "step": 35781 + }, + { + "epoch": 97.49863760217984, + "grad_norm": 3.5434200763702393, + "learning_rate": 3.2797593234735745e-08, + "loss": 0.035, + "step": 35782 + }, + { + "epoch": 97.50136239782016, + "grad_norm": 4.449948310852051, + "learning_rate": 3.272621668000797e-08, + "loss": 0.0667, + "step": 35783 + }, + { + "epoch": 97.50408719346049, + "grad_norm": 2.3025572299957275, + "learning_rate": 3.265491775008789e-08, + "loss": 0.0849, + "step": 35784 + }, + { + "epoch": 97.50681198910081, + "grad_norm": 2.930227041244507, + "learning_rate": 3.25836964455295e-08, + "loss": 0.1944, + "step": 35785 + }, + { + "epoch": 97.50953678474114, + "grad_norm": 2.109895706176758, + "learning_rate": 3.251255276688903e-08, + "loss": 0.024, + "step": 35786 + }, + { + "epoch": 97.51226158038148, + "grad_norm": 2.6566219329833984, + "learning_rate": 3.2441486714720474e-08, + "loss": 0.2145, + "step": 35787 + }, + { + "epoch": 97.5149863760218, + "grad_norm": 4.1831512451171875, + "learning_rate": 3.2370498289576727e-08, + "loss": 0.0332, + "step": 35788 + }, + { + "epoch": 97.51771117166213, + "grad_norm": 1.8247441053390503, + "learning_rate": 3.2299587492009565e-08, + "loss": 0.0231, + "step": 35789 + }, + { + "epoch": 97.52043596730245, + "grad_norm": 2.600660800933838, + "learning_rate": 3.2228754322574106e-08, + "loss": 0.08, + "step": 35790 + }, + { + "epoch": 97.52316076294278, + "grad_norm": 1.1747342348098755, + "learning_rate": 3.21579987818188e-08, + "loss": 0.0146, + "step": 35791 + }, + { + "epoch": 97.52588555858311, + "grad_norm": 1.9240552186965942, + "learning_rate": 3.208732087029653e-08, + "loss": 0.0535, + "step": 35792 + }, + { + "epoch": 97.52861035422343, + "grad_norm": 1.777369737625122, + "learning_rate": 3.201672058855798e-08, + "loss": 0.0808, + "step": 35793 + }, + { + "epoch": 97.53133514986376, + "grad_norm": 1.862227201461792, + "learning_rate": 3.19461979371527e-08, + "loss": 0.0446, + "step": 35794 + }, + { + "epoch": 97.53405994550408, + "grad_norm": 1.7047882080078125, + "learning_rate": 3.1875752916628034e-08, + "loss": 0.0421, + "step": 35795 + }, + { + "epoch": 97.53678474114442, + "grad_norm": 2.558957576751709, + "learning_rate": 3.180538552753576e-08, + "loss": 0.1248, + "step": 35796 + }, + { + "epoch": 97.53950953678473, + "grad_norm": 1.5976080894470215, + "learning_rate": 3.1735095770421e-08, + "loss": 0.0167, + "step": 35797 + }, + { + "epoch": 97.54223433242507, + "grad_norm": 2.2887840270996094, + "learning_rate": 3.166488364583331e-08, + "loss": 0.055, + "step": 35798 + }, + { + "epoch": 97.5449591280654, + "grad_norm": 2.419386863708496, + "learning_rate": 3.159474915431893e-08, + "loss": 0.0276, + "step": 35799 + }, + { + "epoch": 97.54768392370572, + "grad_norm": 2.284625768661499, + "learning_rate": 3.1524692296422966e-08, + "loss": 0.0894, + "step": 35800 + }, + { + "epoch": 97.55040871934605, + "grad_norm": 2.5056934356689453, + "learning_rate": 3.145471307269277e-08, + "loss": 0.1508, + "step": 35801 + }, + { + "epoch": 97.55313351498637, + "grad_norm": 2.7053492069244385, + "learning_rate": 3.138481148367123e-08, + "loss": 0.0803, + "step": 35802 + }, + { + "epoch": 97.5558583106267, + "grad_norm": 2.577946662902832, + "learning_rate": 3.1314987529905696e-08, + "loss": 0.0287, + "step": 35803 + }, + { + "epoch": 97.55858310626704, + "grad_norm": 4.119221210479736, + "learning_rate": 3.124524121193684e-08, + "loss": 0.1726, + "step": 35804 + }, + { + "epoch": 97.56130790190736, + "grad_norm": 2.4762916564941406, + "learning_rate": 3.117557253030978e-08, + "loss": 0.277, + "step": 35805 + }, + { + "epoch": 97.56403269754769, + "grad_norm": 2.0731794834136963, + "learning_rate": 3.1105981485566314e-08, + "loss": 0.0502, + "step": 35806 + }, + { + "epoch": 97.566757493188, + "grad_norm": 5.1868109703063965, + "learning_rate": 3.1036468078248226e-08, + "loss": 0.0834, + "step": 35807 + }, + { + "epoch": 97.56948228882834, + "grad_norm": 10.438080787658691, + "learning_rate": 3.0967032308897304e-08, + "loss": 0.0165, + "step": 35808 + }, + { + "epoch": 97.57220708446866, + "grad_norm": 2.423152446746826, + "learning_rate": 3.089767417805534e-08, + "loss": 0.0232, + "step": 35809 + }, + { + "epoch": 97.57493188010899, + "grad_norm": 2.390340805053711, + "learning_rate": 3.082839368626078e-08, + "loss": 0.147, + "step": 35810 + }, + { + "epoch": 97.57765667574932, + "grad_norm": 2.715242624282837, + "learning_rate": 3.075919083405321e-08, + "loss": 0.0534, + "step": 35811 + }, + { + "epoch": 97.58038147138964, + "grad_norm": 2.4230451583862305, + "learning_rate": 3.06900656219733e-08, + "loss": 0.0555, + "step": 35812 + }, + { + "epoch": 97.58310626702998, + "grad_norm": 2.556752920150757, + "learning_rate": 3.0621018050557285e-08, + "loss": 0.0471, + "step": 35813 + }, + { + "epoch": 97.5858310626703, + "grad_norm": 2.55846905708313, + "learning_rate": 3.0552048120343625e-08, + "loss": 0.0276, + "step": 35814 + }, + { + "epoch": 97.58855585831063, + "grad_norm": 2.751675605773926, + "learning_rate": 3.048315583187078e-08, + "loss": 0.0822, + "step": 35815 + }, + { + "epoch": 97.59128065395096, + "grad_norm": 2.4820244312286377, + "learning_rate": 3.041434118567388e-08, + "loss": 0.0377, + "step": 35816 + }, + { + "epoch": 97.59400544959128, + "grad_norm": 1.261082649230957, + "learning_rate": 3.034560418228916e-08, + "loss": 0.0173, + "step": 35817 + }, + { + "epoch": 97.59673024523161, + "grad_norm": 3.7353408336639404, + "learning_rate": 3.027694482225285e-08, + "loss": 0.1013, + "step": 35818 + }, + { + "epoch": 97.59945504087193, + "grad_norm": 2.633507251739502, + "learning_rate": 3.020836310609787e-08, + "loss": 0.0305, + "step": 35819 + }, + { + "epoch": 97.60217983651226, + "grad_norm": 2.2586116790771484, + "learning_rate": 3.0139859034359344e-08, + "loss": 0.0249, + "step": 35820 + }, + { + "epoch": 97.60490463215258, + "grad_norm": 2.453795909881592, + "learning_rate": 3.0071432607571284e-08, + "loss": 0.0449, + "step": 35821 + }, + { + "epoch": 97.60762942779292, + "grad_norm": 1.8358465433120728, + "learning_rate": 3.000308382626549e-08, + "loss": 0.0244, + "step": 35822 + }, + { + "epoch": 97.61035422343325, + "grad_norm": 2.564528703689575, + "learning_rate": 2.9934812690974865e-08, + "loss": 0.0816, + "step": 35823 + }, + { + "epoch": 97.61307901907357, + "grad_norm": 2.7338919639587402, + "learning_rate": 2.986661920223122e-08, + "loss": 0.0786, + "step": 35824 + }, + { + "epoch": 97.6158038147139, + "grad_norm": 3.4388840198516846, + "learning_rate": 2.9798503360565225e-08, + "loss": 0.1104, + "step": 35825 + }, + { + "epoch": 97.61852861035422, + "grad_norm": 3.998267412185669, + "learning_rate": 2.9730465166508683e-08, + "loss": 0.1049, + "step": 35826 + }, + { + "epoch": 97.62125340599455, + "grad_norm": 2.5960872173309326, + "learning_rate": 2.966250462058895e-08, + "loss": 0.0555, + "step": 35827 + }, + { + "epoch": 97.62397820163488, + "grad_norm": 3.861147880554199, + "learning_rate": 2.9594621723336715e-08, + "loss": 0.1128, + "step": 35828 + }, + { + "epoch": 97.6267029972752, + "grad_norm": 2.300067663192749, + "learning_rate": 2.952681647528155e-08, + "loss": 0.0264, + "step": 35829 + }, + { + "epoch": 97.62942779291554, + "grad_norm": 2.9510819911956787, + "learning_rate": 2.9459088876950814e-08, + "loss": 0.0454, + "step": 35830 + }, + { + "epoch": 97.63215258855585, + "grad_norm": 2.6466665267944336, + "learning_rate": 2.939143892887075e-08, + "loss": 0.0342, + "step": 35831 + }, + { + "epoch": 97.63487738419619, + "grad_norm": 2.8660361766815186, + "learning_rate": 2.932386663156983e-08, + "loss": 0.0273, + "step": 35832 + }, + { + "epoch": 97.6376021798365, + "grad_norm": 2.7252252101898193, + "learning_rate": 2.9256371985573183e-08, + "loss": 0.0471, + "step": 35833 + }, + { + "epoch": 97.64032697547684, + "grad_norm": 1.7736456394195557, + "learning_rate": 2.918895499140817e-08, + "loss": 0.025, + "step": 35834 + }, + { + "epoch": 97.64305177111717, + "grad_norm": 3.138150691986084, + "learning_rate": 2.91216156495977e-08, + "loss": 0.0954, + "step": 35835 + }, + { + "epoch": 97.64577656675749, + "grad_norm": 2.4309849739074707, + "learning_rate": 2.9054353960666914e-08, + "loss": 0.038, + "step": 35836 + }, + { + "epoch": 97.64850136239782, + "grad_norm": 2.0006468296051025, + "learning_rate": 2.8987169925140947e-08, + "loss": 0.0347, + "step": 35837 + }, + { + "epoch": 97.65122615803814, + "grad_norm": 1.5603562593460083, + "learning_rate": 2.89200635435416e-08, + "loss": 0.0622, + "step": 35838 + }, + { + "epoch": 97.65395095367847, + "grad_norm": 2.112581491470337, + "learning_rate": 2.885303481639179e-08, + "loss": 0.0379, + "step": 35839 + }, + { + "epoch": 97.65667574931881, + "grad_norm": 1.983702540397644, + "learning_rate": 2.8786083744213322e-08, + "loss": 0.0239, + "step": 35840 + }, + { + "epoch": 97.65940054495913, + "grad_norm": 2.877119541168213, + "learning_rate": 2.8719210327528e-08, + "loss": 0.097, + "step": 35841 + }, + { + "epoch": 97.66212534059946, + "grad_norm": 1.8336174488067627, + "learning_rate": 2.8652414566857633e-08, + "loss": 0.0228, + "step": 35842 + }, + { + "epoch": 97.66485013623978, + "grad_norm": 1.8584233522415161, + "learning_rate": 2.858569646272069e-08, + "loss": 0.0318, + "step": 35843 + }, + { + "epoch": 97.66757493188011, + "grad_norm": 4.630131721496582, + "learning_rate": 2.8519056015636758e-08, + "loss": 0.2295, + "step": 35844 + }, + { + "epoch": 97.67029972752043, + "grad_norm": 6.461533069610596, + "learning_rate": 2.845249322612542e-08, + "loss": 0.0283, + "step": 35845 + }, + { + "epoch": 97.67302452316076, + "grad_norm": 2.585191488265991, + "learning_rate": 2.8386008094706264e-08, + "loss": 0.0307, + "step": 35846 + }, + { + "epoch": 97.6757493188011, + "grad_norm": 2.753736972808838, + "learning_rate": 2.8319600621895537e-08, + "loss": 0.0288, + "step": 35847 + }, + { + "epoch": 97.67847411444141, + "grad_norm": 1.8776227235794067, + "learning_rate": 2.8253270808209498e-08, + "loss": 0.0481, + "step": 35848 + }, + { + "epoch": 97.68119891008175, + "grad_norm": 2.0777225494384766, + "learning_rate": 2.818701865416773e-08, + "loss": 0.0196, + "step": 35849 + }, + { + "epoch": 97.68392370572207, + "grad_norm": 3.543302059173584, + "learning_rate": 2.8120844160283155e-08, + "loss": 0.0319, + "step": 35850 + }, + { + "epoch": 97.6866485013624, + "grad_norm": 2.379166841506958, + "learning_rate": 2.805474732707425e-08, + "loss": 0.0935, + "step": 35851 + }, + { + "epoch": 97.68937329700273, + "grad_norm": 1.4063812494277954, + "learning_rate": 2.7988728155052825e-08, + "loss": 0.0199, + "step": 35852 + }, + { + "epoch": 97.69209809264305, + "grad_norm": 2.5580313205718994, + "learning_rate": 2.7922786644734023e-08, + "loss": 0.0546, + "step": 35853 + }, + { + "epoch": 97.69482288828338, + "grad_norm": 4.716394424438477, + "learning_rate": 2.785692279663188e-08, + "loss": 0.0518, + "step": 35854 + }, + { + "epoch": 97.6975476839237, + "grad_norm": 12.530521392822266, + "learning_rate": 2.779113661125932e-08, + "loss": 0.0395, + "step": 35855 + }, + { + "epoch": 97.70027247956403, + "grad_norm": 2.3398494720458984, + "learning_rate": 2.7725428089128148e-08, + "loss": 0.0687, + "step": 35856 + }, + { + "epoch": 97.70299727520435, + "grad_norm": 2.703486680984497, + "learning_rate": 2.7659797230751295e-08, + "loss": 0.1221, + "step": 35857 + }, + { + "epoch": 97.70572207084469, + "grad_norm": 2.562216281890869, + "learning_rate": 2.759424403663835e-08, + "loss": 0.1106, + "step": 35858 + }, + { + "epoch": 97.70844686648502, + "grad_norm": 2.428530693054199, + "learning_rate": 2.752876850730002e-08, + "loss": 0.0369, + "step": 35859 + }, + { + "epoch": 97.71117166212534, + "grad_norm": 2.3940417766571045, + "learning_rate": 2.7463370643247e-08, + "loss": 0.0773, + "step": 35860 + }, + { + "epoch": 97.71389645776567, + "grad_norm": 3.7675716876983643, + "learning_rate": 2.7398050444987777e-08, + "loss": 0.0825, + "step": 35861 + }, + { + "epoch": 97.71662125340599, + "grad_norm": 2.7979650497436523, + "learning_rate": 2.7332807913033055e-08, + "loss": 0.1596, + "step": 35862 + }, + { + "epoch": 97.71934604904632, + "grad_norm": 3.132063150405884, + "learning_rate": 2.7267643047887982e-08, + "loss": 0.06, + "step": 35863 + }, + { + "epoch": 97.72207084468666, + "grad_norm": 3.481983184814453, + "learning_rate": 2.720255585006215e-08, + "loss": 0.0613, + "step": 35864 + }, + { + "epoch": 97.72479564032697, + "grad_norm": 2.4922659397125244, + "learning_rate": 2.7137546320061824e-08, + "loss": 0.0716, + "step": 35865 + }, + { + "epoch": 97.7275204359673, + "grad_norm": 4.750972270965576, + "learning_rate": 2.7072614458393263e-08, + "loss": 0.0408, + "step": 35866 + }, + { + "epoch": 97.73024523160763, + "grad_norm": 2.241948127746582, + "learning_rate": 2.7007760265561623e-08, + "loss": 0.0278, + "step": 35867 + }, + { + "epoch": 97.73297002724796, + "grad_norm": 2.3033273220062256, + "learning_rate": 2.694298374207316e-08, + "loss": 0.0254, + "step": 35868 + }, + { + "epoch": 97.73569482288828, + "grad_norm": 3.9879684448242188, + "learning_rate": 2.6878284888431916e-08, + "loss": 0.0698, + "step": 35869 + }, + { + "epoch": 97.73841961852861, + "grad_norm": 2.7510740756988525, + "learning_rate": 2.6813663705141935e-08, + "loss": 0.109, + "step": 35870 + }, + { + "epoch": 97.74114441416894, + "grad_norm": 3.931377410888672, + "learning_rate": 2.6749120192705037e-08, + "loss": 0.1352, + "step": 35871 + }, + { + "epoch": 97.74386920980926, + "grad_norm": 2.564488172531128, + "learning_rate": 2.668465435162637e-08, + "loss": 0.1061, + "step": 35872 + }, + { + "epoch": 97.7465940054496, + "grad_norm": 4.47464656829834, + "learning_rate": 2.6620266182405542e-08, + "loss": 0.233, + "step": 35873 + }, + { + "epoch": 97.74931880108991, + "grad_norm": 1.857589602470398, + "learning_rate": 2.6555955685545476e-08, + "loss": 0.0255, + "step": 35874 + }, + { + "epoch": 97.75204359673025, + "grad_norm": 2.577150583267212, + "learning_rate": 2.6491722861546887e-08, + "loss": 0.0413, + "step": 35875 + }, + { + "epoch": 97.75476839237058, + "grad_norm": 3.132887601852417, + "learning_rate": 2.6427567710909374e-08, + "loss": 0.0273, + "step": 35876 + }, + { + "epoch": 97.7574931880109, + "grad_norm": 1.9996192455291748, + "learning_rate": 2.636349023413254e-08, + "loss": 0.0997, + "step": 35877 + }, + { + "epoch": 97.76021798365123, + "grad_norm": 2.1004786491394043, + "learning_rate": 2.629949043171709e-08, + "loss": 0.0346, + "step": 35878 + }, + { + "epoch": 97.76294277929155, + "grad_norm": 1.7419300079345703, + "learning_rate": 2.62355683041593e-08, + "loss": 0.0293, + "step": 35879 + }, + { + "epoch": 97.76566757493188, + "grad_norm": 2.583218812942505, + "learning_rate": 2.6171723851957652e-08, + "loss": 0.0338, + "step": 35880 + }, + { + "epoch": 97.7683923705722, + "grad_norm": 1.9477218389511108, + "learning_rate": 2.6107957075609537e-08, + "loss": 0.029, + "step": 35881 + }, + { + "epoch": 97.77111716621253, + "grad_norm": 1.9340739250183105, + "learning_rate": 2.6044267975612324e-08, + "loss": 0.0298, + "step": 35882 + }, + { + "epoch": 97.77384196185287, + "grad_norm": 2.064065933227539, + "learning_rate": 2.5980656552461182e-08, + "loss": 0.1699, + "step": 35883 + }, + { + "epoch": 97.77656675749319, + "grad_norm": 2.660323143005371, + "learning_rate": 2.5917122806652374e-08, + "loss": 0.1159, + "step": 35884 + }, + { + "epoch": 97.77929155313352, + "grad_norm": 2.3571033477783203, + "learning_rate": 2.585366673867884e-08, + "loss": 0.1284, + "step": 35885 + }, + { + "epoch": 97.78201634877384, + "grad_norm": 2.6144180297851562, + "learning_rate": 2.5790288349035742e-08, + "loss": 0.1057, + "step": 35886 + }, + { + "epoch": 97.78474114441417, + "grad_norm": 2.8029589653015137, + "learning_rate": 2.5726987638218238e-08, + "loss": 0.0518, + "step": 35887 + }, + { + "epoch": 97.7874659400545, + "grad_norm": 2.6526236534118652, + "learning_rate": 2.5663764606717046e-08, + "loss": 0.0926, + "step": 35888 + }, + { + "epoch": 97.79019073569482, + "grad_norm": 3.7425220012664795, + "learning_rate": 2.5600619255025106e-08, + "loss": 0.1374, + "step": 35889 + }, + { + "epoch": 97.79291553133515, + "grad_norm": 2.5686843395233154, + "learning_rate": 2.5537551583635356e-08, + "loss": 0.0217, + "step": 35890 + }, + { + "epoch": 97.79564032697547, + "grad_norm": 1.8298101425170898, + "learning_rate": 2.5474561593037406e-08, + "loss": 0.0203, + "step": 35891 + }, + { + "epoch": 97.7983651226158, + "grad_norm": 3.1686811447143555, + "learning_rate": 2.5411649283723083e-08, + "loss": 0.0518, + "step": 35892 + }, + { + "epoch": 97.80108991825612, + "grad_norm": 2.802241325378418, + "learning_rate": 2.5348814656181996e-08, + "loss": 0.0389, + "step": 35893 + }, + { + "epoch": 97.80381471389646, + "grad_norm": 2.4015142917633057, + "learning_rate": 2.5286057710902647e-08, + "loss": 0.134, + "step": 35894 + }, + { + "epoch": 97.80653950953679, + "grad_norm": 2.5389842987060547, + "learning_rate": 2.5223378448374636e-08, + "loss": 0.108, + "step": 35895 + }, + { + "epoch": 97.80926430517711, + "grad_norm": 2.8739893436431885, + "learning_rate": 2.5160776869086467e-08, + "loss": 0.1641, + "step": 35896 + }, + { + "epoch": 97.81198910081744, + "grad_norm": 1.6186907291412354, + "learning_rate": 2.509825297352442e-08, + "loss": 0.0279, + "step": 35897 + }, + { + "epoch": 97.81471389645776, + "grad_norm": 2.8059005737304688, + "learning_rate": 2.5035806762175874e-08, + "loss": 0.0389, + "step": 35898 + }, + { + "epoch": 97.8174386920981, + "grad_norm": 2.3546082973480225, + "learning_rate": 2.4973438235528223e-08, + "loss": 0.0934, + "step": 35899 + }, + { + "epoch": 97.82016348773843, + "grad_norm": 1.5940228700637817, + "learning_rate": 2.4911147394065526e-08, + "loss": 0.0817, + "step": 35900 + }, + { + "epoch": 97.82288828337875, + "grad_norm": 2.4367599487304688, + "learning_rate": 2.484893423827406e-08, + "loss": 0.0494, + "step": 35901 + }, + { + "epoch": 97.82561307901908, + "grad_norm": 3.33247447013855, + "learning_rate": 2.4786798768638987e-08, + "loss": 0.0252, + "step": 35902 + }, + { + "epoch": 97.8283378746594, + "grad_norm": 1.9521251916885376, + "learning_rate": 2.4724740985642148e-08, + "loss": 0.0405, + "step": 35903 + }, + { + "epoch": 97.83106267029973, + "grad_norm": 2.5466678142547607, + "learning_rate": 2.466276088976871e-08, + "loss": 0.0296, + "step": 35904 + }, + { + "epoch": 97.83378746594005, + "grad_norm": 1.8345268964767456, + "learning_rate": 2.4600858481500512e-08, + "loss": 0.0286, + "step": 35905 + }, + { + "epoch": 97.83651226158038, + "grad_norm": 1.7329964637756348, + "learning_rate": 2.4539033761319387e-08, + "loss": 0.0206, + "step": 35906 + }, + { + "epoch": 97.83923705722071, + "grad_norm": 4.210390090942383, + "learning_rate": 2.447728672970717e-08, + "loss": 0.0614, + "step": 35907 + }, + { + "epoch": 97.84196185286103, + "grad_norm": 1.8690903186798096, + "learning_rate": 2.4415617387145708e-08, + "loss": 0.0619, + "step": 35908 + }, + { + "epoch": 97.84468664850137, + "grad_norm": 2.3672852516174316, + "learning_rate": 2.4354025734113495e-08, + "loss": 0.0262, + "step": 35909 + }, + { + "epoch": 97.84741144414168, + "grad_norm": 3.118413209915161, + "learning_rate": 2.4292511771091266e-08, + "loss": 0.0801, + "step": 35910 + }, + { + "epoch": 97.85013623978202, + "grad_norm": 1.7585015296936035, + "learning_rate": 2.4231075498557522e-08, + "loss": 0.0294, + "step": 35911 + }, + { + "epoch": 97.85286103542235, + "grad_norm": 1.6392691135406494, + "learning_rate": 2.416971691699188e-08, + "loss": 0.0683, + "step": 35912 + }, + { + "epoch": 97.85558583106267, + "grad_norm": 4.103469371795654, + "learning_rate": 2.410843602687063e-08, + "loss": 0.0183, + "step": 35913 + }, + { + "epoch": 97.858310626703, + "grad_norm": 3.2853872776031494, + "learning_rate": 2.4047232828672272e-08, + "loss": 0.0936, + "step": 35914 + }, + { + "epoch": 97.86103542234332, + "grad_norm": 2.474257469177246, + "learning_rate": 2.39861073228731e-08, + "loss": 0.0541, + "step": 35915 + }, + { + "epoch": 97.86376021798365, + "grad_norm": 2.428039073944092, + "learning_rate": 2.392505950994939e-08, + "loss": 0.0708, + "step": 35916 + }, + { + "epoch": 97.86648501362397, + "grad_norm": 1.4760277271270752, + "learning_rate": 2.386408939037521e-08, + "loss": 0.0934, + "step": 35917 + }, + { + "epoch": 97.8692098092643, + "grad_norm": 3.3375816345214844, + "learning_rate": 2.380319696462685e-08, + "loss": 0.0295, + "step": 35918 + }, + { + "epoch": 97.87193460490464, + "grad_norm": 2.3691625595092773, + "learning_rate": 2.3742382233178374e-08, + "loss": 0.0826, + "step": 35919 + }, + { + "epoch": 97.87465940054496, + "grad_norm": 2.846940517425537, + "learning_rate": 2.3681645196502733e-08, + "loss": 0.0383, + "step": 35920 + }, + { + "epoch": 97.87738419618529, + "grad_norm": 1.978087067604065, + "learning_rate": 2.3620985855072887e-08, + "loss": 0.0409, + "step": 35921 + }, + { + "epoch": 97.88010899182561, + "grad_norm": 2.6109161376953125, + "learning_rate": 2.3560404209362897e-08, + "loss": 0.1963, + "step": 35922 + }, + { + "epoch": 97.88283378746594, + "grad_norm": 2.762831687927246, + "learning_rate": 2.349990025984239e-08, + "loss": 0.0846, + "step": 35923 + }, + { + "epoch": 97.88555858310627, + "grad_norm": 2.228059768676758, + "learning_rate": 2.343947400698432e-08, + "loss": 0.0227, + "step": 35924 + }, + { + "epoch": 97.88828337874659, + "grad_norm": 2.9268105030059814, + "learning_rate": 2.3379125451258312e-08, + "loss": 0.1677, + "step": 35925 + }, + { + "epoch": 97.89100817438693, + "grad_norm": 2.174006938934326, + "learning_rate": 2.3318854593135098e-08, + "loss": 0.0294, + "step": 35926 + }, + { + "epoch": 97.89373297002724, + "grad_norm": 1.953399896621704, + "learning_rate": 2.3258661433082087e-08, + "loss": 0.0776, + "step": 35927 + }, + { + "epoch": 97.89645776566758, + "grad_norm": 3.0561678409576416, + "learning_rate": 2.3198545971571118e-08, + "loss": 0.0314, + "step": 35928 + }, + { + "epoch": 97.8991825613079, + "grad_norm": 2.6855521202087402, + "learning_rate": 2.3138508209067377e-08, + "loss": 0.0363, + "step": 35929 + }, + { + "epoch": 97.90190735694823, + "grad_norm": 2.544351577758789, + "learning_rate": 2.307854814604049e-08, + "loss": 0.0203, + "step": 35930 + }, + { + "epoch": 97.90463215258856, + "grad_norm": 2.0955066680908203, + "learning_rate": 2.301866578295675e-08, + "loss": 0.0602, + "step": 35931 + }, + { + "epoch": 97.90735694822888, + "grad_norm": 2.097294569015503, + "learning_rate": 2.2958861120283558e-08, + "loss": 0.0217, + "step": 35932 + }, + { + "epoch": 97.91008174386921, + "grad_norm": 2.20684814453125, + "learning_rate": 2.2899134158483883e-08, + "loss": 0.1108, + "step": 35933 + }, + { + "epoch": 97.91280653950953, + "grad_norm": 2.080538749694824, + "learning_rate": 2.283948489802512e-08, + "loss": 0.0271, + "step": 35934 + }, + { + "epoch": 97.91553133514986, + "grad_norm": 2.9684462547302246, + "learning_rate": 2.2779913339371352e-08, + "loss": 0.0647, + "step": 35935 + }, + { + "epoch": 97.9182561307902, + "grad_norm": 3.363239049911499, + "learning_rate": 2.2720419482987754e-08, + "loss": 0.0244, + "step": 35936 + }, + { + "epoch": 97.92098092643052, + "grad_norm": 4.937668800354004, + "learning_rate": 2.2661003329335073e-08, + "loss": 0.0565, + "step": 35937 + }, + { + "epoch": 97.92370572207085, + "grad_norm": 2.4344513416290283, + "learning_rate": 2.2601664878877384e-08, + "loss": 0.0365, + "step": 35938 + }, + { + "epoch": 97.92643051771117, + "grad_norm": 2.5451300144195557, + "learning_rate": 2.2542404132077643e-08, + "loss": 0.1251, + "step": 35939 + }, + { + "epoch": 97.9291553133515, + "grad_norm": 1.9203739166259766, + "learning_rate": 2.248322108939549e-08, + "loss": 0.0661, + "step": 35940 + }, + { + "epoch": 97.93188010899182, + "grad_norm": 2.2082369327545166, + "learning_rate": 2.2424115751293885e-08, + "loss": 0.0472, + "step": 35941 + }, + { + "epoch": 97.93460490463215, + "grad_norm": 2.3483364582061768, + "learning_rate": 2.2365088118231347e-08, + "loss": 0.0504, + "step": 35942 + }, + { + "epoch": 97.93732970027249, + "grad_norm": 2.3083558082580566, + "learning_rate": 2.2306138190668624e-08, + "loss": 0.0269, + "step": 35943 + }, + { + "epoch": 97.9400544959128, + "grad_norm": 2.189378261566162, + "learning_rate": 2.2247265969065347e-08, + "loss": 0.0314, + "step": 35944 + }, + { + "epoch": 97.94277929155314, + "grad_norm": 2.719431161880493, + "learning_rate": 2.2188471453877815e-08, + "loss": 0.0557, + "step": 35945 + }, + { + "epoch": 97.94550408719346, + "grad_norm": 2.964179754257202, + "learning_rate": 2.212975464556677e-08, + "loss": 0.0734, + "step": 35946 + }, + { + "epoch": 97.94822888283379, + "grad_norm": 1.7924069166183472, + "learning_rate": 2.2071115544587406e-08, + "loss": 0.0266, + "step": 35947 + }, + { + "epoch": 97.95095367847412, + "grad_norm": 2.598353862762451, + "learning_rate": 2.2012554151397137e-08, + "loss": 0.0391, + "step": 35948 + }, + { + "epoch": 97.95367847411444, + "grad_norm": 1.3391518592834473, + "learning_rate": 2.195407046645115e-08, + "loss": 0.019, + "step": 35949 + }, + { + "epoch": 97.95640326975477, + "grad_norm": 1.5363374948501587, + "learning_rate": 2.1895664490206857e-08, + "loss": 0.0279, + "step": 35950 + }, + { + "epoch": 97.95912806539509, + "grad_norm": 3.2424540519714355, + "learning_rate": 2.1837336223117233e-08, + "loss": 0.0335, + "step": 35951 + }, + { + "epoch": 97.96185286103542, + "grad_norm": 2.925813674926758, + "learning_rate": 2.1779085665637467e-08, + "loss": 0.0579, + "step": 35952 + }, + { + "epoch": 97.96457765667574, + "grad_norm": 2.4966001510620117, + "learning_rate": 2.172091281822164e-08, + "loss": 0.0526, + "step": 35953 + }, + { + "epoch": 97.96730245231608, + "grad_norm": 2.0699377059936523, + "learning_rate": 2.1662817681321613e-08, + "loss": 0.0637, + "step": 35954 + }, + { + "epoch": 97.97002724795641, + "grad_norm": 2.216644525527954, + "learning_rate": 2.1604800255390356e-08, + "loss": 0.0928, + "step": 35955 + }, + { + "epoch": 97.97275204359673, + "grad_norm": 3.448300361633301, + "learning_rate": 2.1546860540879734e-08, + "loss": 0.0463, + "step": 35956 + }, + { + "epoch": 97.97547683923706, + "grad_norm": 3.955340623855591, + "learning_rate": 2.14889985382416e-08, + "loss": 0.0295, + "step": 35957 + }, + { + "epoch": 97.97820163487738, + "grad_norm": 4.31251335144043, + "learning_rate": 2.14312142479256e-08, + "loss": 0.1193, + "step": 35958 + }, + { + "epoch": 97.98092643051771, + "grad_norm": 4.111076354980469, + "learning_rate": 2.1373507670381376e-08, + "loss": 0.0726, + "step": 35959 + }, + { + "epoch": 97.98365122615803, + "grad_norm": 3.263672351837158, + "learning_rate": 2.1315878806060787e-08, + "loss": 0.0558, + "step": 35960 + }, + { + "epoch": 97.98637602179836, + "grad_norm": 2.007985830307007, + "learning_rate": 2.125832765541014e-08, + "loss": 0.027, + "step": 35961 + }, + { + "epoch": 97.9891008174387, + "grad_norm": 2.3174593448638916, + "learning_rate": 2.1200854218877964e-08, + "loss": 0.0367, + "step": 35962 + }, + { + "epoch": 97.99182561307902, + "grad_norm": 1.442603349685669, + "learning_rate": 2.1143458496912795e-08, + "loss": 0.0162, + "step": 35963 + }, + { + "epoch": 97.99455040871935, + "grad_norm": 4.202771186828613, + "learning_rate": 2.1086140489960937e-08, + "loss": 0.0444, + "step": 35964 + }, + { + "epoch": 97.99727520435967, + "grad_norm": 2.63293194770813, + "learning_rate": 2.1028900198468704e-08, + "loss": 0.0247, + "step": 35965 + }, + { + "epoch": 98.0, + "grad_norm": 2.4509873390197754, + "learning_rate": 2.0971737622883515e-08, + "loss": 0.0524, + "step": 35966 + }, + { + "epoch": 98.00272479564033, + "grad_norm": 1.954356074333191, + "learning_rate": 2.0914652763648348e-08, + "loss": 0.0263, + "step": 35967 + }, + { + "epoch": 98.00544959128065, + "grad_norm": 2.8290443420410156, + "learning_rate": 2.085764562120951e-08, + "loss": 0.0574, + "step": 35968 + }, + { + "epoch": 98.00817438692098, + "grad_norm": 2.316638231277466, + "learning_rate": 2.0800716196008874e-08, + "loss": 0.0668, + "step": 35969 + }, + { + "epoch": 98.0108991825613, + "grad_norm": 4.08411979675293, + "learning_rate": 2.074386448849164e-08, + "loss": 0.0718, + "step": 35970 + }, + { + "epoch": 98.01362397820164, + "grad_norm": 2.340932846069336, + "learning_rate": 2.068709049910078e-08, + "loss": 0.0681, + "step": 35971 + }, + { + "epoch": 98.01634877384195, + "grad_norm": 2.5804271697998047, + "learning_rate": 2.0630394228277063e-08, + "loss": 0.0828, + "step": 35972 + }, + { + "epoch": 98.01907356948229, + "grad_norm": 2.2683908939361572, + "learning_rate": 2.057377567646235e-08, + "loss": 0.0313, + "step": 35973 + }, + { + "epoch": 98.02179836512262, + "grad_norm": 2.1464920043945312, + "learning_rate": 2.05172348440974e-08, + "loss": 0.0302, + "step": 35974 + }, + { + "epoch": 98.02452316076294, + "grad_norm": 2.4043939113616943, + "learning_rate": 2.0460771731624086e-08, + "loss": 0.0261, + "step": 35975 + }, + { + "epoch": 98.02724795640327, + "grad_norm": 2.5983052253723145, + "learning_rate": 2.040438633948094e-08, + "loss": 0.1276, + "step": 35976 + }, + { + "epoch": 98.02997275204359, + "grad_norm": 2.8535356521606445, + "learning_rate": 2.034807866810762e-08, + "loss": 0.1196, + "step": 35977 + }, + { + "epoch": 98.03269754768392, + "grad_norm": 2.621011972427368, + "learning_rate": 2.029184871794154e-08, + "loss": 0.177, + "step": 35978 + }, + { + "epoch": 98.03542234332426, + "grad_norm": 3.7379093170166016, + "learning_rate": 2.0235696489421254e-08, + "loss": 0.2048, + "step": 35979 + }, + { + "epoch": 98.03814713896458, + "grad_norm": 2.3887557983398438, + "learning_rate": 2.0179621982984178e-08, + "loss": 0.1078, + "step": 35980 + }, + { + "epoch": 98.04087193460491, + "grad_norm": 7.204305171966553, + "learning_rate": 2.0123625199067743e-08, + "loss": 0.093, + "step": 35981 + }, + { + "epoch": 98.04359673024523, + "grad_norm": 2.4790451526641846, + "learning_rate": 2.0067706138107157e-08, + "loss": 0.0773, + "step": 35982 + }, + { + "epoch": 98.04632152588556, + "grad_norm": 2.852440595626831, + "learning_rate": 2.001186480053763e-08, + "loss": 0.1036, + "step": 35983 + }, + { + "epoch": 98.04904632152588, + "grad_norm": 1.650865077972412, + "learning_rate": 1.9956101186794362e-08, + "loss": 0.0369, + "step": 35984 + }, + { + "epoch": 98.05177111716621, + "grad_norm": 2.4738357067108154, + "learning_rate": 1.990041529731257e-08, + "loss": 0.0237, + "step": 35985 + }, + { + "epoch": 98.05449591280654, + "grad_norm": 2.4581356048583984, + "learning_rate": 1.9844807132524123e-08, + "loss": 0.0202, + "step": 35986 + }, + { + "epoch": 98.05722070844686, + "grad_norm": 2.1589486598968506, + "learning_rate": 1.9789276692863125e-08, + "loss": 0.0362, + "step": 35987 + }, + { + "epoch": 98.0599455040872, + "grad_norm": 3.0614559650421143, + "learning_rate": 1.9733823978762555e-08, + "loss": 0.0566, + "step": 35988 + }, + { + "epoch": 98.06267029972751, + "grad_norm": 1.0813218355178833, + "learning_rate": 1.96784489906543e-08, + "loss": 0.0123, + "step": 35989 + }, + { + "epoch": 98.06539509536785, + "grad_norm": 3.7860329151153564, + "learning_rate": 1.9623151728968004e-08, + "loss": 0.0522, + "step": 35990 + }, + { + "epoch": 98.06811989100818, + "grad_norm": 5.7503204345703125, + "learning_rate": 1.9567932194135553e-08, + "loss": 0.0411, + "step": 35991 + }, + { + "epoch": 98.0708446866485, + "grad_norm": 1.8334646224975586, + "learning_rate": 1.951279038658771e-08, + "loss": 0.0239, + "step": 35992 + }, + { + "epoch": 98.07356948228883, + "grad_norm": 3.1036291122436523, + "learning_rate": 1.9457726306751913e-08, + "loss": 0.1188, + "step": 35993 + }, + { + "epoch": 98.07629427792915, + "grad_norm": 1.93489670753479, + "learning_rate": 1.9402739955058925e-08, + "loss": 0.028, + "step": 35994 + }, + { + "epoch": 98.07901907356948, + "grad_norm": 2.9652209281921387, + "learning_rate": 1.9347831331936186e-08, + "loss": 0.2568, + "step": 35995 + }, + { + "epoch": 98.0817438692098, + "grad_norm": 2.488975763320923, + "learning_rate": 1.9293000437811127e-08, + "loss": 0.0921, + "step": 35996 + }, + { + "epoch": 98.08446866485014, + "grad_norm": 2.527630567550659, + "learning_rate": 1.9238247273110077e-08, + "loss": 0.0303, + "step": 35997 + }, + { + "epoch": 98.08719346049047, + "grad_norm": 1.9312889575958252, + "learning_rate": 1.9183571838261584e-08, + "loss": 0.0268, + "step": 35998 + }, + { + "epoch": 98.08991825613079, + "grad_norm": 2.61395001411438, + "learning_rate": 1.9128974133689748e-08, + "loss": 0.0212, + "step": 35999 + }, + { + "epoch": 98.09264305177112, + "grad_norm": 1.9238824844360352, + "learning_rate": 1.907445415981979e-08, + "loss": 0.0285, + "step": 36000 + }, + { + "epoch": 98.09536784741144, + "grad_norm": 1.5434598922729492, + "learning_rate": 1.902001191707803e-08, + "loss": 0.0334, + "step": 36001 + }, + { + "epoch": 98.09809264305177, + "grad_norm": 1.6021926403045654, + "learning_rate": 1.8965647405885247e-08, + "loss": 0.0423, + "step": 36002 + }, + { + "epoch": 98.1008174386921, + "grad_norm": 2.5341289043426514, + "learning_rate": 1.8911360626668874e-08, + "loss": 0.0345, + "step": 36003 + }, + { + "epoch": 98.10354223433242, + "grad_norm": 1.9662022590637207, + "learning_rate": 1.8857151579847465e-08, + "loss": 0.1571, + "step": 36004 + }, + { + "epoch": 98.10626702997276, + "grad_norm": 1.6988203525543213, + "learning_rate": 1.8803020265847348e-08, + "loss": 0.023, + "step": 36005 + }, + { + "epoch": 98.10899182561307, + "grad_norm": 2.856804609298706, + "learning_rate": 1.874896668508597e-08, + "loss": 0.2222, + "step": 36006 + }, + { + "epoch": 98.11171662125341, + "grad_norm": 2.2739062309265137, + "learning_rate": 1.8694990837988534e-08, + "loss": 0.0209, + "step": 36007 + }, + { + "epoch": 98.11444141689373, + "grad_norm": 2.8482143878936768, + "learning_rate": 1.8641092724971388e-08, + "loss": 0.2362, + "step": 36008 + }, + { + "epoch": 98.11716621253406, + "grad_norm": 2.5867767333984375, + "learning_rate": 1.858727234645752e-08, + "loss": 0.0294, + "step": 36009 + }, + { + "epoch": 98.11989100817439, + "grad_norm": 3.1094701290130615, + "learning_rate": 1.8533529702864374e-08, + "loss": 0.0288, + "step": 36010 + }, + { + "epoch": 98.12261580381471, + "grad_norm": 2.174095869064331, + "learning_rate": 1.8479864794610502e-08, + "loss": 0.0357, + "step": 36011 + }, + { + "epoch": 98.12534059945504, + "grad_norm": 3.00639271736145, + "learning_rate": 1.8426277622114463e-08, + "loss": 0.0362, + "step": 36012 + }, + { + "epoch": 98.12806539509536, + "grad_norm": 1.8950481414794922, + "learning_rate": 1.83727681857937e-08, + "loss": 0.0212, + "step": 36013 + }, + { + "epoch": 98.1307901907357, + "grad_norm": 1.8707834482192993, + "learning_rate": 1.8319336486063433e-08, + "loss": 0.0267, + "step": 36014 + }, + { + "epoch": 98.13351498637603, + "grad_norm": 2.5346744060516357, + "learning_rate": 1.826598252334222e-08, + "loss": 0.092, + "step": 36015 + }, + { + "epoch": 98.13623978201635, + "grad_norm": 1.6178852319717407, + "learning_rate": 1.821270629804306e-08, + "loss": 0.0297, + "step": 36016 + }, + { + "epoch": 98.13896457765668, + "grad_norm": 1.6849186420440674, + "learning_rate": 1.81595078105834e-08, + "loss": 0.0295, + "step": 36017 + }, + { + "epoch": 98.141689373297, + "grad_norm": 2.2350454330444336, + "learning_rate": 1.810638706137513e-08, + "loss": 0.1013, + "step": 36018 + }, + { + "epoch": 98.14441416893733, + "grad_norm": 2.8852832317352295, + "learning_rate": 1.8053344050833478e-08, + "loss": 0.041, + "step": 36019 + }, + { + "epoch": 98.14713896457765, + "grad_norm": 3.075474262237549, + "learning_rate": 1.800037877937144e-08, + "loss": 0.0758, + "step": 36020 + }, + { + "epoch": 98.14986376021798, + "grad_norm": 2.540247917175293, + "learning_rate": 1.7947491247399808e-08, + "loss": 0.0815, + "step": 36021 + }, + { + "epoch": 98.15258855585832, + "grad_norm": 2.0208468437194824, + "learning_rate": 1.7894681455333794e-08, + "loss": 0.0339, + "step": 36022 + }, + { + "epoch": 98.15531335149863, + "grad_norm": 3.4823648929595947, + "learning_rate": 1.784194940358086e-08, + "loss": 0.0955, + "step": 36023 + }, + { + "epoch": 98.15803814713897, + "grad_norm": 2.4442057609558105, + "learning_rate": 1.7789295092555114e-08, + "loss": 0.054, + "step": 36024 + }, + { + "epoch": 98.16076294277929, + "grad_norm": 3.0584557056427, + "learning_rate": 1.773671852266401e-08, + "loss": 0.0513, + "step": 36025 + }, + { + "epoch": 98.16348773841962, + "grad_norm": 2.1580777168273926, + "learning_rate": 1.7684219694318328e-08, + "loss": 0.0257, + "step": 36026 + }, + { + "epoch": 98.16621253405995, + "grad_norm": 2.9333670139312744, + "learning_rate": 1.763179860792663e-08, + "loss": 0.1014, + "step": 36027 + }, + { + "epoch": 98.16893732970027, + "grad_norm": 2.2418465614318848, + "learning_rate": 1.7579455263897483e-08, + "loss": 0.0561, + "step": 36028 + }, + { + "epoch": 98.1716621253406, + "grad_norm": 6.723508358001709, + "learning_rate": 1.7527189662638334e-08, + "loss": 0.0727, + "step": 36029 + }, + { + "epoch": 98.17438692098092, + "grad_norm": 1.9667026996612549, + "learning_rate": 1.7475001804555525e-08, + "loss": 0.0346, + "step": 36030 + }, + { + "epoch": 98.17711171662125, + "grad_norm": 2.2690699100494385, + "learning_rate": 1.7422891690056508e-08, + "loss": 0.0321, + "step": 36031 + }, + { + "epoch": 98.17983651226157, + "grad_norm": 5.59989070892334, + "learning_rate": 1.7370859319547628e-08, + "loss": 0.0415, + "step": 36032 + }, + { + "epoch": 98.1825613079019, + "grad_norm": 2.4863879680633545, + "learning_rate": 1.7318904693431894e-08, + "loss": 0.0548, + "step": 36033 + }, + { + "epoch": 98.18528610354224, + "grad_norm": 3.2599329948425293, + "learning_rate": 1.7267027812115646e-08, + "loss": 0.1327, + "step": 36034 + }, + { + "epoch": 98.18801089918256, + "grad_norm": 2.4539096355438232, + "learning_rate": 1.7215228676003005e-08, + "loss": 0.176, + "step": 36035 + }, + { + "epoch": 98.19073569482289, + "grad_norm": 1.724025845527649, + "learning_rate": 1.7163507285495872e-08, + "loss": 0.0297, + "step": 36036 + }, + { + "epoch": 98.19346049046321, + "grad_norm": 1.5585377216339111, + "learning_rate": 1.7111863640999483e-08, + "loss": 0.1148, + "step": 36037 + }, + { + "epoch": 98.19618528610354, + "grad_norm": 1.6620516777038574, + "learning_rate": 1.706029774291351e-08, + "loss": 0.0213, + "step": 36038 + }, + { + "epoch": 98.19891008174388, + "grad_norm": 2.1538443565368652, + "learning_rate": 1.7008809591639863e-08, + "loss": 0.0811, + "step": 36039 + }, + { + "epoch": 98.2016348773842, + "grad_norm": 2.7999744415283203, + "learning_rate": 1.6957399187581547e-08, + "loss": 0.1881, + "step": 36040 + }, + { + "epoch": 98.20435967302453, + "grad_norm": 3.429708242416382, + "learning_rate": 1.6906066531137132e-08, + "loss": 0.0264, + "step": 36041 + }, + { + "epoch": 98.20708446866485, + "grad_norm": 2.7518060207366943, + "learning_rate": 1.6854811622707412e-08, + "loss": 0.0634, + "step": 36042 + }, + { + "epoch": 98.20980926430518, + "grad_norm": 3.1121954917907715, + "learning_rate": 1.6803634462690955e-08, + "loss": 0.0921, + "step": 36043 + }, + { + "epoch": 98.2125340599455, + "grad_norm": 3.7017569541931152, + "learning_rate": 1.675253505148633e-08, + "loss": 0.0453, + "step": 36044 + }, + { + "epoch": 98.21525885558583, + "grad_norm": 2.11387038230896, + "learning_rate": 1.6701513389492106e-08, + "loss": 0.0447, + "step": 36045 + }, + { + "epoch": 98.21798365122616, + "grad_norm": 1.6125013828277588, + "learning_rate": 1.6650569477104638e-08, + "loss": 0.0201, + "step": 36046 + }, + { + "epoch": 98.22070844686648, + "grad_norm": 2.024996042251587, + "learning_rate": 1.6599703314721382e-08, + "loss": 0.0343, + "step": 36047 + }, + { + "epoch": 98.22343324250681, + "grad_norm": 1.7762742042541504, + "learning_rate": 1.6548914902738688e-08, + "loss": 0.0184, + "step": 36048 + }, + { + "epoch": 98.22615803814713, + "grad_norm": 2.6843836307525635, + "learning_rate": 1.6498204241551796e-08, + "loss": 0.0272, + "step": 36049 + }, + { + "epoch": 98.22888283378747, + "grad_norm": 2.516796112060547, + "learning_rate": 1.6447571331554836e-08, + "loss": 0.1096, + "step": 36050 + }, + { + "epoch": 98.2316076294278, + "grad_norm": 1.8902513980865479, + "learning_rate": 1.6397016173143043e-08, + "loss": 0.0189, + "step": 36051 + }, + { + "epoch": 98.23433242506812, + "grad_norm": 2.1218597888946533, + "learning_rate": 1.6346538766710552e-08, + "loss": 0.0863, + "step": 36052 + }, + { + "epoch": 98.23705722070845, + "grad_norm": 3.2340712547302246, + "learning_rate": 1.6296139112649268e-08, + "loss": 0.0603, + "step": 36053 + }, + { + "epoch": 98.23978201634877, + "grad_norm": 3.202751398086548, + "learning_rate": 1.6245817211353322e-08, + "loss": 0.099, + "step": 36054 + }, + { + "epoch": 98.2425068119891, + "grad_norm": 2.7101292610168457, + "learning_rate": 1.61955730632124e-08, + "loss": 0.0193, + "step": 36055 + }, + { + "epoch": 98.24523160762942, + "grad_norm": 1.6028387546539307, + "learning_rate": 1.6145406668619523e-08, + "loss": 0.028, + "step": 36056 + }, + { + "epoch": 98.24795640326975, + "grad_norm": 3.7268786430358887, + "learning_rate": 1.609531802796549e-08, + "loss": 0.0414, + "step": 36057 + }, + { + "epoch": 98.25068119891009, + "grad_norm": 2.2488632202148438, + "learning_rate": 1.604530714163888e-08, + "loss": 0.0246, + "step": 36058 + }, + { + "epoch": 98.2534059945504, + "grad_norm": 2.7443923950195312, + "learning_rate": 1.5995374010030483e-08, + "loss": 0.1881, + "step": 36059 + }, + { + "epoch": 98.25613079019074, + "grad_norm": 4.7676682472229, + "learning_rate": 1.594551863352889e-08, + "loss": 0.0768, + "step": 36060 + }, + { + "epoch": 98.25885558583106, + "grad_norm": 2.9786148071289062, + "learning_rate": 1.5895741012521558e-08, + "loss": 0.0934, + "step": 36061 + }, + { + "epoch": 98.26158038147139, + "grad_norm": 3.0991547107696533, + "learning_rate": 1.5846041147397072e-08, + "loss": 0.044, + "step": 36062 + }, + { + "epoch": 98.26430517711172, + "grad_norm": 1.976578950881958, + "learning_rate": 1.5796419038542897e-08, + "loss": 0.0169, + "step": 36063 + }, + { + "epoch": 98.26702997275204, + "grad_norm": 2.9477286338806152, + "learning_rate": 1.5746874686344284e-08, + "loss": 0.0365, + "step": 36064 + }, + { + "epoch": 98.26975476839237, + "grad_norm": 1.9412206411361694, + "learning_rate": 1.5697408091188694e-08, + "loss": 0.0223, + "step": 36065 + }, + { + "epoch": 98.2724795640327, + "grad_norm": 2.5030250549316406, + "learning_rate": 1.5648019253459156e-08, + "loss": 0.096, + "step": 36066 + }, + { + "epoch": 98.27520435967303, + "grad_norm": 1.2808163166046143, + "learning_rate": 1.5598708173542032e-08, + "loss": 0.0171, + "step": 36067 + }, + { + "epoch": 98.27792915531334, + "grad_norm": 2.0064923763275146, + "learning_rate": 1.5549474851820346e-08, + "loss": 0.0263, + "step": 36068 + }, + { + "epoch": 98.28065395095368, + "grad_norm": 2.899421215057373, + "learning_rate": 1.5500319288678234e-08, + "loss": 0.0847, + "step": 36069 + }, + { + "epoch": 98.28337874659401, + "grad_norm": 3.2286341190338135, + "learning_rate": 1.5451241484498724e-08, + "loss": 0.0996, + "step": 36070 + }, + { + "epoch": 98.28610354223433, + "grad_norm": 2.4577603340148926, + "learning_rate": 1.5402241439663736e-08, + "loss": 0.0692, + "step": 36071 + }, + { + "epoch": 98.28882833787466, + "grad_norm": 2.7878971099853516, + "learning_rate": 1.535331915455407e-08, + "loss": 0.0471, + "step": 36072 + }, + { + "epoch": 98.29155313351498, + "grad_norm": 2.434969186782837, + "learning_rate": 1.5304474629551648e-08, + "loss": 0.0244, + "step": 36073 + }, + { + "epoch": 98.29427792915531, + "grad_norm": 2.7359986305236816, + "learning_rate": 1.5255707865036163e-08, + "loss": 0.0523, + "step": 36074 + }, + { + "epoch": 98.29700272479565, + "grad_norm": 1.842993140220642, + "learning_rate": 1.5207018861388423e-08, + "loss": 0.0415, + "step": 36075 + }, + { + "epoch": 98.29972752043597, + "grad_norm": 3.4313676357269287, + "learning_rate": 1.5158407618987014e-08, + "loss": 0.0666, + "step": 36076 + }, + { + "epoch": 98.3024523160763, + "grad_norm": 1.4521300792694092, + "learning_rate": 1.5109874138210522e-08, + "loss": 0.0185, + "step": 36077 + }, + { + "epoch": 98.30517711171662, + "grad_norm": 2.410409688949585, + "learning_rate": 1.5061418419437536e-08, + "loss": 0.0668, + "step": 36078 + }, + { + "epoch": 98.30790190735695, + "grad_norm": 1.9829622507095337, + "learning_rate": 1.5013040463043305e-08, + "loss": 0.0319, + "step": 36079 + }, + { + "epoch": 98.31062670299727, + "grad_norm": 2.0669567584991455, + "learning_rate": 1.496474026940753e-08, + "loss": 0.0344, + "step": 36080 + }, + { + "epoch": 98.3133514986376, + "grad_norm": 2.6750333309173584, + "learning_rate": 1.4916517838904355e-08, + "loss": 0.037, + "step": 36081 + }, + { + "epoch": 98.31607629427793, + "grad_norm": 1.5951213836669922, + "learning_rate": 1.4868373171910144e-08, + "loss": 0.027, + "step": 36082 + }, + { + "epoch": 98.31880108991825, + "grad_norm": 1.3873144388198853, + "learning_rate": 1.4820306268800155e-08, + "loss": 0.0157, + "step": 36083 + }, + { + "epoch": 98.32152588555859, + "grad_norm": 1.8574143648147583, + "learning_rate": 1.4772317129947422e-08, + "loss": 0.0481, + "step": 36084 + }, + { + "epoch": 98.3242506811989, + "grad_norm": 3.45485782623291, + "learning_rate": 1.47244057557272e-08, + "loss": 0.1301, + "step": 36085 + }, + { + "epoch": 98.32697547683924, + "grad_norm": 2.714715003967285, + "learning_rate": 1.4676572146511414e-08, + "loss": 0.1108, + "step": 36086 + }, + { + "epoch": 98.32970027247957, + "grad_norm": 2.4655139446258545, + "learning_rate": 1.46288163026731e-08, + "loss": 0.0625, + "step": 36087 + }, + { + "epoch": 98.33242506811989, + "grad_norm": 5.965032577514648, + "learning_rate": 1.458113822458529e-08, + "loss": 0.0718, + "step": 36088 + }, + { + "epoch": 98.33514986376022, + "grad_norm": 1.9181727170944214, + "learning_rate": 1.453353791261658e-08, + "loss": 0.0481, + "step": 36089 + }, + { + "epoch": 98.33787465940054, + "grad_norm": 2.015746593475342, + "learning_rate": 1.4486015367140005e-08, + "loss": 0.093, + "step": 36090 + }, + { + "epoch": 98.34059945504087, + "grad_norm": 2.7315802574157715, + "learning_rate": 1.443857058852527e-08, + "loss": 0.0274, + "step": 36091 + }, + { + "epoch": 98.34332425068119, + "grad_norm": 2.158799171447754, + "learning_rate": 1.4391203577140966e-08, + "loss": 0.0705, + "step": 36092 + }, + { + "epoch": 98.34604904632153, + "grad_norm": 3.0152547359466553, + "learning_rate": 1.4343914333356801e-08, + "loss": 0.1108, + "step": 36093 + }, + { + "epoch": 98.34877384196186, + "grad_norm": 2.108616352081299, + "learning_rate": 1.4296702857541367e-08, + "loss": 0.0309, + "step": 36094 + }, + { + "epoch": 98.35149863760218, + "grad_norm": 2.5189340114593506, + "learning_rate": 1.4249569150061037e-08, + "loss": 0.0299, + "step": 36095 + }, + { + "epoch": 98.35422343324251, + "grad_norm": 2.253386974334717, + "learning_rate": 1.4202513211284408e-08, + "loss": 0.1952, + "step": 36096 + }, + { + "epoch": 98.35694822888283, + "grad_norm": 1.5023448467254639, + "learning_rate": 1.415553504157674e-08, + "loss": 0.0541, + "step": 36097 + }, + { + "epoch": 98.35967302452316, + "grad_norm": 1.9690170288085938, + "learning_rate": 1.4108634641304409e-08, + "loss": 0.0254, + "step": 36098 + }, + { + "epoch": 98.3623978201635, + "grad_norm": 2.67514967918396, + "learning_rate": 1.4061812010832676e-08, + "loss": 0.0541, + "step": 36099 + }, + { + "epoch": 98.36512261580381, + "grad_norm": 2.0228111743927, + "learning_rate": 1.4015067150525696e-08, + "loss": 0.0244, + "step": 36100 + }, + { + "epoch": 98.36784741144415, + "grad_norm": 3.1129562854766846, + "learning_rate": 1.3968400060748733e-08, + "loss": 0.0341, + "step": 36101 + }, + { + "epoch": 98.37057220708446, + "grad_norm": 2.7543745040893555, + "learning_rate": 1.3921810741864828e-08, + "loss": 0.0343, + "step": 36102 + }, + { + "epoch": 98.3732970027248, + "grad_norm": 4.894028186798096, + "learning_rate": 1.3875299194235914e-08, + "loss": 0.0757, + "step": 36103 + }, + { + "epoch": 98.37602179836512, + "grad_norm": 2.0562045574188232, + "learning_rate": 1.3828865418223925e-08, + "loss": 0.0341, + "step": 36104 + }, + { + "epoch": 98.37874659400545, + "grad_norm": 5.251753330230713, + "learning_rate": 1.3782509414191902e-08, + "loss": 0.0528, + "step": 36105 + }, + { + "epoch": 98.38147138964578, + "grad_norm": 4.380325794219971, + "learning_rate": 1.373623118250067e-08, + "loss": 0.0289, + "step": 36106 + }, + { + "epoch": 98.3841961852861, + "grad_norm": 3.9425055980682373, + "learning_rate": 1.3690030723509939e-08, + "loss": 0.075, + "step": 36107 + }, + { + "epoch": 98.38692098092643, + "grad_norm": 3.0681300163269043, + "learning_rate": 1.3643908037580533e-08, + "loss": 0.184, + "step": 36108 + }, + { + "epoch": 98.38964577656675, + "grad_norm": 2.5093634128570557, + "learning_rate": 1.3597863125069943e-08, + "loss": 0.0444, + "step": 36109 + }, + { + "epoch": 98.39237057220708, + "grad_norm": 2.9992306232452393, + "learning_rate": 1.3551895986338993e-08, + "loss": 0.1239, + "step": 36110 + }, + { + "epoch": 98.39509536784742, + "grad_norm": 2.3570594787597656, + "learning_rate": 1.3506006621742951e-08, + "loss": 0.0403, + "step": 36111 + }, + { + "epoch": 98.39782016348774, + "grad_norm": 2.0751588344573975, + "learning_rate": 1.3460195031641532e-08, + "loss": 0.1548, + "step": 36112 + }, + { + "epoch": 98.40054495912807, + "grad_norm": 3.247391939163208, + "learning_rate": 1.3414461216391117e-08, + "loss": 0.0984, + "step": 36113 + }, + { + "epoch": 98.40326975476839, + "grad_norm": 1.9408838748931885, + "learning_rate": 1.3368805176346977e-08, + "loss": 0.0262, + "step": 36114 + }, + { + "epoch": 98.40599455040872, + "grad_norm": 3.2725577354431152, + "learning_rate": 1.3323226911864385e-08, + "loss": 0.123, + "step": 36115 + }, + { + "epoch": 98.40871934604904, + "grad_norm": 2.6939446926116943, + "learning_rate": 1.327772642330083e-08, + "loss": 0.0371, + "step": 36116 + }, + { + "epoch": 98.41144414168937, + "grad_norm": 2.5777392387390137, + "learning_rate": 1.3232303711007143e-08, + "loss": 0.0715, + "step": 36117 + }, + { + "epoch": 98.4141689373297, + "grad_norm": 2.5360629558563232, + "learning_rate": 1.3186958775339709e-08, + "loss": 0.0458, + "step": 36118 + }, + { + "epoch": 98.41689373297002, + "grad_norm": 2.9892444610595703, + "learning_rate": 1.3141691616651575e-08, + "loss": 0.1276, + "step": 36119 + }, + { + "epoch": 98.41961852861036, + "grad_norm": 3.8520965576171875, + "learning_rate": 1.3096502235293573e-08, + "loss": 0.1467, + "step": 36120 + }, + { + "epoch": 98.42234332425068, + "grad_norm": 1.4537595510482788, + "learning_rate": 1.3051390631618755e-08, + "loss": 0.0925, + "step": 36121 + }, + { + "epoch": 98.42506811989101, + "grad_norm": 3.732198715209961, + "learning_rate": 1.3006356805977949e-08, + "loss": 0.1491, + "step": 36122 + }, + { + "epoch": 98.42779291553134, + "grad_norm": 2.4978554248809814, + "learning_rate": 1.2961400758721987e-08, + "loss": 0.0511, + "step": 36123 + }, + { + "epoch": 98.43051771117166, + "grad_norm": 4.112996578216553, + "learning_rate": 1.2916522490201699e-08, + "loss": 0.0407, + "step": 36124 + }, + { + "epoch": 98.433242506812, + "grad_norm": 1.5079231262207031, + "learning_rate": 1.2871722000766806e-08, + "loss": 0.0155, + "step": 36125 + }, + { + "epoch": 98.43596730245231, + "grad_norm": 2.5488126277923584, + "learning_rate": 1.2826999290764807e-08, + "loss": 0.0576, + "step": 36126 + }, + { + "epoch": 98.43869209809264, + "grad_norm": 3.4591064453125, + "learning_rate": 1.2782354360544314e-08, + "loss": 0.0393, + "step": 36127 + }, + { + "epoch": 98.44141689373296, + "grad_norm": 2.671058416366577, + "learning_rate": 1.2737787210453933e-08, + "loss": 0.0665, + "step": 36128 + }, + { + "epoch": 98.4441416893733, + "grad_norm": 3.291278123855591, + "learning_rate": 1.2693297840840058e-08, + "loss": 0.0498, + "step": 36129 + }, + { + "epoch": 98.44686648501363, + "grad_norm": 3.0969431400299072, + "learning_rate": 1.2648886252050186e-08, + "loss": 0.068, + "step": 36130 + }, + { + "epoch": 98.44959128065395, + "grad_norm": 2.8539137840270996, + "learning_rate": 1.2604552444428487e-08, + "loss": 0.0499, + "step": 36131 + }, + { + "epoch": 98.45231607629428, + "grad_norm": 2.5560038089752197, + "learning_rate": 1.2560296418320239e-08, + "loss": 0.0398, + "step": 36132 + }, + { + "epoch": 98.4550408719346, + "grad_norm": 2.3815579414367676, + "learning_rate": 1.2516118174071834e-08, + "loss": 0.026, + "step": 36133 + }, + { + "epoch": 98.45776566757493, + "grad_norm": 1.9051722288131714, + "learning_rate": 1.2472017712027439e-08, + "loss": 0.0295, + "step": 36134 + }, + { + "epoch": 98.46049046321527, + "grad_norm": 2.047534704208374, + "learning_rate": 1.2427995032527895e-08, + "loss": 0.0307, + "step": 36135 + }, + { + "epoch": 98.46321525885558, + "grad_norm": 1.9832487106323242, + "learning_rate": 1.238405013591848e-08, + "loss": 0.056, + "step": 36136 + }, + { + "epoch": 98.46594005449592, + "grad_norm": 2.251464605331421, + "learning_rate": 1.2340183022541142e-08, + "loss": 0.0343, + "step": 36137 + }, + { + "epoch": 98.46866485013624, + "grad_norm": 1.642418622970581, + "learning_rate": 1.2296393692735608e-08, + "loss": 0.0187, + "step": 36138 + }, + { + "epoch": 98.47138964577657, + "grad_norm": 2.1609480381011963, + "learning_rate": 1.225268214684494e-08, + "loss": 0.0845, + "step": 36139 + }, + { + "epoch": 98.47411444141689, + "grad_norm": 2.5468668937683105, + "learning_rate": 1.2209048385209977e-08, + "loss": 0.1115, + "step": 36140 + }, + { + "epoch": 98.47683923705722, + "grad_norm": 3.6908071041107178, + "learning_rate": 1.2165492408168223e-08, + "loss": 0.046, + "step": 36141 + }, + { + "epoch": 98.47956403269755, + "grad_norm": 3.202972173690796, + "learning_rate": 1.2122014216060518e-08, + "loss": 0.1119, + "step": 36142 + }, + { + "epoch": 98.48228882833787, + "grad_norm": 3.602304458618164, + "learning_rate": 1.2078613809225482e-08, + "loss": 0.0756, + "step": 36143 + }, + { + "epoch": 98.4850136239782, + "grad_norm": 3.881646156311035, + "learning_rate": 1.2035291187999509e-08, + "loss": 0.0448, + "step": 36144 + }, + { + "epoch": 98.48773841961852, + "grad_norm": 1.424583911895752, + "learning_rate": 1.199204635272233e-08, + "loss": 0.013, + "step": 36145 + }, + { + "epoch": 98.49046321525886, + "grad_norm": 1.6723031997680664, + "learning_rate": 1.1948879303729233e-08, + "loss": 0.0118, + "step": 36146 + }, + { + "epoch": 98.49318801089919, + "grad_norm": 3.3834898471832275, + "learning_rate": 1.1905790041357724e-08, + "loss": 0.028, + "step": 36147 + }, + { + "epoch": 98.49591280653951, + "grad_norm": 1.136795997619629, + "learning_rate": 1.1862778565940869e-08, + "loss": 0.0156, + "step": 36148 + }, + { + "epoch": 98.49863760217984, + "grad_norm": 2.5485243797302246, + "learning_rate": 1.1819844877816178e-08, + "loss": 0.0458, + "step": 36149 + }, + { + "epoch": 98.50136239782016, + "grad_norm": 2.5030970573425293, + "learning_rate": 1.1776988977316717e-08, + "loss": 0.061, + "step": 36150 + }, + { + "epoch": 98.50408719346049, + "grad_norm": 4.324421405792236, + "learning_rate": 1.1734210864777773e-08, + "loss": 0.1569, + "step": 36151 + }, + { + "epoch": 98.50681198910081, + "grad_norm": 2.1284096240997314, + "learning_rate": 1.1691510540530193e-08, + "loss": 0.0599, + "step": 36152 + }, + { + "epoch": 98.50953678474114, + "grad_norm": 1.4949356317520142, + "learning_rate": 1.1648888004907043e-08, + "loss": 0.0183, + "step": 36153 + }, + { + "epoch": 98.51226158038148, + "grad_norm": 2.3864893913269043, + "learning_rate": 1.1606343258242503e-08, + "loss": 0.1269, + "step": 36154 + }, + { + "epoch": 98.5149863760218, + "grad_norm": 1.6330173015594482, + "learning_rate": 1.1563876300865195e-08, + "loss": 0.0367, + "step": 36155 + }, + { + "epoch": 98.51771117166213, + "grad_norm": 3.575246810913086, + "learning_rate": 1.152148713310708e-08, + "loss": 0.0872, + "step": 36156 + }, + { + "epoch": 98.52043596730245, + "grad_norm": 2.4141902923583984, + "learning_rate": 1.1479175755297889e-08, + "loss": 0.0862, + "step": 36157 + }, + { + "epoch": 98.52316076294278, + "grad_norm": 1.7315680980682373, + "learning_rate": 1.1436942167768472e-08, + "loss": 0.0661, + "step": 36158 + }, + { + "epoch": 98.52588555858311, + "grad_norm": 2.7438507080078125, + "learning_rate": 1.1394786370845234e-08, + "loss": 0.1063, + "step": 36159 + }, + { + "epoch": 98.52861035422343, + "grad_norm": 2.2468864917755127, + "learning_rate": 1.1352708364859022e-08, + "loss": 0.0189, + "step": 36160 + }, + { + "epoch": 98.53133514986376, + "grad_norm": 2.3657684326171875, + "learning_rate": 1.131070815013624e-08, + "loss": 0.0293, + "step": 36161 + }, + { + "epoch": 98.53405994550408, + "grad_norm": 3.182272434234619, + "learning_rate": 1.1268785727004406e-08, + "loss": 0.1786, + "step": 36162 + }, + { + "epoch": 98.53678474114442, + "grad_norm": 3.479954242706299, + "learning_rate": 1.1226941095788813e-08, + "loss": 0.051, + "step": 36163 + }, + { + "epoch": 98.53950953678473, + "grad_norm": 2.0503923892974854, + "learning_rate": 1.1185174256816978e-08, + "loss": 0.0247, + "step": 36164 + }, + { + "epoch": 98.54223433242507, + "grad_norm": 2.055842399597168, + "learning_rate": 1.1143485210413086e-08, + "loss": 0.0238, + "step": 36165 + }, + { + "epoch": 98.5449591280654, + "grad_norm": 3.5154647827148438, + "learning_rate": 1.1101873956902431e-08, + "loss": 0.0838, + "step": 36166 + }, + { + "epoch": 98.54768392370572, + "grad_norm": 9.433673858642578, + "learning_rate": 1.10603404966092e-08, + "loss": 0.0289, + "step": 36167 + }, + { + "epoch": 98.55040871934605, + "grad_norm": 4.547787189483643, + "learning_rate": 1.101888482985647e-08, + "loss": 0.0366, + "step": 36168 + }, + { + "epoch": 98.55313351498637, + "grad_norm": 2.169792652130127, + "learning_rate": 1.0977506956967309e-08, + "loss": 0.0235, + "step": 36169 + }, + { + "epoch": 98.5558583106267, + "grad_norm": 5.074012756347656, + "learning_rate": 1.093620687826369e-08, + "loss": 0.0531, + "step": 36170 + }, + { + "epoch": 98.55858310626704, + "grad_norm": 2.4713664054870605, + "learning_rate": 1.0894984594067571e-08, + "loss": 0.0533, + "step": 36171 + }, + { + "epoch": 98.56130790190736, + "grad_norm": 1.9822112321853638, + "learning_rate": 1.0853840104698698e-08, + "loss": 0.0322, + "step": 36172 + }, + { + "epoch": 98.56403269754769, + "grad_norm": 4.8559136390686035, + "learning_rate": 1.0812773410480148e-08, + "loss": 0.0784, + "step": 36173 + }, + { + "epoch": 98.566757493188, + "grad_norm": 3.35929012298584, + "learning_rate": 1.0771784511729444e-08, + "loss": 0.11, + "step": 36174 + }, + { + "epoch": 98.56948228882834, + "grad_norm": 1.8584080934524536, + "learning_rate": 1.0730873408766329e-08, + "loss": 0.0279, + "step": 36175 + }, + { + "epoch": 98.57220708446866, + "grad_norm": 3.7485361099243164, + "learning_rate": 1.0690040101910549e-08, + "loss": 0.0979, + "step": 36176 + }, + { + "epoch": 98.57493188010899, + "grad_norm": 2.447479248046875, + "learning_rate": 1.0649284591478514e-08, + "loss": 0.0633, + "step": 36177 + }, + { + "epoch": 98.57765667574932, + "grad_norm": 1.4438681602478027, + "learning_rate": 1.0608606877788863e-08, + "loss": 0.0764, + "step": 36178 + }, + { + "epoch": 98.58038147138964, + "grad_norm": 3.983067274093628, + "learning_rate": 1.0568006961156895e-08, + "loss": 0.0306, + "step": 36179 + }, + { + "epoch": 98.58310626702998, + "grad_norm": 1.738135576248169, + "learning_rate": 1.0527484841900137e-08, + "loss": 0.0292, + "step": 36180 + }, + { + "epoch": 98.5858310626703, + "grad_norm": 2.455057382583618, + "learning_rate": 1.0487040520335e-08, + "loss": 0.0323, + "step": 36181 + }, + { + "epoch": 98.58855585831063, + "grad_norm": 1.8972069025039673, + "learning_rate": 1.044667399677457e-08, + "loss": 0.0241, + "step": 36182 + }, + { + "epoch": 98.59128065395096, + "grad_norm": 2.701190710067749, + "learning_rate": 1.0406385271533037e-08, + "loss": 0.0959, + "step": 36183 + }, + { + "epoch": 98.59400544959128, + "grad_norm": 3.047895908355713, + "learning_rate": 1.0366174344925705e-08, + "loss": 0.0672, + "step": 36184 + }, + { + "epoch": 98.59673024523161, + "grad_norm": 2.033413887023926, + "learning_rate": 1.0326041217265659e-08, + "loss": 0.1726, + "step": 36185 + }, + { + "epoch": 98.59945504087193, + "grad_norm": 2.644911527633667, + "learning_rate": 1.0285985888863759e-08, + "loss": 0.0378, + "step": 36186 + }, + { + "epoch": 98.60217983651226, + "grad_norm": 2.7324492931365967, + "learning_rate": 1.0246008360034199e-08, + "loss": 0.0484, + "step": 36187 + }, + { + "epoch": 98.60490463215258, + "grad_norm": 2.0621514320373535, + "learning_rate": 1.020610863108673e-08, + "loss": 0.0755, + "step": 36188 + }, + { + "epoch": 98.60762942779292, + "grad_norm": 2.5982513427734375, + "learning_rate": 1.0166286702332218e-08, + "loss": 0.0341, + "step": 36189 + }, + { + "epoch": 98.61035422343325, + "grad_norm": 2.2652432918548584, + "learning_rate": 1.0126542574081521e-08, + "loss": 0.0354, + "step": 36190 + }, + { + "epoch": 98.61307901907357, + "grad_norm": 2.6030406951904297, + "learning_rate": 1.0086876246644395e-08, + "loss": 0.0826, + "step": 36191 + }, + { + "epoch": 98.6158038147139, + "grad_norm": 2.524291515350342, + "learning_rate": 1.0047287720328369e-08, + "loss": 0.0447, + "step": 36192 + }, + { + "epoch": 98.61852861035422, + "grad_norm": 1.7350260019302368, + "learning_rate": 1.0007776995442087e-08, + "loss": 0.0363, + "step": 36193 + }, + { + "epoch": 98.62125340599455, + "grad_norm": 2.4189505577087402, + "learning_rate": 9.96834407229419e-09, + "loss": 0.0332, + "step": 36194 + }, + { + "epoch": 98.62397820163488, + "grad_norm": 2.639000415802002, + "learning_rate": 9.928988951192209e-09, + "loss": 0.0343, + "step": 36195 + }, + { + "epoch": 98.6267029972752, + "grad_norm": 2.462409019470215, + "learning_rate": 9.889711632440346e-09, + "loss": 0.0336, + "step": 36196 + }, + { + "epoch": 98.62942779291554, + "grad_norm": 2.373863458633423, + "learning_rate": 9.850512116347245e-09, + "loss": 0.1455, + "step": 36197 + }, + { + "epoch": 98.63215258855585, + "grad_norm": 2.109741449356079, + "learning_rate": 9.811390403215992e-09, + "loss": 0.0429, + "step": 36198 + }, + { + "epoch": 98.63487738419619, + "grad_norm": 2.0638701915740967, + "learning_rate": 9.772346493351902e-09, + "loss": 0.0302, + "step": 36199 + }, + { + "epoch": 98.6376021798365, + "grad_norm": 3.05644154548645, + "learning_rate": 9.733380387059177e-09, + "loss": 0.2133, + "step": 36200 + }, + { + "epoch": 98.64032697547684, + "grad_norm": 3.4912054538726807, + "learning_rate": 9.694492084642016e-09, + "loss": 0.0805, + "step": 36201 + }, + { + "epoch": 98.64305177111717, + "grad_norm": 2.714277744293213, + "learning_rate": 9.6556815864024e-09, + "loss": 0.0427, + "step": 36202 + }, + { + "epoch": 98.64577656675749, + "grad_norm": 2.102691411972046, + "learning_rate": 9.616948892642307e-09, + "loss": 0.1589, + "step": 36203 + }, + { + "epoch": 98.64850136239782, + "grad_norm": 2.0056819915771484, + "learning_rate": 9.578294003664835e-09, + "loss": 0.0388, + "step": 36204 + }, + { + "epoch": 98.65122615803814, + "grad_norm": 3.3613219261169434, + "learning_rate": 9.539716919768626e-09, + "loss": 0.1596, + "step": 36205 + }, + { + "epoch": 98.65395095367847, + "grad_norm": 3.162074089050293, + "learning_rate": 9.501217641256776e-09, + "loss": 0.0988, + "step": 36206 + }, + { + "epoch": 98.65667574931881, + "grad_norm": 3.202958822250366, + "learning_rate": 9.462796168427935e-09, + "loss": 0.0974, + "step": 36207 + }, + { + "epoch": 98.65940054495913, + "grad_norm": 1.555505633354187, + "learning_rate": 9.42445250158075e-09, + "loss": 0.02, + "step": 36208 + }, + { + "epoch": 98.66212534059946, + "grad_norm": 5.151355266571045, + "learning_rate": 9.386186641013872e-09, + "loss": 0.0285, + "step": 36209 + }, + { + "epoch": 98.66485013623978, + "grad_norm": 2.0583536624908447, + "learning_rate": 9.347998587027063e-09, + "loss": 0.024, + "step": 36210 + }, + { + "epoch": 98.66757493188011, + "grad_norm": 2.2810378074645996, + "learning_rate": 9.30988833991564e-09, + "loss": 0.0576, + "step": 36211 + }, + { + "epoch": 98.67029972752043, + "grad_norm": 2.646106004714966, + "learning_rate": 9.271855899977144e-09, + "loss": 0.0264, + "step": 36212 + }, + { + "epoch": 98.67302452316076, + "grad_norm": 2.243086338043213, + "learning_rate": 9.233901267509115e-09, + "loss": 0.0927, + "step": 36213 + }, + { + "epoch": 98.6757493188011, + "grad_norm": 1.8522670269012451, + "learning_rate": 9.196024442804652e-09, + "loss": 0.0445, + "step": 36214 + }, + { + "epoch": 98.67847411444141, + "grad_norm": 2.2108867168426514, + "learning_rate": 9.158225426160183e-09, + "loss": 0.0687, + "step": 36215 + }, + { + "epoch": 98.68119891008175, + "grad_norm": 2.378458261489868, + "learning_rate": 9.120504217871029e-09, + "loss": 0.1945, + "step": 36216 + }, + { + "epoch": 98.68392370572207, + "grad_norm": 2.6821839809417725, + "learning_rate": 9.082860818228068e-09, + "loss": 0.1039, + "step": 36217 + }, + { + "epoch": 98.6866485013624, + "grad_norm": 2.8306756019592285, + "learning_rate": 9.045295227527728e-09, + "loss": 0.0531, + "step": 36218 + }, + { + "epoch": 98.68937329700273, + "grad_norm": 2.138756036758423, + "learning_rate": 9.007807446059779e-09, + "loss": 0.1238, + "step": 36219 + }, + { + "epoch": 98.69209809264305, + "grad_norm": 2.8362069129943848, + "learning_rate": 8.970397474118431e-09, + "loss": 0.0756, + "step": 36220 + }, + { + "epoch": 98.69482288828338, + "grad_norm": 1.5811744928359985, + "learning_rate": 8.93306531199345e-09, + "loss": 0.0255, + "step": 36221 + }, + { + "epoch": 98.6975476839237, + "grad_norm": 2.259927988052368, + "learning_rate": 8.895810959976825e-09, + "loss": 0.0324, + "step": 36222 + }, + { + "epoch": 98.70027247956403, + "grad_norm": 2.612879991531372, + "learning_rate": 8.858634418358325e-09, + "loss": 0.0418, + "step": 36223 + }, + { + "epoch": 98.70299727520435, + "grad_norm": 2.5344955921173096, + "learning_rate": 8.821535687426609e-09, + "loss": 0.029, + "step": 36224 + }, + { + "epoch": 98.70572207084469, + "grad_norm": 13.622929573059082, + "learning_rate": 8.784514767470331e-09, + "loss": 0.0871, + "step": 36225 + }, + { + "epoch": 98.70844686648502, + "grad_norm": 1.8633819818496704, + "learning_rate": 8.747571658780373e-09, + "loss": 0.0222, + "step": 36226 + }, + { + "epoch": 98.71117166212534, + "grad_norm": 2.615386486053467, + "learning_rate": 8.710706361642063e-09, + "loss": 0.0578, + "step": 36227 + }, + { + "epoch": 98.71389645776567, + "grad_norm": 2.52996563911438, + "learning_rate": 8.673918876342947e-09, + "loss": 0.0966, + "step": 36228 + }, + { + "epoch": 98.71662125340599, + "grad_norm": 1.7542939186096191, + "learning_rate": 8.63720920316946e-09, + "loss": 0.0367, + "step": 36229 + }, + { + "epoch": 98.71934604904632, + "grad_norm": 2.614475727081299, + "learning_rate": 8.600577342408046e-09, + "loss": 0.0735, + "step": 36230 + }, + { + "epoch": 98.72207084468666, + "grad_norm": 4.2264814376831055, + "learning_rate": 8.564023294344026e-09, + "loss": 0.0692, + "step": 36231 + }, + { + "epoch": 98.72479564032697, + "grad_norm": 1.6859139204025269, + "learning_rate": 8.527547059262731e-09, + "loss": 0.1277, + "step": 36232 + }, + { + "epoch": 98.7275204359673, + "grad_norm": 2.428453207015991, + "learning_rate": 8.491148637446156e-09, + "loss": 0.0275, + "step": 36233 + }, + { + "epoch": 98.73024523160763, + "grad_norm": 4.541210651397705, + "learning_rate": 8.454828029178518e-09, + "loss": 0.0867, + "step": 36234 + }, + { + "epoch": 98.73297002724796, + "grad_norm": 2.7328550815582275, + "learning_rate": 8.418585234744037e-09, + "loss": 0.1257, + "step": 36235 + }, + { + "epoch": 98.73569482288828, + "grad_norm": 1.9844528436660767, + "learning_rate": 8.382420254424706e-09, + "loss": 0.0273, + "step": 36236 + }, + { + "epoch": 98.73841961852861, + "grad_norm": 2.834373950958252, + "learning_rate": 8.346333088500303e-09, + "loss": 0.0505, + "step": 36237 + }, + { + "epoch": 98.74114441416894, + "grad_norm": 2.5058889389038086, + "learning_rate": 8.310323737252824e-09, + "loss": 0.0267, + "step": 36238 + }, + { + "epoch": 98.74386920980926, + "grad_norm": 2.4641990661621094, + "learning_rate": 8.274392200964265e-09, + "loss": 0.0387, + "step": 36239 + }, + { + "epoch": 98.7465940054496, + "grad_norm": 4.683347702026367, + "learning_rate": 8.238538479912184e-09, + "loss": 0.1611, + "step": 36240 + }, + { + "epoch": 98.74931880108991, + "grad_norm": 2.662602186203003, + "learning_rate": 8.202762574376355e-09, + "loss": 0.0271, + "step": 36241 + }, + { + "epoch": 98.75204359673025, + "grad_norm": 2.5227410793304443, + "learning_rate": 8.167064484636555e-09, + "loss": 0.069, + "step": 36242 + }, + { + "epoch": 98.75476839237058, + "grad_norm": 3.3482046127319336, + "learning_rate": 8.13144421097034e-09, + "loss": 0.0352, + "step": 36243 + }, + { + "epoch": 98.7574931880109, + "grad_norm": 2.558753728866577, + "learning_rate": 8.095901753654156e-09, + "loss": 0.0271, + "step": 36244 + }, + { + "epoch": 98.76021798365123, + "grad_norm": 2.3655343055725098, + "learning_rate": 8.060437112965558e-09, + "loss": 0.0602, + "step": 36245 + }, + { + "epoch": 98.76294277929155, + "grad_norm": 2.8100643157958984, + "learning_rate": 8.02505028918099e-09, + "loss": 0.0667, + "step": 36246 + }, + { + "epoch": 98.76566757493188, + "grad_norm": 1.8988646268844604, + "learning_rate": 7.989741282575792e-09, + "loss": 0.077, + "step": 36247 + }, + { + "epoch": 98.7683923705722, + "grad_norm": 2.5409767627716064, + "learning_rate": 7.954510093425294e-09, + "loss": 0.095, + "step": 36248 + }, + { + "epoch": 98.77111716621253, + "grad_norm": 2.4074063301086426, + "learning_rate": 7.919356722002613e-09, + "loss": 0.0317, + "step": 36249 + }, + { + "epoch": 98.77384196185287, + "grad_norm": 1.1986193656921387, + "learning_rate": 7.884281168583086e-09, + "loss": 0.0141, + "step": 36250 + }, + { + "epoch": 98.77656675749319, + "grad_norm": 5.700056552886963, + "learning_rate": 7.849283433438714e-09, + "loss": 0.0583, + "step": 36251 + }, + { + "epoch": 98.77929155313352, + "grad_norm": 3.0358242988586426, + "learning_rate": 7.814363516842616e-09, + "loss": 0.0546, + "step": 36252 + }, + { + "epoch": 98.78201634877384, + "grad_norm": 1.692973256111145, + "learning_rate": 7.779521419066793e-09, + "loss": 0.0178, + "step": 36253 + }, + { + "epoch": 98.78474114441417, + "grad_norm": 4.116315841674805, + "learning_rate": 7.744757140382141e-09, + "loss": 0.0465, + "step": 36254 + }, + { + "epoch": 98.7874659400545, + "grad_norm": 1.8948396444320679, + "learning_rate": 7.710070681060666e-09, + "loss": 0.0192, + "step": 36255 + }, + { + "epoch": 98.79019073569482, + "grad_norm": 1.9507626295089722, + "learning_rate": 7.67546204137104e-09, + "loss": 0.0448, + "step": 36256 + }, + { + "epoch": 98.79291553133515, + "grad_norm": 3.586582660675049, + "learning_rate": 7.640931221583048e-09, + "loss": 0.0426, + "step": 36257 + }, + { + "epoch": 98.79564032697547, + "grad_norm": 3.2128372192382812, + "learning_rate": 7.606478221965363e-09, + "loss": 0.0405, + "step": 36258 + }, + { + "epoch": 98.7983651226158, + "grad_norm": 2.8067307472229004, + "learning_rate": 7.572103042787771e-09, + "loss": 0.0772, + "step": 36259 + }, + { + "epoch": 98.80108991825612, + "grad_norm": 2.903602361679077, + "learning_rate": 7.537805684316724e-09, + "loss": 0.0514, + "step": 36260 + }, + { + "epoch": 98.80381471389646, + "grad_norm": 2.3150784969329834, + "learning_rate": 7.503586146819785e-09, + "loss": 0.0279, + "step": 36261 + }, + { + "epoch": 98.80653950953679, + "grad_norm": 2.790849208831787, + "learning_rate": 7.4694444305623e-09, + "loss": 0.0524, + "step": 36262 + }, + { + "epoch": 98.80926430517711, + "grad_norm": 2.5214614868164062, + "learning_rate": 7.4353805358129416e-09, + "loss": 0.1017, + "step": 36263 + }, + { + "epoch": 98.81198910081744, + "grad_norm": 2.7264602184295654, + "learning_rate": 7.401394462833722e-09, + "loss": 0.0297, + "step": 36264 + }, + { + "epoch": 98.81471389645776, + "grad_norm": 2.5907976627349854, + "learning_rate": 7.3674862118922055e-09, + "loss": 0.0599, + "step": 36265 + }, + { + "epoch": 98.8174386920981, + "grad_norm": 3.868417263031006, + "learning_rate": 7.333655783249294e-09, + "loss": 0.0575, + "step": 36266 + }, + { + "epoch": 98.82016348773843, + "grad_norm": 2.3906784057617188, + "learning_rate": 7.299903177171441e-09, + "loss": 0.082, + "step": 36267 + }, + { + "epoch": 98.82288828337875, + "grad_norm": 7.075655460357666, + "learning_rate": 7.2662283939206604e-09, + "loss": 0.025, + "step": 36268 + }, + { + "epoch": 98.82561307901908, + "grad_norm": 3.075913906097412, + "learning_rate": 7.232631433757853e-09, + "loss": 0.0504, + "step": 36269 + }, + { + "epoch": 98.8283378746594, + "grad_norm": 2.7215065956115723, + "learning_rate": 7.1991122969461425e-09, + "loss": 0.0616, + "step": 36270 + }, + { + "epoch": 98.83106267029973, + "grad_norm": 2.9382898807525635, + "learning_rate": 7.165670983746431e-09, + "loss": 0.053, + "step": 36271 + }, + { + "epoch": 98.83378746594005, + "grad_norm": 3.1600341796875, + "learning_rate": 7.132307494418511e-09, + "loss": 0.0317, + "step": 36272 + }, + { + "epoch": 98.83651226158038, + "grad_norm": 2.2423198223114014, + "learning_rate": 7.099021829223285e-09, + "loss": 0.0593, + "step": 36273 + }, + { + "epoch": 98.83923705722071, + "grad_norm": 2.4246907234191895, + "learning_rate": 7.065813988418324e-09, + "loss": 0.0484, + "step": 36274 + }, + { + "epoch": 98.84196185286103, + "grad_norm": 2.9497811794281006, + "learning_rate": 7.032683972263421e-09, + "loss": 0.0344, + "step": 36275 + }, + { + "epoch": 98.84468664850137, + "grad_norm": 1.5730886459350586, + "learning_rate": 6.999631781017258e-09, + "loss": 0.0173, + "step": 36276 + }, + { + "epoch": 98.84741144414168, + "grad_norm": 2.204084634780884, + "learning_rate": 6.966657414935185e-09, + "loss": 0.0454, + "step": 36277 + }, + { + "epoch": 98.85013623978202, + "grad_norm": 2.1484272480010986, + "learning_rate": 6.933760874274775e-09, + "loss": 0.0466, + "step": 36278 + }, + { + "epoch": 98.85286103542235, + "grad_norm": 2.359956741333008, + "learning_rate": 6.9009421592936e-09, + "loss": 0.0305, + "step": 36279 + }, + { + "epoch": 98.85558583106267, + "grad_norm": 3.301863670349121, + "learning_rate": 6.8682012702459e-09, + "loss": 0.085, + "step": 36280 + }, + { + "epoch": 98.858310626703, + "grad_norm": 1.8629157543182373, + "learning_rate": 6.835538207387027e-09, + "loss": 0.0227, + "step": 36281 + }, + { + "epoch": 98.86103542234332, + "grad_norm": 1.7687841653823853, + "learning_rate": 6.802952970971222e-09, + "loss": 0.0311, + "step": 36282 + }, + { + "epoch": 98.86376021798365, + "grad_norm": 2.2203309535980225, + "learning_rate": 6.770445561252725e-09, + "loss": 0.0374, + "step": 36283 + }, + { + "epoch": 98.86648501362397, + "grad_norm": 3.330214023590088, + "learning_rate": 6.738015978484669e-09, + "loss": 0.0371, + "step": 36284 + }, + { + "epoch": 98.8692098092643, + "grad_norm": 2.2659683227539062, + "learning_rate": 6.705664222919072e-09, + "loss": 0.0565, + "step": 36285 + }, + { + "epoch": 98.87193460490464, + "grad_norm": 2.4965755939483643, + "learning_rate": 6.673390294807958e-09, + "loss": 0.0605, + "step": 36286 + }, + { + "epoch": 98.87465940054496, + "grad_norm": 2.2927823066711426, + "learning_rate": 6.641194194402234e-09, + "loss": 0.0253, + "step": 36287 + }, + { + "epoch": 98.87738419618529, + "grad_norm": 2.6198787689208984, + "learning_rate": 6.609075921953923e-09, + "loss": 0.0968, + "step": 36288 + }, + { + "epoch": 98.88010899182561, + "grad_norm": 2.3675615787506104, + "learning_rate": 6.577035477712823e-09, + "loss": 0.0383, + "step": 36289 + }, + { + "epoch": 98.88283378746594, + "grad_norm": 3.417741298675537, + "learning_rate": 6.545072861927626e-09, + "loss": 0.097, + "step": 36290 + }, + { + "epoch": 98.88555858310627, + "grad_norm": 1.915927529335022, + "learning_rate": 6.5131880748481314e-09, + "loss": 0.0749, + "step": 36291 + }, + { + "epoch": 98.88828337874659, + "grad_norm": 2.6985626220703125, + "learning_rate": 6.481381116721919e-09, + "loss": 0.0901, + "step": 36292 + }, + { + "epoch": 98.89100817438693, + "grad_norm": 3.038095235824585, + "learning_rate": 6.449651987797678e-09, + "loss": 0.0373, + "step": 36293 + }, + { + "epoch": 98.89373297002724, + "grad_norm": 2.512392520904541, + "learning_rate": 6.418000688320769e-09, + "loss": 0.0248, + "step": 36294 + }, + { + "epoch": 98.89645776566758, + "grad_norm": 1.378581166267395, + "learning_rate": 6.386427218539881e-09, + "loss": 0.0157, + "step": 36295 + }, + { + "epoch": 98.8991825613079, + "grad_norm": 1.49094557762146, + "learning_rate": 6.354931578699264e-09, + "loss": 0.0318, + "step": 36296 + }, + { + "epoch": 98.90190735694823, + "grad_norm": 2.465254545211792, + "learning_rate": 6.323513769045386e-09, + "loss": 0.0295, + "step": 36297 + }, + { + "epoch": 98.90463215258856, + "grad_norm": 2.6463098526000977, + "learning_rate": 6.292173789821387e-09, + "loss": 0.0393, + "step": 36298 + }, + { + "epoch": 98.90735694822888, + "grad_norm": 2.901310920715332, + "learning_rate": 6.260911641272626e-09, + "loss": 0.0693, + "step": 36299 + }, + { + "epoch": 98.91008174386921, + "grad_norm": 2.0929248332977295, + "learning_rate": 6.229727323643353e-09, + "loss": 0.1131, + "step": 36300 + }, + { + "epoch": 98.91280653950953, + "grad_norm": 2.5953946113586426, + "learning_rate": 6.198620837174485e-09, + "loss": 0.0463, + "step": 36301 + }, + { + "epoch": 98.91553133514986, + "grad_norm": 2.3402748107910156, + "learning_rate": 6.167592182108051e-09, + "loss": 0.0297, + "step": 36302 + }, + { + "epoch": 98.9182561307902, + "grad_norm": 2.9301769733428955, + "learning_rate": 6.1366413586883e-09, + "loss": 0.1096, + "step": 36303 + }, + { + "epoch": 98.92098092643052, + "grad_norm": 3.1592493057250977, + "learning_rate": 6.10576836715393e-09, + "loss": 0.0623, + "step": 36304 + }, + { + "epoch": 98.92370572207085, + "grad_norm": 2.4974987506866455, + "learning_rate": 6.07497320774697e-09, + "loss": 0.0535, + "step": 36305 + }, + { + "epoch": 98.92643051771117, + "grad_norm": 1.8690325021743774, + "learning_rate": 6.044255880705008e-09, + "loss": 0.1418, + "step": 36306 + }, + { + "epoch": 98.9291553133515, + "grad_norm": 2.1339619159698486, + "learning_rate": 6.013616386270071e-09, + "loss": 0.018, + "step": 36307 + }, + { + "epoch": 98.93188010899182, + "grad_norm": 1.7211685180664062, + "learning_rate": 5.983054724679749e-09, + "loss": 0.0186, + "step": 36308 + }, + { + "epoch": 98.93460490463215, + "grad_norm": 2.7866098880767822, + "learning_rate": 5.952570896170518e-09, + "loss": 0.0359, + "step": 36309 + }, + { + "epoch": 98.93732970027249, + "grad_norm": 3.0363857746124268, + "learning_rate": 5.9221649009810756e-09, + "loss": 0.0381, + "step": 36310 + }, + { + "epoch": 98.9400544959128, + "grad_norm": 6.504725456237793, + "learning_rate": 5.891836739349011e-09, + "loss": 0.0466, + "step": 36311 + }, + { + "epoch": 98.94277929155314, + "grad_norm": 2.009805679321289, + "learning_rate": 5.86158641150969e-09, + "loss": 0.0238, + "step": 36312 + }, + { + "epoch": 98.94550408719346, + "grad_norm": 3.1905014514923096, + "learning_rate": 5.83141391769737e-09, + "loss": 0.0407, + "step": 36313 + }, + { + "epoch": 98.94822888283379, + "grad_norm": 2.685636520385742, + "learning_rate": 5.80131925814964e-09, + "loss": 0.0229, + "step": 36314 + }, + { + "epoch": 98.95095367847412, + "grad_norm": 2.8348448276519775, + "learning_rate": 5.771302433098536e-09, + "loss": 0.0467, + "step": 36315 + }, + { + "epoch": 98.95367847411444, + "grad_norm": 3.036760091781616, + "learning_rate": 5.741363442779424e-09, + "loss": 0.0544, + "step": 36316 + }, + { + "epoch": 98.95640326975477, + "grad_norm": 2.766896963119507, + "learning_rate": 5.711502287425452e-09, + "loss": 0.0347, + "step": 36317 + }, + { + "epoch": 98.95912806539509, + "grad_norm": 1.3856438398361206, + "learning_rate": 5.6817189672675464e-09, + "loss": 0.0166, + "step": 36318 + }, + { + "epoch": 98.96185286103542, + "grad_norm": 2.2274909019470215, + "learning_rate": 5.652013482539964e-09, + "loss": 0.1188, + "step": 36319 + }, + { + "epoch": 98.96457765667574, + "grad_norm": 1.9218724966049194, + "learning_rate": 5.6223858334725215e-09, + "loss": 0.0305, + "step": 36320 + }, + { + "epoch": 98.96730245231608, + "grad_norm": 2.904686689376831, + "learning_rate": 5.592836020295034e-09, + "loss": 0.0803, + "step": 36321 + }, + { + "epoch": 98.97002724795641, + "grad_norm": 1.8116261959075928, + "learning_rate": 5.563364043240649e-09, + "loss": 0.0276, + "step": 36322 + }, + { + "epoch": 98.97275204359673, + "grad_norm": 2.1489503383636475, + "learning_rate": 5.533969902535852e-09, + "loss": 0.1026, + "step": 36323 + }, + { + "epoch": 98.97547683923706, + "grad_norm": 2.3643507957458496, + "learning_rate": 5.504653598411569e-09, + "loss": 0.0418, + "step": 36324 + }, + { + "epoch": 98.97820163487738, + "grad_norm": 1.8588837385177612, + "learning_rate": 5.475415131094286e-09, + "loss": 0.0258, + "step": 36325 + }, + { + "epoch": 98.98092643051771, + "grad_norm": 3.1523587703704834, + "learning_rate": 5.446254500813819e-09, + "loss": 0.1419, + "step": 36326 + }, + { + "epoch": 98.98365122615803, + "grad_norm": 3.467860221862793, + "learning_rate": 5.417171707795544e-09, + "loss": 0.0603, + "step": 36327 + }, + { + "epoch": 98.98637602179836, + "grad_norm": 2.8103842735290527, + "learning_rate": 5.388166752267054e-09, + "loss": 0.0376, + "step": 36328 + }, + { + "epoch": 98.9891008174387, + "grad_norm": 2.1515791416168213, + "learning_rate": 5.359239634454838e-09, + "loss": 0.0339, + "step": 36329 + }, + { + "epoch": 98.99182561307902, + "grad_norm": 3.5862340927124023, + "learning_rate": 5.330390354582049e-09, + "loss": 0.1131, + "step": 36330 + }, + { + "epoch": 98.99455040871935, + "grad_norm": 4.1147685050964355, + "learning_rate": 5.301618912874062e-09, + "loss": 0.1015, + "step": 36331 + }, + { + "epoch": 98.99727520435967, + "grad_norm": 4.5505781173706055, + "learning_rate": 5.2729253095562535e-09, + "loss": 0.1679, + "step": 36332 + }, + { + "epoch": 99.0, + "grad_norm": 2.0763278007507324, + "learning_rate": 5.2443095448506674e-09, + "loss": 0.039, + "step": 36333 + }, + { + "epoch": 99.00272479564033, + "grad_norm": 2.160623073577881, + "learning_rate": 5.2157716189815685e-09, + "loss": 0.0228, + "step": 36334 + }, + { + "epoch": 99.00544959128065, + "grad_norm": 2.648790121078491, + "learning_rate": 5.1873115321698916e-09, + "loss": 0.0254, + "step": 36335 + }, + { + "epoch": 99.00817438692098, + "grad_norm": 1.4263352155685425, + "learning_rate": 5.158929284637682e-09, + "loss": 0.0121, + "step": 36336 + }, + { + "epoch": 99.0108991825613, + "grad_norm": 2.350101947784424, + "learning_rate": 5.130624876605872e-09, + "loss": 0.083, + "step": 36337 + }, + { + "epoch": 99.01362397820164, + "grad_norm": 1.9578046798706055, + "learning_rate": 5.102398308295398e-09, + "loss": 0.0771, + "step": 36338 + }, + { + "epoch": 99.01634877384195, + "grad_norm": 2.8038489818573, + "learning_rate": 5.074249579924972e-09, + "loss": 0.0727, + "step": 36339 + }, + { + "epoch": 99.01907356948229, + "grad_norm": 2.09999418258667, + "learning_rate": 5.046178691715531e-09, + "loss": 0.0247, + "step": 36340 + }, + { + "epoch": 99.02179836512262, + "grad_norm": 2.1430397033691406, + "learning_rate": 5.018185643884676e-09, + "loss": 0.0304, + "step": 36341 + }, + { + "epoch": 99.02452316076294, + "grad_norm": 1.720141053199768, + "learning_rate": 4.9902704366500135e-09, + "loss": 0.0254, + "step": 36342 + }, + { + "epoch": 99.02724795640327, + "grad_norm": 1.895276665687561, + "learning_rate": 4.9624330702302544e-09, + "loss": 0.0384, + "step": 36343 + }, + { + "epoch": 99.02997275204359, + "grad_norm": 3.258413076400757, + "learning_rate": 4.9346735448407845e-09, + "loss": 0.0641, + "step": 36344 + }, + { + "epoch": 99.03269754768392, + "grad_norm": 1.620366096496582, + "learning_rate": 4.906991860698096e-09, + "loss": 0.0307, + "step": 36345 + }, + { + "epoch": 99.03542234332426, + "grad_norm": 2.048008680343628, + "learning_rate": 4.879388018018683e-09, + "loss": 0.0226, + "step": 36346 + }, + { + "epoch": 99.03814713896458, + "grad_norm": 2.050539255142212, + "learning_rate": 4.8518620170168175e-09, + "loss": 0.0248, + "step": 36347 + }, + { + "epoch": 99.04087193460491, + "grad_norm": 3.3020405769348145, + "learning_rate": 4.824413857906773e-09, + "loss": 0.1052, + "step": 36348 + }, + { + "epoch": 99.04359673024523, + "grad_norm": 3.141381025314331, + "learning_rate": 4.7970435409017136e-09, + "loss": 0.0554, + "step": 36349 + }, + { + "epoch": 99.04632152588556, + "grad_norm": 14.986294746398926, + "learning_rate": 4.769751066217021e-09, + "loss": 0.0382, + "step": 36350 + }, + { + "epoch": 99.04904632152588, + "grad_norm": 2.1716835498809814, + "learning_rate": 4.742536434062528e-09, + "loss": 0.0511, + "step": 36351 + }, + { + "epoch": 99.05177111716621, + "grad_norm": 2.3615550994873047, + "learning_rate": 4.715399644652508e-09, + "loss": 0.0452, + "step": 36352 + }, + { + "epoch": 99.05449591280654, + "grad_norm": 2.8376779556274414, + "learning_rate": 4.6883406981967915e-09, + "loss": 0.0363, + "step": 36353 + }, + { + "epoch": 99.05722070844686, + "grad_norm": 1.998656153678894, + "learning_rate": 4.661359594906323e-09, + "loss": 0.0817, + "step": 36354 + }, + { + "epoch": 99.0599455040872, + "grad_norm": 2.0303032398223877, + "learning_rate": 4.634456334992044e-09, + "loss": 0.0369, + "step": 36355 + }, + { + "epoch": 99.06267029972751, + "grad_norm": 1.6783592700958252, + "learning_rate": 4.607630918662676e-09, + "loss": 0.0582, + "step": 36356 + }, + { + "epoch": 99.06539509536785, + "grad_norm": 4.393839359283447, + "learning_rate": 4.580883346128051e-09, + "loss": 0.0314, + "step": 36357 + }, + { + "epoch": 99.06811989100818, + "grad_norm": 2.3626253604888916, + "learning_rate": 4.554213617594672e-09, + "loss": 0.0389, + "step": 36358 + }, + { + "epoch": 99.0708446866485, + "grad_norm": 3.6280767917633057, + "learning_rate": 4.527621733271259e-09, + "loss": 0.1319, + "step": 36359 + }, + { + "epoch": 99.07356948228883, + "grad_norm": 2.038217067718506, + "learning_rate": 4.5011076933665356e-09, + "loss": 0.0224, + "step": 36360 + }, + { + "epoch": 99.07629427792915, + "grad_norm": 3.5371341705322266, + "learning_rate": 4.474671498083671e-09, + "loss": 0.0534, + "step": 36361 + }, + { + "epoch": 99.07901907356948, + "grad_norm": 2.664658546447754, + "learning_rate": 4.448313147631389e-09, + "loss": 0.0848, + "step": 36362 + }, + { + "epoch": 99.0817438692098, + "grad_norm": 3.05959153175354, + "learning_rate": 4.422032642213969e-09, + "loss": 0.037, + "step": 36363 + }, + { + "epoch": 99.08446866485014, + "grad_norm": 1.676727294921875, + "learning_rate": 4.395829982035693e-09, + "loss": 0.0487, + "step": 36364 + }, + { + "epoch": 99.08719346049047, + "grad_norm": 2.3347127437591553, + "learning_rate": 4.369705167301952e-09, + "loss": 0.1061, + "step": 36365 + }, + { + "epoch": 99.08991825613079, + "grad_norm": 2.571681261062622, + "learning_rate": 4.343658198213696e-09, + "loss": 0.0478, + "step": 36366 + }, + { + "epoch": 99.09264305177112, + "grad_norm": 1.9872663021087646, + "learning_rate": 4.317689074976317e-09, + "loss": 0.0279, + "step": 36367 + }, + { + "epoch": 99.09536784741144, + "grad_norm": 4.219489574432373, + "learning_rate": 4.291797797790764e-09, + "loss": 0.0283, + "step": 36368 + }, + { + "epoch": 99.09809264305177, + "grad_norm": 3.7424395084381104, + "learning_rate": 4.2659843668591e-09, + "loss": 0.1513, + "step": 36369 + }, + { + "epoch": 99.1008174386921, + "grad_norm": 3.471322536468506, + "learning_rate": 4.240248782382272e-09, + "loss": 0.0839, + "step": 36370 + }, + { + "epoch": 99.10354223433242, + "grad_norm": 2.9463798999786377, + "learning_rate": 4.214591044560123e-09, + "loss": 0.041, + "step": 36371 + }, + { + "epoch": 99.10626702997276, + "grad_norm": 2.3431172370910645, + "learning_rate": 4.189011153593603e-09, + "loss": 0.0612, + "step": 36372 + }, + { + "epoch": 99.10899182561307, + "grad_norm": 1.8754887580871582, + "learning_rate": 4.163509109681441e-09, + "loss": 0.0209, + "step": 36373 + }, + { + "epoch": 99.11171662125341, + "grad_norm": 4.4420366287231445, + "learning_rate": 4.1380849130223666e-09, + "loss": 0.0855, + "step": 36374 + }, + { + "epoch": 99.11444141689373, + "grad_norm": 2.1189613342285156, + "learning_rate": 4.112738563814e-09, + "loss": 0.1157, + "step": 36375 + }, + { + "epoch": 99.11716621253406, + "grad_norm": 3.5993266105651855, + "learning_rate": 4.087470062252852e-09, + "loss": 0.0905, + "step": 36376 + }, + { + "epoch": 99.11989100817439, + "grad_norm": 3.2593681812286377, + "learning_rate": 4.06227940853765e-09, + "loss": 0.0729, + "step": 36377 + }, + { + "epoch": 99.12261580381471, + "grad_norm": 4.9808454513549805, + "learning_rate": 4.0371666028637954e-09, + "loss": 0.1191, + "step": 36378 + }, + { + "epoch": 99.12534059945504, + "grad_norm": 2.3980395793914795, + "learning_rate": 4.012131645426687e-09, + "loss": 0.0205, + "step": 36379 + }, + { + "epoch": 99.12806539509536, + "grad_norm": 2.978144645690918, + "learning_rate": 3.987174536421723e-09, + "loss": 0.0345, + "step": 36380 + }, + { + "epoch": 99.1307901907357, + "grad_norm": 2.6568796634674072, + "learning_rate": 3.962295276042083e-09, + "loss": 0.0539, + "step": 36381 + }, + { + "epoch": 99.13351498637603, + "grad_norm": 2.537956476211548, + "learning_rate": 3.937493864483166e-09, + "loss": 0.0359, + "step": 36382 + }, + { + "epoch": 99.13623978201635, + "grad_norm": 5.514376640319824, + "learning_rate": 3.912770301937041e-09, + "loss": 0.0443, + "step": 36383 + }, + { + "epoch": 99.13896457765668, + "grad_norm": 1.956241250038147, + "learning_rate": 3.8881245885957765e-09, + "loss": 0.0261, + "step": 36384 + }, + { + "epoch": 99.141689373297, + "grad_norm": 1.6229876279830933, + "learning_rate": 3.863556724652551e-09, + "loss": 0.0154, + "step": 36385 + }, + { + "epoch": 99.14441416893733, + "grad_norm": 2.845139741897583, + "learning_rate": 3.839066710298323e-09, + "loss": 0.0728, + "step": 36386 + }, + { + "epoch": 99.14713896457765, + "grad_norm": 3.711958646774292, + "learning_rate": 3.81465454572405e-09, + "loss": 0.0603, + "step": 36387 + }, + { + "epoch": 99.14986376021798, + "grad_norm": 3.5983099937438965, + "learning_rate": 3.790320231119582e-09, + "loss": 0.0526, + "step": 36388 + }, + { + "epoch": 99.15258855585832, + "grad_norm": 4.311792373657227, + "learning_rate": 3.766063766673656e-09, + "loss": 0.0487, + "step": 36389 + }, + { + "epoch": 99.15531335149863, + "grad_norm": 1.893627405166626, + "learning_rate": 3.7418851525772296e-09, + "loss": 0.0151, + "step": 36390 + }, + { + "epoch": 99.15803814713897, + "grad_norm": 1.9946928024291992, + "learning_rate": 3.7177843890157108e-09, + "loss": 0.0323, + "step": 36391 + }, + { + "epoch": 99.16076294277929, + "grad_norm": 3.0589988231658936, + "learning_rate": 3.6937614761789474e-09, + "loss": 0.0219, + "step": 36392 + }, + { + "epoch": 99.16348773841962, + "grad_norm": 1.6643747091293335, + "learning_rate": 3.6698164142534574e-09, + "loss": 0.0478, + "step": 36393 + }, + { + "epoch": 99.16621253405995, + "grad_norm": 2.7943308353424072, + "learning_rate": 3.645949203425758e-09, + "loss": 0.0319, + "step": 36394 + }, + { + "epoch": 99.16893732970027, + "grad_norm": 2.1140692234039307, + "learning_rate": 3.6221598438812567e-09, + "loss": 0.017, + "step": 36395 + }, + { + "epoch": 99.1716621253406, + "grad_norm": 3.405674457550049, + "learning_rate": 3.5984483358064703e-09, + "loss": 0.0269, + "step": 36396 + }, + { + "epoch": 99.17438692098092, + "grad_norm": 1.7860310077667236, + "learning_rate": 3.574814679384586e-09, + "loss": 0.0224, + "step": 36397 + }, + { + "epoch": 99.17711171662125, + "grad_norm": 3.141554832458496, + "learning_rate": 3.5512588748010114e-09, + "loss": 0.1446, + "step": 36398 + }, + { + "epoch": 99.17983651226157, + "grad_norm": 2.2735395431518555, + "learning_rate": 3.527780922237822e-09, + "loss": 0.0572, + "step": 36399 + }, + { + "epoch": 99.1825613079019, + "grad_norm": 2.2199854850769043, + "learning_rate": 3.504380821878206e-09, + "loss": 0.0327, + "step": 36400 + }, + { + "epoch": 99.18528610354224, + "grad_norm": 3.187570810317993, + "learning_rate": 3.4810585739053492e-09, + "loss": 0.0714, + "step": 36401 + }, + { + "epoch": 99.18801089918256, + "grad_norm": 2.511786460876465, + "learning_rate": 3.4578141785002182e-09, + "loss": 0.0505, + "step": 36402 + }, + { + "epoch": 99.19073569482289, + "grad_norm": 1.9665066003799438, + "learning_rate": 3.43464763584378e-09, + "loss": 0.0881, + "step": 36403 + }, + { + "epoch": 99.19346049046321, + "grad_norm": 5.338626384735107, + "learning_rate": 3.4115589461169994e-09, + "loss": 0.0701, + "step": 36404 + }, + { + "epoch": 99.19618528610354, + "grad_norm": 1.8583027124404907, + "learning_rate": 3.388548109498624e-09, + "loss": 0.0685, + "step": 36405 + }, + { + "epoch": 99.19891008174388, + "grad_norm": 2.840616464614868, + "learning_rate": 3.3656151261696192e-09, + "loss": 0.2491, + "step": 36406 + }, + { + "epoch": 99.2016348773842, + "grad_norm": 2.7709131240844727, + "learning_rate": 3.3427599963065105e-09, + "loss": 0.0333, + "step": 36407 + }, + { + "epoch": 99.20435967302453, + "grad_norm": 3.268580436706543, + "learning_rate": 3.319982720088044e-09, + "loss": 0.0473, + "step": 36408 + }, + { + "epoch": 99.20708446866485, + "grad_norm": 3.149470806121826, + "learning_rate": 3.2972832976918557e-09, + "loss": 0.0759, + "step": 36409 + }, + { + "epoch": 99.20980926430518, + "grad_norm": 2.2788093090057373, + "learning_rate": 3.274661729295581e-09, + "loss": 0.0873, + "step": 36410 + }, + { + "epoch": 99.2125340599455, + "grad_norm": 1.9153056144714355, + "learning_rate": 3.2521180150735244e-09, + "loss": 0.0249, + "step": 36411 + }, + { + "epoch": 99.21525885558583, + "grad_norm": 2.340096950531006, + "learning_rate": 3.2296521552033223e-09, + "loss": 0.1278, + "step": 36412 + }, + { + "epoch": 99.21798365122616, + "grad_norm": 2.90765643119812, + "learning_rate": 3.207264149857059e-09, + "loss": 0.0468, + "step": 36413 + }, + { + "epoch": 99.22070844686648, + "grad_norm": 2.310850143432617, + "learning_rate": 3.18495399921237e-09, + "loss": 0.0321, + "step": 36414 + }, + { + "epoch": 99.22343324250681, + "grad_norm": 3.482832193374634, + "learning_rate": 3.1627217034413403e-09, + "loss": 0.0328, + "step": 36415 + }, + { + "epoch": 99.22615803814713, + "grad_norm": 2.7978789806365967, + "learning_rate": 3.1405672627171645e-09, + "loss": 0.0276, + "step": 36416 + }, + { + "epoch": 99.22888283378747, + "grad_norm": 3.4980978965759277, + "learning_rate": 3.118490677211927e-09, + "loss": 0.0471, + "step": 36417 + }, + { + "epoch": 99.2316076294278, + "grad_norm": 1.6601653099060059, + "learning_rate": 3.096491947098823e-09, + "loss": 0.0757, + "step": 36418 + }, + { + "epoch": 99.23433242506812, + "grad_norm": 6.678323268890381, + "learning_rate": 3.0745710725477164e-09, + "loss": 0.0646, + "step": 36419 + }, + { + "epoch": 99.23705722070845, + "grad_norm": 1.7206647396087646, + "learning_rate": 3.0527280537306915e-09, + "loss": 0.0308, + "step": 36420 + }, + { + "epoch": 99.23978201634877, + "grad_norm": 1.7365213632583618, + "learning_rate": 3.0309628908176125e-09, + "loss": 0.0235, + "step": 36421 + }, + { + "epoch": 99.2425068119891, + "grad_norm": 1.6074193716049194, + "learning_rate": 3.0092755839772336e-09, + "loss": 0.0174, + "step": 36422 + }, + { + "epoch": 99.24523160762942, + "grad_norm": 2.532968282699585, + "learning_rate": 2.9876661333783084e-09, + "loss": 0.0624, + "step": 36423 + }, + { + "epoch": 99.24795640326975, + "grad_norm": 2.9972033500671387, + "learning_rate": 2.9661345391907013e-09, + "loss": 0.2823, + "step": 36424 + }, + { + "epoch": 99.25068119891009, + "grad_norm": 2.2182281017303467, + "learning_rate": 2.9446808015809457e-09, + "loss": 0.0871, + "step": 36425 + }, + { + "epoch": 99.2534059945504, + "grad_norm": 2.8645570278167725, + "learning_rate": 2.923304920715575e-09, + "loss": 0.0635, + "step": 36426 + }, + { + "epoch": 99.25613079019074, + "grad_norm": 2.3982489109039307, + "learning_rate": 2.902006896762233e-09, + "loss": 0.0265, + "step": 36427 + }, + { + "epoch": 99.25885558583106, + "grad_norm": 4.365675926208496, + "learning_rate": 2.8807867298863425e-09, + "loss": 0.0273, + "step": 36428 + }, + { + "epoch": 99.26158038147139, + "grad_norm": 2.683900833129883, + "learning_rate": 2.8596444202522166e-09, + "loss": 0.1043, + "step": 36429 + }, + { + "epoch": 99.26430517711172, + "grad_norm": 2.0241880416870117, + "learning_rate": 2.8385799680263892e-09, + "loss": 0.1868, + "step": 36430 + }, + { + "epoch": 99.26702997275204, + "grad_norm": 1.9473216533660889, + "learning_rate": 2.817593373372063e-09, + "loss": 0.0326, + "step": 36431 + }, + { + "epoch": 99.26975476839237, + "grad_norm": 3.1982765197753906, + "learning_rate": 2.79668463645244e-09, + "loss": 0.0731, + "step": 36432 + }, + { + "epoch": 99.2724795640327, + "grad_norm": 1.6564440727233887, + "learning_rate": 2.775853757429614e-09, + "loss": 0.0189, + "step": 36433 + }, + { + "epoch": 99.27520435967303, + "grad_norm": 2.0607547760009766, + "learning_rate": 2.755100736467897e-09, + "loss": 0.0985, + "step": 36434 + }, + { + "epoch": 99.27792915531334, + "grad_norm": 2.2081785202026367, + "learning_rate": 2.734425573727162e-09, + "loss": 0.023, + "step": 36435 + }, + { + "epoch": 99.28065395095368, + "grad_norm": 2.806126594543457, + "learning_rate": 2.7138282693683904e-09, + "loss": 0.0649, + "step": 36436 + }, + { + "epoch": 99.28337874659401, + "grad_norm": 3.082141876220703, + "learning_rate": 2.6933088235536752e-09, + "loss": 0.0543, + "step": 36437 + }, + { + "epoch": 99.28610354223433, + "grad_norm": 2.207090139389038, + "learning_rate": 2.672867236440668e-09, + "loss": 0.0247, + "step": 36438 + }, + { + "epoch": 99.28882833787466, + "grad_norm": 1.978706955909729, + "learning_rate": 2.6525035081903516e-09, + "loss": 0.0297, + "step": 36439 + }, + { + "epoch": 99.29155313351498, + "grad_norm": 2.7729930877685547, + "learning_rate": 2.632217638960377e-09, + "loss": 0.0251, + "step": 36440 + }, + { + "epoch": 99.29427792915531, + "grad_norm": 2.5666956901550293, + "learning_rate": 2.6120096289083964e-09, + "loss": 0.0736, + "step": 36441 + }, + { + "epoch": 99.29700272479565, + "grad_norm": 2.3435373306274414, + "learning_rate": 2.5918794781931713e-09, + "loss": 0.1035, + "step": 36442 + }, + { + "epoch": 99.29972752043597, + "grad_norm": 2.143259286880493, + "learning_rate": 2.571827186970133e-09, + "loss": 0.0686, + "step": 36443 + }, + { + "epoch": 99.3024523160763, + "grad_norm": 3.842270612716675, + "learning_rate": 2.551852755395823e-09, + "loss": 0.0896, + "step": 36444 + }, + { + "epoch": 99.30517711171662, + "grad_norm": 1.5671322345733643, + "learning_rate": 2.5319561836267824e-09, + "loss": 0.0204, + "step": 36445 + }, + { + "epoch": 99.30790190735695, + "grad_norm": 2.957319974899292, + "learning_rate": 2.5121374718162228e-09, + "loss": 0.0291, + "step": 36446 + }, + { + "epoch": 99.31062670299727, + "grad_norm": 1.752927541732788, + "learning_rate": 2.4923966201195748e-09, + "loss": 0.0245, + "step": 36447 + }, + { + "epoch": 99.3133514986376, + "grad_norm": 1.822049856185913, + "learning_rate": 2.4727336286900493e-09, + "loss": 0.1189, + "step": 36448 + }, + { + "epoch": 99.31607629427793, + "grad_norm": 1.785093903541565, + "learning_rate": 2.4531484976819677e-09, + "loss": 0.0389, + "step": 36449 + }, + { + "epoch": 99.31880108991825, + "grad_norm": 1.935732364654541, + "learning_rate": 2.4336412272463197e-09, + "loss": 0.0252, + "step": 36450 + }, + { + "epoch": 99.32152588555859, + "grad_norm": 2.195263147354126, + "learning_rate": 2.414211817535206e-09, + "loss": 0.0441, + "step": 36451 + }, + { + "epoch": 99.3242506811989, + "grad_norm": 1.9610813856124878, + "learning_rate": 2.3948602687018375e-09, + "loss": 0.0222, + "step": 36452 + }, + { + "epoch": 99.32697547683924, + "grad_norm": 2.1458311080932617, + "learning_rate": 2.375586580893874e-09, + "loss": 0.0311, + "step": 36453 + }, + { + "epoch": 99.32970027247957, + "grad_norm": 1.9295579195022583, + "learning_rate": 2.3563907542645257e-09, + "loss": 0.1235, + "step": 36454 + }, + { + "epoch": 99.33242506811989, + "grad_norm": 2.887185573577881, + "learning_rate": 2.337272788961453e-09, + "loss": 0.0348, + "step": 36455 + }, + { + "epoch": 99.33514986376022, + "grad_norm": 1.5260833501815796, + "learning_rate": 2.318232685133426e-09, + "loss": 0.0667, + "step": 36456 + }, + { + "epoch": 99.33787465940054, + "grad_norm": 1.5578218698501587, + "learning_rate": 2.2992704429292136e-09, + "loss": 0.024, + "step": 36457 + }, + { + "epoch": 99.34059945504087, + "grad_norm": 1.683821439743042, + "learning_rate": 2.280386062497586e-09, + "loss": 0.0202, + "step": 36458 + }, + { + "epoch": 99.34332425068119, + "grad_norm": 3.2472360134124756, + "learning_rate": 2.2615795439839826e-09, + "loss": 0.0341, + "step": 36459 + }, + { + "epoch": 99.34604904632153, + "grad_norm": 4.313271522521973, + "learning_rate": 2.242850887534953e-09, + "loss": 0.1013, + "step": 36460 + }, + { + "epoch": 99.34877384196186, + "grad_norm": 3.0428760051727295, + "learning_rate": 2.2242000932970464e-09, + "loss": 0.0309, + "step": 36461 + }, + { + "epoch": 99.35149863760218, + "grad_norm": 2.2389774322509766, + "learning_rate": 2.205627161415702e-09, + "loss": 0.0399, + "step": 36462 + }, + { + "epoch": 99.35422343324251, + "grad_norm": 1.8114615678787231, + "learning_rate": 2.187132092034139e-09, + "loss": 0.0216, + "step": 36463 + }, + { + "epoch": 99.35694822888283, + "grad_norm": 3.40175461769104, + "learning_rate": 2.168714885298906e-09, + "loss": 0.0247, + "step": 36464 + }, + { + "epoch": 99.35967302452316, + "grad_norm": 2.9031620025634766, + "learning_rate": 2.150375541351002e-09, + "loss": 0.0329, + "step": 36465 + }, + { + "epoch": 99.3623978201635, + "grad_norm": 3.3373162746429443, + "learning_rate": 2.1321140603336452e-09, + "loss": 0.0241, + "step": 36466 + }, + { + "epoch": 99.36512261580381, + "grad_norm": 1.999098539352417, + "learning_rate": 2.113930442390055e-09, + "loss": 0.021, + "step": 36467 + }, + { + "epoch": 99.36784741144415, + "grad_norm": 2.326115608215332, + "learning_rate": 2.09582468766234e-09, + "loss": 0.0679, + "step": 36468 + }, + { + "epoch": 99.37057220708446, + "grad_norm": 11.089275360107422, + "learning_rate": 2.0777967962892775e-09, + "loss": 0.1068, + "step": 36469 + }, + { + "epoch": 99.3732970027248, + "grad_norm": 3.55578351020813, + "learning_rate": 2.059846768412976e-09, + "loss": 0.0205, + "step": 36470 + }, + { + "epoch": 99.37602179836512, + "grad_norm": 1.9651052951812744, + "learning_rate": 2.0419746041733247e-09, + "loss": 0.0592, + "step": 36471 + }, + { + "epoch": 99.37874659400545, + "grad_norm": 2.7975447177886963, + "learning_rate": 2.0241803037091002e-09, + "loss": 0.0518, + "step": 36472 + }, + { + "epoch": 99.38147138964578, + "grad_norm": 6.04313325881958, + "learning_rate": 2.0064638671579706e-09, + "loss": 0.1152, + "step": 36473 + }, + { + "epoch": 99.3841961852861, + "grad_norm": 2.5856568813323975, + "learning_rate": 1.988825294658714e-09, + "loss": 0.1662, + "step": 36474 + }, + { + "epoch": 99.38692098092643, + "grad_norm": 2.250094175338745, + "learning_rate": 1.9712645863489977e-09, + "loss": 0.07, + "step": 36475 + }, + { + "epoch": 99.38964577656675, + "grad_norm": 2.380284309387207, + "learning_rate": 1.9537817423653794e-09, + "loss": 0.0531, + "step": 36476 + }, + { + "epoch": 99.39237057220708, + "grad_norm": 2.2417728900909424, + "learning_rate": 1.9363767628444164e-09, + "loss": 0.0748, + "step": 36477 + }, + { + "epoch": 99.39509536784742, + "grad_norm": 2.6770682334899902, + "learning_rate": 1.919049647920446e-09, + "loss": 0.05, + "step": 36478 + }, + { + "epoch": 99.39782016348774, + "grad_norm": 3.7568910121917725, + "learning_rate": 1.9018003977289147e-09, + "loss": 0.0294, + "step": 36479 + }, + { + "epoch": 99.40054495912807, + "grad_norm": 2.4807164669036865, + "learning_rate": 1.8846290124052703e-09, + "loss": 0.0256, + "step": 36480 + }, + { + "epoch": 99.40326975476839, + "grad_norm": 4.318384170532227, + "learning_rate": 1.8675354920816293e-09, + "loss": 0.1189, + "step": 36481 + }, + { + "epoch": 99.40599455040872, + "grad_norm": 2.2268853187561035, + "learning_rate": 1.8505198368923282e-09, + "loss": 0.0317, + "step": 36482 + }, + { + "epoch": 99.40871934604904, + "grad_norm": 2.5289037227630615, + "learning_rate": 1.833582046968374e-09, + "loss": 0.0271, + "step": 36483 + }, + { + "epoch": 99.41144414168937, + "grad_norm": 2.2588653564453125, + "learning_rate": 1.8167221224441035e-09, + "loss": 0.0973, + "step": 36484 + }, + { + "epoch": 99.4141689373297, + "grad_norm": 2.657165288925171, + "learning_rate": 1.799940063448302e-09, + "loss": 0.0832, + "step": 36485 + }, + { + "epoch": 99.41689373297002, + "grad_norm": 2.0009355545043945, + "learning_rate": 1.783235870113087e-09, + "loss": 0.0297, + "step": 36486 + }, + { + "epoch": 99.41961852861036, + "grad_norm": 2.1202259063720703, + "learning_rate": 1.7666095425683538e-09, + "loss": 0.0381, + "step": 36487 + }, + { + "epoch": 99.42234332425068, + "grad_norm": 2.0005722045898438, + "learning_rate": 1.7500610809439989e-09, + "loss": 0.0269, + "step": 36488 + }, + { + "epoch": 99.42506811989101, + "grad_norm": 1.8287826776504517, + "learning_rate": 1.7335904853676977e-09, + "loss": 0.023, + "step": 36489 + }, + { + "epoch": 99.42779291553134, + "grad_norm": 2.116440534591675, + "learning_rate": 1.7171977559682363e-09, + "loss": 0.0485, + "step": 36490 + }, + { + "epoch": 99.43051771117166, + "grad_norm": 2.248250722885132, + "learning_rate": 1.70088289287329e-09, + "loss": 0.0537, + "step": 36491 + }, + { + "epoch": 99.433242506812, + "grad_norm": 3.7882604598999023, + "learning_rate": 1.684645896210535e-09, + "loss": 0.0244, + "step": 36492 + }, + { + "epoch": 99.43596730245231, + "grad_norm": 2.1944730281829834, + "learning_rate": 1.6684867661065363e-09, + "loss": 0.0898, + "step": 36493 + }, + { + "epoch": 99.43869209809264, + "grad_norm": 2.940349817276001, + "learning_rate": 1.6524055026856388e-09, + "loss": 0.0978, + "step": 36494 + }, + { + "epoch": 99.44141689373296, + "grad_norm": 2.730057716369629, + "learning_rate": 1.6364021060744084e-09, + "loss": 0.0567, + "step": 36495 + }, + { + "epoch": 99.4441416893733, + "grad_norm": 2.3615787029266357, + "learning_rate": 1.6204765763971897e-09, + "loss": 0.0447, + "step": 36496 + }, + { + "epoch": 99.44686648501363, + "grad_norm": 2.5666565895080566, + "learning_rate": 1.6046289137783277e-09, + "loss": 0.0623, + "step": 36497 + }, + { + "epoch": 99.44959128065395, + "grad_norm": 4.310489654541016, + "learning_rate": 1.5888591183399472e-09, + "loss": 0.1389, + "step": 36498 + }, + { + "epoch": 99.45231607629428, + "grad_norm": 2.57661771774292, + "learning_rate": 1.5731671902063927e-09, + "loss": 0.0811, + "step": 36499 + }, + { + "epoch": 99.4550408719346, + "grad_norm": 2.558673620223999, + "learning_rate": 1.557553129498679e-09, + "loss": 0.0345, + "step": 36500 + }, + { + "epoch": 99.45776566757493, + "grad_norm": 3.643984317779541, + "learning_rate": 1.5420169363389303e-09, + "loss": 0.0345, + "step": 36501 + }, + { + "epoch": 99.46049046321527, + "grad_norm": 2.4214136600494385, + "learning_rate": 1.5265586108481612e-09, + "loss": 0.1484, + "step": 36502 + }, + { + "epoch": 99.46321525885558, + "grad_norm": 2.4700000286102295, + "learning_rate": 1.5111781531473856e-09, + "loss": 0.0313, + "step": 36503 + }, + { + "epoch": 99.46594005449592, + "grad_norm": 2.7732627391815186, + "learning_rate": 1.4958755633542876e-09, + "loss": 0.0269, + "step": 36504 + }, + { + "epoch": 99.46866485013624, + "grad_norm": 2.753965139389038, + "learning_rate": 1.4806508415909914e-09, + "loss": 0.0943, + "step": 36505 + }, + { + "epoch": 99.47138964577657, + "grad_norm": 2.1247220039367676, + "learning_rate": 1.4655039879740706e-09, + "loss": 0.2098, + "step": 36506 + }, + { + "epoch": 99.47411444141689, + "grad_norm": 2.5269577503204346, + "learning_rate": 1.4504350026223192e-09, + "loss": 0.0488, + "step": 36507 + }, + { + "epoch": 99.47683923705722, + "grad_norm": 1.9422529935836792, + "learning_rate": 1.43544388565231e-09, + "loss": 0.0172, + "step": 36508 + }, + { + "epoch": 99.47956403269755, + "grad_norm": 3.2932417392730713, + "learning_rate": 1.4205306371817274e-09, + "loss": 0.0342, + "step": 36509 + }, + { + "epoch": 99.48228882833787, + "grad_norm": 4.437108039855957, + "learning_rate": 1.405695257326034e-09, + "loss": 0.148, + "step": 36510 + }, + { + "epoch": 99.4850136239782, + "grad_norm": 1.8429901599884033, + "learning_rate": 1.3909377462006933e-09, + "loss": 0.145, + "step": 36511 + }, + { + "epoch": 99.48773841961852, + "grad_norm": 2.8696699142456055, + "learning_rate": 1.3762581039211686e-09, + "loss": 0.0878, + "step": 36512 + }, + { + "epoch": 99.49046321525886, + "grad_norm": 3.777517557144165, + "learning_rate": 1.3616563306018126e-09, + "loss": 0.0543, + "step": 36513 + }, + { + "epoch": 99.49318801089919, + "grad_norm": 2.00805401802063, + "learning_rate": 1.3471324263558684e-09, + "loss": 0.0207, + "step": 36514 + }, + { + "epoch": 99.49591280653951, + "grad_norm": 2.38852596282959, + "learning_rate": 1.3326863912965782e-09, + "loss": 0.0959, + "step": 36515 + }, + { + "epoch": 99.49863760217984, + "grad_norm": 2.6656932830810547, + "learning_rate": 1.318318225536075e-09, + "loss": 0.0883, + "step": 36516 + }, + { + "epoch": 99.50136239782016, + "grad_norm": 4.719111919403076, + "learning_rate": 1.3040279291876013e-09, + "loss": 0.071, + "step": 36517 + }, + { + "epoch": 99.50408719346049, + "grad_norm": 2.596975803375244, + "learning_rate": 1.2898155023610692e-09, + "loss": 0.1507, + "step": 36518 + }, + { + "epoch": 99.50681198910081, + "grad_norm": 4.292980194091797, + "learning_rate": 1.2756809451675012e-09, + "loss": 0.0935, + "step": 36519 + }, + { + "epoch": 99.50953678474114, + "grad_norm": 2.4347875118255615, + "learning_rate": 1.2616242577168092e-09, + "loss": 0.0316, + "step": 36520 + }, + { + "epoch": 99.51226158038148, + "grad_norm": 2.349003791809082, + "learning_rate": 1.2476454401200155e-09, + "loss": 0.0832, + "step": 36521 + }, + { + "epoch": 99.5149863760218, + "grad_norm": 1.5870577096939087, + "learning_rate": 1.2337444924837017e-09, + "loss": 0.0706, + "step": 36522 + }, + { + "epoch": 99.51771117166213, + "grad_norm": 2.5609068870544434, + "learning_rate": 1.2199214149177795e-09, + "loss": 0.092, + "step": 36523 + }, + { + "epoch": 99.52043596730245, + "grad_norm": 2.1779537200927734, + "learning_rate": 1.2061762075288307e-09, + "loss": 0.0374, + "step": 36524 + }, + { + "epoch": 99.52316076294278, + "grad_norm": 1.9448508024215698, + "learning_rate": 1.192508870424547e-09, + "loss": 0.0225, + "step": 36525 + }, + { + "epoch": 99.52588555858311, + "grad_norm": 3.0391459465026855, + "learning_rate": 1.1789194037115093e-09, + "loss": 0.1417, + "step": 36526 + }, + { + "epoch": 99.52861035422343, + "grad_norm": 2.4883079528808594, + "learning_rate": 1.1654078074940788e-09, + "loss": 0.0598, + "step": 36527 + }, + { + "epoch": 99.53133514986376, + "grad_norm": 3.8180992603302, + "learning_rate": 1.1519740818799473e-09, + "loss": 0.0397, + "step": 36528 + }, + { + "epoch": 99.53405994550408, + "grad_norm": 2.5799219608306885, + "learning_rate": 1.1386182269723656e-09, + "loss": 0.0308, + "step": 36529 + }, + { + "epoch": 99.53678474114442, + "grad_norm": 2.159740924835205, + "learning_rate": 1.1253402428745841e-09, + "loss": 0.0273, + "step": 36530 + }, + { + "epoch": 99.53950953678473, + "grad_norm": 1.376673698425293, + "learning_rate": 1.1121401296909639e-09, + "loss": 0.0872, + "step": 36531 + }, + { + "epoch": 99.54223433242507, + "grad_norm": 3.0177886486053467, + "learning_rate": 1.099017887524756e-09, + "loss": 0.0326, + "step": 36532 + }, + { + "epoch": 99.5449591280654, + "grad_norm": 2.472672462463379, + "learning_rate": 1.0859735164769903e-09, + "loss": 0.0297, + "step": 36533 + }, + { + "epoch": 99.54768392370572, + "grad_norm": 2.5569729804992676, + "learning_rate": 1.0730070166509177e-09, + "loss": 0.1165, + "step": 36534 + }, + { + "epoch": 99.55040871934605, + "grad_norm": 2.6483771800994873, + "learning_rate": 1.060118388145348e-09, + "loss": 0.0229, + "step": 36535 + }, + { + "epoch": 99.55313351498637, + "grad_norm": 2.695887804031372, + "learning_rate": 1.0473076310624218e-09, + "loss": 0.0465, + "step": 36536 + }, + { + "epoch": 99.5558583106267, + "grad_norm": 2.4064455032348633, + "learning_rate": 1.034574745500949e-09, + "loss": 0.0948, + "step": 36537 + }, + { + "epoch": 99.55858310626704, + "grad_norm": 1.4350569248199463, + "learning_rate": 1.0219197315597396e-09, + "loss": 0.0175, + "step": 36538 + }, + { + "epoch": 99.56130790190736, + "grad_norm": 2.4260857105255127, + "learning_rate": 1.0093425893387133e-09, + "loss": 0.1, + "step": 36539 + }, + { + "epoch": 99.56403269754769, + "grad_norm": 2.115938663482666, + "learning_rate": 9.968433189355697e-10, + "loss": 0.3049, + "step": 36540 + }, + { + "epoch": 99.566757493188, + "grad_norm": 2.5792899131774902, + "learning_rate": 9.844219204468985e-10, + "loss": 0.0392, + "step": 36541 + }, + { + "epoch": 99.56948228882834, + "grad_norm": 2.8147940635681152, + "learning_rate": 9.720783939692891e-10, + "loss": 0.0434, + "step": 36542 + }, + { + "epoch": 99.57220708446866, + "grad_norm": 2.99324107170105, + "learning_rate": 9.598127395993307e-10, + "loss": 0.0319, + "step": 36543 + }, + { + "epoch": 99.57493188010899, + "grad_norm": 2.7439558506011963, + "learning_rate": 9.476249574325026e-10, + "loss": 0.0557, + "step": 36544 + }, + { + "epoch": 99.57765667574932, + "grad_norm": 3.165449857711792, + "learning_rate": 9.355150475642837e-10, + "loss": 0.0294, + "step": 36545 + }, + { + "epoch": 99.58038147138964, + "grad_norm": 2.2052972316741943, + "learning_rate": 9.234830100879333e-10, + "loss": 0.1125, + "step": 36546 + }, + { + "epoch": 99.58310626702998, + "grad_norm": 2.7302558422088623, + "learning_rate": 9.115288450978199e-10, + "loss": 0.1363, + "step": 36547 + }, + { + "epoch": 99.5858310626703, + "grad_norm": 1.9348679780960083, + "learning_rate": 8.996525526872024e-10, + "loss": 0.0199, + "step": 36548 + }, + { + "epoch": 99.58855585831063, + "grad_norm": 3.44775390625, + "learning_rate": 8.878541329482293e-10, + "loss": 0.0242, + "step": 36549 + }, + { + "epoch": 99.59128065395096, + "grad_norm": 2.0738258361816406, + "learning_rate": 8.761335859730491e-10, + "loss": 0.032, + "step": 36550 + }, + { + "epoch": 99.59400544959128, + "grad_norm": 2.6990418434143066, + "learning_rate": 8.644909118515898e-10, + "loss": 0.0329, + "step": 36551 + }, + { + "epoch": 99.59673024523161, + "grad_norm": 2.516026258468628, + "learning_rate": 8.529261106771103e-10, + "loss": 0.0537, + "step": 36552 + }, + { + "epoch": 99.59945504087193, + "grad_norm": 2.832350730895996, + "learning_rate": 8.41439182537318e-10, + "loss": 0.023, + "step": 36553 + }, + { + "epoch": 99.60217983651226, + "grad_norm": 2.176815986633301, + "learning_rate": 8.300301275221412e-10, + "loss": 0.0325, + "step": 36554 + }, + { + "epoch": 99.60490463215258, + "grad_norm": 2.719883918762207, + "learning_rate": 8.186989457215078e-10, + "loss": 0.0668, + "step": 36555 + }, + { + "epoch": 99.60762942779292, + "grad_norm": 2.2102978229522705, + "learning_rate": 8.074456372231254e-10, + "loss": 0.0756, + "step": 36556 + }, + { + "epoch": 99.61035422343325, + "grad_norm": 1.9211902618408203, + "learning_rate": 7.962702021147018e-10, + "loss": 0.0159, + "step": 36557 + }, + { + "epoch": 99.61307901907357, + "grad_norm": 2.3778374195098877, + "learning_rate": 7.851726404828342e-10, + "loss": 0.0706, + "step": 36558 + }, + { + "epoch": 99.6158038147139, + "grad_norm": 2.125946521759033, + "learning_rate": 7.741529524141201e-10, + "loss": 0.037, + "step": 36559 + }, + { + "epoch": 99.61852861035422, + "grad_norm": 7.415036201477051, + "learning_rate": 7.632111379951568e-10, + "loss": 0.0206, + "step": 36560 + }, + { + "epoch": 99.62125340599455, + "grad_norm": 1.5431028604507446, + "learning_rate": 7.523471973092112e-10, + "loss": 0.0199, + "step": 36561 + }, + { + "epoch": 99.62397820163488, + "grad_norm": 2.3266077041625977, + "learning_rate": 7.415611304428805e-10, + "loss": 0.1038, + "step": 36562 + }, + { + "epoch": 99.6267029972752, + "grad_norm": 2.8579304218292236, + "learning_rate": 7.308529374794316e-10, + "loss": 0.0793, + "step": 36563 + }, + { + "epoch": 99.62942779291554, + "grad_norm": 2.9477689266204834, + "learning_rate": 7.20222618502131e-10, + "loss": 0.1182, + "step": 36564 + }, + { + "epoch": 99.63215258855585, + "grad_norm": 1.4284054040908813, + "learning_rate": 7.096701735942457e-10, + "loss": 0.024, + "step": 36565 + }, + { + "epoch": 99.63487738419619, + "grad_norm": 2.898362159729004, + "learning_rate": 6.991956028379321e-10, + "loss": 0.0802, + "step": 36566 + }, + { + "epoch": 99.6376021798365, + "grad_norm": 1.9462116956710815, + "learning_rate": 6.887989063131262e-10, + "loss": 0.0298, + "step": 36567 + }, + { + "epoch": 99.64032697547684, + "grad_norm": 1.887109398841858, + "learning_rate": 6.784800841030948e-10, + "loss": 0.0897, + "step": 36568 + }, + { + "epoch": 99.64305177111717, + "grad_norm": 2.0863425731658936, + "learning_rate": 6.682391362877738e-10, + "loss": 0.0273, + "step": 36569 + }, + { + "epoch": 99.64577656675749, + "grad_norm": 2.1058130264282227, + "learning_rate": 6.58076062944879e-10, + "loss": 0.0211, + "step": 36570 + }, + { + "epoch": 99.64850136239782, + "grad_norm": 2.643380880355835, + "learning_rate": 6.479908641565668e-10, + "loss": 0.0388, + "step": 36571 + }, + { + "epoch": 99.65122615803814, + "grad_norm": 2.3741872310638428, + "learning_rate": 6.379835399983326e-10, + "loss": 0.0278, + "step": 36572 + }, + { + "epoch": 99.65395095367847, + "grad_norm": 2.371957540512085, + "learning_rate": 6.280540905512222e-10, + "loss": 0.0256, + "step": 36573 + }, + { + "epoch": 99.65667574931881, + "grad_norm": 2.2500576972961426, + "learning_rate": 6.18202515889621e-10, + "loss": 0.0271, + "step": 36574 + }, + { + "epoch": 99.65940054495913, + "grad_norm": 1.956206202507019, + "learning_rate": 6.084288160923546e-10, + "loss": 0.0302, + "step": 36575 + }, + { + "epoch": 99.66212534059946, + "grad_norm": 1.9971297979354858, + "learning_rate": 5.987329912349182e-10, + "loss": 0.0211, + "step": 36576 + }, + { + "epoch": 99.66485013623978, + "grad_norm": 2.158386707305908, + "learning_rate": 5.891150413928071e-10, + "loss": 0.0291, + "step": 36577 + }, + { + "epoch": 99.66757493188011, + "grad_norm": 2.6648027896881104, + "learning_rate": 5.795749666404061e-10, + "loss": 0.0976, + "step": 36578 + }, + { + "epoch": 99.67029972752043, + "grad_norm": 2.7986602783203125, + "learning_rate": 5.701127670532103e-10, + "loss": 0.0389, + "step": 36579 + }, + { + "epoch": 99.67302452316076, + "grad_norm": 1.5865932703018188, + "learning_rate": 5.607284427033843e-10, + "loss": 0.0223, + "step": 36580 + }, + { + "epoch": 99.6757493188011, + "grad_norm": 2.294034242630005, + "learning_rate": 5.514219936642029e-10, + "loss": 0.1224, + "step": 36581 + }, + { + "epoch": 99.67847411444141, + "grad_norm": 2.7299232482910156, + "learning_rate": 5.42193420010051e-10, + "loss": 0.1174, + "step": 36582 + }, + { + "epoch": 99.68119891008175, + "grad_norm": 1.9245857000350952, + "learning_rate": 5.330427218108725e-10, + "loss": 0.0274, + "step": 36583 + }, + { + "epoch": 99.68392370572207, + "grad_norm": 1.757200837135315, + "learning_rate": 5.239698991388321e-10, + "loss": 0.0196, + "step": 36584 + }, + { + "epoch": 99.6866485013624, + "grad_norm": 1.994696855545044, + "learning_rate": 5.149749520638736e-10, + "loss": 0.0334, + "step": 36585 + }, + { + "epoch": 99.68937329700273, + "grad_norm": 2.803117036819458, + "learning_rate": 5.060578806559413e-10, + "loss": 0.0774, + "step": 36586 + }, + { + "epoch": 99.69209809264305, + "grad_norm": 4.198057174682617, + "learning_rate": 4.972186849860894e-10, + "loss": 0.0306, + "step": 36587 + }, + { + "epoch": 99.69482288828338, + "grad_norm": 2.314763069152832, + "learning_rate": 4.884573651209313e-10, + "loss": 0.0291, + "step": 36588 + }, + { + "epoch": 99.6975476839237, + "grad_norm": 1.7226258516311646, + "learning_rate": 4.797739211304108e-10, + "loss": 0.0362, + "step": 36589 + }, + { + "epoch": 99.70027247956403, + "grad_norm": 13.523866653442383, + "learning_rate": 4.711683530822519e-10, + "loss": 0.147, + "step": 36590 + }, + { + "epoch": 99.70299727520435, + "grad_norm": 5.580814838409424, + "learning_rate": 4.626406610419576e-10, + "loss": 0.0941, + "step": 36591 + }, + { + "epoch": 99.70572207084469, + "grad_norm": 2.962643623352051, + "learning_rate": 4.5419084507725143e-10, + "loss": 0.1124, + "step": 36592 + }, + { + "epoch": 99.70844686648502, + "grad_norm": 1.9783023595809937, + "learning_rate": 4.458189052536366e-10, + "loss": 0.0363, + "step": 36593 + }, + { + "epoch": 99.71117166212534, + "grad_norm": 1.824733018875122, + "learning_rate": 4.37524841635506e-10, + "loss": 0.0294, + "step": 36594 + }, + { + "epoch": 99.71389645776567, + "grad_norm": 2.0353915691375732, + "learning_rate": 4.2930865428836286e-10, + "loss": 0.0541, + "step": 36595 + }, + { + "epoch": 99.71662125340599, + "grad_norm": 2.389317512512207, + "learning_rate": 4.2117034327548987e-10, + "loss": 0.0439, + "step": 36596 + }, + { + "epoch": 99.71934604904632, + "grad_norm": 2.519260883331299, + "learning_rate": 4.1310990866128e-10, + "loss": 0.0341, + "step": 36597 + }, + { + "epoch": 99.72207084468666, + "grad_norm": 3.8815038204193115, + "learning_rate": 4.0512735050790566e-10, + "loss": 0.0543, + "step": 36598 + }, + { + "epoch": 99.72479564032697, + "grad_norm": 2.7397398948669434, + "learning_rate": 3.9722266887753933e-10, + "loss": 0.1035, + "step": 36599 + }, + { + "epoch": 99.7275204359673, + "grad_norm": 2.6178321838378906, + "learning_rate": 3.893958638312434e-10, + "loss": 0.1109, + "step": 36600 + }, + { + "epoch": 99.73024523160763, + "grad_norm": 2.7417891025543213, + "learning_rate": 3.8164693543119024e-10, + "loss": 0.0287, + "step": 36601 + }, + { + "epoch": 99.73297002724796, + "grad_norm": 2.6343674659729004, + "learning_rate": 3.7397588373733196e-10, + "loss": 0.0488, + "step": 36602 + }, + { + "epoch": 99.73569482288828, + "grad_norm": 6.195209503173828, + "learning_rate": 3.6638270880851034e-10, + "loss": 0.2053, + "step": 36603 + }, + { + "epoch": 99.73841961852861, + "grad_norm": 2.066901922225952, + "learning_rate": 3.588674107035672e-10, + "loss": 0.0271, + "step": 36604 + }, + { + "epoch": 99.74114441416894, + "grad_norm": 2.7348265647888184, + "learning_rate": 3.514299894835649e-10, + "loss": 0.0271, + "step": 36605 + }, + { + "epoch": 99.74386920980926, + "grad_norm": 2.0644443035125732, + "learning_rate": 3.4407044520401443e-10, + "loss": 0.0213, + "step": 36606 + }, + { + "epoch": 99.7465940054496, + "grad_norm": 5.294316291809082, + "learning_rate": 3.3678877792264754e-10, + "loss": 0.0633, + "step": 36607 + }, + { + "epoch": 99.74931880108991, + "grad_norm": 2.1260714530944824, + "learning_rate": 3.295849876971957e-10, + "loss": 0.1096, + "step": 36608 + }, + { + "epoch": 99.75204359673025, + "grad_norm": 2.419437885284424, + "learning_rate": 3.2245907458317015e-10, + "loss": 0.0466, + "step": 36609 + }, + { + "epoch": 99.75476839237058, + "grad_norm": 2.7944250106811523, + "learning_rate": 3.154110386349718e-10, + "loss": 0.0624, + "step": 36610 + }, + { + "epoch": 99.7574931880109, + "grad_norm": 1.9427090883255005, + "learning_rate": 3.08440879909222e-10, + "loss": 0.0261, + "step": 36611 + }, + { + "epoch": 99.76021798365123, + "grad_norm": 2.4367549419403076, + "learning_rate": 3.015485984603217e-10, + "loss": 0.0258, + "step": 36612 + }, + { + "epoch": 99.76294277929155, + "grad_norm": 2.3611412048339844, + "learning_rate": 2.9473419434045136e-10, + "loss": 0.2156, + "step": 36613 + }, + { + "epoch": 99.76566757493188, + "grad_norm": 3.508145809173584, + "learning_rate": 2.879976676029017e-10, + "loss": 0.2697, + "step": 36614 + }, + { + "epoch": 99.7683923705722, + "grad_norm": 1.7755341529846191, + "learning_rate": 2.8133901830096343e-10, + "loss": 0.025, + "step": 36615 + }, + { + "epoch": 99.77111716621253, + "grad_norm": 1.9118646383285522, + "learning_rate": 2.7475824648570683e-10, + "loss": 0.0337, + "step": 36616 + }, + { + "epoch": 99.77384196185287, + "grad_norm": 2.203730821609497, + "learning_rate": 2.6825535220931233e-10, + "loss": 0.034, + "step": 36617 + }, + { + "epoch": 99.77656675749319, + "grad_norm": 4.123830318450928, + "learning_rate": 2.6183033552174e-10, + "loss": 0.0829, + "step": 36618 + }, + { + "epoch": 99.77929155313352, + "grad_norm": 2.0598483085632324, + "learning_rate": 2.554831964729498e-10, + "loss": 0.0234, + "step": 36619 + }, + { + "epoch": 99.78201634877384, + "grad_norm": 2.5967087745666504, + "learning_rate": 2.4921393511290195e-10, + "loss": 0.0279, + "step": 36620 + }, + { + "epoch": 99.78474114441417, + "grad_norm": 2.9723432064056396, + "learning_rate": 2.4302255149044607e-10, + "loss": 0.1216, + "step": 36621 + }, + { + "epoch": 99.7874659400545, + "grad_norm": 2.351841688156128, + "learning_rate": 2.369090456533218e-10, + "loss": 0.0514, + "step": 36622 + }, + { + "epoch": 99.79019073569482, + "grad_norm": 3.7699193954467773, + "learning_rate": 2.3087341764926885e-10, + "loss": 0.071, + "step": 36623 + }, + { + "epoch": 99.79291553133515, + "grad_norm": 3.212890625, + "learning_rate": 2.2491566752491646e-10, + "loss": 0.1577, + "step": 36624 + }, + { + "epoch": 99.79564032697547, + "grad_norm": 1.6444101333618164, + "learning_rate": 2.19035795326894e-10, + "loss": 0.0292, + "step": 36625 + }, + { + "epoch": 99.7983651226158, + "grad_norm": 3.579833984375, + "learning_rate": 2.1323380110183088e-10, + "loss": 0.0244, + "step": 36626 + }, + { + "epoch": 99.80108991825612, + "grad_norm": 3.0298268795013428, + "learning_rate": 2.0750968489413604e-10, + "loss": 0.09, + "step": 36627 + }, + { + "epoch": 99.80381471389646, + "grad_norm": 3.3600499629974365, + "learning_rate": 2.0186344674821834e-10, + "loss": 0.0834, + "step": 36628 + }, + { + "epoch": 99.80653950953679, + "grad_norm": 2.7193455696105957, + "learning_rate": 1.9629508670848674e-10, + "loss": 0.0782, + "step": 36629 + }, + { + "epoch": 99.80926430517711, + "grad_norm": 2.516709566116333, + "learning_rate": 1.9080460481823993e-10, + "loss": 0.0957, + "step": 36630 + }, + { + "epoch": 99.81198910081744, + "grad_norm": 2.8346807956695557, + "learning_rate": 1.853920011207766e-10, + "loss": 0.0436, + "step": 36631 + }, + { + "epoch": 99.81471389645776, + "grad_norm": 5.574287414550781, + "learning_rate": 1.8005727565717502e-10, + "loss": 0.0314, + "step": 36632 + }, + { + "epoch": 99.8174386920981, + "grad_norm": 2.6337056159973145, + "learning_rate": 1.7480042846851341e-10, + "loss": 0.1221, + "step": 36633 + }, + { + "epoch": 99.82016348773843, + "grad_norm": 2.943788766860962, + "learning_rate": 1.696214595980905e-10, + "loss": 0.064, + "step": 36634 + }, + { + "epoch": 99.82288828337875, + "grad_norm": 2.968533754348755, + "learning_rate": 1.6452036908365388e-10, + "loss": 0.106, + "step": 36635 + }, + { + "epoch": 99.82561307901908, + "grad_norm": 2.553696393966675, + "learning_rate": 1.59497156967392e-10, + "loss": 0.0431, + "step": 36636 + }, + { + "epoch": 99.8283378746594, + "grad_norm": 2.3409392833709717, + "learning_rate": 1.545518232859422e-10, + "loss": 0.0949, + "step": 36637 + }, + { + "epoch": 99.83106267029973, + "grad_norm": 2.7663166522979736, + "learning_rate": 1.4968436807927255e-10, + "loss": 0.0405, + "step": 36638 + }, + { + "epoch": 99.83378746594005, + "grad_norm": 2.4775993824005127, + "learning_rate": 1.4489479138513062e-10, + "loss": 0.0363, + "step": 36639 + }, + { + "epoch": 99.83651226158038, + "grad_norm": 3.056490421295166, + "learning_rate": 1.40183093241264e-10, + "loss": 0.1586, + "step": 36640 + }, + { + "epoch": 99.83923705722071, + "grad_norm": 2.3072080612182617, + "learning_rate": 1.3554927368319982e-10, + "loss": 0.0879, + "step": 36641 + }, + { + "epoch": 99.84196185286103, + "grad_norm": 3.618222236633301, + "learning_rate": 1.3099333274757543e-10, + "loss": 0.1427, + "step": 36642 + }, + { + "epoch": 99.84468664850137, + "grad_norm": 3.623671770095825, + "learning_rate": 1.2651527046991796e-10, + "loss": 0.0563, + "step": 36643 + }, + { + "epoch": 99.84741144414168, + "grad_norm": 2.6766088008880615, + "learning_rate": 1.2211508688464434e-10, + "loss": 0.0362, + "step": 36644 + }, + { + "epoch": 99.85013623978202, + "grad_norm": 2.361475944519043, + "learning_rate": 1.1779278202728174e-10, + "loss": 0.0578, + "step": 36645 + }, + { + "epoch": 99.85286103542235, + "grad_norm": 2.4094767570495605, + "learning_rate": 1.1354835593113678e-10, + "loss": 0.0536, + "step": 36646 + }, + { + "epoch": 99.85558583106267, + "grad_norm": 2.4418084621429443, + "learning_rate": 1.0938180862729575e-10, + "loss": 0.0879, + "step": 36647 + }, + { + "epoch": 99.858310626703, + "grad_norm": 2.1416845321655273, + "learning_rate": 1.0529314015128577e-10, + "loss": 0.0344, + "step": 36648 + }, + { + "epoch": 99.86103542234332, + "grad_norm": 1.8528544902801514, + "learning_rate": 1.0128235053308289e-10, + "loss": 0.0177, + "step": 36649 + }, + { + "epoch": 99.86376021798365, + "grad_norm": 3.770249128341675, + "learning_rate": 9.734943980377331e-11, + "loss": 0.0281, + "step": 36650 + }, + { + "epoch": 99.86648501362397, + "grad_norm": 2.6298139095306396, + "learning_rate": 9.349440799444331e-11, + "loss": 0.033, + "step": 36651 + }, + { + "epoch": 99.8692098092643, + "grad_norm": 2.071444034576416, + "learning_rate": 8.97172551350689e-11, + "loss": 0.1597, + "step": 36652 + }, + { + "epoch": 99.87193460490464, + "grad_norm": 1.9126759767532349, + "learning_rate": 8.60179812556261e-11, + "loss": 0.0237, + "step": 36653 + }, + { + "epoch": 99.87465940054496, + "grad_norm": 6.645708084106445, + "learning_rate": 8.23965863838705e-11, + "loss": 0.1461, + "step": 36654 + }, + { + "epoch": 99.87738419618529, + "grad_norm": 8.344696998596191, + "learning_rate": 7.885307054866786e-11, + "loss": 0.0445, + "step": 36655 + }, + { + "epoch": 99.88010899182561, + "grad_norm": 3.1809380054473877, + "learning_rate": 7.53874337777738e-11, + "loss": 0.0333, + "step": 36656 + }, + { + "epoch": 99.88283378746594, + "grad_norm": 2.368344783782959, + "learning_rate": 7.199967609783365e-11, + "loss": 0.0761, + "step": 36657 + }, + { + "epoch": 99.88555858310627, + "grad_norm": 1.8367606401443481, + "learning_rate": 6.868979753549277e-11, + "loss": 0.037, + "step": 36658 + }, + { + "epoch": 99.88828337874659, + "grad_norm": 4.02899694442749, + "learning_rate": 6.545779811628627e-11, + "loss": 0.0289, + "step": 36659 + }, + { + "epoch": 99.89100817438693, + "grad_norm": 2.255337953567505, + "learning_rate": 6.230367786574931e-11, + "loss": 0.0424, + "step": 36660 + }, + { + "epoch": 99.89373297002724, + "grad_norm": 2.3002030849456787, + "learning_rate": 5.922743680719655e-11, + "loss": 0.0206, + "step": 36661 + }, + { + "epoch": 99.89645776566758, + "grad_norm": 1.7847018241882324, + "learning_rate": 5.622907496616314e-11, + "loss": 0.021, + "step": 36662 + }, + { + "epoch": 99.8991825613079, + "grad_norm": 1.4975664615631104, + "learning_rate": 5.330859236596375e-11, + "loss": 0.0918, + "step": 36663 + }, + { + "epoch": 99.90190735694823, + "grad_norm": 2.6824984550476074, + "learning_rate": 5.046598902769262e-11, + "loss": 0.1954, + "step": 36664 + }, + { + "epoch": 99.90463215258856, + "grad_norm": 1.4897246360778809, + "learning_rate": 4.770126497466443e-11, + "loss": 0.0189, + "step": 36665 + }, + { + "epoch": 99.90735694822888, + "grad_norm": 2.1342153549194336, + "learning_rate": 4.5014420229083645e-11, + "loss": 0.0352, + "step": 36666 + }, + { + "epoch": 99.91008174386921, + "grad_norm": 3.451512336730957, + "learning_rate": 4.240545481093428e-11, + "loss": 0.0523, + "step": 36667 + }, + { + "epoch": 99.91280653950953, + "grad_norm": 2.690477132797241, + "learning_rate": 3.987436874020034e-11, + "loss": 0.081, + "step": 36668 + }, + { + "epoch": 99.91553133514986, + "grad_norm": 8.813395500183105, + "learning_rate": 3.7421162036865854e-11, + "loss": 0.1562, + "step": 36669 + }, + { + "epoch": 99.9182561307902, + "grad_norm": 3.088932991027832, + "learning_rate": 3.504583472091483e-11, + "loss": 0.0624, + "step": 36670 + }, + { + "epoch": 99.92098092643052, + "grad_norm": 1.8969745635986328, + "learning_rate": 3.274838681011083e-11, + "loss": 0.1035, + "step": 36671 + }, + { + "epoch": 99.92370572207085, + "grad_norm": 2.33920955657959, + "learning_rate": 3.0528818322217435e-11, + "loss": 0.0569, + "step": 36672 + }, + { + "epoch": 99.92643051771117, + "grad_norm": 2.0795698165893555, + "learning_rate": 2.838712927388798e-11, + "loss": 0.0306, + "step": 36673 + }, + { + "epoch": 99.9291553133515, + "grad_norm": 2.172757625579834, + "learning_rate": 2.6323319683996262e-11, + "loss": 0.0358, + "step": 36674 + }, + { + "epoch": 99.93188010899182, + "grad_norm": 1.9380152225494385, + "learning_rate": 2.4337389565864956e-11, + "loss": 0.1664, + "step": 36675 + }, + { + "epoch": 99.93460490463215, + "grad_norm": 3.505955219268799, + "learning_rate": 2.2429338937257627e-11, + "loss": 0.0264, + "step": 36676 + }, + { + "epoch": 99.93732970027249, + "grad_norm": 2.7528839111328125, + "learning_rate": 2.059916781260718e-11, + "loss": 0.0389, + "step": 36677 + }, + { + "epoch": 99.9400544959128, + "grad_norm": 3.1094865798950195, + "learning_rate": 1.8846876205236287e-11, + "loss": 0.0626, + "step": 36678 + }, + { + "epoch": 99.94277929155314, + "grad_norm": 3.0980677604675293, + "learning_rate": 1.7172464128467626e-11, + "loss": 0.1261, + "step": 36679 + }, + { + "epoch": 99.94550408719346, + "grad_norm": 3.14235520362854, + "learning_rate": 1.5575931596734094e-11, + "loss": 0.0241, + "step": 36680 + }, + { + "epoch": 99.94822888283379, + "grad_norm": 2.5746209621429443, + "learning_rate": 1.4057278622248149e-11, + "loss": 0.0307, + "step": 36681 + }, + { + "epoch": 99.95095367847412, + "grad_norm": 2.559318780899048, + "learning_rate": 1.2616505216112019e-11, + "loss": 0.0321, + "step": 36682 + }, + { + "epoch": 99.95367847411444, + "grad_norm": 3.2531163692474365, + "learning_rate": 1.1253611389427931e-11, + "loss": 0.0735, + "step": 36683 + }, + { + "epoch": 99.95640326975477, + "grad_norm": 3.2968556880950928, + "learning_rate": 9.968597153298121e-12, + "loss": 0.0254, + "step": 36684 + }, + { + "epoch": 99.95912806539509, + "grad_norm": 3.3459370136260986, + "learning_rate": 8.761462518824815e-12, + "loss": 0.1363, + "step": 36685 + }, + { + "epoch": 99.96185286103542, + "grad_norm": 1.863379955291748, + "learning_rate": 7.632207492669353e-12, + "loss": 0.0264, + "step": 36686 + }, + { + "epoch": 99.96457765667574, + "grad_norm": 2.086629629135132, + "learning_rate": 6.580832085933964e-12, + "loss": 0.0252, + "step": 36687 + }, + { + "epoch": 99.96730245231608, + "grad_norm": 3.285036563873291, + "learning_rate": 5.6073363063902094e-12, + "loss": 0.0684, + "step": 36688 + }, + { + "epoch": 99.97002724795641, + "grad_norm": 1.7984572649002075, + "learning_rate": 4.711720160699429e-12, + "loss": 0.0199, + "step": 36689 + }, + { + "epoch": 99.97275204359673, + "grad_norm": 2.189822196960449, + "learning_rate": 3.893983657743405e-12, + "loss": 0.0326, + "step": 36690 + }, + { + "epoch": 99.97547683923706, + "grad_norm": 3.3216190338134766, + "learning_rate": 3.154126800852808e-12, + "loss": 0.0279, + "step": 36691 + }, + { + "epoch": 99.97820163487738, + "grad_norm": 4.278548717498779, + "learning_rate": 2.492149598909421e-12, + "loss": 0.0627, + "step": 36692 + }, + { + "epoch": 99.98092643051771, + "grad_norm": 2.0453996658325195, + "learning_rate": 1.908052055243914e-12, + "loss": 0.0833, + "step": 36693 + }, + { + "epoch": 99.98365122615803, + "grad_norm": 3.478553295135498, + "learning_rate": 1.4018341754074017e-12, + "loss": 0.1105, + "step": 36694 + }, + { + "epoch": 99.98637602179836, + "grad_norm": 2.225618362426758, + "learning_rate": 9.7349596162033e-13, + "loss": 0.0275, + "step": 36695 + }, + { + "epoch": 99.9891008174387, + "grad_norm": 2.206514596939087, + "learning_rate": 6.23037419433814e-13, + "loss": 0.0327, + "step": 36696 + }, + { + "epoch": 99.99182561307902, + "grad_norm": 3.2508068084716797, + "learning_rate": 3.5045854995807705e-13, + "loss": 0.0998, + "step": 36697 + }, + { + "epoch": 99.99455040871935, + "grad_norm": 2.5737099647521973, + "learning_rate": 1.5575935652378804e-13, + "loss": 0.0228, + "step": 36698 + }, + { + "epoch": 99.99727520435967, + "grad_norm": 2.334688663482666, + "learning_rate": 3.893983913094701e-14, + "loss": 0.0414, + "step": 36699 + }, + { + "epoch": 100.0, + "grad_norm": 1.9821799993515015, + "learning_rate": 0.0, + "loss": 0.022, + "step": 36700 + }, + { + "epoch": 100.0, + "step": 36700, + "total_flos": 2.2807420731392e+16, + "train_loss": 0.47043383053927723, + "train_runtime": 11044.2585, + "train_samples_per_second": 106.164, + "train_steps_per_second": 3.323 + } + ], + "logging_steps": 1.0, + "max_steps": 36700, + "num_input_tokens_seen": 0, + "num_train_epochs": 100, + "save_steps": 50000, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": true, + "should_training_stop": true + }, + "attributes": {} + } + }, + "total_flos": 2.2807420731392e+16, + "train_batch_size": 2, + "trial_name": null, + "trial_params": null +} diff --git a/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/vocab.json b/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..4ebe4bb3f3114daf2e4cc349f24873a1175a35d7 --- /dev/null +++ b/florence-2-b_vis1024-lang2048_dior-v2_b2x16-100e-slurm-zero2/vocab.json @@ -0,0 +1 @@ +{"":0,"":1,"":2,"":3,".":4,"Ġthe":5,",":6,"Ġto":7,"Ġand":8,"Ġof":9,"Ġa":10,"Ġin":11,"-":12,"Ġfor":13,"Ġthat":14,"Ġon":15,"Ġis":16,"âĢ":17,"'s":18,"Ġwith":19,"ĠThe":20,"Ġwas":21,"Ġ\"":22,"Ġat":23,"Ġit":24,"Ġas":25,"Ġsaid":26,"Ļ":27,"Ġbe":28,"s":29,"Ġby":30,"Ġfrom":31,"Ġare":32,"Ġhave":33,"Ġhas":34,":":35,"Ġ(":36,"Ġhe":37,"ĠI":38,"Ġhis":39,"Ġwill":40,"Ġan":41,"Ġthis":42,")":43,"ĠâĢ":44,"Ġnot":45,"Ŀ":46,"Ġyou":47,"ľ":48,"Ġtheir":49,"Ġor":50,"Ġthey":51,"Ġwe":52,"Ġbut":53,"Ġwho":54,"Ġmore":55,"Ġhad":56,"Ġbeen":57,"Ġwere":58,"Ġabout":59,",\"":60,"Ġwhich":61,"Ġup":62,"Ġits":63,"Ġcan":64,"Ġone":65,"Ġout":66,"Ġalso":67,"Ġ$":68,"Ġher":69,"Ġall":70,"Ġafter":71,".\"":72,"/":73,"Ġwould":74,"'t":75,"Ġyear":76,"Ġwhen":77,"Ġfirst":78,"Ġshe":79,"Ġtwo":80,"Ġover":81,"Ġpeople":82,"ĠA":83,"Ġour":84,"ĠIt":85,"Ġtime":86,"Ġthan":87,"Ġinto":88,"Ġthere":89,"t":90,"ĠHe":91,"Ġnew":92,"ĠâĢĶ":93,"Ġlast":94,"Ġjust":95,"ĠIn":96,"Ġother":97,"Ġso":98,"Ġwhat":99,"I":100,"Ġlike":101,"a":102,"Ġsome":103,"S":104,"ë":105,"Ġthem":106,"Ġyears":107,"'":108,"Ġdo":109,"Ġyour":110,"Ġ-":111,"Ġ1":112,"\"":113,"Ġif":114,"Ġcould":115,"?":116,"Ġno":117,"i":118,"m":119,"Ġget":120,"ĠU":121,"Ġnow":122,"Ġhim":123,"Ġback":124,"ĠBut":125,"ĠâĢĵ":126,"Ġmy":127,"Ġ'":128,"Ġonly":129,"Ġthree":130,";":131,"Ġ2":132,"The":133,"1":134,"Ġpercent":135,"Ġagainst":136,"Ġbefore":137,"Ġcompany":138,"o":139,"ĠTrump":140,"Ġhow":141,"Ġbecause":142,"Ġany":143,"Ġmost":144,"Ġbeing":145,"Ġmake":146,"Ġwhere":147,"Ġduring":148,"Ġthrough":149,"Ġwhile":150,"000":151,"ĠThis":152,"Ġmillion":153,"ing":154,"Ġ3":155,"Ġmade":156,"Ġwell":157,"Ġ10":158,"Ġdown":159,"Ġoff":160,"Ġsays":161,"Ġme":162,"ĠB":163,"Ġgoing":164,"Ġteam":165,"ĠWe":166,"Ġthose":167,"Ġgovernment":168,"Ġway":169,"We":170,"Ġmany":171,"Ġthen":172,"Ġwork":173,"Ġtold":174,"com":175,"2":176,"Ġgame":177,"ĠAnd":178,"in":179,"year":180,"Ġp":181,"Ġvery":182,"Ġday":183,"Ġhome":184,"Ġtake":185,"Ġweek":186,"Ġsince":187,"ĠNew":188,"Ġmay":189,"Ġeven":190,"Ġseason":191,"Ġsee":192,"Ġ2017":193,"Ġstate":194,"Ġ5":195,"ed":196,"Ġshould":197,"Ġaround":198,"Ġ2018":199,"Ġsecond":200,"Ġus":201,"Ġstill":202,"Ġmuch":203,"Ġ4":204,"Ġgood":205,"Ġthink":206,"%":207,"ĠS":208,"Ġthese":209,"Ġmarket":210,"ĠD":211,"th":212,"Ġgo":213,"'re":214,"Ġsuch":215,"Ġknow":216,"Ġincluding":217,"Ġdon":218,"y":219,"Ġnext":220,"ĠP":221,"Ġdid":222,"Ġunder":223,"Ġsay":224,"en":225,"ĠL":226,"Ġbetween":227,"Ġper":228,"ĠK":229,"ĠC":230,"Ġ6":231,"Ġworld":232,"Ġpart":233,"ĠN":234,"Ġright":235,"Ġwant":236,"Ġfour":237,"),":238,"Ġhigh":239,"Ġneed":240,"re":241,"e":242,"It":243,"Ġhelp":244,"5":245,"3":246,"Ġcountry":247,"ĠR":248,"Ġpolice":249,"A":250,"Ġlong":251,"ĠThey":252,"Ġend":253,"er":254,"ĠT":255,"ĠM":256,"u":257,"Ġboth":258,"Ġhere":259,"an":260,"on":261,"Ġ7":262,"Ġde":263,"ĠShe":264,"Ġbusiness":265,"Ġreport":266,"j":267,"ers":268,"Ġreally":269,"ĠPresident":270,"ar":271,"ĠG":272,"ĠFriday":273,"ĠF":274,"Ġbest":275,"Ġsame":276,"Ġanother":277,"Ġset":278,"old":279,"ĠThat":280,"as":281,"n":282,"Ġcome":283,"Ġfamily":284,"Ġpublic":285,"ĠFor":286,"ĠAs":287,"0":288,"ĠH":289,"Ġ8":290,"Ġ20":291,"Ġfive":292,"es":293,"ĠTuesday":294,"Ġn":295,"ĠThursday":296,"Ġquarter":297,"h":298,"Ġtop":299,"Ġgot":300,"Ġlife":301,"ĠMonday":302,"Ġfound":303,"Ġuse":304,"ĠW":305,"4":306,"ĠWednesday":307,"Ġown":308,"Ġaccording":309,"Ġplay":310,"Ġshow":311,"ĠSt":312,"Ġman":313,"Ġleft":314,"ĠUnited":315,"Ġ12":316,"Ġplace":317,"ĠIf":318,"Ġlot":319,"Ġformer":320,"Ġ0":321,").":322,"Ġsupport":323,"ie":324,"Ġbillion":325,"Ġt":326,"Ġshares":327,"!":328,"z":329,"k":330,"ĠState":331,"Ġpoints":332,"Ġgroup":333,"Ġschool":334,"Ġinformation":335,"Ġ2016":336,"al":337,"r":338,"Ġwin":339,"Ġnews":340,"Ġused":341,"Ġput":342,"Ġcity":343,"ĠJ":344,"ĠThere":345,"Ġnumber":346,"C":347,"'ve":348,"Ġeach":349,"Ġtoo":350,"Ġwon":351,"ly":352,"Ġmonth":353,"is":354,"Ġadded":355,"Ġlook":356,"Ġbetter":357,"Ġevery":358,"Ġ&":359,"Ġdays":360,"Ġ9":361,"Ġtook":362,"Ġnight":363,"Ġe":364,"Ġ11":365,"os":366,"Ġfew":367,"or":368,"ĠNorth":369,"ĠYou":370,"Ġthird":371,"Ġgreat":372,"Ġcalled":373,"ĠOn":374,"Ġpast":375,"Ġcame":376,"Ġmonths":377,"ĠSaturday":378,"Ġ15":379,"Ġbig":380,"ĠE":381,"ĠUS":382,"Ġthings":383,"ĠO":384,"Ġd":385,"Ġstart":386,"B":387,"Ġstock":388,"Ġ30":389,"Ġwomen":390,"ĠSouth":391,"ĠMay":392,"Ġnever":393,"Ġpresident":394,"ĠSunday":395,"Ġwithout":396,"man":397,"8":398,"Ġdidn":399,"Ġlocal":400,"6":401,"Ġsomething":402,"Ġcase":403,"ĠAll":404,"it":405,"7":406,"ĠSo":407,"Ġchildren":408,"Ġaway":409,"Ġlittle":410,"Ġsix":411,"ĠCity":412,"ĠCounty":413,"Ġdata":414,"at":415,"Ġalready":416,"d":417,"Ġmoney":418,"Ġearly":419,"Ġacross":420,"Ġexpected":421,"Ġrun":422,"Ġlater":423,"am":424,"Ġprice":425,"Ġgames":426,"ĠMr":427,"b":428,"Ġmight":429,"Ġdifferent":430,"Ġreported":431,"Ġdeal":432,"Ġmedia":433,"Ġgrowth":434,"Ġcommunity":435,"ĠChina":436,"'m":437,"c":438,"Ġwent":439,"ĠNo":440,"Ġable":441,"Ġmaking":442,"Ġarea":443,"Ġfar":444,"Ġstatement":445,"ĠHouse":446,"Ġworking":447,"M":448,"Ġk":449,"Ġseen":450,"Ġcompanies":451,"Ġtoday":452,"Ġmembers":453,"Ġuntil":454,"Ġfull":455,"Ġagain":456,"Ġhalf":457,"Ġshare":458,"le":459,"Ġalways":460,"Ġcourt":461,"l":462,"and":463,"Ġchange":464,"Ġfind":465,"9":466,"Ġsystem":467,"ĠV":468,"ĠYork":469,"ĠAmerican":470,"Ġhead":471,"Ġplayers":472,"Ġdoes":473,"Ġhealth":474,"Ġm":475,"Ġpower":476,"Ġpoint":477,"Ġhit":478,"Ġ.":479,"Ġ--":480,"Ġfree":481,".,":482,"Ġlead":483,"Ġseveral":484,"Ġrecent":485,"Ġcall":486,"N":487,"Ġlaw":488,"Ġkeep":489,"Ġopen":490,"ĠNews":491,"Ġgive":492,"ia":493,"ĠMarch":494,"D":495,"ĠNational":496,"ĠAt":497,"Ġtimes":498,"Ġfuture":499,"R":500,"Ġ14":501,"ĠJune":502,"Ġofficials":503,"Ġ18":504,"Ġimportant":505,"f":506,"Ġfinal":507,"Ġ13":508,"ĠOne":509,"P":510,"Ġfollowing":511,"Ġcar":512,"Ġleast":513,"Ġwater":514,"Ġevent":515,"Ġline":516,"Ġmove":517,"Ġservices":518,"Ġhaving":519,"ĠWhen":520,"Ġstudents":521,"ĠPolice":522,"el":523,"Ġam":524,"ĠZ":525,"Ġside":526,"Ġstory":527,"Ġdue":528,"Ġmeeting":529,"K":530,"Ġmust":531,"ĠStates":532,"Ġlikely":533,"G":534,"Ġcontinue":535,"Ġago":536,"Ġparty":537,"Ġmajor":538,"Ġindustry":539,"Ġless":540,"30":541,"Ġun":542,"Ġhard":543,"Ġservice":544,"Ġ16":545,"Ġlooking":546,"Ġheld":547,"ve":548,"Ġwhether":549,"ĠJuly":550,"Ġtaken":551,"Ġalong":552,"Ġasked":553,"Ġstarted":554,"Ġbecome":555,"Ġforward":556,"Ġresearch":557,"Ġoffice":558,"Ġpolitical":559,"to":560,"Ġtogether":561,"Ġgetting":562,"Ġplan":563,"Ġ25":564,"T":565,"Ġamong":566,"Ġcoming":567,"Ġdecision":568,"Ġvideo":569,"Ġ2015":570,"g":571,"ĠAfter":572,"Ġsecurity":573,"L":574,"Ġcare":575,"Ġgiven":576,"Ġavailable":577,"âĢĶ":578,"Ġs":579,"ĠWest":580,"'ll":581,"Ġpay":582,"Ġnear":583,"Ġsaying":584,"Ġannounced":585,"Ġprogram":586,"ĠApril":587,"Ġreal":588,"ĠUniversity":589,"ĠWith":590,"AP":591,"Ġsocial":592,"Ġclose":593,"et":594,"Ġcurrent":595,"Ġwhy":596,"F":597,"ĠTo":598,"ĠTwitter":599,"Ġthough":600,"Ġ17":601,"Ġtaking":602,"ĠInc":603,"Ġmen":604,"w":605,"Ġcomes":606,"ley":607,"Ġdoing":608,"Ġprocess":609,"ĠJohn":610,"ch":611,"00":612,"Ġfinancial":613,"Ġlow":614,"Ġenough":615,"ĠWhile":616,"Ġfurther":617,"Ġpost":618,"Ġfeel":619,"st":620,"Ġperson":621,"ĠFacebook":622,"ĠWorld":623,"Ġwithin":624,"ad":625,"Ġdone":626,"the":627,"Ġlate":628,"Ġtax":629,"Ġdoesn":630,"Ġthing":631,"Ġnational":632,"Ġjob":633,"Ġusing":634,"ĠHowever":635,"ic":636,"Ġcampaign":637,"Ġrecord":638,"Ġbehind":639,"://":640,"ĠDepartment":641,"p":642,"Ġothers":643,"ĠJanuary":644,"Ġorder":645,"Ġ[":646,"Ġsales":647,"Ġyet":648,"Ä":649,"Ġsmall":650,"Ġseries":651,"Ġface":652,"ĠWhat":653,"Ġ50":654,"Ġever":655,"Ġearlier":656,"Ġlove":657,"up":658,"Ġrights":659,"ĠAn":660,"ist":661,"Ġmorning":662,"ĠWashington":663,"Ġyoung":664,"Ġlatest":665,"ĠIndia":666,"Ġtrying":667,"Ġfire":668,"Ġled":669,"Ġstrong":670,"Ġreturn":671,"Ġlevel":672,"O":673,"Ġaverage":674,"Ġperiod":675,"Ġexperience":676,"ak":677,"Ġpossible":678,"Ġbelieve":679,"Ġinclude":680,"Ġoil":681,"Ġrecently":682,"Ġonce":683,"Ġknown":684,"Ġlost":685,"Ġsure":686,"us":687,"Ġweeks":688,"Ġfood":689,"Ġreports":690,"Ġrating":691,"ĠMinister":692,"Ġwoman":693,"Ġprovide":694,"Ġproject":695,"Ġissue":696,"Ġlive":697,"10":698,"Ġclear":699,"he":700,"Ġcost":701,"Ġplayed":702,"Ġreleased":703,"Ġcoach":704,"v":705,"Ġ24":706,"Ġseven":707,"Ġplans":708,"Ġdevelopment":709,"ur":710,"ĺ":711,"Ġincrease":712,"This":713,"Ġpolicy":714,"Ġcent":715,"Ġbased":716,"E":717,"il":718,"ĠDecember":719,"Ġglobal":720,"Ġtrade":721,"Ġhours":722,"Ġhigher":723,"Ġgoal":724,"H":725,"ĠAl":726,"Ġ100":727,"Ġminutes":728,"Ġelection":729,"ĠAmerica":730,"Ġrate":731,"ĠCh":732,"Ġ21":733,"...":734,"ĠWhite":735,"Ġdirector":736,"Ġposition":737,"Ġshot":738,"Ġlarge":739,"Ġc":740,"Ġb":741,"]":742,"Ġissues":743,"Ġdeath":744,"Ġbuilding":745,"Ġtotal":746,"Ġoften":747,"Ġv":748,"Ġcountries":749,"Ġhistory":750,"Ġoutside":751,"Ġfederal":752,"Ġ19":753,"Ġfact":754,"ĠHigh":755,"Ġcareer":756,"im":757,"Ġinternational":758,"ĠNovember":759,"Ġfront":760,"Ġkind":761,"Ġkey":762,"ra":763,"ĠSan":764,"Ġshort":765,"Ġname":766,"ĠAccording":767,"Ġcourse":768,"Ġre":769,"Ġwanted":770,"W":771,"ĠSeptember":772,"Ġinterest":773,"Ġrole":774,"Ġresults":775,"Ġeconomic":776,"Ġ2014":777,"Ġchance":778,"ĠOctober":779,"Ġspecial":780,"Ġofficial":781,"Ġneeds":782,"um":783,"Ġl":784,"Ġproducts":785,"Ġnon":786,"Ġ@":787,"ĠBank":788,"Ġahead":789,"Ġhouse":790,"U":791,"Ġboard":792,"Ġold":793,"Ġsaw":794,"Ġlower":795,"ĠEuropean":796,"Ġcontrol":797,"ĠRussia":798,"Ġeight":799,"Ġrelease":800,"Ġpotential":801,"Ġthought":802,"Ġinvestigation":803,"Ġonline":804,"based":805,"Ġtechnology":806,"ĠDonald":807,"id":808,"Ġbody":809,"Ġrisk":810,"ian":811,"Ġcapital":812,"Ġstaff":813,"Ġaction":814,"ĠLeague":815,"Ġplaying":816,"Ġmakes":817,"Ġalmost":818,"Ġperformance":819,"Ġ22":820,"Ġg":821,"Ġfilm":822,"Ġnearly":823,"ĠCenter":824,"Ġvisit":825,"ĠGroup":826,"Ġbank":827,"Ġbit":828,"Ġreceived":829,"ĠAugust":830,"Ġmilitary":831,"ĠHis":832,"ine":833,"Ġchief":834,"ĠSchool":835,"Ġbring":836,"ĠCourt":837,"Ġ(@":838,"Ġmeans":839,"ĠSh":840,"Ġfans":841,"Ġse":842,"Ġ40":843,"20":844,"\".":845,"V":846,"Ġcut":847,"Ġkilled":848,"Ġ#":849,"Ġprices":850,"Ġgave":851,"ĠStreet":852,"ir":853,"ĠY":854,"Ġcurrently":855,"Ġf":856,"ay":857,"ne":858,"te":859,"Ġtry":860,"ĠPark":861,"ĥ":862,"J":863,"Ġquestion":864,"Ġhand":865,"Ġeconomy":866,"Ġinvestors":867,"able":868,"Ġplayer":869,"ĠBy":870,"ĠDavid":871,"Ġloss":872,"ab":873,"Ġbelow":874,"Ġwrote":875,"co":876,"ate":877,"Ġrunning":878,"un":879,"Ġbegan":880,"Ġsingle":881,"Ġfield":882,"Ġ23":883,"Ġleader":884,"Ġw":885,"ĠCalifornia":886,"Ġfourth":887,"Ġactually":888,"Ġlist":889,"ll":890,"Ġcouple":891,"Ġstudy":892,"Ġteams":893,"He":894,"ah":895,"ĠCanada":896,"Ġla":897,"Ġresult":898,"Ġaccess":899,"Ġvote":900,"ĠMore":901,"ĠFebruary":902,"Ġrevenue":903,"Ġoffer":904,"Ġlet":905,"ier":906,"Ġbuy":907,"Ġattack":908,"Ġblack":909,"Ġr":910,"Ġareas":911,"Ġstop":912,"Ġimpact":913,"Ġmatch":914,"Ġinvestment":915,"Ġcustomers":916,"Ġleaders":917,"ies":918,"Ġmember":919,"Ġchild":920,"Ġroad":921,"ul":922,"Ġvalue":923,"Ġshows":924,"ĠDr":925,"ĠDe":926,"ant":927,"ĠLondon":928,"Ġroom":929,"Ġmusic":930,"Ġproduction":931,"Ġanything":932,"Ġfirm":933,"Ġbiggest":934,"Ġair":935,"Ġproblem":936,"Ġgeneral":937,"Ġwasn":938,"Ġi":939,"Ġprivate":940,"Ġespecially":941,"Ġadministration":942,"Ġadditional":943,"ĠCo":944,"Ġopportunity":945,"Ġhold":946,"&":947,"Ġmatter":948,"Ġsenior":949,"Ġclub":950,"Ġsomeone":951,"ĠÃ":952,"ĠEast":953,"Ġ2019":954,".'":955,"Ġneeded":956,"ĠJames":957,"time":958,"Ġhowever":959,"Ġeverything":960,"Ġeveryone":961,"Ġdied":962,"Ġinvolved":963,"Ġfriends":964,"Ġisn":965,"Ġworth":966,"ik":967,"ĠCup":968,"Ġshowed":969,"There":970,"Ġ28":971,"Ġmeet":972,"Ġ26":973,"Ġ27":974,"Y":975,"Ġregion":976,"ĠPress":977,"ĠNow":978,"Ġson":979,"Ġspace":980,"Ġleading":981,"Ġstates":982,"Ġweekend":983,"Ġ£":984,"Ġmother":985,"Ġprevious":986,"ĠUK":987,"ĠMichael":988,"Ġleave":989,"est":990,"em":991,"Ġz":992,"ĠSome":993,"ors":994,"out":995,"15":996,"Ġwar":997,"Ġwebsite":998,"Ġstar":999,"X":1000,"ro":1001,"Ġtarget":1002,"Ġhimself":1003,"Ġturn":1004,"ĠEurope":1005,"Ġworked":1006,"Ġenergy":1007,"Ġscored":1008,"Ġ*":1009,"Ġsoon":1010,"Ġball":1011,"ĠTV":1012,"Ġannual":1013,"Ġ2013":1014,"Ġrace":1015,"ĠInternational":1016,"'d":1017,"ĠMarket":1018,"Ġconference":1019,"io":1020,"Ġo":1021,"Ġchanges":1022,"ig":1023,"Ġofficers":1024,"Ġinside":1025,"Ġform":1026,"Ġpublished":1027,"Ġphone":1028,"Ġco":1029,"Ġlegal":1030,"Ġexecutive":1031,"Ġfight":1032,"ings":1033,"Ġhope":1034,"Ġsummer":1035,"Ġofficer":1036,"Ġfootball":1037,"Ġproperty":1038,"@":1039,"Ġbook":1040,"Ġparents":1041,"Ġcosts":1042,"ac":1043,"Ġmanager":1044,"Ġcreate":1045,"Ġage":1046,"Ġemail":1047,"Ġmarkets":1048,"Ġmain":1049,"Ġhuman":1050,"Ġsent":1051,"Ġmanagement":1052,"ĠDay":1053,"ton":1054,"Ġcash":1055,"Ġfocus":1056,"Ġexpect":1057,"Ġtraining":1058,"Ġbecame":1059,"Ġwhose":1060,"Ġevents":1061,"Ġround":1062,"ĠLe":1063,"Ġfell":1064,"Ġabove":1065,"Ġanalysts":1066,"Ġtalk":1067,"Ġsituation":1068,"ri":1069,"ated":1070,"ke":1071,"Ġwants":1072,"ag":1073,"Ġlives":1074,"om":1075,"Ġal":1076,"Ġdemand":1077,"Ġsafety":1078,"Ġrest":1079,"ĠCouncil":1080,"Ġpersonal":1081,"Ġsite":1082,"ĠRussian":1083,"Ġmid":1084,"Ġnothing":1085,"Ġwhole":1086,"Ġbill":1087,"Ġsold":1088,"ĠBritish":1089,"se":1090,"Ġremain":1091,"12":1092,"Ġforeign":1093,"Ġshooting":1094,"Ġstay":1095,"50":1096,"ang":1097,"Ġhospital":1098,"Ġbad":1099,"Ġaddress":1100,"ĠKorea":1101,"Ġhappened":1102,"Ġcharges":1103,"Ġwhite":1104,"Ġ31":1105,"If":1106,"Ġearnings":1107,"Ġbreak":1108,"Ġlight":1109,"Ġterms":1110,"ĠChinese":1111,"ĠSenate":1112,"ana":1113,"Ġidea":1114,"ap":1115,"of":1116,"Ġnine":1117,"Ġcompared":1118,"Ġbuild":1119,"ard":1120,"In":1121,"Ġsimilar":1122,"Ġgas":1123,"Ġvictory":1124,"Ġ2012":1125,"Ġdebt":1126,"ĠMar":1127,"Ġarrested":1128,"Ġcomment":1129,"Ġincreased":1130,"Ġmedical":1131,"Ġ29":1132,"ĠJan":1133,"Ġgroups":1134,"Ġdespite":1135,"Ġfall":1136,"Ġtell":1137,"Ġworkers":1138,"Ġtown":1139,"é":1140,"Ġwife":1141,"Ġquestions":1142,"Ġcontinued":1143,"Ġheart":1144,"Ġmet":1145,"Ġbrought":1146,"Ġhelped":1147,"ĠCongress":1148,"Ġstep":1149,"Ġfather":1150,"Ġmoment":1151,"Ġproduct":1152,"Ġprobably":1153,"Ġlargest":1154,"Ġvehicle":1155,"ĠEngland":1156,"Ġallow":1157,"Ġstarting":1158,"Ġkids":1159,"Ġincident":1160,"Ġnet":1161,"Ġrates":1162,"ĠRead":1163,"Ġpressure":1164,"Ġincluded":1165,"Ġread":1166,"Ġissued":1167,"ol":1168,"Ġeither":1169,"Ġefforts":1170,"Ġincludes":1171,"ĠRepublican":1172,"ish":1173,"â̦":1174,"Ġgoals":1175,"aj":1176,"Ġen":1177,"x":1178,"Ġraised":1179,"au":1180,"Ġlonger":1181,"ut":1182,"Ġwatch":1183,"ĠTexas":1184,"You":1185,"Ġrange":1186,"nd":1187,"Ġfunds":1188,"Ġremains":1189,"ĠMark":1190,"Ġ60":1191,"Ġque":1192,"sh":1193,"Ġinterview":1194,"Ġrather":1195,"Ġresidents":1196,"Ġgrowing":1197,"Ġpre":1198,"Ġpaid":1199,"Ġcases":1200,"ĠReuters":1201,"Ġdifficult":1202,"Ġsign":1203,"ĠGoogle":1204,"Ġhttps":1205,"ĠPaul":1206,"Ġliving":1207,"day":1208,"ĠQ":1209,"iz":1210,"ĠRed":1211,"Ġland":1212,"They":1213,"ĠRoad":1214,"_":1215,"ĠThese":1216,"Ġview":1217,"Ġagency":1218,"Ġreason":1219,"Ġallowed":1220,"ĠAustralia":1221,"az":1222,"ĠRe":1223,"Ġturned":1224,"11":1225,"Ġnation":1226,"Ġready":1227,"Ġpress":1228,"Ġbudget":1229,"Ġdaily":1230,"ĠChief":1231,"Ġfamilies":1232,"Ġsignificant":1233,"ĠFirst":1234,"Ġthemselves":1235,"Ġj":1236,"Ġruns":1237,"Ġaccused":1238,"Ġtakes":1239,"Ġspent":1240,"Ġvia":1241,"ot":1242,"ina":1243,"25":1244,"land":1245,"Ġexample":1246,"Ġauthorities":1247,"Ġdate":1248,"Ġended":1249,"all":1250,"Reuters":1251,"Ġbusinesses":1252,"ans":1253,"Ġdetails":1254,"Ġground":1255,"Ġpretty":1256,"ĠApple":1257,"ation":1258,"ĠSmith":1259,"ĠCompany":1260,"ĠFlorida":1261,"Ġdrug":1262,"Ġresponse":1263,"one":1264,"Ġeducation":1265,"Ġmean":1266,"Ġleague":1267,"Ġanyone":1268,"Ġminister":1269,"Ġtitle":1270,"Ġadding":1271,"Ġproblems":1272,"Ġopening":1273,"Ġconditions":1274,"Ġred":1275,"Ġdecided":1276,"Å":1277,"Ġposted":1278,"term":1279,"Ġamount":1280,"ĠEU":1281,"Ġsuccess":1282,"Ġevidence":1283,"ĠObama":1284,"Ġaddition":1285,"Ġprovided":1286,"ĠLos":1287,"Ġagreement":1288,"Ġstage":1289,"ens":1290,"Ġrelationship":1291,"ĠGeneral":1292,"Ġsector":1293,"Ġstudent":1294,"ating":1295,"Ġtest":1296,"\",":1297,"Ġwinning":1298,"Ġfelt":1299,"Ġsource":1300,"Z":1301,"Ġseems":1302,"Ġcause":1303,"Ġschools":1304,"Ġdrive":1305,"Ġensure":1306,"Ġhuge":1307,"ĠMy":1308,"ĠHealth":1309,"Ġscene":1310,"Ġgiving":1311,"Ġcenter":1312,"Ġpositive":1313,"Ġyards":1314,"Ġjobs":1315,"Ġaccount":1316,"Ġheard":1317,"Ġquality":1318,"Ġways":1319,"Ġimmediately":1320,"Ġemployees":1321,"are":1322,"Ġpass":1323,"ĠCEO":1324,"Ġreceive":1325,"Ġlooks":1326,"ĠAfrica":1327,"Ġthroughout":1328,"led":1329,"Ġrelated":1330,"Ġsell":1331,"ĠUnion":1332,"ĠPhoto":1333,"ter":1334,"Ġquickly":1335,"ĠHow":1336,"Ġvarious":1337,"Ġreach":1338,"Ġpick":1339,"Ġcharged":1340,"Ġquite":1341,"ent":1342,"q":1343,"ins":1344,"Ġphoto":1345,"Ġunderstand":1346,"ĠâĢ¢":1347,"Ġreached":1348,"Ġtrack":1349,"uk":1350,"Ġeffort":1351,"ville":1352,"Ġcentral":1353,"Ġdaughter":1354,"Ġcontract":1355,"Ġinjury":1356,"Ġopened":1357,"Ġ($":1358,"Ġstraight":1359,"17":1360,"Ġcredit":1361,"ĠIndian":1362,"Ġsexual":1363,"Ġworks":1364,"Ġeasy":1365,"18":1366,"Ġclosed":1367,"Ġh":1368,"Ġhappen":1369,"Ġforce":1370,"ler":1371,"Ġhappy":1372,"Ġshared":1373,"Ġoverall":1374,"Ġmoving":1375,"á":1376,"Ġprojects":1377,"ĠBlack":1378,"Ġconcerns":1379,"Ġclass":1380,"Ġtried":1381,"Ġappeared":1382,"Ġcontent":1383,"ĠDistrict":1384,"Ġterm":1385,"Ġinstead":1386,"ĠOffice":1387,"Ġcontinues":1388,"Ġlevels":1389,"Ġafternoon":1390,"Ġfund":1391,"Ġsale":1392,"Ġdriver":1393,"Ġask":1394,"Ġcannot":1395,"ner":1396,"end":1397,"ĠHere":1398,"field":1399,"Ġstore":1400,"www":1401,"Ġcertain":1402,"Ġself":1403,"Ġdollar":1404,"ĠHer":1405,"Ġpopular":1406,"Ġfollow":1407,"Ġspending":1408,"by":1409,"Ġmoved":1410,"Ġgoes":1411,"Ġcreated":1412,"Ġstand":1413,"Ġoperations":1414,"Ġlooked":1415,"Ġtreatment":1416,"ov":1417,"Ġdistrict":1418,"Ġsigned":1419,"Ġhands":1420,"Ġmodel":1421,"ĠAngeles":1422,"Ġy":1423,"Ġborder":1424,"Ġincome":1425,"ĠLast":1426,"Ġcharge":1427,"Ġdriving":1428,"ĠJapan":1429,"Ġrise":1430,"Ġtalks":1431,"Ġfollowed":1432,"Ġpreviously":1433,"Ġusers":1434,"Ġfunding":1435,"ĠJohnson":1436,"Ġ":1437,"ou":1438,"ai":1439,"Ġnamed":1440,"Ġfriend":1441,"ĠNov":1442,"Ġdefense":1443,"ĠBritain":1444,"Ġentire":1445,"Ġtrading":1446,"Ġfailed":1447,"ĠEl":1448,"Ġclaims":1449,"Ġcomments":1450,"Ġbeat":1451,"ib":1452,"Ġbasis":1453,"ĠJones":1454,"Ġpresent":1455,"ĠBe":1456,"Ġdouble":1457,"Ġrose":1458,"ite":1459,"Ġability":1460,"Ġoriginal":1461,"Ġdead":1462,"ĠCommission":1463,"ĠMe":1464,"Ġcompetition":1465,"Ġ2011":1466,"Ġknew":1467,"Ġmaterial":1468,"av":1469,"ĠFrance":1470,"Ġscore":1471,"Ġsense":1472,"Ġserious":1473,"Ġconfirmed":1474,"Ġanti":1475,"Ġviolence":1476,"Ġimprove":1477,"son":1478,"ó":1479,"ĠAP":1480,"Ġsh":1481,"Ġhost":1482,"ĠMike":1483,"Ġpatients":1484,"ĠNFL":1485,"Ġcrisis":1486,"Ġrevealed":1487,"ach":1488,"ĠPrime":1489,"Ġbuilt":1490,"ĠNot":1491,"Ġrules":1492,"Ġelse":1493,"Ġdepartment":1494,"Ġitself":1495,"ise":1496,"500":1497,"Ġcomplete":1498,"ion":1499,"Ġtrial":1500,"ĠBay":1501,"ĠDec":1502,"Ġattention":1503,"Ġtravel":1504,"ĠCentral":1505,"ry":1506,"Ġagreed":1507,"Ġmind":1508,"ĠMc":1509,"Ġ70":1510,"Ġcontact":1511,"ari":1512,"ĠTimes":1513,"Ġspot":1514,"ĠFrench":1515,"Ġgets":1516,"op":1517,"Ġbrand":1518,"Ġcalls":1519,"Ġbanks":1520,"Ġdesign":1521,"Ġsafe":1522,"Ġoffers":1523,"Ġpractice":1524,"ĠOf":1525,"á":1526,"ling":1527,"Ġtrue":1528,"off":1529,"Ġnumbers":1530,"Ġfun":1531,"Ġlearn":1532,"Ġmultiple":1533,"ĠIs":1534,"res":1535,"als":1536,"Ġcommon":1537,"ized":1538,"Ġchallenge":1539,"Ġcommittee":1540,"ĠOur":1541,"Ġbase":1542,"ani":1543,"ĠAssociation":1544,"ung":1545,"Ġnetwork":1546,"ĠBrown":1547,"Ġapproach":1548,"16":1549,"Ġfinished":1550,"Ġreview":1551,"Ġrequired":1552,"Ġapp":1553,"ĠMan":1554,"Ġâ̦":1555,"twitter":1556,"ĠDemocratic":1557,"13":1558,"Ġevening":1559,"ĠTom":1560,"ä":1561,"ĠAssociated":1562,"ĠCanadian":1563,"Ġcollege":1564,"Ġspokesman":1565,"Ġarticle":1566,"Ġtowards":1567,"ĠChicago":1568,"Ġmovie":1569,"14":1570,"ity":1571,"Ġforces":1572,"ĠChris":1573,"ĠDemocrats":1574,"Ġfeatures":1575,"Ġhearing":1576,"ĠX":1577,"ĠAlso":1578,"Ġmessage":1579,"age":1580,"Ġnoted":1581,"ĠSuper":1582,"Ġthousands":1583,"aw":1584,"ĠBill":1585,"ĠAr":1586,"ĠLa":1587,"ip":1588,"Ġ/":1589,"ĠDuring":1590,"Ġnote":1591,".)":1592,"Ġwrong":1593,"if":1594,"Ġpassed":1595,"ĠTwo":1596,"Ġdie":1597,",'":1598,"ĠDon":1599,"ĠGermany":1600,"Ġletter":1601,"Ġdescribed":1602,"ĠIran":1603,"ĠWilliams":1604,"Ġparticularly":1605,"Ġadd":1606,"Ġconversation":1607,"ĠSe":1608,"Ġhighest":1609,"be":1610,"Ġhomes":1611,"Ġsports":1612,"Ġgone":1613,"ĠAd":1614,"Ġel":1615,"Ġopportunities":1616,"Ġwords":1617,"Ġleaving":1618,"ĠChristmas":1619,"As":1620,"ĠGovernment":1621,"Ġsimply":1622,"Ġhusband":1623,"ĠResearch":1624,"ĠMexico":1625,"ates":1626,"ale":1627,"ĠGreen":1628,"$":1629,"od":1630,"ĠHall":1631,"Ġnatural":1632,"Ġoperating":1633,"les":1634,"ations":1635,"ĠKim":1636,"Ġgold":1637,"ok":1638,"Ġprovides":1639,"(":1640,"ell":1641,"Ġbegin":1642,"ĠParty":1643,"back":1644,"ĠAmazon":1645,"19":1646,"Ġmajority":1647,"ĠEven":1648,"Ġcheck":1649,"Ġweather":1650,"Ġorganization":1651,"Ġstories":1652,"ĠCar":1653,"Ġforced":1654,"ĠGeorge":1655,"Ġwalk":1656,"ong":1657,"Ġfiled":1658,"ĠJustice":1659,"Ġlaunched":1660,"Ġoffered":1661,"Ġwww":1662,"Ġconstruction":1663,"ĠBen":1664,"Ġserved":1665,"Ġ...":1666,"Ġparts":1667,"Ġcancer":1668,"Ġguys":1669,"Reporting":1670,"ash":1671,"less":1672,"Ġleadership":1673,"ĠCommittee":1674,"Ġregular":1675,"Ġcouncil":1676,"Ġcars":1677,"ĠDirector":1678,"Ġjudge":1679,"Ġvictims":1680,"ĠDaily":1681,"Ġkept":1682,"Ġeffect":1683,"Ġbeyond":1684,"pm":1685,"Ġtalking":1686,"Ġconsidered":1687,"ore":1688,"ĠAdvertisement":1689,"Ġst":1690,"ED":1691,"Ġmiddle":1692,"Ġraise":1693,"we":1694,"Ġclaimed":1695,"ino":1696,"Ġalleged":1697,"ĠPro":1698,"ĠScott":1699,"ĠOct":1700,"Ġconsider":1701,"ĠShare":1702,"Ġtraffic":1703,"ĠAfrican":1704,"Ġcouldn":1705,"Ġtoward":1706,"Ġsearch":1707,"But":1708,"Ġlaunch":1709,"Ġinjured":1710,"That":1711,"Ġalthough":1712,"Ġactivities":1713,"Ġchanged":1714,"Ġsources":1715,"Ġmissing":1716,"Ġu":1717,"Ġ35":1718,"Ġcover":1719,"ised":1720,"Ġ|":1721,"ow":1722,"ES":1723,"Ġdecades":1724,"ich":1725,"Ġcaused":1726,"Ġelections":1727,"ane":1728,"IS":1729,"Ġfeet":1730,"ĠBar":1731,"Ġversion":1732,"Ġgrow":1733,"Ġvehicles":1734,"Ġoptions":1735,"Ġindividual":1736,"Ġenvironment":1737,"ĠRobert":1738,"ĠValley":1739,"ĠFrom":1740,"per":1741,"ara":1742,"Ġsystems":1743,"Ġprotect":1744,"ĠKing":1745,"Ġinjuries":1746,"Ġfinally":1747,"Ġnuclear":1748,"40":1749,"Ġratio":1750,"Ġgun":1751,"ĠPakistan":1752,"ĠManagement":1753,"ĠAir":1754,"ce":1755,"Ġopposition":1756,"ment":1757,"ick":1758,"Ġpro":1759,"Ġact":1760,"Ġplatform":1761,"Ġlack":1762,"Ġpair":1763,"Ġ500":1764,"Ġcalling":1765,"ary":1766,"Ġprograms":1767,"Ġscheduled":1768,"Ġfast":1769,"Ġjoined":1770,"ĠWar":1771,"ĠEditing":1772,"ĠSince":1773,"ĠRyan":1774,"ĠMac":1775,"ĠBig":1776,"ĠLake":1777,"Ġdigital":1778,"When":1779,"ue":1780,"Ġassets":1781,"Ġseeing":1782,"ĠAct":1783,"Ġpartner":1784,"ĠBoard":1785,"Ġbeginning":1786,"Ġsupply":1787,"Ġmiles":1788,"Ġprison":1789,"ons":1790,"ĠAmericans":1791,"ub":1792,"ĠOr":1793,"me":1794,"Ġbenefits":1795,"Ġbenefit":1796,"Ġmeasures":1797,"Ġhear":1798,"Ġparties":1799,"Ġsuccessful":1800,"ĠJust":1801,"Ġvictim":1802,"Ġblock":1803,"Ġlimited":1804,"Ġtrip":1805,"ĠPeople":1806,"Ġserve":1807,"Ġart":1808,"ism":1809,"Ġwide":1810,"ĠSch":1811,"Ġ80":1812,"ĠThomas":1813,"Ġ90":1814,"Ġstocks":1815,"Ġgirl":1816,"ĠAsia":1817,"Ġseeking":1818,"Ġcertainly":1819,"ĠServices":1820,"ĠCollege":1821,"Ġcommunities":1822,"Ġextra":1823,"Ġ2010":1824,"ness":1825,"Ġholding":1826,"ous":1827,"Ġtough":1828,"ade":1829,"Ġmobile":1830,"Ġowns":1831,"ĠDo":1832,"ĠFire":1833,"Ġspoke":1834,"Ġreturned":1835,"Ġsize":1836,"Ġcriminal":1837,"ĠInstagram":1838,"Ġoffering":1839,"ĠGod":1840,"ĠService":1841,"Ġpage":1842,"her":1843,"Ġdeep":1844,"wood":1845,"Ġcrime":1846,"ĠSports":1847,"ile":1848,"ĠGlobal":1849,"Ġproposed":1850,"ain":1851,"Ġsession":1852,"ĠFederal":1853,"ĠSyria":1854,"Ġch":1855,"Ġthreat":1856,"Ġallegations":1857,"ĠRepublicans":1858,"ĠGerman":1859,"Ġstrategy":1860,"Ġcommercial":1861,"ING":1862,"ĠSecretary":1863,"Q":1864,"Ġreporters":1865,"100":1866,"ĠCapital":1867,"ĠBoth":1868,"ĠPost":1869,"ĠIsrael":1870,"Ġsave":1871,"ts":1872,"ill":1873,"Ġdrop":1874,"Ġreserved":1875,"ĠMany":1876,"Ġavoid":1877,"Ġ200":1878,"iv":1879,"Ġdamage":1880,"Ġcondition":1881,"Ġdropped":1882,"Ġdoor":1883,"Ġplanning":1884,"ire":1885,"Ġcard":1886,"Ġdesigned":1887,"Ġreduce":1888,"AN":1889,"ĠUn":1890,"ford":1891,"ĠThen":1892,"Ġpic":1893,"ĠCopyright":1894,"Ġrain":1895,"ĠMartin":1896,"Ġdomestic":1897,"45":1898,"ge":1899,"Ġmurder":1900,"Ġspeech":1901,"line":1902,"Ġhelping":1903,"Ġplanned":1904,"Ġfeature":1905,"ud":1906,"Ġtype":1907,"ham":1908,"ĠPublic":1909,"ja":1910,"Ġinsurance":1911,"Ġattacks":1912,"ĠCorp":1913,"Ġforecast":1914,"Ġresources":1915,"ma":1916,"?\"":1917,"ĠAm":1918,"ĠSept":1919,"Ġpush":1920,"Ġattorney":1921,"23":1922,"Ġemergency":1923,"Ġwinner":1924,"Ġblood":1925,"Ġnorth":1926,"ĠFeb":1927,"Ġbaby":1928,"Ġfloor":1929,"Ġspend":1930,"Ġex":1931,"Ġdollars":1932,"Ġunit":1933,"ĠHill":1934,"Ġder":1935,"ĠAbout":1936,"Ġalone":1937,"ization":1938,"Ġpresidential":1939,"Ġactivity":1940,"ĠTHE":1941,"ee":1942,"ber":1943,"ĠOther":1944,"Ġowner":1945,"Ġhour":1946,"Ġcities":1947,"Ġanswer":1948,"ide":1949,"Ġfully":1950,"ek":1951,"ists":1952,"Ġcoverage":1953,"Ġvs":1954,"Ġfigure":1955,"Ġpopulation":1956,"org":1957,"Ġsnow":1958,"Ġbecoming":1959,"ĠSam":1960,"ĠCarolina":1961,"Ġjoin":1962,"Ġprofit":1963,"Ġitems":1964,"Ġindex":1965,"Ġanalysis":1966,"Ġtournament":1967,"Ġstake":1968,"Ġperfect":1969,"way":1970,"Ġband":1971,"Ġgirls":1972,"Ġoption":1973,"Ġplays":1974,"oc":1975,"Ġproviding":1976,"ÃŃ":1977,"24":1978,"Ġwouldn":1979,"Ġones":1980,"Ġdeclined":1981,"Ġwritten":1982,"Ġvoters":1983,"Ġcandidate":1984,"Ġsuspect":1985,"Ġpolicies":1986,"Ġpeace":1987,"ast":1988,"Ġparticular":1989,"for":1990,"Ġhopes":1991,"Ġstation":1992,"ĠMost":1993,"Ġspeak":1994,"ĠRiver":1995,"Ġasking":1996,"Ġstatements":1997,"Ġfifth":1998,"ha":1999,"ĠNigeria":2000,"af":2001,"Ġexplained":2002,"Ġbar":2003,"Ġhousing":2004,"ĠSanta":2005,"Ġidentified":2006,"Ġsimple":2007,"Ġcritical":2008,"ĠClub":2009,"ĠSecurity":2010,"ĠLike":2011,"Ġstarts":2012,"art":2013,"Ġstreet":2014,"Ġreality":2015,"Ġheavy":2016,"Ġprogress":2017,"Ġshowing":2018,"Ġchallenges":2019,"Ġban":2020,"Ġcommitted":2021,"35":2022,"»":2023,"Ġdirectly":2024,"Ġaren":2025,"Ġclaim":2026,"ĠWestern":2027,"ind":2028,"Ġgives":2029,"ĠSaudi":2030,"Ġchoice":2031,"ĠTh":2032,"Ġapproved":2033,"Ġlocated":2034,"Ġarrived":2035,"22":2036,"Ġcaught":2037,"Ġprofessional":2038,"Ġmissed":2039,"Ġculture":2040,"ĠYear":2041,"ĠOhio":2042,"ĠLtd":2043,"ĠAnother":2044,"Ġseem":2045,"Ġbelieves":2046,"Ġbelieved":2047,"Ġcharacter":2048,"ĠAug":2049,"red":2050,"Ġfine":2051,"Ġprior":2052,"Ġthinking":2053,"Ġhttp":2054,"Ġ+":2055,"Ġzone":2056,"Ġputting":2057,"Ġcrash":2058,"ĠAustralian":2059,"ĠAb":2060,"Ġfocused":2061,"ĠREUTERS":2062,"ĠFox":2063,"ĠSp":2064,"Ġtraditional":2065,"Ġanalyst":2066,"Ġwait":2067,"IT":2068,"Ġrequest":2069,"ru":2070,"ians":2071,"ize":2072,"Ġfinish":2073,"Ġlaws":2074,"Ġran":2075,"ER":2076,"Ġsouth":2077,"Ġspeed":2078,"Ġmovement":2079,"Ġassault":2080,"Ġexchange":2081,"Ġappear":2082,"ĠSun":2083,"Ġle":2084,"Ġmaybe":2085,"Ġlosing":2086,"Ġsubject":2087,"ive":2088,"mer":2089,"ĠBusiness":2090,"ĠBl":2091,"Ġappears":2092,"Ġadvantage":2093,"ĠLee":2094,"ada":2095,"ĠUnder":2096,"Ġprevent":2097,"Ġrespect":2098,"Ġsex":2099,"Ġcentre":2100,"ĠJoe":2101,"ado":2102,"Ġtable":2103,"Ġequipment":2104,"Ġfair":2105,"Ġtour":2106,"Ġ32":2107,"ĠFinancial":2108,"Ġcounty":2109,"Ġdevices":2110,"Ġcustomer":2111,"Ġinfrastructure":2112,"Ġexpectations":2113,"Ġfacing":2114,"Ġupon":2115,"Ġcross":2116,"ĠOpen":2117,"AL":2118,"Ġquick":2119,"Ġattempt":2120,"Ġcompleted":2121,"Ġfacility":2122,"Ġconfidence":2123,"ĠSupreme":2124,"Ġpiece":2125,"our":2126,"Ġplaces":2127,"Ġsometimes":2128,"Ġpoor":2129,"Ġstorm":2130,"Ġhot":2131,"Ġaffected":2132,"na":2133,"Ġabuse":2134,"ĠMs":2135,"Ġword":2136,"over":2137,"Ġbrother":2138,"Ġnecessary":2139,"Ġeventually":2140,"ĠStar":2141,"Ġsend":2142,"Ġboy":2143,"ĠRs":2144,"Ġremember":2145,"21":2146,"Ġclimate":2147,"Ġcapacity":2148,"Ġresponsible":2149,"ĠMatt":2150,"month":2151,"Ġsuffered":2152,"%.":2153,"og":2154,"ĠPeter":2155,"Ġ,":2156,"Ġfeeling":2157,"ze":2158,"Ġbuying":2159,"oy":2160,"ij":2161,"Ġbought":2162,"Ġactions":2163,"Ġowned":2164,"Ġ___":2165,"Ġphysical":2166,"Ġspecific":2167,"Ġbattle":2168,"ĠEnergy":2169,"Ġpicture":2170,"Ġactive":2171,"Ġindividuals":2172,"Ġguy":2173,"Ġregional":2174,"Ġbond":2175,"ows":2176,"ĠToronto":2177,"Ġrule":2178,"Ġdevelop":2179,"Ġcrowd":2180,"Ġguilty":2181,"Ġfemale":2182,"Ġselling":2183,"ĠFollow":2184,"Ġmyself":2185,"ata":2186,"Ġdevice":2187,"Ġreasons":2188,"Ġrecords":2189,"Ġfighting":2190,"ON":2191,"ities":2192,"ĠHome":2193,"Ġstatus":2194,"Ġplant":2195,"Ġdrugs":2196,"ĠChurch":2197,"Ġcompletely":2198,"Ġdisease":2199,"Ġhighly":2200,"ĠParis":2201,"Ġdecade":2202,"Ġowners":2203,"Ġwall":2204,"Ġcamp":2205,"ĠSteve":2206,"Ġreporting":2207,"Ġearned":2208,"ĠImages":2209,"Ġexisting":2210,"ĠSen":2211,"Ġconcern":2212,"Ġhundreds":2213,"Ġsong":2214,"Ġknows":2215,"Ġunique":2216,"Ġlose":2217,"ĠKh":2218,"Ġapproximately":2219,"Ġhaven":2220,"Ġpark":2221,"Ġindependent":2222,"ĠAlthough":2223,"ĠAndrew":2224,"Ġpaper":2225,"Ġdeveloped":2226,"Ġrising":2227,"Ġdirect":2228,"Ġpurchase":2229,"Ġexactly":2230,"Ġq":2231,"Ġmassive":2232,"Ġbox":2233,"Ġchampion":2234,"ĠClinton":2235,"Ġvoice":2236,"Ġarrest":2237,"ĠKorean":2238,"Ġlearning":2239,"ĠVirginia":2240,"Ġsa":2241,"Ġpar":2242,"Ġchairman":2243,"Ġagencies":2244,"Ġhealthy":2245,"ĠThose":2246,"Ġpowerful":2247,"Ġ45":2248,"Ġdifference":2249,"ĠJackson":2250,"Ġenforcement":2251,"Ġdividend":2252,"qu":2253,"Ġenjoy":2254,"Ġruling":2255,"Ġongoing":2256,"Ġsoftware":2257,"ks":2258,"Ġlocation":2259,"Ġmostly":2260,"Ġcandidates":2261,"men":2262,"Ġbroke":2263,"What":2264,"ĠBr":2265,"Ġ2008":2266,"Ġconsumer":2267,"Ġdiscuss":2268,"Ġdi":2269,"Ġprimary":2270,"ĠEn":2271,"Ġgreen":2272,"Ġconcerned":2273,"Ġimage":2274,"ĠPremier":2275,"ĠMeanwhile":2276,"Ġfired":2277,"ĠBoston":2278,"ann":2279,"Ġcamera":2280,"Ġtraded":2281,"Ġhasn":2282,"Ġexcited":2283,"Ġincreasing":2284,"ĠDespite":2285,"Ġcitizens":2286,"Ġeuro":2287,"Ġreportedly":2288,"Ġminute":2289,"ĠWill":2290,"ĠLLC":2291,"Ġsp":2292,"ĠMichigan":2293,"Ġstopped":2294,"Ġeye":2295,"Ġdenied":2296,"Ġmodern":2297,"ĠWall":2298,"Ġdefinitely":2299,"point":2300,"Ġlines":2301,"Ġpolitics":2302,"Ġhotel":2303,"Ġretail":2304,"Ġstated":2305,"ĠOver":2306,"Ġgrew":2307,"Ġbroadcast":2308,"Ġlegislation":2309,"Ġfresh":2310,"Ġbid":2311,"Ġmanaged":2312,"Ġsociety":2313,"Ġscoring":2314,"ĠGet":2315,"Ġintelligence":2316,"Ġholiday":2317,"Ġgovernor":2318,"Ġestimated":2319,"Ġexperts":2320,"ĠJeff":2321,"Ġstruck":2322,"Ġhits":2323,"Ġcarry":2324,"Ġplaced":2325,"Ġstores":2326,"Ġexpressed":2327,"Ġvalued":2328,"Ġad":2329,"Ġtwice":2330,"ala":2331,"Ġdisplay":2332,"Ġusually":2333,"Ġresponded":2334,"Ġdog":2335,"AS":2336,"ĠFed":2337,"Ġ2009":2338,"Ġdocuments":2339,"Ġnormal":2340,"Ġtrain":2341,"Ġfl":2342,"Ġshown":2343,"ĠEd":2344,"Ġsort":2345,"Ġallegedly":2346,"Ġshots":2347,"ka":2348,"Ġaccounts":2349,"Ġyesterday":2350,"Ġcreating":2351,"Ġchurch":2352,"Ġbus":2353,"Ġaward":2354,"Ġequity":2355,"Ġphotos":2356,"Ġ33":2357,"Ġfiscal":2358,"je":2359,"Ġconsumers":2360,"ĠManchester":2361,"no":2362,"ĠKevin":2363,"Ġgain":2364,"Ġcorporate":2365,"Ġcivil":2366,"ĠMiddle":2367,"ally":2368,"Ġsound":2369,"ĠEnglish":2370,"IC":2371,"Ġwinds":2372,"Ġworst":2373,"ĠGrand":2374,"Ġeffective":2375,"ĠIsland":2376,"Ġdrivers":2377,"Ġfan":2378,"pe":2379,"Ġsides":2380,"ĠGo":2381,"Ġclean":2382,"âĢĵ":2383,"Ġtelevision":2384,"ĠJr":2385,"Ġallows":2386,"My":2387,"Ġgreater":2388,"ance":2389,"Ġdecisions":2390,"Ġrestaurant":2391,"ĠHospital":2392,"ĠTr":2393,"Ġbalance":2394,"Ġmph":2395,"Ġkeeping":2396,"Ġseconds":2397,"Ġweapons":2398,"ert":2399,"Ġpain":2400,"ass":2401,"Ġsteps":2402,"ger":2403,"ĠBrexit":2404,"Ġremaining":2405,"Ġbringing":2406,"ure":2407,"Ġweight":2408,"And":2409,"Ġwriting":2410,"Photo":2411,"ĠChristian":2412,"ob":2413,"Ġsport":2414,"Ġfigures":2415,"Ġtrust":2416,"Ġskills":2417,"Ġseat":2418,"Ġfaces":2419,"ck":2420,"Ġborn":2421,"Ġsuper":2422,"Ġfuel":2423,"Ġdel":2424,"Ġmeant":2425,"ica":2426,"Ġjustice":2427,"Ġspring":2428,"Ġkilling":2429,"Ġnegative":2430,"ĠRichard":2431,"Ġund":2432,"Ġfactors":2433,"Ġsigns":2434,"Ġlearned":2435,"ĠGame":2436,"Ġaudience":2437,"Ġdeliver":2438,"Ġillegal":2439,"Ġblue":2440,"Ġscreen":2441,"Ġremained":2442,"Ġannouncement":2443,"IN":2444,"Ġwaiting":2445,"Ġthanks":2446,"Ġimmigration":2447,"ĠFBI":2448,"Ġwarned":2449,"Ġmeasure":2450,"Ġdraw":2451,"Ġpositions":2452,"Ġdebut":2453,"ĠMedia":2454,"Ġallowing":2455,"air":2456,"hen":2457,"Ġmark":2458,"ys":2459,"Ġprepared":2460,"ĠVegas":2461,"ep":2462,"ice":2463,"2018":2464,"Ġdefensive":2465,"60":2466,"ĠBeach":2467,"Ġpulled":2468,"£":2469,"Ġlawyer":2470,"Ġcast":2471,"Ġsolution":2472,"Ġeyes":2473,"Ġmarketing":2474,"ĠFoundation":2475,"Ġrisks":2476,"ĠToday":2477,"za":2478,"Ġdraft":2479,"Ġice":2480,"26":2481,"ĠHar":2482,"ĠExecutive":2483,"Ġtruck":2484,"ions":2485,"ĠYour":2486,"ĠIreland":2487,"ĠJim":2488,"Ġha":2489,"Ġfear":2490,"Ġ36":2491,"UR":2492,"ĠFord":2493,"Ġwatching":2494,"ien":2495,"Ġstyle":2496,"ĠGood":2497,"Ġwearing":2498,"ĠHouston":2499,"Ġonto":2500,"Ġboost":2501,"Ġapplication":2502,"ĠDan":2503,"Ġspread":2504,"ĠDavis":2505,"Ġstrike":2506,"els":2507,"Ġwind":2508,"Ġinterested":2509,"Ġguard":2510,"Ġmission":2511,"Ġyourself":2512,"Ġoperation":2513,"Ġlarger":2514,"She":2515,"Ġseasons":2516,"28":2517,"27":2518,"Ġrespond":2519,"ci":2520,"ĠCentre":2521,"Our":2522,"Ġnames":2523,"Ġflight":2524,"Ġquarterback":2525,"Ġstandard":2526,"so":2527,"Ġsuggested":2528,"ĠMal":2529,"Ġolder":2530,"ini":2531,"Ġperhaps":2532,"ont":2533,"ĠInstitute":2534,"Ġmillions":2535,"Ġmental":2536,"ÃĤ":2537,"ga":2538,"Ġclients":2539,"Ġplease":2540,"Ġloan":2541,"Ġaware":2542,"ft":2543,"int":2544,"75":2545,"05":2546,"AY":2547,"ĠOut":2548,"Ġhair":2549,"ied":2550,"Ġseemed":2551,"ene":2552,"ty":2553,"NYSE":2554,"Ġoffensive":2555,"Ġtaxes":2556,"Ġinitial":2557,"ren":2558,"Ġseparate":2559,"la":2560,"ĠMiami":2561,"AC":2562,"Ġclearly":2563,"Ġfit":2564,"ĠCoast":2565,"Ġfirms":2566,"Ġpartners":2567,"Ġupcoming":2568,"Ġcold":2569,"Ġproposal":2570,"AT":2571,"Ġshut":2572,"ĠCommunity":2573,"Ġnature":2574,"ĠSal":2575,"Ġbottom":2576,"ting":2577,"ĠClick":2578,"Ġnice":2579,"ets":2580,"Ġhurt":2581,"itt":2582,"ama":2583,"Ġcarried":2584,"ĠCon":2585,"rd":2586,"Ġestate":2587,"ĠLas":2588,"ĠLaw":2589,"ng":2590,"Ġprotection":2591,"Ġproduce":2592,"Ġcurrency":2593,"Ġhappens":2594,"ĠPer":2595,"ney":2596,"ĠLong":2597,"Ġfellow":2598,"Ġcuts":2599,"Ġreading":2600,"ano":2601,"Ġproud":2602,"ost":2603,"ĠUN":2604,"ĠArizona":2605,"AD":2606,"Ġhelps":2607,"Ġwinter":2608,"Ġfinding":2609,"ĠGold":2610,"att":2611,"ĠWhy":2612,"Ġbasketball":2613,"lin":2614,"ĠCan":2615,"ĠBowl":2616,"ial":2617,"ĠAlex":2618,"200":2619,"AM":2620,"Ġpresence":2621,"Ġproduced":2622,"Ġdeveloping":2623,"Ġregarding":2624,"Ġdebate":2625,"Ġvice":2626,"ĠItaly":2627,"Ġsu":2628,"its":2629,"ator":2630,"Ġ34":2631,"Ġcomplex":2632,"Ġpresented":2633,"Ġresearchers":2634,"Ġslow":2635,"ya":2636,"Ġsanctions":2637,"Ġloved":2638,"Ġseek":2639,"Ġresponsibility":2640,"Ġadmitted":2641,"Ġalbum":2642,"Ġsolutions":2643,"Ġfacilities":2644,"ett":2645,"ĠGu":2646,"ĠWell":2647,"Ġlawmakers":2648,"Ġmiss":2649,"ful":2650,"ĠNick":2651,"'.":2652,"Ġfeels":2653,"Ġprime":2654,"Ġknowledge":2655,"Ġdeals":2656,"ĠTaylor":2657,"Ġsurvey":2658,"ĠFrancisco":2659,"Ġjoint":2660,"Ġwhom":2661,"Ġsit":2662,"01":2663,"Ġtr":2664,"Ġorganizations":2665,"ĠAvenue":2666,"ĠTheir":2667,"ĠTim":2668,"Ġrally":2669,"game":2670,"Ġbigger":2671,"Ġlawsuit":2672,"Ġrecorded":2673,"Ġfavorite":2674,"yard":2675,"Ġtransaction":2676,"Ġqu":2677,"oh":2678,"Ġinteresting":2679,"Ġinflation":2680,"ath":2681,"Ġstuff":2682,"Ġindustrial":2683,"ico":2684,"TS":2685,"Ġspeaking":2686,"Ġlosses":2687,"ID":2688,"ĠStadium":2689,"Ġstars":2690,"ĠWomen":2691,"ĠBlue":2692,"Ġwins":2693,"Ġdes":2694,"Ġcompetitive":2695,"ters":2696,"Ġpounds":2697,"Ġdirection":2698,"Ġinnings":2699,"ĠBest":2700,"Ġactor":2701,"Ġdangerous":2702,"Ġrequire":2703,"Ġplus":2704,"Ġsolid":2705,"Ġgeneration":2706,"Ġstrength":2707,"ĠMary":2708,"For":2709,"Ġplenty":2710,"ĠTeam":2711,"Ġinfluence":2712,"Ġfaced":2713,"Ġes":2714,"ĠIslamic":2715,"let":2716,"ĠDevelopment":2717,"Ġpath":2718,"Ġyouth":2719,"Ġcommitment":2720,"Ġbeautiful":2721,"ĠJack":2722,"ort":2723,"Ġten":2724,"Ġattend":2725,"ars":2726,"ón":2727,"Ġviews":2728,"Ġeuros":2729,"Ġauthor":2730,"Ġcore":2731,"Ġsupporters":2732,"ĠiPhone":2733,"Ġfashion":2734,"Ġsmaller":2735,"Ġelected":2736,"Ġuniversity":2737,"Ġpicked":2738,"wa":2739,"Ġordered":2740,"ĠSc":2741,"ĠÅ":2742,"Ġlargely":2743,"+":2744,"ĠAttorney":2745,"Ġpaying":2746,"AR":2747,"Ġconnection":2748,"Ġsetting":2749,"Ġna":2750,"ĠRock":2751,"Ġrecovery":2752,"ew":2753,"Ġserving":2754,"Ġsurprise":2755,"Ġoccurred":2756,"Ġdivision":2757,"Ġtelling":2758,"Ġmargin":2759,"Ġ2020":2760,"Ġsister":2761,"ĠNBA":2762,"Ġvoted":2763,"Ġcon":2764,"By":2765,"Ġ49":2766,"Ġfoot":2767,"ü":2768,"ĠTurkey":2769,"Ġamazing":2770,"Ġcombined":2771,"Ġappearance":2772,"Ġeasily":2773,"DAY":2774,"Ġnotes":2775,"ĠStart":2776,"Ġlanguage":2777,"Ġextremely":2778,"Ġcloudy":2779,"ĠLet":2780,"Ġdelivered":2781,"Ġimproved":2782,"Ġcollection":2783,"ĠPM":2784,"Ġestimates":2785,"Ġboys":2786,"izing":2787,"Ġtext":2788,"Ġcloser":2789,"Ġprotest":2790,"Ġprovince":2791,"Ġshop":2792,"Ġsmart":2793,"de":2794,"ĠSheriff":2795,"EN":2796,"Ġcorner":2797,"Ġpanel":2798,"Ġbooks":2799,"Ġsupported":2800,"Ġmentioned":2801,"ver":2802,"ĠMinistry":2803,"ĠPrince":2804,"ĠUSA":2805,"Ġreceiving":2806,"Ġchoose":2807,"ĠIN":2808,"ĠSpain":2809,"Ġsection":2810,"Ġconsidering":2811,"ĠCor":2812,"Ġwish":2813,"Ġwelcome":2814,"ĠConference":2815,"ere":2816,"ĠOfficer":2817,"Ġhoping":2818,"Ġportfolio":2819,"Ġstandards":2820,"Ġgrand":2821,"ĠReal":2822,"Ġsecure":2823,"ĠCorporation":2824,"ĠRep":2825,"ĠKelly":2826,"Ġstreets":2827,"Ġsitting":2828,"Ġslightly":2829,"ĠInvestment":2830,"99":2831,"ond":2832,"Ġunits":2833,"Ġvotes":2834,"Ġsegment":2835,"Ġchampionship":2836,"Ġsquad":2837,"iting":2838,"ron":2839,"®":2840,"Ġem":2841,"Ġtouch":2842,"Ġ38":2843,"Ġceremony":2844,"Ġdecide":2845,"Ġapproval":2846,"So":2847,"ĠPort":2848,"Ġsub":2849,"Ġsc":2850,"Ġrep":2851,"ĠWeek":2852,"Ġupper":2853,"Ġagree":2854,"ny":2855,"Ġmatches":2856,"ics":2857,"Ġtweeted":2858,"Ġheat":2859,"ĠGreat":2860,"Ġpenalty":2861,"Ġmass":2862,"Ġalongside":2863,"Ġherself":2864,"berg":2865,"Ġscience":2866,"Ġentered":2867,"Ġappeal":2868,"ĠPr":2869,"Ġfile":2870,"che":2871,"ĠReport":2872,"ĠThree":2873,"ĠNorthern":2874,"ĠJordan":2875,"Ġamid":2876,"Ġpace":2877,"Ġjail":2878,"Ġfinance":2879,"ĠYoung":2880,"32":2881,"Ġwilling":2882,"Ġconduct":2883,"ĠPar":2884,"Ġestablished":2885,"Ġreturns":2886,"Ġaid":2887,"Ġinternet":2888,"IA":2889,"29":2890,"Ġmeetings":2891,"Ġwarning":2892,"ĠCl":2893,"Ġcampus":2894,"Most":2895,"ĠFund":2896,"ĠWilliam":2897,"ĠJapanese":2898,"Ġconsensus":2899,"Ġbrain":2900,"!\"":2901,"Ġpoll":2902,"Ġtech":2903,"Ġtrend":2904,"Ġpotentially":2905,"Ġreduced":2906,"ĠShow":2907,"Ġ37":2908,"Ġhappening":2909,"ĠBrazil":2910,"pl":2911,"ĠCal":2912,"Ġcovered":2913,"Ġenter":2914,"TV":2915,"Ġcatch":2916,"foot":2917,"Ġunion":2918,"Ġexpansion":2919,"ĠSingapore":2920,"ĠDetroit":2921,"Ġattended":2922,"ats":2923,"Ġnewspaper":2924,"ĠDivision":2925,"news":2926,"Ġcap":2927,"Ġremoved":2928,"Ġ48":2929,"ĠRoyal":2930,"Ġwindow":2931,"Ġparking":2932,"Ġdark":2933,"Ġstanding":2934,"Ġupdate":2935,"Ġagent":2936,"Ġtransfer":2937,"ĠArmy":2938,"Ġuses":2939,"80":2940,"ĠTe":2941,"Ġintroduced":2942,"Ġmale":2943,"ĠSouthern":2944,"Ġratings":2945,"Ġisland":2946,"ĠMiller":2947,"Ġteachers":2948,"Ġadvice":2949,"Ġfamiliar":2950,"uf":2951,"Ġsought":2952,"Ġpor":2953,"ĠEric":2954,"Ġda":2955,"Ġideas":2956,"uh":2957,"Ġsixth":2958,"Ġtalent":2959,"ĠImage":2960,"ering":2961,"run":2962,"ments":2963,"Ġconducted":2964,"300":2965,"Ġurged":2966,"Ġdiscovered":2967,"Ġpl":2968,"Ġunderstanding":2969,"Ġoffense":2970,"Ġsecretary":2971,"Ġsk":2972,"Ġloans":2973,"ĠGr":2974,"Ġapplications":2975,"Ġcrude":2976,"go":2977,"ĠInstead":2978,"Ġopinion":2979,"Ġdoubt":2980,"ey":2981,"Ġdis":2982,"31":2983,"Ġexperienced":2984,"Ġleg":2985,"ĠCleveland":2986,"ven":2987,"Ġfailure":2988,"market":2989,"ack":2990,"Ġdecline":2991,"Ġchanging":2992,"Ġ300":2993,"Ġdefence":2994,"ĠBrian":2995,"Ġdelivery":2996,"Ġmarried":2997,"Ġdeclared":2998,"Ġpull":2999,"Ġlimit":3000,"ĠMORE":3001,"Ġdefeat":3002,"Ġexpand":3003,"ĠColorado":3004,"ĠRob":3005,"iss":3006,"Ġworse":3007,"Ġperform":3008,"ising":3009,"Ġ2007":3010,"ĠDel":3011,"Ġsurgery":3012,"Ġeasier":3013,"Ġmaintain":3014,"ĠEx":3015,"Ġtied":3016,"Ġeast":3017,"Ġuser":3018,"ola":3019,"Ġprogramme":3020,"Ġmanufacturing":3021,"Ġhitting":3022,"Ġx":3023,"Ġskin":3024,"Ġartist":3025,"Ġtells":3026,"Ġnearby":3027,"ĠDaniel":3028,"ĠPower":3029,"Ġdetermined":3030,"Ġactual":3031,"Ġtreated":3032,"Ġlived":3033,"Ġcomputer":3034,"Ġcool":3035,"oo":3036,"ĠPl":3037,"Ġeffects":3038,"Ġenvironmental":3039,"ĠMorgan":3040,"Ġflow":3041,"Ġachieve":3042,"ĠBell":3043,"Ġtesting":3044,"ĠBob":3045,"Ġwhatever":3046,"ĠBecause":3047,"US":3048,"ĠHollywood":3049,"Ġconflict":3050,"Ġwalking":3051,"ĠJudge":3052,"ĠAlabama":3053,"Ġaircraft":3054,"Ġte":3055,"well":3056,"Ġgoods":3057,"Ġidentify":3058,"Ġassociated":3059,"ĠVer":3060,"ĠEducation":3061,"Ġairport":3062,"IL":3063,"Ġfalling":3064,"Ġgiant":3065,"ĠMa":3066,"ĠMedical":3067,"Ġride":3068,"Ġden":3069,"º":3070,"ĠJose":3071,"Ġwest":3072,"ĠPacific":3073,"Ġvisitors":3074,"ĠWatch":3075,"ĠNations":3076,"Ġgains":3077,"Ġschedule":3078,"34":3079,"ĠExchange":3080,"Ġpayments":3081,"ĠII":3082,"70":3083,"No":3084,"ĠSyrian":3085,"ĠAdam":3086,"Ġne":3087,"Ġpartnership":3088,"Ġbl":3089,"ĠGeorgia":3090,"Ġsites":3091,"Ġmodels":3092,"Ġdegree":3093,"Ġdetermine":3094,"ĠWilson":3095,"Ġcontest":3096,"Ġprofessor":3097,"ĠChelsea":3098,"Ġmeaning":3099,"ĠGames":3100,"ĠTrust":3101,"ĠAsian":3102,"33":3103,"Ġlink":3104,"ĠUp":3105,"Ġholds":3106,"ĠTop":3107,"ĠItalian":3108,"ord":3109,"ĠKansas":3110,"Ġfarmers":3111,"Ġextended":3112,"Ġbirth":3113,"Ġreform":3114,"Ġrelations":3115,"Ġwrite":3116,"Ġsupporting":3117,"55":3118,"ita":3119,"Ġnotice":3120,"ster":3121,"Ġanimals":3122,"ĠJersey":3123,"Ġarm":3124,"ĠForeign":3125,"ĠLife":3126,"Ġtruly":3127,"ĠOnce":3128,"ĠMayor":3129,"ĠFree":3130,"ĠAgency":3131,"ĠWood":3132,"Ġpassing":3133,"DA":3134,"Ġ52":3135,"Ġmoves":3136,"Ġcom":3137,"house":3138,"ĠIts":3139,"Ġmarijuana":3140,"ines":3141,"Ġveteran":3142,"Ġvariety":3143,"ki":3144,"ff":3145,"amb":3146,"Ġlisted":3147,"Ġpushed":3148,"Ġvolume":3149,"Ġincreasingly":3150,"Ġkick":3151,"Ġrock":3152,"ank":3153,"Ġfees":3154,"Ġenable":3155,"Ġimages":3156,"Ġtruth":3157,"Ġministry":3158,"Ġrare":3159,"ĠDallas":3160,"ĠMinnesota":3161,"Ġcontributed":3162,"ĠCharles":3163,"Ġpercentage":3164,"Ġtechnical":3165,"ĠApp":3166,"Ġassistant":3167,"Ġinterests":3168,"Ġimmediate":3169,"38":3170,"ĠTown":3171,"Ġclosing":3172,"ĠAnthony":3173,"Ġsouthern":3174,"ase":3175,"ĠPutin":3176,"ĠForce":3177,"ba":3178,"Ġrefused":3179,"ĠStill":3180,"ix":3181,"ĠCol":3182,"Ġmaterials":3183,"Ġstructure":3184,"Ġdriven":3185,"Ġpatient":3186,"Ġbroken":3187,"Ġradio":3188,"Ġscale":3189,"Ġreplace":3190,"Ġ39":3191,"ĠLand":3192,"Ġdeputy":3193,"und":3194,"Ġcolor":3195,"OS":3196,"Ġroads":3197,"Ġcorruption":3198,"ĠRose":3199,"Ġemployee":3200,"ĠWater":3201,"Ġseats":3202,"Ġwalked":3203,"ec":3204,"Ġcents":3205,"Ġchain":3206,"Ġpayment":3207,"ĠAndroid":3208,"eb":3209,"Ġcommission":3210,"Ġthrow":3211,"Ġcount":3212,"Ġaccident":3213,"Ġexpensive":3214,"ered":3215,"ĠYes":3216,"ĠLouis":3217,"Ġstudies":3218,"Ġinvestigating":3219,"Ġcentury":3220,"Ġdiscussion":3221,"Ġinter":3222,"DAQ":3223,"ĠBefore":3224,"Ġinitially":3225,"*":3226,"Ġinvestments":3227,"Ġmulti":3228,"Ġtight":3229,"Ġconfident":3230,"Ġcounter":3231,"ĠQu":3232,"Ġgovernments":3233,"Ġarmed":3234,"Ġsuit":3235,"Ġrow":3236,"Ġlocations":3237,"Ġepisode":3238,"itch":3239,"Ġyounger":3240,"Ġfestival":3241,"Ġpitch":3242,"ĠOF":3243,"Ġtalked":3244,"ca":3245,"Ġprotests":3246,"Ġtargets":3247,"90":3248,"Ġoriginally":3249,"Ġsinger":3250,"Ġjourney":3251,"ug":3252,"Ġapply":3253,"Ġteacher":3254,"Ġchances":3255,"):":3256,"Ġdeaths":3257,"isation":3258,"ĠStephen":3259,"Ġcode":3260,"ĠChampionship":3261,"ĠJason":3262,"ĠAT":3263,"Ġaccept":3264,"ĠSeries":3265,"Ġvalues":3266,"Ġbed":3267,"ĠHarry":3268,"Ġflat":3269,"Ġtools":3270,"Ġpublicly":3271,"37":3272,"Ġpointed":3273,"ĠGolden":3274,"ps":3275,"Ġunable":3276,"ants":3277,"Ġestimate":3278,"Ġwarm":3279,"Ġbasic":3280,"ern":3281,"Ġraising":3282,"ĠRelated":3283,"Ġultimately":3284,"Ġnorthern":3285,"Ġplane":3286,"ĠVice":3287,"ĠRaj":3288,"ĠJustin":3289,"anc":3290,"Ġbrings":3291,"ĠArt":3292,"OT":3293,"Ġshift":3294,"ĠBBC":3295,"ĠSu":3296,"BS":3297,"Ġbag":3298,"Ġdoctor":3299,"Ġfill":3300,"Ġdowntown":3301,"Ġpossibility":3302,"ĠAg":3303,"Ġest":3304,"44":3305,"Ġstruggling":3306,"Ġlinked":3307,"Ġtickets":3308,"ĠJay":3309,"ĠCall":3310,"Ġstands":3311,"Ġwedding":3312,"Ġresident":3313,"eng":3314,"Ġleads":3315,"Ġadvance":3316,"ĠAtlanta":3317,"Ġtie":3318,"Ġadvanced":3319,"pt":3320,"burg":3321,"ĠEarlier":3322,"ĠSw":3323,"ĠZealand":3324,"Ġexercise":3325,"ĠAM":3326,"Ġaffect":3327,"Ġpossession":3328,"Ġinvolving":3329,"Ġ42":3330,"Ġwriter":3331,"ĠBeijing":3332,"Ġdoctors":3333,"Ġobviously":3334,"Ġer":3335,"ĠOlympic":3336,"Ġ75":3337,"ĠKhan":3338,"ĠFort":3339,"app":3340,"like":3341,"Ġsea":3342,"ock":3343,"Ġmix":3344,"ĠIraq":3345,"ĠMuslim":3346,"ĠFinally":3347,"Ġcontinuing":3348,"Ġpr":3349,"ĠKe":3350,"ĠJoseph":3351,"Ġexpects":3352,"Ġinstitutions":3353,"Ġconservative":3354,"own":3355,"ĠChairman":3356,"Ġreturning":3357,".-":3358,"Ġstood":3359,"Ġvision":3360,"ess":3361,"Ġadults":3362,"Ġyield":3363,"Ġprove":3364,"Ġorders":3365,"Ġdream":3366,"36":3367,"related":3368,"Ġsl":3369,"Ġeverybody":3370,"ui":3371,"Ġrepresents":3372,"Ġdiscussed":3373,"Ġbecomes":3374,"Ġvillage":3375,"CC":3376,"Ġnegotiations":3377,"ĠPhiladelphia":3378,"Ġcelebrate":3379,"Ġfarm":3380,"ç":3381,"Ġregistered":3382,"ĠGovernor":3383,"OL":3384,"ĠMon":3385,"Ġfiling":3386,"04":3387,"SE":3388,"ĠAssembly":3389,"Ġactress":3390,"Ġsi":3391,"Ġthank":3392,"Ġheading":3393,"ĠWho":3394,"Ġfamous":3395,"Ġconsecutive":3396,"Ġmarriage":3397,"ette":3398,"NAS":3399,"acks":3400,"ĠPlease":3401,"ĠDiego":3402,"Ġbaseball":3403,"ĠMoore":3404,"Ġties":3405,"Ġcarrying":3406,"que":3407,"Ġturning":3408,"ĠMcC":3409,"ĠKen":3410,"OR":3411,"ĠStock":3412,"Ġbuildings":3413,"49":3414,"ĠVan":3415,"39":3416,"ĠSeattle":3417,"Ġwild":3418,"Ġcrew":3419,"Ġroute":3420,"ĠTime":3421,"Ġtonight":3422,"Ġmoments":3423,"Ġvideos":3424,"Ġinternal":3425,"ĠLiverpool":3426,"port":3427,"Ġchair":3428,"Ġrival":3429,"ĠScotland":3430,"round":3431,"ith":3432,"Ġbreaking":3433,"Ġvoting":3434,"ically":3435,"Ġproducer":3436,"ĠLove":3437,"Ġremove":3438,"PA":3439,"Ġasset":3440,"Ġrequires":3441,"Ġsigning":3442,"ages":3443,"Ġimpressive":3444,"ĠIrish":3445,"Ġauthority":3446,"Ġruled":3447,"Ġaimed":3448,"Ġcaptain":3449,"AG":3450,"Ġplants":3451,"ĠAnderson":3452,"ĠSpanish":3453,"Ġbanking":3454,"Ġthreats":3455,"Ġsuspended":3456,"Ġtests":3457,"Ġreligious":3458,"Ġelectric":3459,"ĠREAD":3460,"Ġstrategic":3461,"Ġsplit":3462,"ex":3463,"Ġpractices":3464,"ĠIsraeli":3465,"ĠArabia":3466,"ĠMoscow":3467,"Ġfranchise":3468,"Ġcustody":3469,"ĠOld":3470,"Ġrequirements":3471,"Ġquarterly":3472,"Ġcomfortable":3473,"Ġcrimes":3474,"Ġheaded":3475,"Ġnewsletter":3476,"Ġanimal":3477,"Ġregulations":3478,"long":3479,"ĠCNN":3480,"Ġassists":3481,"Ġshopping":3482,"ĠGov":3483,"ĠSecurities":3484,"Ġassistance":3485,"Ġnor":3486,"Ġrelatively":3487,"Ġincreases":3488,"Ġgenerally":3489,"Ġ55":3490,"Ġgained":3491,"Ġ41":3492,"Ġpictures":3493,"gan":3494,"Ġpop":3495,"Ġupdates":3496,"ĠRepublic":3497,"Ġrebounds":3498,"ĠPatrick":3499,"Ġrelief":3500,"Ġacting":3501,"ĠFestival":3502,"Ġ2006":3503,"Ġboss":3504,"Ġtypes":3505,"65":3506,"ĠYet":3507,"Ġpurpose":3508,"ning":3509,"Ġmatters":3510,"Ġcompete":3511,"ball":3512,"ĠRam":3513,"Ġsw":3514,"ĠFollowing":3515,"ĠBush":3516,"Ġtroops":3517,"Ġsupposed":3518,"Ġfreedom":3519,"Ġfeatured":3520,"Ġstorage":3521,"ĠInformation":3522,"ĠHong":3523,"Ġgolf":3524,"Ġagents":3525,"Ġfraud":3526,"Ġminimum":3527,"Ġartists":3528,"Ġeat":3529,"high":3530,"ĠFormer":3531,"ĠKong":3532,"ĠJosh":3533,"ĠDelhi":3534,"Ġshowers":3535,"ĠAcademy":3536,"Ġapartment":3537,"Ġvan":3538,"Ġfish":3539,"oe":3540,"Ġfilms":3541,"ĠBo":3542,"Ġedge":3543,"Ġpossibly":3544,"Ġtweet":3545,"09":3546,"Ġresolution":3547,"jo":3548,"Ġkill":3549,"Ġ44":3550,"Ġcell":3551,"Ġscheme":3552,"Ġth":3553,"Ġbonds":3554,"Ġentry":3555,"Ġsecret":3556,"Ġ43":3557,"Ġending":3558,"Ġweren":3559,"ĠCredit":3560,"ĠLive":3561,"Ġretired":3562,"Ġmachine":3563,"Ġsummit":3564,"Ġsharing":3565,"Ġacquired":3566,"Ġera":3567,"Ġwear":3568,"ical":3569,"07":3570,"Ġexciting":3571,"li":3572,"BC":3573,"ĠSocial":3574,"Ġhistoric":3575,"ĠChe":3576,"ĠLewis":3577,"ira":3578,"Ġstolen":3579,"ĠSpeaking":3580,"Ġsleep":3581,"Ġspokeswoman":3582,"week":3583,"Ġpurchased":3584,"Ġimportance":3585,"EC":3586,"Ġends":3587,"Ġdress":3588,"Ġparliament":3589,"ĠCruz":3590,"Ġcards":3591,"hi":3592,"ĠEmail":3593,"Ġrepresent":3594,"Ġbrands":3595,"ĠSenior":3596,"Ġparticipants":3597,"Ġfly":3598,"Ġidentity":3599,"ĠHam":3600,"ĠSky":3601,"ij":3602,"SA":3603,"Ġpromised":3604,"Ġtrouble":3605,"Ġsuffering":3606,"Ġleaves":3607,"Ġsuggest":3608,"Sh":3609,"Ġbusy":3610,"Ġproperties":3611,"Ġworldwide":3612,"Ġcloud":3613,"ĠSEC":3614,"Ġclosely":3615,"Ġmanage":3616,"Ġnumerous":3617,"Ġbackground":3618,"ĠExpress":3619,"Ġ65":3620,"ĠTony":3621,"ĠMadrid":3622,"ev":3623,"der":3624,"Ġsignificantly":3625,"Ġalternative":3626,"Ġship":3627,"head":3628,"ators":3629,"Ġdinner":3630,"ax":3631,"SC":3632,"Ġcriticism":3633,"ĠMah":3634,"ĠMin":3635,"rie":3636,"ĠTour":3637,"Ġbench":3638,"Ġadds":3639,"Ġseriously":3640,"star":3641,"ĠJournal":3642,"ĠDi":3643,"ali":3644,"Ġsentence":3645,"ĠSeveral":3646,"Ġmayor":3647,"ati":3648,"Ġsuggests":3649,"Ġbehavior":3650,"Ġstronger":3651,"ĠFood":3652,"Ġclient":3653,"not":3654,"ĠPrice":3655,"Ġtargeted":3656,"ĠSingh":3657,"ĠNetwork":3658,"Ġprosecutors":3659,"Ġdirected":3660,"ĠDemocrat":3661,"bl":3662,"ues":3663,"ĠFamily":3664,"Ġconnected":3665,"ĠChampions":3666,"Ġroughly":3667,"Ġabsolutely":3668,"08":3669,"Ġpassengers":3670,"ö":3671,"ĠSpecial":3672,"Ġcoast":3673,"Ġcomplaint":3674,"Ġ400":3675,"ĠEm":3676,"ves":3677,"Ġdogs":3678,"Ġhandle":3679,"Ġotherwise":3680,"Ġsees":3681,"Ġticket":3682,"ĠAward":3683,"All":3684,"Ġtask":3685,"Ġsongs":3686,"ĠAmong":3687,"Ġdedicated":3688,"Ġsteel":3689,"looking":3690,"Ġshortly":3691,"Ġtackle":3692,"ative":3693,"Ġminor":3694,"â":3695,"Ġprovider":3696,"vers":3697,"use":3698,"ives":3699,"Ġtypically":3700,"Ġarms":3701,"ĠAnt":3702,"ĠIS":3703,"Ġjump":3704,"Ġ©":3705,"47":3706,"aff":3707,"Ġmonthly":3708,"ĠMicrosoft":3709,"ĠCBS":3710,"Ġthreatened":3711,"Ġhonor":3712,"ĠMo":3713,"42":3714,"Ġinning":3715,"Ġpool":3716,"Ġhealthcare":3717,"ĠStory":3718,"ĠTennessee":3719,"Ġpromote":3720,"EL":3721,"Ġemotional":3722,"Ġpe":3723,"Ġfactor":3724,"Ġinvestigators":3725,"Ľ":3726,"ĠBack":3727,"ĠProject":3728,"Ġcu":3729,"side":3730,"Ġmessages":3731,"TH":3732,"eg":3733,"Ġexperiences":3734,"Ġcausing":3735,"Ġjoining":3736,"Ġpackage":3737,"Ġbodies":3738,"Ġlots":3739,"ĠHarris":3740,"Ġcl":3741,"ĠInternet":3742,"free":3743,"Ġperformed":3744,"Ġpieces":3745,"buy":3746,"Ġcaption":3747,"Ġweb":3748,"Ġcontracts":3749,"At":3750,"Ġattempted":3751,"Ġunlikely":3752,"Ġclick":3753,"Ġinvest":3754,"IM":3755,"ĠView":3756,"Ġneighborhood":3757,"Ġring":3758,"ĠFour":3759,"ail":3760,"46":3761,"One":3762,"Ġnative":3763,"CH":3764,"OM":3765,"Ġalcohol":3766,"ĠVal":3767,"Ġcharacters":3768,"ĠPat":3769,"Ġpoliticians":3770,"ĠMag":3771,"Ġbegins":3772,"ĠAk":3773,"Ġlos":3774,"Ġpersonnel":3775,"Ġenjoyed":3776,"ĠTechnology":3777,"Ġsun":3778,"ĠIT":3779,"Ġdocument":3780,"Ġdeficit":3781,"Ġcoalition":3782,"Ġmemory":3783,"Ġpushing":3784,"any":3785,"ified":3786,"Ġfounder":3787,"Ġ2000":3788,"2017":3789,"Ġvisited":3790,"ĠThough":3791,"ph":3792,"Ġsoft":3793,"Ġflag":3794,"Ġmom":3795,"inch":3796,"ĠSamsung":3797,"Ġapps":3798,"Ġtouchdown":3799,"ĠCare":3800,"ĠMrs":3801,"Ġredistributed":3802,"Ġencourage":3803,"ched":3804,"Ġtend":3805,"Ġregions":3806,"pp":3807,"IP":3808,"br":3809,"ush":3810,"Ġargued":3811,"Ġjunior":3812,"BA":3813,"Ġsevere":3814,"ĠNIGHT":3815,"Ġdef":3816,"Ġsurrounding":3817,"48":3818,"Ġengine":3819,"Ġfilled":3820,"Ġseventh":3821,"Ġbattery":3822,"ĠAllen":3823,"Ġguidance":3824,"Ġroll":3825,"Ġrural":3826,"Ġexpert":3827,"Ġconvicted":3828,"Ġlikes":3829,"ĠRo":3830,"Ġgrown":3831,"Ġretirement":3832,"Ġintended":3833,"Ġmis":3834,"Ġarmy":3835,"Ġdance":3836,"ĠThank":3837,"Ġent":3838,"Ġoutlook":3839,"Ġpara":3840,"Ġdry":3841,"ĠTO":3842,"era":3843,"Ġwaste":3844,"Ġfaster":3845,"ĠEagles":3846,"TA":3847,"ĠFrank":3848,"Ã":3849,"LE":3850,"ura":3851,"ko":3852,"ao":3853,"Ġdistribution":3854,"Ġimprovement":3855,"Ġplayoff":3856,"Ġacquisition":3857,"ĠCH":3858,"Ġtomorrow":3859,"Ġstruggle":3860,"ĠHuman":3861,"Ġnewly":3862,"oon":3863,"ĠNe":3864,"con":3865,"sc":3866,"Ġunless":3867,"Ġtransition":3868,"ten":3869,"ĠInter":3870,"Ġequal":3871,"Ġrec":3872,"Ġappointed":3873,"Ġwake":3874,"ĠEarth":3875,"ose":3876,"ĠEastern":3877,"Ġsoldiers":3878,"ĠParliament":3879,"Ġsets":3880,"Ġattempts":3881,"ĠIllinois":3882,"Ġrevenues":3883,"ĠWil":3884,"Ġheads":3885,"Ġprepare":3886,"Ġpriority":3887,"PS":3888,"ĠJo":3889,"ĠNBC":3890,"Ġtherefore":3891,"yn":3892,"Ġinitiative":3893,"ct":3894,"Ġcoffee":3895,"ĠFair":3896,"43":3897,"den":3898,"form":3899,"ova":3900,"Ġappropriate":3901,"ĠPlay":3902,"Ġaccepted":3903,"Ġcreative":3904,"Ġfollows":3905,"Ġrescue":3906,"Ġtree":3907,"With":3908,"ĠNetflix":3909,"ĠFootball":3910,"Ġsurprised":3911,"Ġlowest":3912,"800":3913,"amp":3914,"Ġworried":3915,"mar":3916,"ran":3917,"Ġvisiting":3918,"Ġselected":3919,"ĠMusic":3920,"ĠAnn":3921,"Ġexplain":3922,"ging":3923,"Ġwidely":3924,"Ġsquare":3925,"Ġtrends":3926,"Ġimproving":3927,"ĠHead":3928,"ĠQueen":3929,"ĠSociety":3930,"Ġcutting":3931,"ĠGOP":3932,"03":3933,"',":3934,"ET":3935,"ĠDrive":3936,"oll":3937,"ato":3938,"ĠSea":3939,"Ġjury":3940,"ĠRights":3941,"Ġinvestor":3942,"ĠABC":3943,"Ġtool":3944,"ĠAre":3945,"Ġrejected":3946,"Ġemerging":3947,"Ġcounts":3948,"Ġnations":3949,"Ġfalse":3950,"Ġtreat":3951,"va":3952,"Ġweak":3953,"ĠHighway":3954,"down":3955,"Ġstruggled":3956,"ĠMP":3957,"Ġguests":3958,"Ġgender":3959,"Ġhouses":3960,"rit":3961,"ĠWild":3962,"Ġstreak":3963,"uc":3964,"ĠReserve":3965,"ĠRatings":3966,"alt":3967,"Ġgreatest":3968,"Ġlawyers":3969,"Ġreaching":3970,"Ġtemperatures":3971,"To":3972,"Ġoutstanding":3973,"Ġpasses":3974,"Ġfaith":3975,"inc":3976,"Ġcr":3977,"Ġinformed":3978,"oz":3979,"Ġtrees":3980,"Ġsending":3981,"Ġ150":3982,"bo":3983,"Ġwine":3984,"ros":3985,"Ġsuspected":3986,"Ġrepeatedly":3987,"Ġhat":3988,"Ġshape":3989,"ĠWh":3990,"Ġassist":3991,"Ġstress":3992,"Ġfeed":3993,"ark":3994,"ored":3995,"Ġwatched":3996,"Ġincredible":3997,"cl":3998,"nt":3999,"Ġentertainment":4000,"ih":4001,"Ġbeauty":4002,"Ġbi":4003,"ĠLocal":4004,"Ġsat":4005,"41":4006,"Ġbroad":4007,"Ġheavily":4008,"Ġengaged":4009,"Ġspecifically":4010,"ĠMen":4011,"ĠRoss":4012,"Ġ2005":4013,"ST":4014,"95":4015,"Ġdownload":4016,"400":4017,"Ġsentenced":4018,"ĠCatholic":4019,"ĠOklahoma":4020,"Ġthrew":4021,"Ġworry":4022,"Ġimp":4023,"Ġdrove":4024,"Ġcolleagues":4025,"Ġagenda":4026,"64":4027,"ĠEach":4028,"Ġfee":4029,"New":4030,"ium":4031,"Ġspokesperson":4032,"Ġbills":4033,"Ġ47":4034,"ĠAfghanistan":4035,"Ġinvited":4036,"ĠYouTube":4037,"Ġanniversary":4038,"Ġdozen":4039,"ram":4040,"ĠOnly":4041,"Ġemployment":4042,"Getty":4043,"Ġgap":4044,"Ġsweet":4045,"ĠLittle":4046,"Ġinf":4047,"ying":4048,"Ġglass":4049,"Ġclasses":4050,"Ġcoal":4051,"ĠSub":4052,"Ġduty":4053,"CA":4054,"Ġcoaches":4055,"Â":4056,"anna":4057,"ĠSk":4058,"Ġ46":4059,"ison":4060,"ille":4061,"ĠST":4062,"ric":4063,"Ġparticipate":4064,"Ġequ":4065,"Ġrich":4066,"Ġrespectively":4067,"Ġexpenses":4068,"Ġcombination":4069,"right":4070,"Ġshareholders":4071,"Ġturns":4072,"Ġearn":4073,"Ġ51":4074,"ured":4075,"Ġdrink":4076,"ĠKar":4077,"ĠShares":4078,"ĠMid":4079,"ĠGetty":4080,"Ġbridge":4081,"lo":4082,"Ġinspired":4083,"Ġsurface":4084,"Ġgift":4085,"ence":4086,"Ġchallenging":4087,"Ġoffices":4088,"Ġsuspects":4089,"ĠFinance":4090,"Ġab":4091,"bound":4092,"Ġmomentum":4093,"Ġbacked":4094,"Ġparent":4095,"Ġcrucial":4096,"ave":4097,"Ġdealing":4098,"Ġregulatory":4099,"Ġapparently":4100,"ĠMat":4101,"Ġapart":4102,"Ġport":4103,"ole":4104,"Ġbeach":4105,"Ġcultural":4106,"Ġinstitutional":4107,"Ġbeating":4108,"ĠIowa":4109,"ĠAli":4110,"67":4111,"Ġje":4112,"ays":4113,"Ġweekly":4114,"Ġbirthday":4115,"Ġpipeline":4116,"Ġknee":4117,"Ġsolar":4118,"ĠPe":4119,"Ġcategory":4120,"ĠArea":4121,"ky":4122,"ures":4123,"06":4124,"ĠBall":4125,"Ġsemi":4126,"ĠHamilton":4127,"hip":4128,"ĠPh":4129,"ĠNext":4130,"Ġathletes":4131,"ii":4132,"Ġmovies":4133,"han":4134,"net":4135,"Ġplastic":4136,"Ġbehalf":4137,"gen":4138,"Ġfindings":4139,"Ġstretch":4140,"ĠSa":4141,"Ġofficially":4142,"ĠSarah":4143,"Ġprivacy":4144,"ĠMad":4145,"Ġnone":4146,"gh":4147,"On":4148,"Ġdrama":4149,"ĠFl":4150,"ika":4151,"ĠArsenal":4152,"Ġviolent":4153,"UN":4154,"called":4155,"59":4156,"Ġhate":4157,"Ġrelationships":4158,"Ġgranted":4159,"ĠJon":4160,"Ġlisten":4161,"season":4162,"Ġfewer":4163,"GA":4164,"ĠLabour":4165,"Ġremarks":4166,"ĠJonathan":4167,"ĠRos":4168,"sey":4169,"ĠOntario":4170,"ĠThompson":4171,"ĠNight":4172,"Ġranked":4173,"ĠUkraine":4174,"Ġimmigrants":4175,"Ġdegrees":4176,"ĠGe":4177,"Ġlabor":4178,"umb":4179,"ĠYORK":4180,"Ġallies":4181,"sp":4182,"hed":4183,"sw":4184,"Ġtariffs":4185,"SP":4186,"Ġclassic":4187,"Ġawards":4188,"ents":4189,"Ġfix":4190,"Ġsoccer":4191,"Ġconcert":4192,"ust":4193,"Ġadult":4194,"Ġoutput":4195,"Ġmanaging":4196,"02":4197,"Ġpromise":4198,"Ġawareness":4199,"Ġgross":4200,"Ġentering":4201,"Ġpo":4202,"oj":4203,"Ġmetal":4204,"Ġexit":4205,"Ġexcellent":4206,"Ġclubs":4207,"hold":4208,"Ġreplaced":4209,"ĠClass":4210,"Ġscientists":4211,"Ġprimarily":4212,"ĠMer":4213,"ão":4214,"Ġcircumstances":4215,"ades":4216,"Ġsupplies":4217,"aker":4218,"ĠSand":4219,"Ġscandal":4220,"Ġsettlement":4221,"ĠWisconsin":4222,"ĠWarriors":4223,"ĠAustin":4224,"Ġjournalists":4225,"ening":4226,"Ġreflect":4227,"ĠBuy":4228,"ĠAwards":4229,"Ġselection":4230,"ĠBel":4231,"bury":4232,"Ġtechnologies":4233,"%,":4234,"ime":4235,"ĠÄ":4236,"ĠAdministration":4237,"Ġchannel":4238,"Star":4239,"Ġtransport":4240,"Ġawarded":4241,"ena":4242,"Ġmotor":4243,"orn":4244,"kin":4245,"Ġfeaturing":4246,"Ġphones":4247,"ĠAND":4248,"Ġrelevant":4249,"ĠSee":4250,"Ġwinners":4251,"Ġdad":4252,"ĠSource":4253,"ĠCheck":4254,"aut":4255,"ĠFar":4256,"Ġopponents":4257,"Ġoutcome":4258,"Ġdoors":4259,"Ġsuicide":4260,"ima":4261,"Ġjumped":4262,"Ġperspective":4263,"Ġtransportation":4264,"Ġthinks":4265,"ĠMor":4266,"Ġdeadline":4267,"Ġ53":4268,"ĠDeputy":4269,"ery":4270,"Ġdetailed":4271,"uch":4272,"ĠBur":4273,"Ġtrades":4274,"ĠGreg":4275,"Ġzero":4276,"erson":4277,"ĠChildren":4278,"Ġdu":4279,"66":4280,"Ġmixed":4281,"ĠBarack":4282,"54":4283,"Ġterritory":4284,"Ġac":4285,"Ġconcept":4286,"ĠAdd":4287,"Ġourselves":4288,"Ġreaction":4289,"ĠSydney":4290,"ink":4291,"Ġconsistent":4292,"Ġboat":4293,"room":4294,"Ġdozens":4295,"Ġeffectively":4296,"but":4297,"Ġmotion":4298,"Ġalive":4299,"ĠKey":4300,"weight":4301,"Ġexports":4302,"Ġoperate":4303,"Ġregime":4304,"ĠAuthority":4305,"och":4306,"ĠCR":4307,"leg":4308,"Ġforget":4309,"American":4310,"bs":4311,"Ġthoughts":4312,"ĠSign":4313,"ĠPatriots":4314,"Ġbrief":4315,"ĠOregon":4316,"ĠBal":4317,"Ġmine":4318,"Ġciting":4319,"Ġmagazine":4320,"more":4321,"ERS":4322,"ĠBer":4323,"ua":4324,"ox":4325,"ĠMain":4326,"Ġinstance":4327,"tr":4328,"Ġrestaurants":4329,"ora":4330,"Ġharassment":4331,"\",\"":4332,"Ł":4333,"Ġsilver":4334,"ĠMueller":4335,"ĠSenator":4336,"ĠEvery":4337,"Ġfootage":4338,"ms":4339,"Ġopposed":4340,"ĠLink":4341,"Ġver":4342,"Ġpleased":4343,"ame":4344,"ending":4345,"Ġrivals":4346,"ida":4347,"ike":4348,"ta":4349,"ĠCook":4350,"Ġheadquarters":4351,"ear":4352,"Ġaggressive":4353,"Ġcourts":4354,"ĠMuseum":4355,"Ġim":4356,"ĠHoldings":4357,"Ġcommunication":4358,"Ġphase":4359,"yl":4360,"Ġpowers":4361,"Ġproved":4362,"Ġcarbon":4363,"Ġaside":4364,"ĠOlympics":4365,"Ġgathered":4366,"ĠPennsylvania":4367,"Ġsmartphone":4368,"ĠMet":4369,"ĠHurricane":4370,"Ġprotected":4371,"Ġcommunications":4372,"Ġemerged":4373,"Ġaim":4374,"Ġstable":4375,"ides":4376,"GB":4377,"Ġentirely":4378,"Ġmissile":4379,"ĠGen":4380,"Ġunclear":4381,"Ġelectricity":4382,"ology":4383,"away":4384,"Ġlicense":4385,"ĠPittsburgh":4386,"Ġcameras":4387,"Ġmusical":4388,"Ġmanagers":4389,"57":4390,"Ġscores":4391,"Ġprofile":4392,"hel":4393,"¼":4394,"Ġshouldn":4395,"RA":4396,");":4397,"Ġpermanent":4398,"ome":4399,"Ġet":4400,"Ġmar":4401,"Ġfavor":4402,"Ġmaker":4403,"Ġdiscussions":4404,"ory":4405,"Ġsharp":4406,"Ġpleaded":4407,"Ġpassenger":4408,"quarter":4409,"Ġdem":4410,"Ġversus":4411,"Ġmainly":4412,"Ġeighth":4413,"ĠAirport":4414,"ĠCross":4415,"million":4416,"ĠNas":4417,"Ġcited":4418,"56":4419,"Ġyes":4420,"ĠBelow":4421,"arn":4422,"ĠTurkish":4423,"ĠSl":4424,"Ġstepped":4425,"Ġproducers":4426,"Ġovernight":4427,"Ġsounds":4428,"52":4429,"Ġ64":4430,"Ġ54":4431,"58":4432,"ĠClark":4433,"ĠRick":4434,"Ġgr":4435,"ĠMont":4436,"Ġbeer":4437,"une":4438,"Ġreporter":4439,"Ġcharity":4440,"Ġeating":4441,"Ġextend":4442,"Ġguess":4443,"NA":4444,"Ġhedge":4445,"Ġencouraged":4446,"owned":4447,"ĠMel":4448,"ĠKentucky":4449,"ace":4450,"Ġlineup":4451,"Ġhosts":4452,"Ġcapable":4453,"PR":4454,"ĠArts":4455,"Ġcontroversial":4456,"Ġhosted":4457,"ries":4458,"Ġroster":4459,"Ġfixed":4460,"ĠWalker":4461,"ged":4462,"Ġdisaster":4463,"Ġdispute":4464,"ĠDenver":4465,"ĠTrade":4466,"ute":4467,"ese":4468,"cy":4469,"Ġgrant":4470,"ĠMax":4471,"Ġdistance":4472,"isc":4473,"Ġeditor":4474,"ĠDave":4475,"Ġperformances":4476,"Ġlay":4477,"Ġvulnerable":4478,"ĠMurray":4479,"ĠâĤ¬":4480,"Ġmining":4481,"Ġ2004":4482,"level":4483,"ability":4484,"Ġauto":4485,"Ġfake":4486,"Ġattacked":4487,"ona":4488,"ups":4489,"ened":4490,"Ġfallen":4491,"Ġstations":4492,"ĠContact":4493,"itz":4494,"Ġincidents":4495,"Ġcomplaints":4496,"Ġoperates":4497,"Ġrefugees":4498,"Ġessential":4499,"ĠTest":4500,"Ġdemands":4501,"Ġroles":4502,"yr":4503,"Ġacts":4504,"Ġusual":4505,"ring":4506,"Ġhanded":4507,"ĠMatthew":4508,"hour":4509,"Ġindustries":4510,"Ġshoot":4511,"ĠAuthorities":4512,"Ġprobe":4513,"ĠUtah":4514,"ĠRBI":4515,"ĠAD":4516,"Ġprospect":4517,"outs":4518,"ĠUber":4519,"Ġbright":4520,"Ġmention":4521,"Ġsavings":4522,"ĠMiss":4523,"ONDON":4524,"Ġ1990":4525,"arm":4526,"ĠTen":4527,"These":4528,"Ġexplains":4529,"minute":4530,"85":4531,"Ġmaximum":4532,"Ġro":4533,"Ġrookie":4534,"Ġstudio":4535,"ĠCam":4536,"ĠGal":4537,"Ġdefend":4538,"hand":4539,"53":4540,"ĠOil":4541,"Ġserves":4542,"Ġsn":4543,"ios":4544,"ĠDefense":4545,"AB":4546,"Ġhired":4547,"Ġsupports":4548,"Ġpremium":4549,"ef":4550,"Ġfailing":4551,"ĠIndiana":4552,"Ġexp":4553,"Ġobjective":4554,"Ġaffordable":4555,"ĠCom":4556,"ĠThanks":4557,"Ġanywhere":4558,"Ġconfirm":4559,"ited":4560,"Ġrepresenting":4561,"Ġwitness":4562,"69":4563,"Ġclaiming":4564,"Ġviolation":4565,"Ġhistorical":4566,"med":4567,"Ġpreparing":4568,"ĠTech":4569,"Ġposts":4570,"OC":4571,"ĠGraham":4572,"ĠGl":4573,"ĠLions":4574,"ales":4575,"ĠID":4576,"Ġcorrect":4577,"ĠAntonio":4578,"Ġadvertising":4579,"Ġeastern":4580,"OW":4581,"Ġholdings":4582,"Ġpolls":4583,"ĠSH":4584,"Ġexecutives":4585,"ĠJewish":4586,"ĠGary":4587,"Ġprize":4588,"ĠCommissioner":4589,"Ġcells":4590,"ify":4591,"Ġlunch":4592,"Ġdemocracy":4593,"ĠEr":4594,"Ġregularly":4595,"Ġresulted":4596,"ĠAve":4597,"ĠPartners":4598,"Ġrewritten":4599,"Ġlo":4600,"Ġcooperation":4601,"ĠGulf":4602,"Ġsmoke":4603,"ĠMemorial":4604,"Ġwave":4605,"Ġfears":4606,"Ġkid":4607,"ĠGiants":4608,"Ġrecovered":4609,"row":4610,"ĠRadio":4611,"ĠBarcelona":4612,"Ġwonderful":4613,"ĠDow":4614,"Ġstream":4615,"ĠSimon":4616,"Ġdetail":4617,"Ġvolunteers":4618,"ĠInd":4619,"Ġforms":4620,"mann":4621,"ĠRay":4622,"oor":4623,"ĠTake":4624,"Ġrepresented":4625,"het":4626,"Ġblow":4627,"aged":4628,"RE":4629,"ĠMissouri":4630,"Ġcovering":4631,"Ġprofits":4632,"Ġconcluded":4633,"Ġthus":4634,"ĠColumbia":4635,"ode":4636,"ĠZimbabwe":4637,"Ġdisclosed":4638,"Ġlifted":4639,"ĠSean":4640,"ĠHarvey":4641,"ĠPlus":4642,"ces":4643,"ĠGreece":4644,"ĠLady":4645,"Ġdelay":4646,"Ġkitchen":4647,"ĠIndex":4648,"Ġbear":4649,"Ġputs":4650,"new":4651,"88":4652,"ĠAsh":4653,"Å¡":4654,"Ġperforming":4655,"law":4656,"ĠPart":4657,"Ġindicated":4658,"Ġannounce":4659,"Ġcompensation":4660,"Ġka":4661,"ĠScience":4662,"ris":4663,"Ġrecommendations":4664,"ĠSecond":4665,"Ġlights":4666,"Ġtemporary":4667,"urs":4668,"Ġwestern":4669,"stone":4670,"68":4671,"ĠDisney":4672,"Ġplayoffs":4673,"Ġjudges":4674,"Ġengineering":4675,"ĠPen":4676,"ĠPal":4677,"Ġobvious":4678,"ĠBridge":4679,"ĠEnd":4680,"ĠArab":4681,"Ġexcept":4682,"Ġhole":4683,"class":4684,"Ġcauses":4685,"Ġconnect":4686,"ĠAI":4687,"An":4688,"Ġchose":4689,"ĠElizabeth":4690,"min":4691,"Ġproper":4692,"ĠNHL":4693,"Ġraces":4694,"Ġinnovation":4695,"Ġsugar":4696,"600":4697,"ĠModi":4698,"illa":4699,"Ġtrillion":4700,"ĠSar":4701,"ĠAffairs":4702,"Ġimpossible":4703,"Ġguide":4704,"Ġcaptured":4705,"ĠSales":4706,"Ġspecies":4707,"51":4708,"Ġar":4709,"Ġmaster":4710,"Ġstayed":4711,"iro":4712,"ĠEconomic":4713,"Ġvast":4714,"ili":4715,"Ġpet":4716,"ye":4717,"77":4718,"Ġkeeps":4719,"ĠPhil":4720,"ĠEPS":4721,"ĠRegional":4722,"Ġsectors":4723,"Ġdesire":4724,"ĠStanley":4725,"¾":4726,"Ġunknown":4727,"Ġpot":4728,"ĠPR":4729,"Ġknowing":4730,"Ġflying":4731,"ĠTreasury":4732,"iers":4733,"enn":4734,"ably":4735,"Ġsick":4736,"Ġmanner":4737,"Ġmanufacturers":4738,"Ġchampions":4739,"gy":4740,"Part":4741,"ister":4742,"ĠMountain":4743,"Ġimagine":4744,"Ġportion":4745,"ĠCamp":4746,"Ġchemical":4747,"ible":4748,"ĠAnaly":4749,"ĠBureau":4750,"Ġpm":4751,"Ġupdated":4752,"Ġetc":4753,"ĠField":4754,"iles":4755,"Ġobtained":4756,"Ġstick":4757,"Ġcat":4758,"har":4759,"Ġmarked":4760,"Ġmedium":4761,"ĠDes":4762,"People":4763,"Ġwealth":4764,"ores":4765,"ĠBaltimore":4766,"Ġtip":4767,"Ġdismissed":4768,"ĠVictoria":4769,"ĠBrad":4770,"Ch":4771,"Ġ56":4772,"Ġstadium":4773,"eth":4774,"Ġthunder":4775,"Ġtested":4776,"Ġdrawn":4777,"Ġcounsel":4778,"ld":4779,"Ġspirit":4780,"uss":4781,"Ġtheme":4782,"my":4783,"Ġnecessarily":4784,"Ġelements":4785,"Ġcollected":4786,"ĠRes":4787,"ĠMaryland":4788,"ĠEnter":4789,"Ġfounded":4790,"ae":4791,"Ġpilot":4792,"Ġshoulder":4793,"PC":4794,"Ġargument":4795,"Ġyen":4796,"Ġreceiver":4797,"Ġharm":4798,"ĠET":4799,"Ġprotesters":4800,"Ġ72":4801,"ĠAaron":4802,"Ġed":4803,"Ġexpecting":4804,"\":\"":4805,"Ġbike":4806,"Äĩ":4807,"Ġluxury":4808,"half":4809,"ĠBarbara":4810,"Ġfoundation":4811,"Ġill":4812,"Ġsubmitted":4813,"Ġdeeply":4814,"Ġhospitals":4815,"ĠBJP":4816,"Ġshock":4817,"Ġplatforms":4818,"Ġsummary":4819,"ĠWhere":4820,"Ġcelebration":4821,"iff":4822,"Ġveterans":4823,"Ġachieved":4824,"fl":4825,"Ġactivists":4826,"ĠManager":4827,"Ġformal":4828,"Ġformed":4829,"Ġinvestigate":4830,"ĠKyle":4831,"Ġ:":4832,"ĠRa":4833,"ovic":4834,"Ġdrinking":4835,"Ġnetworks":4836,"ĠAlexander":4837,"ĠOs":4838,"Ġ)":4839,"Ġbomb":4840,"Ġrecalled":4841,"ito":4842,"ient":4843,"Ġrepresentatives":4844,"ĠChrist":4845,"ĠWay":4846,"Ġdeadly":4847,"Ġinvesting":4848,"ĠRussell":4849,"Ġconsumption":4850,"Ġharder":4851,"Ġbail":4852,"Ġcritics":4853,"Ġdanger":4854,"Ġdrew":4855,"ĠSol":4856,"Ġcopyright":4857,"ĠHenry":4858,"Ġbuyers":4859,"Ġresidential":4860,"Ġmaintenance":4861,"pr":4862,"Ġmarks":4863,"Ġages":4864,"Ġcovers":4865,"Ġton":4866,"Ġtitles":4867,"ĠPS":4868,"ĠEvans":4869,"Ġmigrants":4870,"Ġflights":4871,"Ġmonitoring":4872,"Ġaddressed":4873,"Ġvital":4874,"Ġcontrolled":4875,"Ġweapon":4876,"Ġinches":4877,"Ġreduction":4878,"Ġurban":4879,"Ġcoaching":4880,"Ġreducing":4881,"ila":4882,"Ġrealize":4883,"Ġmeat":4884,"Ġref":4885,"Ġoverseas":4886,"Ġblame":4887,"Ġterrorist":4888,"Ġstuck":4889,"ĠUs":4890,"esh":4891,"pro":4892,"Ġ58":4893,"ough":4894,"Ġexposure":4895,"ĠAbu":4896,"state":4897,"Ġproviders":4898,"Ġfore":4899,"Ġjet":4900,"bar":4901,"Ġownership":4902,"ret":4903,"Ġupset":4904,"Ġfacts":4905,"Ġpurchasing":4906,"Ġreforms":4907,"Ġriver":4908,"Ġsomebody":4909,"Ġguest":4910,"iy":4911,"Ġauction":4912,"ĠReading":4913,"Ġconsequences":4914,"Ġrepresentative":4915,"Ġappointment":4916,"add":4917,"Ġcollaboration":4918,"ĠTesla":4919,"ĠCohen":4920,"Ġengagement":4921,"Ġspeaks":4922,"EST":4923,"Ġexposed":4924,"Ġmaintained":4925,"rs":4926,"Ġdating":4927,"ĠProgram":4928,"board":4929,"Ġracing":4930,"Ġpension":4931,"ign":4932,"iti":4933,"ĠFive":4934,"Ġextensive":4935,"ĠHa":4936,"ĠPoint":4937,"ĠMexican":4938,"Ġexpanded":4939,"Ġtotally":4940,"Ġinvestigations":4941,"ĠOrleans":4942,"Ġcycle":4943,"ĠESPN":4944,"ifying":4945,"Ġcup":4946,"ĠAz":4947,"ĠInvestors":4948,"Ġengage":4949,"reg":4950,"Ġfought":4951,"Ġterrorism":4952,"Ġblocked":4953,"ĠOK":4954,"Äį":4955,"72":4956,"Ġdestroyed":4957,"«":4958,"Ġstaying":4959,"Ġafford":4960,"Ġappearances":4961,"ĠHills":4962,"Ġcrore":4963,"Ġstrategies":4964,"Ġtips":4965,"ĠSm":4966,"ĠFr":4967,"Ġbanned":4968,"ĠSon":4969,"ask":4970,"Ġlimits":4971,"Ġrecognition":4972,"Ġeligible":4973,"ĠGar":4974,"Ġvolatility":4975,"Ġlaid":4976,"nes":4977,"Ġgrade":4978,"ĠRE":4979,"ĠHart":4980,"Ġ57":4981,"oma":4982,"Ġuncertainty":4983,"Ġrecognized":4984,"ĠPC":4985,"Ġchosen":4986,"uz":4987,"Ġadviser":4988,"una":4989,"Ġassessment":4990,"Ġreveal":4991,"mo":4992,"After":4993,"ĠBro":4994,"ĠOff":4995,"Ġpeak":4996,"Ġreferred":4997,"ĠSC":4998,"Ġ2003":4999,"ification":5000,"Ġshutdown":5001,"ĠOfficials":5002,"ias":5003,"Ġextreme":5004,"Ġflood":5005,"Ġhockey":5006,"Ġwage":5007,"ĠNet":5008,"Ġdamaged":5009,"Ġreplacement":5010,"ĠMaria":5011,"Ġcreation":5012,"Ġguns":5013,"aci":5014,"Ġworker":5015,"do":5016,"Ġviewers":5017,"Ġseed":5018,"sts":5019,"Ġtouchdowns":5020,"Ġmistake":5021,"ray":5022,"ull":5023,"Ġpricing":5024,"Ġstrongly":5025,"Ġaims":5026,"ĠNavy":5027,"ĠEgypt":5028,"ker":5029,"Ġve":5030,"ĠSteven":5031,"Ġres":5032,"ational":5033,"Ġrequests":5034,"Ġemissions":5035,"ĠArena":5036,"uma":5037,"ĠAtlantic":5038,"hr":5039,"ĠAFP":5040,"ĠSquare":5041,"Ġcontribute":5042,"Ġfunction":5043,"Ġdec":5044,"ĠNelson":5045,"89":5046,"Ġreferendum":5047,"ĠPre":5048,"Ġapplied":5049,"ĠGMT":5050,"ĠIranian":5051,"ĠNigerian":5052,"ĠAny":5053,"NG":5054,"Ġacknowledged":5055,"Ġreferring":5056,"Ġventure":5057,"Ġimports":5058,"Ġblog":5059,"Ġfutures":5060,"OU":5061,"ĠUFC":5062,"Ġneither":5063,"Ġextension":5064,"hes":5065,"ĠMed":5066,"76":5067,"Ġsustainable":5068,"ains":5069,"Ġreputation":5070,"ĠVancouver":5071,"Ġbasically":5072,"acy":5073,"Ġsad":5074,"ĠFrancis":5075,"ĠKennedy":5076,"ĠNevada":5077,"ĠLu":5078,"ras":5079,"ĠAv":5080,"Ġrear":5081,"ĠHo":5082,"Ġproperly":5083,"abe":5084,"ĠHotel":5085,"Ġopinions":5086,"under":5087,"ĠStation":5088,"ĠFOR":5089,"ops":5090,"Ġadopted":5091,"ĠSwiss":5092,"ĠCountry":5093,"ĠTer":5094,"ĠAndy":5095,"Me":5096,"ĠCooper":5097,"ĠTigers":5098,"ĠCreek":5099,"Ġgay":5100,"iner":5101,"ĠAN":5102,"Ġbird":5103,"lla":5104,"ĠKate":5105,"ĠPet":5106,"ni":5107,"Ġprospects":5108,"ater":5109,"ites":5110,"Ġescape":5111,"lam":5112,"ake":5113,"Ġ1980":5114,"ĠLag":5115,"Ġsuccessfully":5116,"Ġdistricts":5117,"Ġministers":5118,"aries":5119,"Ġframe":5120,"ĠON":5121,"ĠEuro":5122,"ĠMarkets":5123,"Ġregister":5124,"Ġdefeated":5125,"Ġdevelopments":5126,"Ġninth":5127,"Ġquiet":5128,"Ġgenerated":5129,"Ġvaluable":5130,"Ġrecommended":5131,"ĠTheatre":5132,"ĠCap":5133,"bed":5134,"Ġreference":5135,"Ġease":5136,"oring":5137,"Ġ66":5138,"Ġimprovements":5139,"Ġelsewhere":5140,"ĠHillary":5141,"Ġdefender":5142,"ĠRight":5143,"zy":5144,"Ġcomprehensive":5145,"Ġspotted":5146,"ĠOakland":5147,"ĠOk":5148,"ĠSystem":5149,"ique":5150,"Ġpersons":5151,"Ġexist":5152,"Ġbroader":5153,"Ġclinical":5154,"Ġ2001":5155,"oul":5156,"Ġsecurities":5157,"ghan":5158,"Ġshelter":5159,"ero":5160,"ATED":5161,"Ġhosting":5162,"Ġselect":5163,"ĠKavanaugh":5164,"Ġrestrictions":5165,"osa":5166,"Ġyields":5167,"ĠLA":5168,"Ġ59":5169,"Ġwonder":5170,"Ġabsence":5171,"ür":5172,"ÅĤ":5173,"DP":5174,"Ġelectronic":5175,"Ġillegally":5176,"Ġmicro":5177,"ĠNEW":5178,"Ġhall":5179,"Ġaged":5180,"Ġtemperature":5181,"cast":5182,"atic":5183,"Ġlegacy":5184,"Ġaffairs":5185,"ji":5186,"ĠResources":5187,"Ġgang":5188,"winning":5189,"Ġattending":5190,"aro":5191,"Ġfriendly":5192,"aine":5193,"Ġcannabis":5194,"Ġairline":5195,"Ġnoting":5196,"Ġprofessionals":5197,"ĠFREE":5198,"RC":5199,"Ġfinancing":5200,"Ġindependence":5201,"ved":5202,"Ġresulting":5203,"Ġsteady":5204,"ĠWinter":5205,"uring":5206,"Ġhoped":5207,"98":5208,"Ġpresentation":5209,"aya":5210,"Ġrated":5211,"osh":5212,"ĠAnalysis":5213,"=":5214,"Ġdonations":5215,"IR":5216,"Ġcombat":5217,"ĠHoward":5218,"anda":5219,"79":5220,"Ġinvested":5221,"Ġexpanding":5222,"omb":5223,"ress":5224,"ble":5225,"Ġjournalist":5226,"ĠWoods":5227,"Ġcenters":5228,"ott":5229,"Ġstreaming":5230,"Ġterror":5231,"Ġsustained":5232,"ĠWWE":5233,"pre":5234,"ÅŁ":5235,"ait":5236,"Ġarrival":5237,"Ġresidence":5238,"Ġextent":5239,"Ġarrive":5240,"Ġ2002":5241,"Ġestablish":5242,"74":5243,"ĠArgentina":5244,"ĠDem":5245,"inn":5246,"aud":5247,"ĠNCAA":5248,"Ġquestioned":5249,"Ġballot":5250,"Ġmin":5251,"Ġlandscape":5252,"Ġhorse":5253,"Ġopponent":5254,"iel":5255,"Ġprompted":5256,"atory":5257,"Ġlift":5258,"Ġassociation":5259,"cher":5260,"Ġdefending":5261,"Ġtiny":5262,"Ġpoverty":5263,"ĠSafety":5264,"Ġpetition":5265,"ĠLimited":5266,"ĠCA":5267,"FC":5268,"Ãł":5269,"oni":5270,"Ġmonitor":5271,"ÃŃa":5272,"MA":5273,"Ġanswers":5274,"ĠMitchell":5275,"Ġbo":5276,"ĠShah":5277,"Ġsm":5278,"Ġmedal":5279,"ĠCivil":5280,"Ġrecognize":5281,"key":5282,"Ġpregnant":5283,"Ġspots":5284,"ante":5285,"Ġacademic":5286,"Ġinitiatives":5287,"Ġsecured":5288,"ĠCL":5289,"ils":5290,"Ġanticipated":5291,"Ġinvolvement":5292,"ĠMake":5293,"Ġinsisted":5294,"ĠWales":5295,"Ġclothing":5296,"Ġtracks":5297,"Ġsymptoms":5298,"Ġplate":5299,"ĠNY":5300,"Ġretailers":5301,"ĠPan":5302,"Ġfled":5303,"Ġquoted":5304,"Ġsaved":5305,"ĠCarter":5306,"Ġteaching":5307,"ĠTokyo":5308,"ĠCr":5309,"ĠSix":5310,"ĠPicture":5311,"Ġrecover":5312,"Ġcomedy":5313,"ree":5314,"Ġstrikes":5315,"ĠSanders":5316,"sel":5317,"Ġgraduate":5318,"Ġpending":5319,"St":5320,"Ġwarrant":5321,"Ġhonest":5322,"ĠGM":5323,"Ġnoticed":5324,"ĠGalaxy":5325,"ider":5326,"Ġproposals":5327,"Ġwore":5328,"Ġindeed":5329,"EM":5330,"ĠChannel":5331,"ances":5332,"ĠBrady":5333,"86":5334,"Ġgotten":5335,"Ġthrowing":5336,"ĠLeader":5337,"ĠVideo":5338,"71":5339,"Ġwelcomed":5340,"NEW":5341,"Ġfairly":5342,"Ġpromises":5343,"ĠSilver":5344,"Ġrape":5345,"Ġopener":5346,"ares":5347,"ĠSir":5348,"making":5349,"Ġcur":5350,"Ġrooms":5351,"73":5352,"Ġamounts":5353,"ĠIndustry":5354,"ĠDar":5355,"Ġ62":5356,"ted":5357,"Ġabroad":5358,"ĠMaybe":5359,"Ġreaders":5360,"oke":5361,"Ġpublication":5362,"ĠJean":5363,"Ġoperator":5364,"ĠHaving":5365,"ĠMil":5366,"life":5367,"Ġgenerate":5368,"ĠCraig":5369,"ĠMass":5370,"ĠBh":5371,"Ġrequested":5372,"Ġcrazy":5373,"ĠSpace":5374,"Ġcopy":5375,"Ġexport":5376,"Ġcontext":5377,"Ġbr":5378,"62":5379,"ĠRobinson":5380,"Ġcyber":5381,"ENT":5382,"BI":5383,"arg":5384,"Ġspeaker":5385,"Ġdramatic":5386,"ĠOl":5387,"ĠMill":5388,"Ġtrained":5389,"Ġediting":5390,"Ġsalary":5391,"Ġdirectors":5392,"Ġexplore":5393,"Ġlucky":5394,"Ġprominent":5395,"Ġbrothers":5396,"Ġneck":5397,"icht":5398,"ĠWatson":5399,"born":5400,"Ġproven":5401,"Ġprincipal":5402,"Ġedition":5403,"Ed":5404,"Ġswitch":5405,"maker":5406,"Ġrelative":5407,"mi":5408,"ĠBruce":5409,"ho":5410,"ĠScottish":5411,"water":5412,"ĠSport":5413,"ĠKings":5414,"ĠCollins":5415,"adi":5416,"Ġcelebrated":5417,"Ġclothes":5418,"Ġsunny":5419,"ĠCharlotte":5420,"ees":5421,"Ġscenes":5422,"ĠData":5423,"Ġwounded":5424,"Ġunusual":5425,"Ġrealized":5426,"ĠPlan":5427,"ĠTrans":5428,"ĠFC":5429,"Ġletters":5430,"Ġalerts":5431,"ĠWarren":5432,"DS":5433,"oss":5434,"pping":5435,"Ġsuspension":5436,"Ġbenchmark":5437,"ĠAcc":5438,"Ġalert":5439,"Ġpassion":5440,"ĠEst":5441,"Ġlatter":5442,"Ġstability":5443,"Ġarts":5444,"Ġpursue":5445,"ĠSeason":5446,"Ġfields":5447,"Ġmethod":5448,"63":5449,"Ġfolks":5450,"Ġexclusive":5451,"Ġcrews":5452,"Ġsessions":5453,"ĠMajor":5454,"ĠMount":5455,"Ġmap":5456,"Ġ=":5457,"Ġsituations":5458,"ĠBerlin":5459,"rey":5460,"Ġdates":5461,"Ġsheet":5462,"ĠLo":5463,"Ġfighters":5464,"ĠMart":5465,"Ġatmosphere":5466,"Ġillness":5467,"Ġcompeting":5468,"ĠChristopher":5469,"ĠRoy":5470,"mm":5471,"iano":5472,"Ġge":5473,"ĠRams":5474,"Ġconversations":5475,"ĠPa":5476,"ĠTel":5477,"Ġappreciate":5478,"78":5479,"ĠTotal":5480,"low":5481,"ĠStone":5482,"Ġopposite":5483,"Ġbarrel":5484,"Ġdevelopers":5485,"Ġexpress":5486,"Ġhighs":5487,"which":5488,"par":5489,"ĠVietnam":5490,"Ġblocks":5491,"Ġrecording":5492,"Ġadjusted":5493,"Ġret":5494,"ĠAR":5495,"Ġmilitants":5496,"Ġinnovative":5497,"ĠGhana":5498,"FR":5499,"Ġfantastic":5500,"Ġmortgage":5501,"ando":5502,"ĠLane":5503,"ises":5504,"ĠÂ":5505,"Ġhomeless":5506,"ĠKal":5507,"Ġapproached":5508,"Ġrounds":5509,"Ġmargins":5510,"ament":5511,"ĠMotor":5512,"Ġencouraging":5513,"ÂŃ":5514,"uru":5515,"Ġhandling":5516,"ĠMassachusetts":5517,"Ġplanet":5518,"ĠSpring":5519,"ĠBon":5520,"gu":5521,"Beat":5522,"Ġdrawing":5523,"ĠPhoenix":5524,"very":5525,"aid":5526,"ĠSte":5527,"ĠEntertainment":5528,"ĠRon":5529,"Ġassigned":5530,"ĠSA":5531,"News":5532,"Ġinterviews":5533,"ĠOh":5534,"media":5535,"vel":5536,"Ġpermission":5537,"Ġtransactions":5538,"Ġtraders":5539,"Ġsolo":5540,"Ġprovincial":5541,"Ġsuggesting":5542,"¡":5543,"Ġdiverse":5544,"Ġ67":5545,"Ġranks":5546,"ĠFre":5547,"Ġfavourite":5548,"Ġ63":5549,"Ġdifferences":5550,"Ġtargeting":5551,"Ġactors":5552,"Ġ76":5553,"icated":5554,"Ġcollect":5555,"akes":5556,"war":5557,"Ġcontained":5558,"ches":5559,"Ġlibrary":5560,"Ġsegments":5561,"ĠLine":5562,"ê":5563,"ual":5564,"Ġbags":5565,"Ġfactory":5566,"Ġear":5567,"Ġsomewhat":5568,"Ġrail":5569,"ĠUP":5570,"ula":5571,"ĠNiger":5572,"Ġlas":5573,"Ġimplementation":5574,"Ġemails":5575,"kel":5576,"wing":5577,"Ġadvised":5578,"--":5579,"istic":5580,"Ġdepth":5581,"Ġshoes":5582,"ĠJennifer":5583,"Ġvenue":5584,"Ġcontain":5585,"Ġhighlights":5586,"Ġcapabilities":5587,"Ġprocesses":5588,"Ġtradition":5589,"Ġcontacted":5590,"Ġproducing":5591,"Ġtrail":5592,"rem":5593,"Ġ600":5594,"Ġ68":5595,"AA":5596,"ĠBa":5597,"ĠSuch":5598,"ĠTyler":5599,"ipp":5600,"Ġsurvived":5601,"ami":5602,"ĠContinue":5603,"Ġcapture":5604,"bi":5605,"61":5606,"96":5607,"Ġthreatening":5608,"Ġkeen":5609,"dale":5610,"Ġtrailer":5611,"Ġstages":5612,"ĠGordon":5613,"Ġfinishing":5614,"Ġlegislative":5615,"Ġuseful":5616,"ĠGreek":5617,"ald":5618,"Ġgrounds":5619,"ĠDu":5620,"storms":5621,"ills":5622,"Ġexpense":5623,"Ġdetained":5624,"Today":5625,"Ġdiet":5626,"Ġwood":5627,"ĠCameron":5628,"Ġthrown":5629,"Ġcricket":5630,"Ġideal":5631,"with":5632,"Ġteammates":5633,"ours":5634,"Ġprojected":5635,"Ġpersonally":5636,"ĠBoy":5637,"rom":5638,"ĠPhilippines":5639,"win":5640,"ges":5641,"Ġcounties":5642,"ĠBaker":5643,"Ġprosecutor":5644,"Ġroof":5645,"met":5646,"Ġpartly":5647,"ĠMoon":5648,"eman":5649,"Ġfocusing":5650,"Ġfishing":5651,"than":5652,"ĠJeremy":5653,"ĠBad":5654,"ais":5655,"Ġcontrols":5656,"Ġtonnes":5657,"Ġshall":5658,"Ġ61":5659,"Ġgathering":5660,"ĠERA":5661,"Ġpresidency":5662,"Ġ85":5663,"ĠGas":5664,"Ġscenario":5665,"Ġquarters":5666,"Ġang":5667,"Ġsettled":5668,"ĠCommerce":5669,"Ġanybody":5670,"Ġgarden":5671,"ĠLibrary":5672,"Ġbet":5673,"Ġtopic":5674,"olo":5675,"Ġintense":5676,"87":5677,"Ġlinks":5678,"Ġmed":5679,"ĠAG":5680,"Ġflooding":5681,"ĠMurphy":5682,"PM":5683,"Ġfinds":5684,"Ġsensitive":5685,"pped":5686,"Ġcompletion":5687,"Ġminority":5688,"Ġvon":5689,"Ġstriking":5690,"rich":5691,"Ġbars":5692,"Ġefficient":5693,"Ġcontributions":5694,"Ġvisits":5695,"Ġattract":5696,"ĠMalaysia":5697,"ĠREL":5698,"Ġopens":5699,"Ġessentially":5700,"Ġreasonable":5701,"Ġsentiment":5702,"ĠMelbourne":5703,"Ġfitness":5704,"Ġfrequently":5705,"ĠRangers":5706,"Ġmuseum":5707,"ĠDNA":5708,"Ġcontrast":5709,"ĠAdams":5710,"ĠWin":5711,"Ġfalls":5712,"Ġimposed":5713,"250":5714,"ood":5715,"ĠRio":5716,"Ġchoices":5717,"Ġyellow":5718,"rin":5719,"ben":5720,"ĠStaff":5721,"ĠIndonesia":5722,"Ġcarries":5723,"Ġtourism":5724,"UM":5725,"ĠOrange":5726,"sell":5727,"Ġresolve":5728,"ĠMumbai":5729,"Ġpan":5730,"Ġimplement":5731,"Ġmidfielder":5732,"OP":5733,"Ġtensions":5734,"Ġ800":5735,"ĠLord":5736,"ĠLight":5737,"Ġlies":5738,"és":5739,"Ġparticipation":5740,"Ġtries":5741,"Ġsheriff":5742,"degree":5743,"Ġcongressional":5744,"Ġmode":5745,"Ġregulation":5746,"ĠJacob":5747,"ĠCrown":5748,"Ġbowl":5749,"ĠMississippi":5750,"Ġtheft":5751,"ĠKingdom":5752,"Ġresort":5753,"Ġroyal":5754,"Ġunemployment":5755,"PP":5756,"Ġnomination":5757,"ĠTR":5758,"Ġbehaviour":5759,"bank":5760,"ĠForest":5761,"WASHINGTON":5762,"ĠOthers":5763,"Ġslowly":5764,"Ġmenu":5765,"vo":5766,"ĠSy":5767,"ĠMetro":5768,"ĠLisa":5769,"Ġregistration":5770,"While":5771,"ĠJesus":5772,"Ġ250":5773,"Ġprocessing":5774,"Ġmonetary":5775,"ape":5776,"ener":5777,"ĠSystems":5778,"Ġdisappointed":5779,"Ġprint":5780,"uy":5781,"ħ":5782,"Ġdemanding":5783,"Ġincredibly":5784,"play":5785,"Ġsurveillance":5786,"ĠStandard":5787,"Ġperiods":5788,"Ġwrites":5789,"ĠLuke":5790,"ĠPalestinian":5791,"Ġwalks":5792,"Ġriding":5793,"Ġwaters":5794,"ĠSox":5795,"Ġtraveling":5796,"Ġtap":5797,"Ġorganized":5798,"Ġresource":5799,"Ġangry":5800,"Ġtiming":5801,"Ġempty":5802,"Ġmilk":5803,"Ġtherapy":5804,"ĠBrandon":5805,"mon":5806,"Ġnationwide":5807,"Ġnovel":5808,"ĠStorm":5809,"iet":5810,"ĠBre":5811,"Ġbegun":5812,"Ġdiplomatic":5813,"Ġads":5814,"ĠDC":5815,"ĠOb":5816,"ĠMontreal":5817,"ĠDown":5818,"ĠMilwaukee":5819,"Ġmeal":5820,"ĠPuerto":5821,"ĠMas":5822,"Ġjoy":5823,"Ġdeparture":5824,"ĠWright":5825,"Ġspoken":5826,"style":5827,"ĠAction":5828,"ĠComey":5829,"Ġdelivering":5830,"Ġtoll":5831,"Ġmidnight":5832,"ĠRevenue":5833,"Ġfiring":5834,"Ġstunning":5835,"Ġkicked":5836,"ĠOttawa":5837,"Ġefficiency":5838,"ĠLincoln":5839,"Ġtaste":5840,"ez":5841,"ĠWeather":5842,"ĠMorning":5843,"Ġhadn":5844,"Ġdiversity":5845,"ily":5846,"ĠAy":5847,"Ġargue":5848,"Ġerror":5849,"Ġtaught":5850,"Ġche":5851,"Ġoccasion":5852,"Ġinc":5853,"ĠOrlando":5854,"ĠOnline":5855,"Ġlegs":5856,"ĠNation":5857,"uck":5858,"Ġwidespread":5859,"ĠOcean":5860,"Ġconstantly":5861,"ĠLatin":5862,"Ġcomfort":5863,"Ġrely":5864,"uff":5865,"ĠCard":5866,"aring":5867,"Ġhumans":5868,"ĠThomson":5869,"aka":5870,"BIT":5871,"ĠReview":5872,"po":5873,"ú":5874,"Ġtrucks":5875,"Ġforecasts":5876,"view":5877,"Ġlongtime":5878,"ĠConstitution":5879,"Ġreserves":5880,"bit":5881,"Ġstressed":5882,"Ġcontribution":5883,"Ġchicken":5884,"ĠDE":5885,"Ġfat":5886,"ĠOscar":5887,"Ġcriticized":5888,"Ġtestimony":5889,"Ġapparent":5890,"Ġconstant":5891,"Ġcabinet":5892,"ĠDuke":5893,"Ġaspects":5894,"lic":5895,"ĠVol":5896,"Ġwing":5897,"Ġreb":5898,"ĠSessions":5899,"ĠSmart":5900,"car":5901,"ĠIm":5902,"Ġoperational":5903,"Ġregulators":5904,"ĠJimmy":5905,"eter":5906,"Ġnobody":5907,"ĠMarc":5908,"Ġliterally":5909,"Ġresistance":5910,"ĠKam":5911,"Ġsexually":5912,"Ġ69":5913,"uth":5914,"Ġviewed":5915,"Ġpicks":5916,"Ġdin":5917,"Ġtalented":5918,"Ġtennis":5919,"Ġstrengthen":5920,"Ġgl":5921,"ĠProtection":5922,"Ġinstalled":5923,"ways":5924,"ĠCampbell":5925,"ĠPortland":5926,"Ġintent":5927,"ĠPalace":5928,"Ġsecondary":5929,"Ġlocked":5930,"ĠPA":5931,"Ġlanded":5932,"Ġlength":5933,"Ġboosted":5934,"Ġpurchases":5935,"Ġcommand":5936,"ĠAsked":5937,"Ġspaces":5938,"Ġiconic":5939,"Ġrecommend":5940,"Ġduties":5941,"Ġseized":5942,"Ġdelayed":5943,"FA":5944,"AND":5945,"daq":5946,"Ġhiring":5947,"Ġoccur":5948,"DC":5949,"ĠMus":5950,"Ġag":5951,"Ġhopefully":5952,"ĠPenn":5953,"ards":5954,"Ġstriker":5955,"Ġrent":5956,"ĠTy":5957,"ĠBuffalo":5958,"ĠKy":5959,"Ġhike":5960,"pper":5961,"Ġ120":5962,"Ġop":5963,"Ġwheel":5964,"ĠIan":5965,"Ġchart":5966,"tt":5967,"Ġvolunteer":5968,"IG":5969,"person":5970,"ight":5971,"ĠBook":5972,"unt":5973,"ĠTechnologies":5974,"Now":5975,"Ġfavour":5976,"ĠGh":5977,"ĠQatar":5978,"ĠDutch":5979,"ĠGrant":5980,"ĠBan":5981,"rel":5982,"Ġagreements":5983,"Ġeducational":5984,"worth":5985,"ĠWard":5986,"700":5987,"Ġanymore":5988,"Ġrepair":5989,"Ġoperators":5990,"ĠLi":5991,"ots":5992,"ĠLouisiana":5993,"ĠWhether":5994,"Ġodds":5995,"Ġnoon":5996,"ĠStr":5997,"Ġfail":5998,"iser":5999,"Ġforever":6000,"Ġrecall":6001,"ĠPo":6002,"ĠHot":6003,"Ġdesigner":6004,"ido":6005,"LL":6006,"ĠControl":6007,"Ġsurvive":6008,"iam":6009,"Ġorganisation":6010,"ĠWork":6011,"Ġwider":6012,"Ġtank":6013,"work":6014,"ĠAS":6015,"Ġposting":6016,"Ġsuddenly":6017,"MC":6018,"ĠAL":6019,"ĠProfessor":6020,"ĠCoach":6021,"Ġrushed":6022,"Ġafraid":6023,"Ġactivist":6024,"that":6025,"ĠFilm":6026,"Ġbacking":6027,"Ġhousehold":6028,"Ġsignal":6029,"Ġaccurate":6030,"str":6031,"ĠThread":6032,"ĠBears":6033,"ATION":6034,"ĠAlliance":6035,"ĠMcDonald":6036,"ĠVenezuela":6037,"ogg":6038,"ĠWindows":6039,"makers":6040,"Ġutility":6041,"Ġrapidly":6042,"Ġattractive":6043,"Ġpa":6044,"ĠLarry":6045,"Ġmisconduct":6046,"Ġfreshman":6047,"Ġqualified":6048,"Ġcleared":6049,"Ġcrashed":6050,"Ġparticipating":6051,"Ġpages":6052,"Ġhighlight":6053,"Ġdialogue":6054,"ĠAlberta":6055,"Ġca":6056,"Ġwitnesses":6057,"ables":6058,"Ġfollowers":6059,"Ġensuring":6060,"Ġpromoting":6061,"Ġsearching":6062,"Ġremote":6063,"Ġclash":6064,"Ġfirefighters":6065,"Ġteen":6066,"ĠPlace":6067,"ĠNote":6068,"Ġregardless":6069,"ult":6070,"oney":6071,"ander":6072,"ional":6073,"ining":6074,"Ġdemanded":6075,"ĠCommunications":6076,"Ġconsideration":6077,"TC":6078,"ĠSoutheast":6079,"aga":6080,"ĠGarden":6081,"inger":6082,"ht":6083,"Ġbranch":6084,"Ġmouth":6085,"Ġaudio":6086,"Ġraw":6087,"Ġcoordinator":6088,"Ġexact":6089,"ĠHan":6090,"Ġdelays":6091,"ĠWal":6092,"ĠWells":6093,"Ġng":6094,"Ġhandful":6095,"Ġgirlfriend":6096,"Ġtypical":6097,"ĠWayne":6098,"ĠFranklin":6099,"Ġconstitutional":6100,"ĠChance":6101,"Ġblamed":6102,"rim":6103,"Ġpreliminary":6104,"Ġlie":6105,"da":6106,"ĠCapitol":6107,"Ġroutine":6108,"ĠNASA":6109,"Ġtre":6110,"ĠGolf":6111,"Ġsight":6112,"ĠDer":6113,"Ġreserve":6114,"150":6115,"Ġspeculation":6116,"Ġcompetitors":6117,"ĠMacron":6118,"ony":6119,"Ġovertime":6120,"Ġ71":6121,"Ġdepending":6122,"ĠWarner":6123,"Ġaccusations":6124,"ius":6125,"Ġpredicted":6126,"ĠCharlie":6127,"Ġeverywhere":6128,"Ġcable":6129,"ĠSaint":6130,"ĠRegion":6131,"Ġhero":6132,"ĠEmb":6133,"Ġkinds":6134,"Ġstarter":6135,"Ġsolve":6136,"ĠGuard":6137,"Ġloves":6138,"ĠDouglas":6139,"Ġfunded":6140,"ĠBrent":6141,"ĠAnyone":6142,"Ġsubstantial":6143,"ĠMarine":6144,"ĠMichelle":6145,"Ġcelebrating":6146,"Ġoffset":6147,"Ġbutton":6148,"gg":6149,"Ġmedicine":6150,"uri":6151,"Ġsomewhere":6152,"PD":6153,"Ġmon":6154,"Ġfires":6155,"final":6156,"oth":6157,"ined":6158,"Ġunderway":6159,"Ġmistakes":6160,"Ġgrateful":6161,"Ġcheap":6162,"È":6163,"Ġ95":6164,"Ġviolations":6165,"arr":6166,"Ġsurprising":6167,"Ġob":6168,"ĠNATO":6169,"Ġcontroversy":6170,"ĠSweden":6171,"Ġfuneral":6172,"Ġreviews":6173,"Ġpromotion":6174,"TY":6175,"Ġliberal":6176,"Ġpromising":6177,"ĠSP":6178,"How":6179,"Ġmemories":6180,"Ġbreast":6181,"zi":6182,"ights":6183,"Ġpattern":6184,"Ġoutdoor":6185,"ĠMu":6186,"Ġrush":6187,"ĠTheresa":6188,"ĠPol":6189,"Ġdescribe":6190,"ĠBand":6191,"ĠStewart":6192,"Ġ1999":6193,"ĠRaiders":6194,"mp":6195,"Ġprocedures":6196,"Ġplot":6197,"Ġhire":6198,"used":6199,"Ġ1970":6200,"Ġpicking":6201,"ĠSim":6202,"Ġregard":6203,"inal":6204,"backs":6205,"ĠHard":6206,"ĠLow":6207,"ĠAc":6208,"Is":6209,"Ġguarantee":6210,"ĠGiven":6211,"Ġbeta":6212,"ĠTre":6213,"Ġtrans":6214,"Ġretailer":6215,"Ġpurposes":6216,"ĠHol":6217,"Ġenjoying":6218,"Ġbrown":6219,"ĠPerry":6220,"Ġplea":6221,"MS":6222,"ĠDakota":6223,"ĠParker":6224,"Ġcommit":6225,"ĠLawrence":6226,"ĠMorris":6227,"ended":6228,"Ġvirtual":6229,"ÃĹ":6230,"Ġfruit":6231,"84":6232,"ĠHas":6233,"ishing":6234,"Ġdominated":6235,"ĠFA":6236,"Ġchannels":6237,"Ġunderstood":6238,"Ġcitizen":6239,"Ġchecks":6240,"ĠKenya":6241,"Ġdisabled":6242,"SD":6243,"Ġprotecting":6244,"Ġtweets":6245,"Ġsparked":6246,"ĠCO":6247,"§":6248,"ori":6249,"ĠGDP":6250,"ĠSer":6251,"ĠVisit":6252,"ĠMS":6253,"Ġbarely":6254,"Ġsand":6255,"Ġap":6256,"aging":6257,"Ġrel":6258,"ĠPerhaps":6259,"ĠMourinho":6260,"ĠJets":6261,"Ġdisclosure":6262,"Ġhighlighted":6263,"Ġimplemented":6264,"Ġcompliance":6265,"ĠAB":6266,"ĠAssistant":6267,"ĠCape":6268,"Ġfunny":6269,"Ġleverage":6270,"Ġmachines":6271,"Ġranging":6272,"Ġfastest":6273,"ĠRoberts":6274,"ĠPolicy":6275,"gar":6276,"Ġcollapse":6277,"ĠThrough":6278,"Ġrobbery":6279,"ĠHay":6280,"Ġelite":6281,"ĠDigital":6282,"ĠFun":6283,"ĠAlan":6284,"ement":6285,"Ġmit":6286,"Ġspin":6287,"Ġlistening":6288,"ĠDoug":6289,"ĠSaints":6290,"Ġinterior":6291,"Ġenhance":6292,"ĠCardinals":6293,"ever":6294,"Ġrobust":6295,"Ġinform":6296,"Ġsuffer":6297,"book":6298,"ĠMuslims":6299,"Ġagriculture":6300,"Ġkm":6301,"Ġdivers":6302,"ñ":6303,"ĠReg":6304,"Ġequivalent":6305,"Ġcraft":6306,"Ġsettle":6307,"Ġcontains":6308,"ĠMack":6309,"ĠDis":6310,"ĠFore":6311,"ĠSudan":6312,"ĠMail":6313,"ĠBrooklyn":6314,"izer":6315,"bn":6316,"Ġhundred":6317,"Ġexhibition":6318,"ĠHave":6319,"vin":6320,"Ġcivilians":6321,"ĠCincinnati":6322,"Some":6323,"ĠSE":6324,"Ġbat":6325,"ĠIns":6326,"Ġcalm":6327,"Ġtone":6328,"Ġnormally":6329,"Ġseeks":6330,"ĠAss":6331,"Ġmembership":6332,"Ġannually":6333,"Ġemployers":6334,"CO":6335,"Ġcomplicated":6336,"Ġheadlines":6337,"ĠLabor":6338,"Ġlifestyle":6339,"ĠRen":6340,"ĠRich":6341,"cent":6342,"ude":6343,"Ġawesome":6344,"Ġpaint":6345,"Ġrolling":6346,"Ġwalls":6347,"Ġlab":6348,"Ġtourists":6349,"care":6350,"Ġgear":6351,"izz":6352,"Ġcream":6353,"ĠTro":6354,"ices":6355,"Ġpack":6356,"Ġdiseases":6357,"ĠSpeaker":6358,"ĠOfficers":6359,"Ġsky":6360,"83":6361,"ĠBE":6362,"Ġcategories":6363,"Ġindicate":6364,"Ġru":6365,"ĠSony":6366,"ĠDun":6367,"ocks":6368,"Ġconcrete":6369,"ĠMadison":6370,"ĠSab":6371,"IV":6372,"Ġobserved":6373,"ria":6374,"Ġinterim":6375,"Ġencounter":6376,"ista":6377,"Ġanger":6378,"Ġrapid":6379,"mail":6380,"Ġdestination":6381,"ĩ":6382,"Ġbreaks":6383,"rell":6384,"ĠChase":6385,"Ġattorneys":6386,"Ġrolled":6387,"ĠSprings":6388,"ĠVillage":6389,"TO":6390,"HS":6391,"Ġcampaigns":6392,"ologist":6393,"ĠTax":6394,"ĠIII":6395,"Ġteach":6396,"Ġprovision":6397,"Ġrem":6398,"Ġshirt":6399,"Ġdeployed":6400,"Ġguidelines":6401,"Ġav":6402,"zer":6403,"Ġrushing":6404,"94":6405,"place":6406,"Man":6407,"Ġdivided":6408,"ĠGun":6409,"Ġwindows":6410,"Ġcomponents":6411,"aba":6412,"ĠSwitzerland":6413,"election":6414,"ĠTampa":6415,"ĠAri":6416,"ás":6417,"Ġhighway":6418,"Ġacres":6419,"Ġcrown":6420,"known":6421,"Ġinquiry":6422,"url":6423,"Ġexpertise":6424,"Ġpraised":6425,"yer":6426,"Ġconclusion":6427,"Ġabortion":6428,"Ġlady":6429,"Ġtribute":6430,"Ġunveiled":6431,"Ġbeaten":6432,"TE":6433,"ĠMot":6434,"unk":6435,"Ġtriple":6436,"Ġforcing":6437,"ĠTickets":6438,"uit":6439,"Ġiron":6440,"Ġscientific":6441,"ĠIP":6442,"Ġdiagnosed":6443,"Ġocean":6444,"wide":6445,"ĠCowboys":6446,"LC":6447,"Ġmethods":6448,"ĠFind":6449,"ĠDean":6450,"Ġfundamental":6451,"ĠGill":6452,"Ġfeelings":6453,"IO":6454,"hu":6455,"Ġfeedback":6456,"ote":6457,"Ġduo":6458,"fully":6459,"get":6460,"Ġproof":6461,"story":6462,"Ġlongest":6463,"Ġshops":6464,"ĠJong":6465,"ĠCro":6466,"ĠHawaii":6467,"91":6468,"ĠJake":6469,"ĠSusan":6470,"Ġsubmit":6471,"rav":6472,"Ġmodest":6473,"Ġlit":6474,"Ġattempting":6475,"Ġsits":6476,"Ġaddressing":6477,"93":6478,"ĠBi":6479,"Ġlying":6480,"ĠOrganization":6481,"ĠOak":6482,"oli":6483,"Ġfatal":6484,"Ġmountain":6485,"val":6486,"lu":6487,"ĠMaine":6488,"Ġcharging":6489,"Ġresigned":6490,"illo":6491,"Ġrecommendation":6492,"party":6493,"ĠWeb":6494,"ĠPanthers":6495,"Ġnoise":6496,"ĠBrussels":6497,"awa":6498,"Ġambassador":6499,"Ġaccessible":6500,"ĠCalgary":6501,"idd":6502,"ĠAirlines":6503,"gr":6504,"Ġnu":6505,"roy":6506,"ĠMars":6507,"ĠPoland":6508,"ĠJerry":6509,"ados":6510,"ĠRico":6511,"ĠMir":6512,"ĠFin":6513,"ious":6514,"Ġpacked":6515,"Ġinsider":6516,"President":6517,"ĠBull":6518,"ĠYemen":6519,"ĠConnecticut":6520,"Ġ73":6521,"Ġdepartments":6522,"Ġorganic":6523,"ĠSummer":6524,"ĠBet":6525,"ste":6526,"zo":6527,"rat":6528,"Ġalliance":6529,"Ġintervention":6530,"wan":6531,"ĠOR":6532,"Ġdefined":6533,"ĠÃł":6534,"ĠChiefs":6535,"Ġknocked":6536,"ared":6537,"Ġholes":6538,"Ġpulling":6539,"ĠTodd":6540,"ĠJamie":6541,"ĠSher":6542,"Ġsignature":6543,"ĠSur":6544,"Ġgym":6545,"ĠVladimir":6546,"ĠThailand":6547,"Ġgaming":6548,"Ġsaving":6549,"ceive":6550,"82":6551,"ĠBern":6552,"ĠDid":6553,"Ġhardware":6554,"ished":6555,"Ġconspiracy":6556,"ANS":6557,"ĠIntelligence":6558,"Ġassembly":6559,"Ġ101":6560,"Ġconcise":6561,"ĠManhattan":6562,"Ġbelief":6563,"Ġsurge":6564,"Ġdeserve":6565,"Ġconsistently":6566,"ĠNor":6567,"okes":6568,"ðŁ":6569,"ME":6570,"ĠAsset":6571,"Ġsubstance":6572,"Ġprefer":6573,"Ġburning":6574,"ĠNik":6575,"ook":6576,"ĠPinterest":6577,"Ġboyfriend":6578,"ĠHal":6579,"ĠMerkel":6580,"Ġintroduce":6581,"ĠLinkedIn":6582,"ĠFull":6583,"ĠFarm":6584,"Ġchildhood":6585,"ĠTransportation":6586,"Ġterrible":6587,"du":6588,"Ġintention":6589,"Ġseemingly":6590,"elle":6591,"Ġfoods":6592,"Ġtitled":6593,"Ġdual":6594,"Ġimport":6595,"Ġdeveloper":6596,"UL":6597,"ington":6598,"ĠDelta":6599,"?'":6600,"iness":6601,"Ġquit":6602,"ĠGarcia":6603,"ĠSri":6604,"Ġhip":6605,"ĠBrazilian":6606,"elt":6607,"ively":6608,"Ġstructures":6609,"Ġlabour":6610,"Ġneighbors":6611,"Ġtill":6612,"Ġsoil":6613,"Ġdropping":6614,"Ġnominee":6615,"Ġmeets":6616,"92":6617,"rant":6618,"isa":6619,"Ġluck":6620,"aa":6621,"jet":6622,"ĠTor":6623,"ĠCrime":6624,"Ġlane":6625,"Ġflu":6626,"Ġlaunching":6627,"ĠAutom":6628,"aks":6629,"Ġuniversities":6630,"Ġpollution":6631,"ĠAdvis":6632,"ĠMall":6633,"ls":6634,"Ġdeeper":6635,"Ġrepeated":6636,"Ġmeanwhile":6637,"Ġchip":6638,"Ġoutlets":6639,"Ġliked":6640,"Ġsal":6641,"Ġwelfare":6642,"ago":6643,"Ġmakers":6644,"ving":6645,"fer":6646,"Ġovercome":6647,"mb":6648,"Ġshocked":6649,"akers":6650,"Ġnonprofit":6651,"Ġdonated":6652,"eral":6653,"Ġresume":6654,"Ġlogo":6655,"Ġsubscription":6656,"Ġ74":6657,"ela":6658,"Ġaspect":6659,"html":6660,"Ġsorry":6661,"Ġupgrade":6662,"Ġstance":6663,"Ġfr":6664,"Ġpapers":6665,"Ġattacking":6666,"Ġmeaningful":6667,"81":6668,"ĠWeinstein":6669,"Ġcreates":6670,"Ġhonour":6671,"ĠReply":6672,"oph":6673,"Ġmarch":6674,"Ġsmile":6675,"Ġcomparison":6676,"will":6677,"ĠSanchez":6678,"Ġvoter":6679,"Ġtheory":6680,"Ġequally":6681,"ĠRoger":6682,"Ġperfectly":6683,"Ġlanding":6684,"Ġbillions":6685,"ĠBloomberg":6686,"Ġpermit":6687,"Ġfinals":6688,"Ġracial":6689,"Ġpregnancy":6690,"iled":6691,"ĠFederation":6692,"Ġforest":6693,"Ġtag":6694,"aul":6695,"Ġdrinks":6696,"Ġ(\"":6697,"ĠMobile":6698,"Ġtouched":6699,"Ġclock":6700,"Ġreg":6701,"Ġasylum":6702,"igan":6703,"Ġsenator":6704,"Ġ99":6705,"ĠKumar":6706,"Ġskill":6707,"Ġ1998":6708,"pa":6709,"ĠAf":6710,"Ġmood":6711,"ston":6712,"Ġhang":6713,"ĠMPs":6714,"Please":6715,"ĠEve":6716,"Ġdocumentary":6717,"Ġpersonality":6718,"ĠCast":6719,"Ġdiscount":6720,"bing":6721,"ĠBoeing":6722,"Ġdepend":6723,"Ġcrossing":6724,"EX":6725,"Ġsucceed":6726,"Ġhumanitarian":6727,"ĠMuhammad":6728,"Ġwages":6729,"Ġcolumn":6730,"Ġexternal":6731,"Ġstatistics":6732,"ĠTODAY":6733,"Ġtrips":6734,"Ġta":6735,"Ġpenalties":6736,"Ġwriters":6737,"Ġshipping":6738,"ĠIndians":6739,"Ġsalt":6740,"ĠIndustrial":6741,"ĠYankees":6742,"ĠDen":6743,"Ġrough":6744,"Ġbarrels":6745,"ĠHor":6746,"bert":6747,"ĠDep":6748,"Ġresign":6749,"97":6750,"Ġballs":6751,"ĠJun":6752,"ĠBab":6753,"Ġassociate":6754,"Ġstring":6755,"Ġhub":6756,"Ġorgan":6757,"ĠMarshall":6758,"ĠFIFA":6759,"ĠMun":6760,"ency":6761,"research":6762,"Ġpeers":6763,"Ġtall":6764,"ĠGoldman":6765,"Don":6766,"Ġparade":6767,"Ġparks":6768,"Ġdet":6769,"Ġdisappointing":6770,"Ġreflects":6771,"ĠLakers":6772,"Ġfiles":6773,"Ġrelatives":6774,"ĠUSD":6775,"ĠArticle":6776,"Ġcustom":6777,"ĠCarlos":6778,"Ġtracking":6779,"Ġmaintaining":6780,"ĠCur":6781,"ardo":6782,"ĠSkip":6783,"Ġattitude":6784,"Just":6785,"Ġinstitution":6786,"Ġnarrow":6787,"Ġsnap":6788,"Ġenterprise":6789,"Ġdrives":6790,"Ġ77":6791,"Ġcrop":6792,"Ġvirus":6793,"Ġcelebrity":6794,"Ġeconomies":6795,"ued":6796,"Ġsum":6797,"ĠDubai":6798,"ĠInsurance":6799,"Ĺ":6800,"ury":6801,"ĠUnfortunately":6802,"Ġclosure":6803,"ota":6804,"ĠPhilip":6805,"oms":6806,"Ġinvestigated":6807,"Ġgenerations":6808,"ĠETF":6809,"ĠKeith":6810,"ĠLater":6811,"isk":6812,"Ġpreferred":6813,"Ġdefault":6814,"Ġtowns":6815,"ĠRod":6816,"ĠDie":6817,"Ġintegrated":6818,"Ġacquiring":6819,"Ġvoices":6820,"Ġser":6821,"Ġpresents":6822,"ĠBR":6823,"ĠEmergency":6824,"Ġreligion":6825,"HA":6826,"Ġresponding":6827,"ĠThings":6828,"Ġbeef":6829,"ĠWithout":6830,"urd":6831,"ĠCarl":6832,"Ġadministrative":6833,"ĠWhich":6834,"Ġchallenged":6835,"Ġcooking":6836,"ivid":6837,"ĠFer":6838,"Ġtremendous":6839,"ĠTerry":6840,"iri":6841,"CS":6842,"ĠJunior":6843,"ĠReddit":6844,"Ġtea":6845,"Ġaccounting":6846,"lan":6847,"Ġdetention":6848,"Ġreplied":6849,"SI":6850,"ĠHel":6851,"ns":6852,"ĠProf":6853,"Ġramp":6854,"ĠConservative":6855,"Ġattendance":6856,"Ġspecialist":6857,"ĠFinal":6858,"Ġadvertisement":6859,"Ġacquire":6860,"ĠWhatsApp":6861,"Ġworkforce":6862,"ĠCalif":6863,"Ġspeakers":6864,"ĠEPA":6865,"Ġconviction":6866,"hire":6867,"ĠFisher":6868,"ĠIntel":6869,"Ġbin":6870,"ĠWas":6871,"Ġearth":6872,"vi":6873,"Ġhurricane":6874,"Ġholidays":6875,"Ġassume":6876,"Ġinvolve":6877,"Ġdynamic":6878,"ĠGre":6879,"Ġitem":6880,"Ġpound":6881,"Ġanxiety":6882,"ĠPrint":6883,"rop":6884,"Ġautomatically":6885,"Ġdiscrimination":6886,"ĠLam":6887,"ĠColl":6888,"Ġimpressed":6889,"Ġinvolves":6890,"ĠLes":6891,"ĠTri":6892,"ĠLook":6893,"ĠiOS":6894,"Ġgrab":6895,"ĠAngel":6896,"Ġstops":6897,"ĠPay":6898,"ĠECB":6899,"Ġbunch":6900,"Ġletting":6901,"ele":6902,"ĠAdditionally":6903,"Ġboards":6904,"NC":6905,"Ġtragedy":6906,"Ġpink":6907,"Ġgonna":6908,"ones":6909,"Ġrev":6910,"ĠIndependent":6911,"ĠCambridge":6912,"ĠPence":6913,"Ġprosecution":6914,"Ġdeputies":6915,"ĠAhmed":6916,"Ġlows":6917,"ĠAmy":6918,"ĠBuilding":6919,"mark":6920,"Ġsmooth":6921,"Ġsole":6922,"Ġwanting":6923,"ĠHeart":6924,"Ġobtain":6925,"ĠBus":6926,"Ġexchanges":6927,"friendly":6928,"Ġlabel":6929,"elect":6930,"ĠCompanies":6931,"owing":6932,"ĠCB":6933,"RI":6934,"ĠMaster":6935,"Ġliquid":6936,"ĠDanny":6937,"Ġproceeds":6938,"ĠLaura":6939,"card":6940,"Ġtears":6941,"Ġexploration":6942,"Ġdepression":6943,"ken":6944,"ĠFe":6945,"Ġlending":6946,"ĠYouth":6947,"ality":6948,"NS":6949,"Ġmoon":6950,"ĠTaiwan":6951,"Ġstruggles":6952,"Ġdiscovery":6953,"Ġqualify":6954,"Ġwireless":6955,"alia":6956,"Ġwitnessed":6957,"Ġheight":6958,"ĠGuy":6959,"left":6960,"KE":6961,"Ġfoul":6962,"ĠMohammed":6963,"Ġgrass":6964,"ĠNon":6965,"Ġswim":6966,"Ġbrilliant":6967,"you":6968,"ĠFlynn":6969,"Ġsinging":6970,"eria":6971,"UT":6972,"ĠMcCain":6973,"ĠSep":6974,"ĠWars":6975,"Ġburden":6976,"Ġpas":6977,"Ġabandoned":6978,"Ġint":6979,"ĠTurner":6980,"Ġcollective":6981,"ĠEnvironmental":6982,"ĠStudents":6983,"Ġofferings":6984,"Ġresignation":6985,"Ġexplosion":6986,"ĠKoh":6987,"ager":6988,"Ġthrows":6989,"Ġasks":6990,"light":6991,"Ġanyway":6992,"Ġyard":6993,"Ġcarrier":6994,"Ġwaves":6995,"backed":6996,"TR":6997,"oud":6998,"Ġbreach":6999,"Ġdated":7000,"Ġdressed":7001,"ĠDodgers":7002,"oles":7003,"Ġ78":7004,"Ġreads":7005,"Ġpredict":7006,"ĠJerusalem":7007,"ĠPT":7008,"Ġcrack":7009,"yan":7010,"Ġnights":7011,"eline":7012,"Ġconvinced":7013,"Ġlock":7014,"Ġcarefully":7015,"ĠMercedes":7016,"Ġultimate":7017,"Ġdist":7018,"Ġslight":7019,"ĠEdwards":7020,"Ġswing":7021,"iling":7022,"Ġknife":7023,"ĠNashville":7024,"IF":7025,"inder":7026,"udd":7027,"Ġsenators":7028,"ĠFurther":7029,"ĠXi":7030,"Ġstr":7031,"ĠOd":7032,"days":7033,"Ġcomm":7034,"Ġverdict":7035,"Ġconfirmation":7036,"king":7037,"ĠCS":7038,"Ġadvocates":7039,"Ġpride":7040,"Ġmemorial":7041,"ams":7042,"erman":7043,"Ġteenager":7044,"ĠNeil":7045,"uts":7046,"Ġsoul":7047,"see":7048,"post":7049,"Ġchest":7050,"fire":7051,"ĠLynch":7052,"Ġpeaceful":7053,"OND":7054,"ĠIndustries":7055,"ĠJuan":7056,"Ġrestore":7057,"Ġreliable":7058,"ming":7059,"agan":7060,"Source":7061,"ĠCabinet":7062,"Ġremarkable":7063,"ĠTrudeau":7064,"ĠEs":7065,"Ġintegrity":7066,"ove":7067,"fe":7068,"Ġproceedings":7069,"Ġconnections":7070,"Ġunprecedented":7071,"ĠGlen":7072,"ux":7073,"Ġearning":7074,"Ġingredients":7075,"Ġnominated":7076,"ĠBangladesh":7077,"made":7078,"Ġlessons":7079,"Ġbreakfast":7080,"ĠRelations":7081,"Ġloose":7082,"Al":7083,"Ġupgraded":7084,"ral":7085,"ĠPage":7086,"oto":7087,"ĠQueensland":7088,"Ġprocedure":7089,"ĠSmall":7090,"Ġrespective":7091,"Ġpictured":7092,"ĠBas":7093,"Ġpreparation":7094,"ĠMyanmar":7095,"Ġdonation":7096,"Ġvisible":7097,"iest":7098,"ĠBroadway":7099,"rick":7100,"ĠSchools":7101,"Ġarrests":7102,"ĠJessica":7103,"ĠBengal":7104,"Ġhell":7105,"Ġannouncing":7106,"Ġmail":7107,"ĠMcG":7108,"two":7109,"rest":7110,"OD":7111,"ĠBradley":7112,"Ġdoubled":7113,"Ġpledged":7114,"Ġcomeback":7115,"Ġextraordinary":7116,"Ġslide":7117,"Ġassess":7118,"Ġagricultural":7119,"ĠKay":7120,"Ġvendors":7121,"Ġnarrative":7122,"Ġreviewed":7123,"ĠPass":7124,"Ġinspiration":7125,"ĠHunter":7126,"Ġcalendar":7127,"ĠDiamond":7128,"Ġremoval":7129,"ners":7130,"ĠKap":7131,"Ġconsent":7132,"Ġvisual":7133,"Ġcheese":7134,"ĠTher":7135,"ĠFR":7136,"ĠShanghai":7137,"iah":7138,"ĠCole":7139,"AK":7140,"Ġranking":7141,"Ġcook":7142,"Ġhalftime":7143,"ĠStars":7144,"Ġroutes":7145,"aim":7146,"Ġestablishment":7147,"ĠMug":7148,"Ġsurvivors":7149,"urg":7150,"ĠBrett":7151,"Ġunexpected":7152,"ained":7153,"Ġrarely":7154,"ĠGall":7155,"Ġadvocate":7156,"ĠNad":7157,"Ġ911":7158,"Ġracist":7159,"erer":7160,"ĠRev":7161,"ĠSection":7162,"Ġhelpful":7163,"CT":7164,"agg":7165,"Ġgovernance":7166,"Ġfelony":7167,"Ġoptimistic":7168,"Ġelectoral":7169,"EG":7170,"town":7171,"Ġdaughters":7172,"Ġanswered":7173,"Ġthin":7174,"ĠClassic":7175,"Ġshareholder":7176,"ĠBlake":7177,"ĠFla":7178,"Ġparliamentary":7179,"dy":7180,"Ġcommented":7181,"Ġtri":7182,"Ġglobe":7183,"Ġmandate":7184,"Ġslipped":7185,"ĠTower":7186,"Ġoperated":7187,"gers":7188,"Ġassured":7189,"ĠMartinez":7190,"Ġdesigns":7191,"ĠModel":7192,"Ġstakeholders":7193,"Ġdefended":7194,"Ġseniors":7195,"Ġvacation":7196,"Ġglobally":7197,"ump":7198,"Not":7199,"Ġclip":7200,"Ġarticles":7201,"BR":7202,"km":7203,"ĠFront":7204,"PL":7205,"Ġadoption":7206,"Ġsudden":7207,"Ġframework":7208,"Ġhanging":7209,"gl":7210,"ĠSel":7211,"Ġmoderate":7212,"Ġreverse":7213,"income":7214,"cor":7215,"ĠGB":7216,"Ġphysically":7217,"Ġtransparency":7218,"ĠElectric":7219,"Ġrefugee":7220,"profile":7221,"iva":7222,"ately":7223,"ĠAC":7224,"Ġtransferred":7225,"Ġaffair":7226,"ĠAlaska":7227,"oria":7228,"ĠChange":7229,"Ġrepeat":7230,"Ġscreening":7231,"ender":7232,"ĠCas":7233,"ĠDav":7234,"Ġfocuses":7235,"Ġcommissioner":7236,"Ġupside":7237,"ĠKeep":7238,"ĠBlues":7239,"ently":7240,"Ġaut":7241,"Ġexperiencing":7242,"aman":7243,"Ġapprove":7244,"Ġmile":7245,"Ġcheaper":7246,"ĠWind":7247,"ĠStore":7248,"Ġgrabbed":7249,"Ġsons":7250,"Ġfighter":7251,"Ġum":7252,"ĠBased":7253,"don":7254,"Ġconstitution":7255,"finals":7256,"act":7257,"¢":7258,"Ġmill":7259,"Ġorganisations":7260,"ĠToyota":7261,"Ġyuan":7262,"Ġterrorists":7263,"Ġforth":7264,"Ġavailability":7265,"Ġentrance":7266,"Ġvolumes":7267,"Ġmult":7268,"plus":7269,"ĠColumbus":7270,"ĠSummit":7271,"Ġbabies":7272,"ĠMur":7273,"ĠGray":7274,"ĠChar":7275,"ĠButler":7276,"Ġpose":7277,"ĠNatural":7278,"ĠAtt":7279,"Ġdecrease":7280,"Ġtens":7281,"kt":7282,"Ġminds":7283,"Ġimpacted":7284,"Ġchapter":7285,"ĠOp":7286,"ĠHarrison":7287,"ĠRodriguez":7288,"Ġethnic":7289,"Ġtravelling":7290,"ĠBond":7291,"ader":7292,"core":7293,"Ġgallery":7294,"founder":7295,"ĠVill":7296,"Ġdecent":7297,"ĠHistory":7298,"ĠInt":7299,"ĠNa":7300,"ĠHad":7301,"Ġmainstream":7302,"ĠTs":7303,"Ġbottle":7304,"sen":7305,"Ġrecession":7306,"Ġsophomore":7307,"Ġsilence":7308,"cc":7309,"Ġqualifying":7310,"Ġcomplained":7311,"ĠRad":7312,"Ġactively":7313,"Ġbacks":7314,"ĠMusk":7315,"Ġcareful":7316,"Ġmeals":7317,"ĠDor":7318,"Ġmess":7319,"ĠBelgium":7320,"Ġke":7321,"ĠLopez":7322,"Ġbow":7323,"Ġhelicopter":7324,"was":7325,"Ġstone":7326,"kins":7327,"Ġunlike":7328,"Ġcollision":7329,"ĠAlt":7330,"HP":7331,"ĠMason":7332,"has":7333,"Ġclimbed":7334,"Ġindication":7335,"Ġhotels":7336,"Ġloud":7337,"ĠMilan":7338,"kes":7339,"Ġbadly":7340,"Ġtrials":7341,"Ġimpacts":7342,"ĠJane":7343,"Ġcrossed":7344,"Ġdiscussing":7345,"ĠSM":7346,"Ġpopularity":7347,"ĠWant":7348,"fall":7349,"Ġartificial":7350,"ĠBu":7351,"akh":7352,"Ġdominant":7353,"gov":7354,"Ġpremier":7355,"Ġexecution":7356,"gate":7357,"Ġswimming":7358,"Ġchat":7359,"Ġdevastating":7360,"acking":7361,"Ġreception":7362,"urt":7363,"Ġtheater":7364,"Ġgather":7365,"Ġtear":7366,"uro":7367,"Ġdemocratic":7368,"Ġrebels":7369,"Ġlifetime":7370,"Ġradical":7371,"uan":7372,"Ġtechniques":7373,"ache":7374,"ior":7375,"Ġcamps":7376,"Ġtelephone":7377,"ĠDublin":7378,"ĠBrand":7379,"ĠMarcus":7380,"aun":7381,"ĠRec":7382,"Ġ82":7383,"ban":7384,"Ġsafely":7385,"aku":7386,"aki":7387,"Ġbankruptcy":7388,"FF":7389,"Ġformat":7390,"Ġattached":7391,"ĠFame":7392,"ĠEdward":7393,"Ġmerger":7394,"ĠRepresentatives":7395,"izes":7396,"Ġhidden":7397,"Ġval":7398,"zz":7399,"Ġexcess":7400,"Ġscope":7401,"Ġdivorce":7402,"Ġburn":7403,"Ġrequirement":7404,"BB":7405,"ĠHand":7406,"Ġcons":7407,"Ġrisen":7408,"Ġtwitter":7409,"Ġoffseason":7410,"ĠSometimes":7411,"ĠInf":7412,"ĠAng":7413,"uer":7414,"report":7415,"Ġdreams":7416,"Ġ700":7417,"ips":7418,"ĠDream":7419,"Ġgifts":7420,"Ġsomehow":7421,"ĠTur":7422,"ĠRachel":7423,"can":7424,"Ġlog":7425,"ĠMedicaid":7426,"Ġles":7427,"Ġtired":7428,"ĠArkansas":7429,"Ġliquidity":7430,"ĠPhillips":7431,"ĠBTC":7432,"Ġhide":7433,"Ġpun":7434,"ĠRun":7435,"lyn":7436,"ĠUC":7437,"ĠDesign":7438,"ĠDev":7439,"Ġvaluation":7440,"Ġreveals":7441,"ĠChild":7442,"other":7443,"Ġposed":7444,"lee":7445,"Ġships":7446,"ĠTrue":7447,"Ġdescribes":7448,"Ġrunner":7449,"bro":7450,"Ġankle":7451,"Ġod":7452,"ĠAnnual":7453,"CL":7454,"Ġoverhaul":7455,"ned":7456,"Ġbold":7457,"Ġmo":7458,"ĠFalls":7459,"Ġemployed":7460,"ĠGro":7461,"Ġflash":7462,"ĠTD":7463,"Ġnervous":7464,"Ġintegration":7465,"Ġsmartphones":7466,"Ġmovements":7467,"nie":7468,"ition":7469,"ĠThird":7470,"Ģ":7471,"Ġmetres":7472,"Ġeconomist":7473,"omp":7474,"Ġteens":7475,"Ġeveryday":7476,"Ġinterviewed":7477,"Ġbriefly":7478,"],":7479,"uke":7480,"ĠFOX":7481,"Ġunderlying":7482,"ĠLuc":7483,"Ġcourses":7484,"ss":7485,"amed":7486,"°":7487,"ju":7488,"ĠBanks":7489,"Ġoutfit":7490,"illing":7491,"Ġtrafficking":7492,"Ġurging":7493,"Ġbelt":7494,"Ġrid":7495,"CP":7496,"Ġelderly":7497,"ĠGrowth":7498,"án":7499,"ĠSn":7500,"Ġsurrounded":7501,"Ġsisters":7502,"ĠIslam":7503,"Ġsynd":7504,"ĠCosta":7505,"di":7506,"ĠKl":7507,"Ġmanufacturer":7508,"holders":7509,"Ġelement":7510,"Ġload":7511,"Ġbooked":7512,"Ġaccompanied":7513,"ĠChamber":7514,"Ġbriefing":7515,"Oh":7516,"imi":7517,"ĠDefence":7518,"ĠCurrently":7519,"aking":7520,"Ġhandled":7521,"ĠCD":7522,"ĠBenjamin":7523,"Ġpocket":7524,"ĠKashmir":7525,"Ġlighting":7526,"aps":7527,"Ġ1997":7528,"ech":7529,"Ġaddiction":7530,"Ġbases":7531,"Ġpriorities":7532,"Ġhardly":7533,"ĠQuebec":7534,"ĠEarn":7535,"IES":7536,"ĠZach":7537,"ĠAlong":7538,"MI":7539,"Ġins":7540,"ĠRogers":7541,"ĠKan":7542,"ĠFuture":7543,"Ġtriggered":7544,"ĠUnit":7545,"Ġweighed":7546,"Ġpointing":7547,"Ġchocolate":7548,"ĠBrowns":7549,"ĠISIS":7550,"Ġgoalkeeper":7551,"Ġsaves":7552,"ĠAndre":7553,"burn":7554,"ĠCont":7555,"ĠNetherlands":7556,"Ġpolitically":7557,"ĠAshley":7558,"ĠWhit":7559,"aded":7560,"PH":7561,"Ġborders":7562,"ORE":7563,"Ġally":7564,"Trump":7565,"istan":7566,"ĠHunt":7567,"ĠCancer":7568,"ĠGrace":7569,"ĠTottenham":7570,"Ġ1960":7571,"ĠMarg":7572,"ĠBryan":7573,"ĠAgain":7574,"acing":7575,"Ġarguments":7576,"ĠSouthwest":7577,"Ġvocal":7578,"Ġjudgment":7579,"Ġengaging":7580,"Ġadopt":7581,"Ġrental":7582,"Ġlinebacker":7583,"ĠKardashian":7584,"Ġepisodes":7585,"..":7586,"Ġunt":7587,"Ġvowed":7588,"Ġ79":7589,"ule":7590,"Ġtransit":7591,"Ġoffshore":7592,"Ġsuppliers":7593,"Ġarguing":7594,"Ġsatellite":7595,"ĠLind":7596,"ĠTaliban":7597,"Buy":7598,"ĠCaribbean":7599,"ĠBarry":7600,"Ġauthors":7601,"ĠWolf":7602,"Ġviewing":7603,"ĠCubs":7604,"From":7605,"Ġ%":7606,"Ġcurrencies":7607,"Why":7608,"ĠBroncos":7609,"Ġtrick":7610,"Ġdiesel":7611,"ĠLiberal":7612,"FL":7613,"Ġtopics":7614,"Ġretain":7615,"ĠLiberty":7616,"Ġacquisitions":7617,"ced":7618,"Ġfre":7619,"Ġfleet":7620,"Ġcopper":7621,"ĠPot":7622,"jen":7623,"ĠElliott":7624,"ĠPyongyang":7625,"Ġobject":7626,"ĠUse":7627,"Ġmutual":7628,"MP":7629,"Ġev":7630,"Ġdeny":7631,"ĠEveryone":7632,"lling":7633,"Ġpays":7634,"Ġdrought":7635,"Ġcorn":7636,"Ġworkplace":7637,"rig":7638,"ĠMn":7639,"Ġadvisory":7640,"ĠCat":7641,"Ġchronic":7642,"ĠSteelers":7643,"Ġboxes":7644,"ĠNap":7645,"Ġdemonstrated":7646,"ĠTournament":7647,"Ġsymbol":7648,"ĠAfghan":7649,"ĠTan":7650,"ired":7651,"ĠEv":7652,"ĠConsumer":7653,"Ġmoral":7654,"ĠAdditional":7655,"Ġwebsites":7656,"Ġoccasions":7657,"Ġfate":7658,"Ġpitcher":7659,"Ġtaxpayers":7660,"Ġdeemed":7661,"ĠLibya":7662,"Ġpriced":7663,"Ġdistributed":7664,"ĠForum":7665,"Ġrice":7666,"Ġbloc":7667,"Ġprovisions":7668,"agh":7669,"Ġpen":7670,"Ġattracted":7671,"ĠEdmonton":7672,"Ġthousand":7673,"Ġpainting":7674,"Ġil":7675,"Ġcourtesy":7676,"Ġeliminate":7677,"Ġacc":7678,"Ġmeters":7679,"Ġreflected":7680,"Ġcomponent":7681,"Every":7682,"Ġsells":7683,"Ġfault":7684,"Ġburned":7685,"ĠKirk":7686,"ĠAnna":7687,"Ġappeals":7688,"Ġeggs":7689,"Ġfrequent":7690,"Ġtrigger":7691,"Ġrevised":7692,"ĠAngela":7693,"Ġ81":7694,"Ġsingles":7695,"Ġviral":7696,"Ġworries":7697,"ĠShould":7698,"profit":7699,"Ġraises":7700,"ĠBryant":7701,"ĠProduct":7702,"Ġtenure":7703,"Ġdiabetes":7704,"Ġcolour":7705,"azz":7706,"ĠGirls":7707,"Ġpractical":7708,"Ġblind":7709,"ancing":7710,"pictured":7711,"Ġfinale":7712,"ĠElection":7713,"Ġathletic":7714,"Ġpromoted":7715,"Ġflowers":7716,"Ġtrains":7717,"ario":7718,"Ġsufficient":7719,"IE":7720,"Ġexamples":7721,"Ġshed":7722,"Ġbirds":7723,"Ġchaos":7724,"Ġwound":7725,"Ġrocket":7726,"Ġwet":7727,"Ġsample":7728,"ĠNag":7729,"ĠOliver":7730,"Ġscrutiny":7731,"ĠSeven":7732,"ĠRoman":7733,"ĠFred":7734,"Ġweird":7735,"ĠTam":7736,"ĠSupport":7737,"ĠNathan":7738,"Ġstudying":7739,"Ġintroduction":7740,"Ġtons":7741,"cer":7742,"aus":7743,"ION":7744,"Ġcritic":7745,"ĠAh":7746,"alo":7747,"pur":7748,"Ġstorms":7749,"ĠMission":7750,"Ġcredits":7751,"Ġgrants":7752,"Ġcomp":7753,"Ġhearts":7754,"part":7755,"Ġpin":7756,"Ġsubsequent":7757,"Ġmad":7758,"ĠSacramento":7759,"woman":7760,"from":7761,"Ġoutcomes":7762,"Ġoldest":7763,"Ġdesperate":7764,"ĠTal":7765,"ĠDJ":7766,"ward":7767,"Ġaudiences":7768,"Ġimportantly":7769,"ĠEmily":7770,"sk":7771,"ĠHeat":7772,"ĠType":7773,"ĠPeace":7774,"Ġsuspicious":7775,"aly":7776,"ĠGET":7777,"ĠCAP":7778,"dis":7779,"ĠIraqi":7780,"ĠReed":7781,"Ġstrange":7782,"ĠParent":7783,"900":7784,"Ġglad":7785,"ĠTroy":7786,"ĠShort":7787,"Ġheritage":7788,"Ġarriving":7789,"ingly":7790,"Ġtransformation":7791,"Ġlease":7792,"Ġcollapsed":7793,"cha":7794,"ĠPatrol":7795,"Ġcomputers":7796,"Ġprinciples":7797,"Ġsporting":7798,"ĠHughes":7799,"mile":7800,"ĠCit":7801,"Ġdrilling":7802,"ĠBox":7803,"ÃŁ":7804,"bre":7805,"ĠOverall":7806,"Ġopioid":7807,"Ġdelighted":7808,"Ġhonored":7809,"ĠCold":7810,"Ġunions":7811,"ĠCou":7812,"ĠCircuit":7813,"Ġblast":7814,"sson":7815,"ĠHernandez":7816,"ĠLooking":7817,"Ġlegally":7818,"ĠWalmart":7819,"bridge":7820,"Ġmat":7821,"rad":7822,"ids":7823,"Ġdining":7824,"Ġrebound":7825,"abad":7826,"ĠRom":7827,"Ġimpose":7828,"ĠAlpha":7829,"ĠWeekly":7830,"TER":7831,"ĠJam":7832,"Ġabsolute":7833,"Ġinventory":7834,"ĠBilly":7835,"ĠKaren":7836,"ĠFriends":7837,"ĠCent":7838,"ĠVikings":7839,"ĠMuch":7840,"cell":7841,"ads":7842,"Ġph":7843,"Ġkiller":7844,"ĠMembers":7845,"Ġshooter":7846,"ĠInvestigators":7847,"ĠJoshua":7848,"Ġparticipated":7849,"Ġinnocent":7850,"ĠRichmond":7851,"itor":7852,"ĠDal":7853,"ĠOperator":7854,"Ġmakeup":7855,"Ġconf":7856,"ĠNEWS":7857,"ĠDef":7858,"Ġchase":7859,"ĠCost":7860,"mont":7861,"\":":7862,"Ġarrangements":7863,"stein":7864,"Ġretire":7865,"ĠLuis":7866,"Ġrenewed":7867,"ĠTownship":7868,"Ġchecked":7869,"arts":7870,"ĠCash":7871,"Ġcentres":7872,"chers":7873,"ĠSolutions":7874,"Ġlegend":7875,"ige":7876,"most":7877,"osed":7878,"ĠPor":7879,"Ġpremiere":7880,"FS":7881,"Ġmissiles":7882,"ĠLang":7883,"Ġsing":7884,"best":7885,"Ġtail":7886,"Ġriders":7887,"Picture":7888,"zen":7889,"ĠKent":7890,"Ġtransform":7891,"Ġwildlife":7892,"Ġsmoking":7893,"Ġpreseason":7894,"ĠLucas":7895,"ĠAnne":7896,"owski":7897,"Ġtape":7898,"Ġdisplayed":7899,"Ġforum":7900,"Ġanonymity":7901,"ĠIndianapolis":7902,"hips":7903,"acc":7904,"ĠMoreover":7905,"lers":7906,"area":7907,"ĠIndeed":7908,"Ġconducting":7909,"Ġinfection":7910,"Ġdealt":7911,"OB":7912,"asing":7913,"ĠGaza":7914,"itter":7915,"ĠKa":7916,"Ġhopeful":7917,"ĠSnow":7918,"Ġentitled":7919,"Ġaffecting":7920,"Ġeager":7921,"Ġcircle":7922,"Ġlaugh":7923,"ĠProsecutors":7924,"ĠDur":7925,"Ġbarriers":7926,"ĠPoll":7927,"oun":7928,"ĠPalm":7929,"chi":7930,"Ġsamples":7931,"Ġcompromise":7932,"atter":7933,"Ġenormous":7934,"Ġé":7935,"coming":7936,"ĠPharmaceutical":7937,"Ġrank":7938,"Let":7939,"Ġtransgender":7940,"ĠCloud":7941,"FO":7942,"ĠBor":7943,"Ġbonus":7944,"Ġordinary":7945,"ĠPres":7946,"ĠHIV":7947,"ires":7948,"OSE":7949,"Ġdancing":7950,"ĠHD":7951,"Ġversions":7952,"Ġ88":7953,"rate":7954,"Ġtackles":7955,"Ġknock":7956,"ĠEmma":7957,"Ġmotivated":7958,"ĠBennett":7959,"ĠBurn":7960,"Ġgrid":7961,"Ġembrace":7962,"ĠSpurs":7963,"Ġflows":7964,"ĠGer":7965,"Ġsponsored":7966,"Ġsurvival":7967,"ching":7968,"Ġ1995":7969,"Ġreward":7970,"Ġdepends":7971,"Ġpostseason":7972,"Ġloaded":7973,"Ġneutral":7974,"ĠPop":7975,"BL":7976,"Ġrevolution":7977,"ĠFreedom":7978,"Ġrecovering":7979,"Ġrequiring":7980,"ALL":7981,"ARE":7982,"Ġmini":7983,"lt":7984,"ĠFDA":7985,"Ġcarpet":7986,"ĠPrior":7987,"Ġadmission":7988,"ĠEver":7989,"ĠTribune":7990,"ĠRonaldo":7991,"Ġthick":7992,"Ġlanes":7993,"Ġ84":7994,"ĠMemphis":7995,"Ġopt":7996,"BO":7997,"Ġfaculty":7998,"ĠChad":7999,"ĠSUV":8000,"ĠHen":8001,"Ġeste":8002,"ĠHu":8003,"ĠAgriculture":8004,"store":8005,"ĠDrug":8006,"inter":8007,"Ġ1996":8008,"ident":8009,"Ġbackup":8010,"ĠHonda":8011,"ĠHope":8012,"oes":8013,"ums":8014,"amer":8015,"Ġbreath":8016,"Ġ110":8017,"Ġjoke":8018,"ĠAld":8019,"Ġwondering":8020,"ĠAssad":8021,"ĠRem":8022,"Ġfundraising":8023,"pot":8024,"è":8025,"Ġquestioning":8026,"Ġpent":8027,"ĠMoney":8028,"ĠMedicine":8029,"wick":8030,"ĠKnights":8031,"Ġbatting":8032,"ĠMos":8033,"Ġdesignated":8034,"isse":8035,"Ġspotlight":8036,"Ġlake":8037,"Ġcaution":8038,"Ġinmates":8039,"Ġlap":8040,"CE":8041,"ĠJavascript":8042,"ĠDeutsche":8043,"ĠFargo":8044,"Ġguaranteed":8045,"borough":8046,"Ġfunctions":8047,"ĠElementary":8048,"ĠChuck":8049,"Ġpitched":8050,"ĠKrist":8051,"Ġsteal":8052,"Ġchips":8053,"Ġalarm":8054,"Ġbeloved":8055,"scale":8056,"Ġassaulted":8057,"ĠPentagon":8058,"Ġtemporarily":8059,"Ġ93":8060,"Ġ>":8061,"ĠPortugal":8062,"ti":8063,"HL":8064,"Ġdecreased":8065,"Ġexistence":8066,"Ġisolated":8067,"Ġdeposit":8068,"Ġstudied":8069,"\")":8070,"Ġtrophy":8071,"ĠBrooks":8072,"Ġbattling":8073,"Ġweaker":8074,"ĠPrivate":8075,"ĠAccess":8076,"Ġvirtually":8077,"Ġshortage":8078,"Ġgaining":8079,"Ġbathroom":8080,"TON":8081,"Ġconcerning":8082,"Ġengineer":8083,"Ġbread":8084,"Ġdemonstrate":8085,"ĠDh":8086,"Ġhorses":8087,"Ġintersection":8088,"Ġcolors":8089,"Ġdelegation":8090,"Ġnotable":8091,"Ġwithdrawal":8092,"ĠDennis":8093,"Ġlocally":8094,"Ġcoastal":8095,"Ġcomply":8096,"ĠMoh":8097,"ĠAlbert":8098,"Ġclosest":8099,"ĠCITY":8100,"Ġ83":8101,"Ġcancelled":8102,"ĠðŁ":8103,"Ġsharply":8104,"RS":8105,"Ġproductivity":8106,"Ġbasket":8107,"SS":8108,"Ġadmit":8109,"ool":8110,"ination":8111,"ĠBB":8112,"Ġsur":8113,"ĠSteel":8114,"ĠTed":8115,"ĠPac":8116,"Ġpatterns":8117,"Ġlisting":8118,"Ġreplacing":8119,"ĠPradesh":8120,"Ġroots":8121,"Ġbroker":8122,"ĠWriting":8123,"Ġsued":8124,"Ġorganised":8125,"ĠThanksgiving":8126,"ĠNOT":8127,"Ġjournalism":8128,"uel":8129,"Ġkilometers":8130,"Ġhunt":8131,"berry":8132,"ĠMother":8133,"Ġlegitimate":8134,"Ġinput":8135,"ĠRel":8136,"ĠGuardian":8137,"Ar":8138,"Ġtransported":8139,"Ġbedroom":8140,"ashing":8141,"Ġbats":8142,"Ġcleaning":8143,"Ġwrapped":8144,"Pacific":8145,"Ġfence":8146,"Ġtestified":8147,"Ġ1994":8148,"Ġinterference":8149,"Ġmatching":8150,"Ġexpression":8151,"eta":8152,"ĠSpencer":8153,"Ġstrategist":8154,"who":8155,"Ġvictories":8156,"Ġ2022":8157,"Ġstakes":8158,"Ġbuses":8159,"ĠHousing":8160,"Ġeditorial":8161,"Ġ86":8162,"ĠBishop":8163,"Ġfrustrated":8164,"Ġappearing":8165,"http":8166,"IGHT":8167,"Ġmemo":8168,"Ġinsiders":8169,"Even":8170,"Ġclassroom":8171,"Ġchef":8172,"aining":8173,"].":8174,"ĠMcD":8175,"Ġ87":8176,"ĠPunjab":8177,"Ġancient":8178,"Ġresolved":8179,"Ġdying":8180,"Ġdestruction":8181,"Ġgoverning":8182,"Ġrestructuring":8183,"ĠPick":8184,"Ġmunicipal":8185,"Ġengines":8186,"ĠHudson":8187,"Æ":8188,"Ġrepeal":8189,"standing":8190,"Ġbound":8191,"ĠOS":8192,"ĠCommonwealth":8193,"Ġdescription":8194,"Ġhouseholds":8195,"Ġmal":8196,"Ġstopping":8197,"equ":8198,"Ġregulator":8199,"Ġcontaining":8200,"Ġremoving":8201,"Ġwithdraw":8202,"Ġburied":8203,"Ġlists":8204,"ĠGil":8205,"Ġlowered":8206,"Ġformally":8207,"ĠRound":8208,"asi":8209,"¥":8210,"lett":8211,"Ġprogressive":8212,"ĠFalcons":8213,"ĠRaw":8214,"gun":8215,"Ġcontributing":8216,"Ġhunting":8217,"Ġvalid":8218,"Ġexception":8219,"ĠPlayers":8220,"ĠTra":8221,"Ġracism":8222,"hing":8223,"chen":8224,"Ġdifferently":8225,"Ġchampionships":8226,"ĠEng":8227,"ĠNO":8228,"ĠAuto":8229,"ĠErdogan":8230,"iding":8231,"Ġwarming":8232,"Ġcivilian":8233,"ĠDam":8234,"Ġfantasy":8235,"ĠNav":8236,"itions":8237,"ĠDrew":8238,"ĠNancy":8239,"Ġtrapped":8240,"ĠRussians":8241,"ĠIC":8242,"Ġflexibility":8243,"ular":8244,"Ġviolated":8245,"ipped":8246,"Ġgarage":8247,"ĠDeep":8248,"Ġpraise":8249,"ĠLab":8250,"ĠPlayer":8251,"Ġjudicial":8252,"Ġdonate":8253,"Ġseparated":8254,"Ġreleases":8255,"nik":8256,"Ġexplanation":8257,"aph":8258,"Ġloyal":8259,"Ġstrongest":8260,"ĠShar":8261,"Ġrescued":8262,"Ġambitious":8263,"Ġclimb":8264,"Ġscared":8265,"Ġignored":8266,"cut":8267,"Ġstole":8268,"Ġweakness":8269,"ĠRidge":8270,"oa":8271,"LA":8272,"Ġdep":8273,"ĠPowell":8274,"Do":8275,"Ġprotein":8276,"Ġreiterated":8277,"ĠCox":8278,"aling":8279,"ĠUnlike":8280,"ĠKane":8281,"ĠMcConnell":8282,"Ġshowcase":8283,"Ġuniform":8284,"ower":8285,"Ġdiscover":8286,"stop":8287,"ipper":8288,"Ġtreatments":8289,"Ġgrocery":8290,"Ġsubscribers":8291,"lock":8292,"ple":8293,"Ġflew":8294,"ania":8295,"Ġstepping":8296,"ĠSoviet":8297,"Ġconsultant":8298,"ags":8299,"ĠLim":8300,"Ġ91":8301,"ĠCode":8302,"ports":8303,"box":8304,"Ġlakh":8305,"Ġreminder":8306,"ym":8307,"ĠTravis":8308,"Ġpure":8309,"now":8310,"ĠVR":8311,"Ġachievement":8312,"ĠEmirates":8313,"ĠThunder":8314,"Ġmerely":8315,"ĠCa":8316,"ĠAverage":8317,"ĠDa":8318,"Ġtopped":8319,"ĠCurry":8320,"Ġchemicals":8321,"Ġamendment":8322,"ĠBorder":8323,"ĠBat":8324,"Ġ130":8325,"Ġprogramming":8326,"Ġtele":8327,"ĠKarl":8328,"Ġaveraged":8329,"ĠSpe":8330,"world":8331,"PG":8332,"Ġfights":8333,"ĠPrincess":8334,"ĠCIA":8335,"ĠAbe":8336,"Ġacted":8337,"only":8338,"Ġinsight":8339,"Ġathlete":8340,"ĠTar":8341,"commerce":8342,"Ġaveraging":8343,"cr":8344,"ĠPalestinians":8345,"Well":8346,"Ġbull":8347,"Ġchoosing":8348,"Ġsurely":8349,"ĠSecret":8350,"Ġteammate":8351,"ĠAmendment":8352,"ĠBirmingham":8353,"Ġexcitement":8354,"strong":8355,"ĠSin":8356,"Ġdamages":8357,"rated":8358,"Ġrankings":8359,"Ġconservation":8360,"home":8361,"erm":8362,"ield":8363,"Ġdisorder":8364,"acher":8365,"Ġnaturally":8366,"atur":8367,"Ġpackages":8368,"Ġapproaches":8369,"icks":8370,"ourn":8371,"Ġodd":8372,"Ġshore":8373,"ĠBeing":8374,"Ġmagic":8375,"Ġtourist":8376,"largest":8377,"Ġwhenever":8378,"Ġlenders":8379,"Ġegg":8380,"ĠChair":8381,"Ġlets":8382,"Ġwarnings":8383,"į":8384,"Ġpol":8385,"Ġdrag":8386,"ĠAmb":8387,"ĠCle":8388,"ĠLouisville":8389,"ĠShaw":8390,"lands":8391,"Ġanthem":8392,"ĠTrail":8393,"Ġaccepting":8394,"anger":8395,"good":8396,"ĠBroad":8397,"ĠLebanon":8398,"ĠMillion":8399,"ĠHenderson":8400,"Ġwh":8401,"Ġdust":8402,"Ġ92":8403,"ĠMend":8404,"Ġchecking":8405,"ĠCow":8406,"sized":8407,"Ġautomatic":8408,"Ġcelebrates":8409,"Ġarena":8410,"Ġfinger":8411,"ĠHarvard":8412,"Ġfrustration":8413,"Ġstrict":8414,"Ġpreserve":8415,"Ġsleeping":8416,"Ġconverted":8417,"Ġinsights":8418,"Ġtra":8419,"Ġjailed":8420,"Ġchamber":8421,"Ġtoxic":8422,"ading":8423,"ĠTriple":8424,"grade":8425,"ĠRest":8426,"ĠHoly":8427,"oper":8428,"Ġdesk":8429,"Ġmatchup":8430,"Ġsteep":8431,"ĠGot":8432,"lay":8433,"ĠCab":8434,"aked":8435,"ĠFoster":8436,"Ġrunners":8437,"ĠNA":8438,"Ġdestroy":8439,"Ġsupportive":8440,"ĠRacing":8441,"Ġtrademark":8442,"Ġjacket":8443,"Ġhorror":8444,"ĠAle":8445,"Ġass":8446,"Ġsch":8447,"abb":8448,"Ġplanes":8449,"Ġimpression":8450,"ĠEarly":8451,"ĠPompe":8452,"Ġking":8453,"Ġsilent":8454,"ĠCuba":8455,"Ġmedication":8456,"ences":8457,"list":8458,"ailing":8459,"WA":8460,"ella":8461,"Ġprop":8462,"Ġhalt":8463,"Ġslowing":8464,"ĠFoods":8465,"Ġanonymous":8466,"kh":8467,"Ġtraveled":8468,"Ġcommunicate":8469,"Ġter":8470,"ĠHockey":8471,"ĠRobin":8472,"Ġswept":8473,"Ġclinic":8474,"ration":8475,"len":8476,"Ġau":8477,"Ġcareers":8478,"ĠSound":8479,"Ġaddresses":8480,"China":8481,"ĠSr":8482,"Ġexhibit":8483,"ĠMotors":8484,"ĠIl":8485,"Ġinstall":8486,"ĠOkay":8487,"Ġ>>":8488,"hood":8489,"stand":8490,"Ġaudit":8491,"Ġcake":8492,"Ġflames":8493,"bel":8494,"ĠMust":8495,"ĠManafort":8496,"Ġcommodity":8497,"night":8498,"ĠRoom":8499,"ĠLanka":8500,"Ġcommander":8501,"ln":8502,"Ġdatabase":8503,"ĠSet":8504,"Ġgraduated":8505,"ĠTarget":8506,"Ġoutbreak":8507,"rou":8508,"ĠPope":8509,"ĠEqu":8510,"Ġpolling":8511,"Ġdig":8512,"Ġbrutal":8513,"ĠBarn":8514,"Ġdefinition":8515,"Ġpit":8516,"Ġpickup":8517,"ĠBitcoin":8518,"ĠReid":8519,"Ġloving":8520,"ĠHerald":8521,"ĠCanadians":8522,"Ġneighbor":8523,"Ġdies":8524,"ione":8525,"ĠRef":8526,"big":8527,"Ġguards":8528,"including":8529,"ente":8530,"Ġpartially":8531,"Image":8532,"Ġbulk":8533,"Ġslot":8534,"ĠNorthwest":8535,"ĠBarclays":8536,"Ġairlines":8537,"iver":8538,"isi":8539,"Ġsubsidiary":8540,"Ġcont":8541,"ĠDaniels":8542,"Ġscript":8543,"Ġunfair":8544,"Ġscreens":8545,"Ġprof":8546,"ĠIrma":8547,"Ġ1992":8548,"Ġmandatory":8549,"ĠSant":8550,"Ġsuspicion":8551,"NES":8552,"ĠLauren":8553,"igen":8554,"Ġprevention":8555,"Ġtension":8556,"ema":8557,"Ġtasks":8558,"Ġshake":8559,"Ġexplosive":8560,"Ġaffects":8561,"Ġmum":8562,"ĠDog":8563,"rer":8564,"Ġopted":8565,"Ġtrio":8566,"Ġlesson":8567,"Ġautomotive":8568,"where":8569,"ĠMontgomery":8570,"Ġcouples":8571,"Ġ89":8572,"AF":8573,"Ġinfo":8574,"ĠForm":8575,"Ġspectrum":8576,"Ġbands":8577,"Ġokay":8578,"Ġstroke":8579,"ĠNetanyahu":8580,"Ġwealthy":8581,"ĠAround":8582,"ĠGlenn":8583,"sec":8584,"there":8585,"ickets":8586,"ĠBudget":8587,"ĠBMW":8588,"Ġflagship":8589,"rier":8590,"Ġpodcast":8591,"Ġpursuing":8592,"Ġpos":8593,"ĠIslands":8594,"ĠUrban":8595,"page":8596,"Ġemotions":8597,"ided":8598,"Ġdividends":8599,"Ġboom":8600,"Ġaccusing":8601,"ird":8602,"ĠNam":8603,"ava":8604,"Ġwishes":8605,"ĠNy":8606,"ĠStanford":8607,"Ġcriteria":8608,"ĠJews":8609,"Ġengineers":8610,"Ġaccuracy":8611,"Ġdisplays":8612,"Ġdeserves":8613,"ridge":8614,"omm":8615,"aur":8616,"Ġdramatically":8617,"Ġunity":8618,"speed":8619,"Ġdeclining":8620,"Ġpermits":8621,"ĠKn":8622,"Ġconsulting":8623,"aux":8624,"ATE":8625,"ĠWat":8626,"ĠEditor":8627,"sy":8628,"urn":8629,"ĠUsing":8630,"asc":8631,"ital":8632,"Ġcre":8633,"quality":8634,"Ġce":8635,"Ġenemy":8636,"Ġoffence":8637,"icket":8638,"ĠDick":8639,"ĠTH":8640,"ĠChampionships":8641,"Ġoverwhelming":8642,"rib":8643,"ku":8644,"rap":8645,"Ġhomer":8646,"acion":8647,"member":8648,"erv":8649,"aney":8650,"MB":8651,"eded":8652,"Ġpunishment":8653,"Ġnegotiate":8654,"ĠFile":8655,"stream":8656,"ĠHur":8657,"Ġnose":8658,"ĠFab":8659,"iter":8660,"Ġpainful":8661,"ITY":8662,"eren":8663,"Ġcollecting":8664,"Additional":8665,"Ġentrepreneurs":8666,"bal":8667,"Ġexploring":8668,"Ġguitar":8669,"Ġpartnerships":8670,"Ġfurniture":8671,"Ġauthorized":8672,"Ġeasing":8673,"shirt":8674,"ĠGross":8675,"Ġpolitician":8676,"ĠSimpson":8677,"Ġdrone":8678,"ĠKatie":8679,"Ġprofitability":8680,"ĠNHS":8681,"ĠSierra":8682,"ĠNorway":8683,"ASHINGTON":8684,"ific":8685,"Ġcondemned":8686,"team":8687,"ĠNebraska":8688,"Ġthrilled":8689,"iller":8690,"Ġpatrol":8691,"ĠWR":8692,"orm":8693,"Ġspectacular":8694,"ĠKnight":8695,"ĠTravel":8696,"nam":8697,"Ġmuscle":8698,"ĠRain":8699,"ĠColombia":8700,"Ġnursing":8701,"Ġmigration":8702,"ĠMitch":8703,"Ġreleasing":8704,"ĠBesides":8705,"ĠMul":8706,"Ġheadline":8707,"Ġcontemporary":8708,"Ġdev":8709,"ĠChan":8710,"Ġindicates":8711,"ĠAp":8712,"ĠLt":8713,"ĠMarvel":8714,"Ġremembered":8715,"®":8716,"ĠForces":8717,"ĠColin":8718,"ĠGabriel":8719,"Ġobjects":8720,"ĠRHP":8721,"kar":8722,"ĠKo":8723,"Ġsignals":8724,"Ġinner":8725,"real":8726,"RO":8727,"Ġromantic":8728,"cat":8729,"ĠKel":8730,"Ġgut":8731,"ĠBoys":8732,"Ġyoungest":8733,"ĠCeltics":8734,"Ġslated":8735,"Ġremind":8736,"Ġproductive":8737,"set":8738,"Co":8739,"ĠBailey":8740,"Ġrenewable":8741,"ĠCarson":8742,"ĠDj":8743,"ĠKos":8744,"Ġurge":8745,"Ġfin":8746,"Ġpursuit":8747,"ĠCON":8748,"ĠChapter":8749,"Ġpal":8750,"Ġgate":8751,"ĠPackers":8752,"ĠReports":8753,"ĠRugby":8754,"ĠMasters":8755,"MO":8756,"Ġ98":8757,"Ġcatches":8758,"ĠAgreement":8759,"ĠTillerson":8760,"ĠIce":8761,"Ġrumors":8762,"ĠLeonard":8763,"ĠDolphins":8764,"ĠLP":8765,"top":8766,"ĠCrist":8767,"ĠHon":8768,"Ġblaze":8769,"Ġrhetoric":8770,"ands":8771,"ady":8772,"David":8773,"igh":8774,"Ġbuzz":8775,"ĠStrong":8776,"Ġshocking":8777,"ĠRh":8778,"Ġnegotiating":8779,"Ġtender":8780,"ĠJohnny":8781,"ĠMario":8782,"Ġ97":8783,"ĠHeritage":8784,"Ġexists":8785,"Ġprayers":8786,"Ġlengthy":8787,"Ġsafer":8788,"ĠHalloween":8789,"ĠJared":8790,"ĠConnect":8791,"Ġbump":8792,"Ġstrain":8793,"Ġfilling":8794,"Ġtrauma":8795,"Ġcompleting":8796,"cht":8797,"Ġkillings":8798,"anne":8799,"GE":8800,"ĠRescue":8801,"Ġdealers":8802,"Ġlocals":8803,"ĠVictor":8804,"Ġtragic":8805,"Ġdelivers":8806,"orts":8807,"Ġrugby":8808,"Ġinstallation":8809,"asa":8810,"ĠBart":8811,"Ġjournal":8812,"school":8813,"ĠCome":8814,"ĠVeterans":8815,"Sun":8816,"Ġcrowds":8817,"Ġtransparent":8818,"Ġimplications":8819,"ĠHuawei":8820,"sex":8821,"Ġrallied":8822,"Ġresponses":8823,"Ġdebris":8824,"Ġconvention":8825,"Ġmothers":8826,"BE":8827,"ĠRoute":8828,"Ġrebel":8829,"ĠEmmanuel":8830,"aster":8831,"Ġunderstands":8832,"pound":8833,"ĠCastle":8834,"Ġ2021":8835,"rik":8836,"ĠGR":8837,"Ġconvince":8838,"ault":8839,"Ġpassionate":8840,"ĠSciences":8841,"Ġarrives":8842,"idad":8843,"Ġcelebrities":8844,"ends":8845,"ĠFans":8846,"Ġdish":8847,"ĠCorps":8848,"hat":8849,"Ġemployer":8850,"ĠHy":8851,"Ġpowered":8852,"Ġgrandmother":8853,"ĠFL":8854,"oured":8855,"VE":8856,"ĠInst":8857,"ĠPerez":8858,"Ġtune":8859,"Ġcitizenship":8860,"Ġignore":8861,"Ġdoubles":8862,"IB":8863,"Ġprogrammes":8864,"inda":8865,"Ġentities":8866,"ĠInterior":8867,"Ġprompting":8868,"Ġwire":8869,"Ġtheatre":8870,"%)":8871,"Ġheels":8872,"ĠJu":8873,"Ġdeposits":8874,"Ġtrash":8875,"mond":8876,"she":8877,"iana":8878,"Ġislands":8879,"ĠTommy":8880,"Ġpub":8881,"Ġdiscipline":8882,"ĠSW":8883,"Ġmusicians":8884,"Ġembassy":8885,"ĠQB":8886,"hander":8887,"UES":8888,"ĠFerguson":8889,"Ġblocking":8890,"ahn":8891,"Ġfines":8892,"Ġtactics":8893,"Ġbullet":8894,"Ġequipped":8895,"Ġescaped":8896,"ĠSil":8897,"ĠPack":8898,"ĠAthletic":8899,"ĠMic":8900,"ĠDoes":8901,"ĠCarr":8902,"ĠChargers":8903,"ĠKyl":8904,"Ġzones":8905,"µ":8906,"iki":8907,"Ġgreatly":8908,"ĠMD":8909,"Ġimmigrant":8910,"ĠConstruction":8911,"ĠBorn":8912,"iment":8913,"ĠWade":8914,"Ġvisa":8915,"Ġgenuine":8916,"Ġelectronics":8917,"ĠSat":8918,"Ġsponsors":8919,"ĠMontana":8920,"Ġspell":8921,"ĠSachs":8922,"ĠEt":8923,"Ġfoster":8924,"Ġlocker":8925,"Ġexplaining":8926,"ĠAge":8927,"Ġgunman":8928,"Ġsauce":8929,"Ġcry":8930,"Ġstimulus":8931,"Ġarray":8932,"Ġcompare":8933,"Ġboats":8934,"Ġext":8935,"iders":8936,"ĠAst":8937,"ĠParks":8938,"ester":8939,"Ġ94":8940,"Ġrelating":8941,"Ġvegetables":8942,"Ġaccountable":8943,"Ġhyper":8944,"ĠWim":8945,"Ġnewest":8946,"ĠRome":8947,"ĠChancellor":8948,"CBS":8949,"Ġbusinessman":8950,"ĠDelaware":8951,"Ġlands":8952,"court":8953,"aria":8954,"Ġapproaching":8955,"cker":8956,"ĠSalt":8957,"ĠMak":8958,"Ġtreating":8959,"Ġsubsequently":8960,"ĠEll":8961,"xton":8962,"Ġ180":8963,"Ġdetermination":8964,"ĠSalman":8965,"ĠJoel":8966,"Ġclassified":8967,"Ġspan":8968,"Ġearthquake":8969,"ranked":8970,"Ġ96":8971,"ĠTiger":8972,"Ġadvocacy":8973,"mit":8974,"Ġcolleges":8975,"ĠYeah":8976,"ĠCaptain":8977,"Ġorange":8978,"Ġprojections":8979,"Ġelectrical":8980,"ĠMA":8981,"olog":8982,"ĠNewcastle":8983,"oppers":8984,"Ġrepresentation":8985,"Ġlawsuits":8986,"just":8987,"aced":8988,"ĠRace":8989,"ĠAqu":8990,"ĠBills":8991,"Ġexclusively":8992,"ĠProfile":8993,"Ġhometown":8994,"ĠStan":8995,"Ġstarring":8996,"Ġdeciding":8997,"ĠRating":8998,"ĠMedicare":8999,"ĠTransport":9000,"Ġmystery":9001,"ĠTa":9002,"ĠPad":9003,"ĠSwedish":9004,"ĠCarroll":9005,"about":9006,"Ġtorn":9007,"Ġnurse":9008,"NE":9009,"Ġwaited":9010,"ĠJeffrey":9011,"ĠUntil":9012,"Ġbone":9013,"ĠBobby":9014,"Ġpronounced":9015,"Ġpharmaceutical":9016,"ĠGallery":9017,"ĠMatch":9018,"Ġeconomists":9019,"ĠMarketing":9020,"face":9021,"ĠPetroleum":9022,"ories":9023,"ĠMets":9024,"ĠCore":9025,"billion":9026,"Ġexamination":9027,"ĠPorter":9028,"2016":9029,"Ġgolden":9030,"Ġsem":9031,"ĠDuterte":9032,"ĠJefferson":9033,"ĠTehran":9034,"ĠLeicester":9035,"ĠDA":9036,"Ġadapt":9037,"ĠDame":9038,"ĠRic":9039,"Ġunchanged":9040,"ect":9041,"Ġsections":9042,"kg":9043,"igned":9044,"Ġfilings":9045,"Ġreact":9046,"Ġurgent":9047,"Ġvessels":9048,"Ġspark":9049,"Ġbutter":9050,"ĠCons":9051,"Ġstating":9052,"Ġcorporations":9053,"ĠHus":9054,"Ġdamaging":9055,"raw":9056,"Ġequality":9057,"Two":9058,"ĠMills":9059,"iu":9060,"Ġobligation":9061,"ĠBrook":9062,"arian":9063,"Re":9064,"Ġphotographs":9065,"Ġepic":9066,"ĠStudent":9067,"ĠTherefore":9068,"Ġgod":9069,"ĠFILE":9070,"iqu":9071,"Ġdescribing":9072,"Ġproceed":9073,"Ġcas":9074,"ĠKat":9075,"ĠBra":9076,"Ġadequate":9077,"Ġpassage":9078,"Ġthanked":9079,"USA":9080,"ĠNeither":9081,"ĠLegislature":9082,"Ġfinances":9083,"Ġinst":9084,"ĵ":9085,"ĠAngels":9086,"Ġvet":9087,"ĠDead":9088,"Ex":9089,"Ġkicks":9090,"force":9091,"Ġsoy":9092,"ĠWindsor":9093,"Ġenhanced":9094,"Ġ1993":9095,"ĠCzech":9096,"Ġgradually":9097,"ĠMagic":9098,"Ġshadow":9099,"Ġneighborhoods":9100,"ĠRivers":9101,"Ġrapper":9102,"ĠGirl":9103,"ĠRot":9104,"Ġcrackdown":9105,"fish":9106,"Ġpreventing":9107,"Ġproduces":9108,"ĠMi":9109,"Ġnotified":9110,"Ġunderground":9111,"WE":9112,"Ġadmits":9113,"Ġboxing":9114,"Ġrefer":9115,"Ġcommitments":9116,"ĠWoman":9117,"Ġdenies":9118,"col":9119,"ĠSide":9120,"Ġambulance":9121,"ĠRodgers":9122,"Ġaftermath":9123,"Ġdeck":9124,"irmed":9125,"Ġerrors":9126,"ĠConvention":9127,"Ġcurb":9128,"ĠShop":9129,"ĠThai":9130,"Ġma":9131,"Ġrespected":9132,"ĠMVP":9133,"Ġborrowing":9134,"Ġcruise":9135,"ĠSure":9136,"Ġsentencing":9137,"ĠObamacare":9138,"ĠIr":9139,"ĠSale":9140,"ĠPete":9141,"Ġopenly":9142,"Ġstartup":9143,"rock":9144,"Ġcargo":9145,"Ġtelecom":9146,"ĠDownload":9147,"Ġextending":9148,"ĠCurrent":9149,"Ġcompetitions":9150,"ĠKids":9151,"Ġshy":9152,"ĠKerry":9153,"ĠNever":9154,"ĠDevils":9155,"Ġprim":9156,"Con":9157,"Ġcurve":9158,"Ġassumed":9159,"Ġadjust":9160,"Ġimmune":9161,"UE":9162,"ĠUr":9163,"Ġconventional":9164,"Ġgrandchildren":9165,"ĠBol":9166,"Ad":9167,"ĠMaduro":9168,"fi":9169,"ĠUAE":9170,"ĠOrgan":9171,"Ġindicating":9172,"iem":9173,"ĠAgainst":9174,"ĠAmbassador":9175,"ĠSeoul":9176,"Ġcriminals":9177,"how":9178,"put":9179,"Ġreminded":9180,"Ġparked":9181,"lich":9182,"Ġcontinent":9183,"Ġmatched":9184,"ĠNicole":9185,"Ġgenetic":9186,"Ġhumanity":9187,"ĠTem":9188,"Ġindicator":9189,"Ġvessel":9190,"Ġdefendant":9191,"ĠGriffin":9192,"jan":9193,"Ġvend":9194,"boro":9195,"Ġbrokerage":9196,"ĠFall":9197,"Ġmere":9198,"VILLE":9199,"Ġlasted":9200,"ĠMind":9201,"Ġpatch":9202,"ĠInsider":9203,"ĠComm":9204,"Ġtechnique":9205,"ĠIM":9206,"ĠCavaliers":9207,"Ġshame":9208,"Ġmil":9209,"oot":9210,"irt":9211,"Ġcop":9212,"ĠLeon":9213,"Ġfrozen":9214,"Ġslip":9215,"pton":9216,"Ġpanels":9217,"Ġpitching":9218,"Ġleather":9219,"ĠLogan":9220,"ĠNearly":9221,"urch":9222,"Ġinstructions":9223,"ĠRow":9224,"ĠKurdish":9225,"this":9226,"Ġlegendary":9227,"su":9228,"Ġstabbed":9229,"sters":9230,"Ġteenage":9231,"def":9232,"Ġoversight":9233,"Ġvolatile":9234,"Ġtransmission":9235,"ĠSgt":9236,"ĠIndigenous":9237,"ĠOxford":9238,"ĠCasey":9239,"Ġcor":9240,"Ġsalaries":9241,"Ġsponsor":9242,"Ġprescription":9243,"mat":9244,"ĠLeeds":9245,"ĠPakistani":9246,"Ġevil":9247,"Ġtables":9248,"ĠAbdul":9249,"Ġexpectation":9250,"Ġlegislature":9251,"ĠLin":9252,"¹":9253,"Ġcontractor":9254,"Ġshifting":9255,"Ġgenerous":9256,"ĠEddie":9257,"Ġpuck":9258,"utt":9259,"Ġdubbed":9260,"Ġnowhere":9261,"Ġbetting":9262,"Ġdisclose":9263,"Ĥ":9264,"ĠFashion":9265,"ĠHarper":9266,"handed":9267,"isha":9268,"ĠReds":9269,"Ġachievements":9270,"ume":9271,"Ġshootings":9272,"Ġadvisers":9273,"ĠEaster":9274,"Ġinternationally":9275,"ĠWi":9276,"ĠGandhi":9277,"ĠChristians":9278,"Ġrecruiting":9279,"Ġexperiment":9280,"Ġsol":9281,"Ġdifficulties":9282,"Ġinfluential":9283,"Ġhybrid":9284,"Ġformation":9285,"ĠBoulevard":9286,"Ġflags":9287,"Ġformula":9288,"front":9289,"Ġinclusion":9290,"ĠNone":9291,"ICE":9292,"Ġfilming":9293,"ĠLou":9294,"ĠReynolds":9295,"Ġpump":9296,"Ġexceptional":9297,"ANG":9298,"ĠCorporate":9299,"SAN":9300,"ĠHealthcare":9301,"ĠUkrainian":9302,"aron":9303,"Ġpants":9304,"Ġdrops":9305,"ete":9306,"ĠStudies":9307,"Ġwounds":9308,"END":9309,"Ġshower":9310,"Ġreviewing":9311,"ĠGreater":9312,"Ġ»":9313,"itors":9314,"alled":9315,"Ġsqu":9316,"ĠRonald":9317,"ĠInv":9318,"Ġtougher":9319,"Ġbalanced":9320,"Ġlined":9321,"Ġprinciple":9322,"Ġ1950":9323,"Ġleak":9324,"Be":9325,"Ġcircuit":9326,"Ġunfortunate":9327,"ĠGran":9328,"ĠFish":9329,"Ġfriendship":9330,"asp":9331,"OO":9332,"Ġobligations":9333,"Ġcoup":9334,"OK":9335,"Ġbreakdown":9336,"Ġhook":9337,"Ġresearcher":9338,"inated":9339,"ĠMarie":9340,"ĠGab":9341,"ĠWA":9342,"quez":9343,"General":9344,"ĠSwift":9345,"Ġgust":9346,"ĠCarol":9347,"ĠCentury":9348,"ĠOPEC":9349,"ĠRd":9350,"ĠCop":9351,"Ġsubjects":9352,"ĠComments":9353,"ases":9354,"Ġrelation":9355,"ĠEnvironment":9356,"ı":9357,"Ġgasoline":9358,"ĠLog":9359,"Ġicon":9360,"Ġprofitable":9361,"ĠRetail":9362,"ANC":9363,"Ġappealing":9364,"Ġvillages":9365,"Ġpizza":9366,"Ġmall":9367,"Ġtower":9368,"ĠLinda":9369,"Ġaccomplished":9370,"Ġpod":9371,"Ġleaked":9372,"ĠWed":9373,"Ġmer":9374,"Ġopposing":9375,"!'":9376,"Ġstomach":9377,"Ġrevealing":9378,"Ġho":9379,"DF":9380,"ĠSterling":9381,"Ġsolely":9382,"Ġpres":9383,"ĠCy":9384,"ĠLatest":9385,"ĠPitt":9386,"ĠThink":9387,"Ġcapability":9388,"aled":9389,"Ġexecuted":9390,"alling":9391,"ĠSilva":9392,"Ġrestricted":9393,"Ġdeclaration":9394,"Ġkilometres":9395,"rol":9396,"Ġidentifying":9397,"Ġdonors":9398,"vent":9399,"Ġcostly":9400,"ense":9401,"ĠSeeking":9402,"OURCE":9403,"iving":9404,"Ġplacing":9405,"tech":9406,"Ġbottles":9407,"writer":9408,"ĠSeahawks":9409,"oming":9410,"ĠArthur":9411,"ously":9412,"bin":9413,"ĠVa":9414,"Ġbias":9415,"Ġliability":9416,"ift":9417,"rak":9418,"aves":9419,"Ġcautious":9420,"ĠPrize":9421,"iley":9422,"ĠSharma":9423,"global":9424,"Ġwars":9425,"sm":9426,"ĠRemember":9427,"wind":9428,"ĠRichardson":9429,"ĠSum":9430,"ĠVincent":9431,"ĠRice":9432,"inf":9433,"Ġconsultation":9434,"range":9435,"Ġbacteria":9436,"Ġarchitecture":9437,"Ġpole":9438,"ĠMach":9439,"Ġcattle":9440,"Ġabused":9441,"being":9442,"ĠHERE":9443,"Ġfame":9444,"Ġhearings":9445,"ĠBrit":9446,"Ġjoins":9447,"ĠMcGregor":9448,"Ġoppose":9449,"Ġcheer":9450,"itting":9451,"imes":9452,"Ġusage":9453,"Ġstint":9454,"Ġoutlet":9455,"Ġshoppers":9456,"ĠBaptist":9457,"Ġinappropriate":9458,"ĠALSO":9459,"Ġstealing":9460,"Ġpledge":9461,"ĠRan":9462,"Ġphotographer":9463,"Ġprevented":9464,"Ġ01":9465,"ĠEngineering":9466,"ĠProducts":9467,"Ġuniverse":9468,"ĠMcCarthy":9469,"¿":9470,"graded":9471,"Ġinspection":9472,"Ġind":9473,"Fi":9474,"aren":9475,"Ġprotections":9476,"Ġsorts":9477,"ĠWorks":9478,"Ġbillionaire":9479,"ĠGay":9480,"ĠiPad":9481,"IX":9482,"Ġdefendants":9483,"band":9484,"Ġfarms":9485,"Ġhom":9486,"gal":9487,"iant":9488,"Ġnortheast":9489,"ĠJoint":9490,"Ġcanceled":9491,"Ġtoys":9492,"Ġrein":9493,"ĠTumblr":9494,"pees":9495,"ĠAut":9496,"Police":9497,"Ġaide":9498,"Ġachieving":9499,"Ġmund":9500,"ĠCommercial":9501,"first":9502,"Ġanticipate":9503,"iac":9504,"Ġprobation":9505,"hem":9506,"Ġports":9507,"ĠKer":9508,"Ġsupplier":9509,"ĠFather":9510,"ĠAnti":9511,"ashed":9512,"ĠTable":9513,"bledon":9514,"Ġunf":9515,"ĠRash":9516,"ĠLeBron":9517,"Car":9518,"bu":9519,"ĠDerek":9520,"Ġaccounted":9521,"ĠPri":9522,"nings":9523,"Ġreceives":9524,"lev":9525,"Ġbilateral":9526,"ĠList":9527,"ĠLG":9528,"ĠJazz":9529,"Ġrestored":9530,"Ġbattles":9531,"ials":9532,"Ġoccupied":9533,"Ġrepairs":9534,"Ġradar":9535,"ĠMLB":9536,"ĠNC":9537,"Ġflexible":9538,"ĠCommand":9539,"Ġcoat":9540,"ĠVir":9541,"ĠColts":9542,"ĠBC":9543,"Ġtwin":9544,"Ġprisoners":9545,"Ġslowed":9546,"hop":9547,"ĠInn":9548,"Ġconflicts":9549,"Ġmeasured":9550,"Ġautonomous":9551,"ĠBow":9552,"Ġdisc":9553,"inson":9554,"ĠSche":9555,"aire":9556,"ĠSU":9557,"ĠPeterson":9558,"Ġdrafted":9559,"ĠPelosi":9560,"ĠSoon":9561,"Ġmechanism":9562,"Ġaccountability":9563,"ĠNortheast":9564,"Ġfo":9565,"Ġanalytics":9566,"ĠEverything":9567,"Ġperceived":9568,"bers":9569,"Ġcelebrations":9570,"Ġinstruments":9571,"Ġstrip":9572,"ĠJuventus":9573,"Ġunfortunately":9574,"ĠGA":9575,"Ġwrestling":9576,"Ġstatue":9577,"vis":9578,"five":9579,"Ġmarine":9580,"ĠSamuel":9581,"Ġresponsibilities":9582,"hill":9583,"Ġrecruit":9584,"Ġreferee":9585,"ĠRail":9586,"ĠEagle":9587,"ĠCongressional":9588,"Ġbreathing":9589,"Ġbass":9590,"hit":9591,"Ġspreading":9592,"Ġevacuated":9593,"Ġintellectual":9594,"Ġsovereign":9595,"ocked":9596,"Ġslammed":9597,"Ġformerly":9598,"Ġarch":9599,"Ġdifficulty":9600,"ĠAFC":9601,"ĠFresh":9602,"Ġinvite":9603,"oner":9604,"ĠMich":9605,"Ġpitches":9606,"stock":9607,"Ġinitiated":9608,"ĠKu":9609,"ĠFlorence":9610,"yd":9611,"ĠFast":9612,"Ġmusician":9613,"ĠChile":9614,"anga":9615,"Ġdairy":9616,"Ġcontractors":9617,"ador":9618,"ĠPlanning":9619,"Ġultra":9620,"Ġprayer":9621,"Ġsuggestions":9622,"ĠEk":9623,"Ġrandom":9624,"ĠSullivan":9625,"Ġsensor":9626,"Ġhomicide":9627,"ĠIncome":9628,"Ġsettings":9629,"Ġacknowledge":9630,"ĠStay":9631,"Ġterminal":9632,"Ġ1991":9633,"West":9634,"hard":9635,"arc":9636,"Ġcombine":9637,"Ġprivately":9638,"Ġbarrier":9639,"Ġmedian":9640,"Ġwhereas":9641,"ĠTitans":9642,"Ġincentives":9643,"Ġhistorically":9644,"Ġindictment":9645,"Ġhiding":9646,"ĠPDT":9647,"Ġrebuild":9648,"hol":9649,"Ġpour":9650,"Ġairports":9651,"ĠEdinburgh":9652,"Ġappoint":9653,"ĠJul":9654,"Ġconfusion":9655,"Ġdam":9656,"ork":9657,"Ġcalculated":9658,"Ġhood":9659,"ĠTemple":9660,"ĠYorkshire":9661,"EP":9662,"ented":9663,"Ġapology":9664,"awi":9665,"Ġfacilitate":9666,"ĠSheffield":9667,"Ġrides":9668,"Ġcompelling":9669,"ĠGonzalez":9670,"roll":9671,"ONG":9672,"UP":9673,"ĠAj":9674,"pen":9675,"ĠVar":9676,"ĠIPO":9677,"ĠAnimal":9678,"Ġshifted":9679,"Ġ140":9680,"Ġtobacco":9681,"El":9682,"ild":9683,"Ġuncertain":9684,"Un":9685,"Ġcaps":9686,"Ġrecreational":9687,"ĠTu":9688,"Ġenc":9689,"More":9690,"iko":9691,"ĠEverton":9692,"ĠWalk":9693,"Ġmurdered":9694,"Ġpur":9695,"Ġdivisions":9696,"ivo":9697,"Ġfarming":9698,"Ġcourage":9699,"ped":9700,"Ġcrying":9701,"Ġattributed":9702,"ée":9703,"Ġimplementing":9704,"ĠWang":9705,"Ġspeeds":9706,"alk":9707,"aming":9708,"eries":9709,"Ġavoided":9710,"ĠMessi":9711,"Ġconsiderable":9712,"rt":9713,"Ġinauguration":9714,"ĠPH":9715,"Ġsoldier":9716,"Ġore":9717,"ollywood":9718,"otive":9719,"ĠAuburn":9720,"ĠSav":9721,"ĠPut":9722,"Ġemphasis":9723,"Ġaf":9724,"owed":9725,"Ġdiagnosis":9726,"Ġcart":9727,"Ġassisted":9728,"ĠOrder":9729,"ĠEstate":9730,"Ġintends":9731,"ĠCommon":9732,"Ġadventure":9733,"Ġbeliefs":9734,"Ġlasting":9735,"cel":9736,"Ġdeployment":9737,"tra":9738,"ĠStories":9739,"Ġquote":9740,"Ġfeared":9741,"Ġconvenience":9742,"Ġoptimism":9743,"Ġscientist":9744,"ĠEnterprise":9745,"ĠRex":9746,"ĠFel":9747,"Ġposes":9748,"Ġroot":9749,"Ġevacuation":9750,"Ġpresidents":9751,"ĠRather":9752,"Ġgrave":9753,"ĠHeights":9754,"Ġjumping":9755,"driven":9756,"Ġaluminum":9757,"Ġholders":9758,"Ġboot":9759,"iber":9760,"Ġprecious":9761,"uation":9762,"FP":9763,"uses":9764,"Ġcommentary":9765,"Ġadvances":9766,"ĠNissan":9767,"Ġbronze":9768,"Ġinspire":9769,"Ġstarters":9770,"ĠEvan":9771,"rah":9772,"body":9773,"Ġcrops":9774,"Ġseeds":9775,"Ġharsh":9776,"ĠHomeland":9777,"Ġenabled":9778,"ological":9779,"Ġworkshop":9780,"Ġchains":9781,"amps":9782,"Ġamongst":9783,"ĠBear":9784,"Ġcertified":9785,"ĠJulie":9786,"Ġmountains":9787,"VA":9788,"Ġfed":9789,"Ġbuyer":9790,"ahl":9791,"ĠBos":9792,"ĠCrystal":9793,"Ġquest":9794,"ĠStein":9795,"Ġacceptable":9796,"Ġunbeaten":9797,"iring":9798,"ural":9799,"Ġuncomfortable":9800,"Ġpartial":9801,"Ġsacrifice":9802,"ĠGrande":9803,"Ġarrangement":9804,"Ġpackaging":9805,"screen":9806,"Ġmirror":9807,"Ġsweep":9808,"Ġconnecting":9809,"Ġpanic":9810,"ĠJacksonville":9811,"ĠKremlin":9812,"Ġorigin":9813,"Brien":9814,"Ġnorthwest":9815,"Ġcarriers":9816,"ĠRiley":9817,"Ġaud":9818,"Ġappreciation":9819,"Ġeliminated":9820,"ĠAnalyst":9821,"CR":9822,"Ġfirearm":9823,"Ġaccommodate":9824,"Ġstructural":9825,"Ġappealed":9826,"Ġcharter":9827,"ressing":9828,"Ġalike":9829,"white":9830,"Ġslowdown":9831,"Ġweigh":9832,"ĠPalmer":9833,"ound":9834,"ĠConn":9835,"Ġbranches":9836,"Ġace":9837,"Ġinsists":9838,"yo":9839,"ĠLynn":9840,"ĠCC":9841,"ĠWithin":9842,"Ġcoll":9843,"Ġsustain":9844,"Ġemerge":9845,"ĠBattle":9846,"VER":9847,"Ġaviation":9848,"Ġenables":9849,"ĠProduction":9850,"ĠGrove":9851,"Ġnationally":9852,"ĠBaldwin":9853,"rent":9854,"Ġfirearms":9855,"irm":9856,"Ġconsiders":9857,"ĠCosby":9858,"ĠMcK":9859,"ĠEnt":9860,"Ġincumbent":9861,"iance":9862,"Ġgiants":9863,"Ġkan":9864,"Ġminimal":9865,"ivity":9866,"ĠSay":9867,"ĠNass":9868,"Ġlovely":9869,"ĠFurthermore":9870,"Ġdisplaced":9871,"Ġcontacts":9872,"NY":9873,"Ġtechnological":9874,"ancy":9875,"Ġant":9876,"ope":9877,"ĠFY":9878,"Ġfavorable":9879,"ĠVirgin":9880,"Ġcasual":9881,"ĠLat":9882,"Ġpopulations":9883,"Ġromance":9884,"Ġforgotten":9885,"Ġfleeing":9886,"Ġspecialty":9887,"Ġdrill":9888,"Ġapplying":9889,"Ġcocaine":9890,"rea":9891,"Ġheroin":9892,"Ġsweeping":9893,"ĠMaj":9894,"Ġtroubled":9895,"Ġcolleague":9896,"Ġedged":9897,"omes":9898,"ĠHappy":9899,"´":9900,"Ġmilitant":9901,"boy":9902,"aver":9903,"Yes":9904,"llo":9905,"Ġsupporter":9906,"ĠSubscribe":9907,"ĠBird":9908,"ĠGibson":9909,"Ġhill":9910,"Ġnewspapers":9911,"ĠPHOTO":9912,"Ġouting":9913,"Ġdefine":9914,"Ġann":9915,"Ġrobot":9916,"Ġregret":9917,"ĠCould":9918,"raz":9919,"Ġceiling":9920,"Ġorganizers":9921,"ĠTw":9922,"Ġcriticised":9923,"ĠJoh":9924,"ĠJe":9925,"ĠBulls":9926,"Ġteeth":9927,"ĠRanch":9928,"ĠAndrea":9929,"Ġconservatives":9930,"Ġmag":9931,"vey":9932,"Ġpredecessor":9933,"ĠJPMorgan":9934,"Ġdraws":9935,"umber":9936,"Ġvaccine":9937,"ĠDas":9938,"Ġdisappeared":9939,"ĠIron":9940,"Ġlitigation":9941,"vert":9942,"Ġbelong":9943,"ĠRet":9944,"owers":9945,"rain":9946,"controlled":9947,"ĠKil":9948,"Ġrehab":9949,"ĠAustria":9950,"Ġprivilege":9951,"Ġbounce":9952,"Ġbout":9953,"ĠIslamist":9954,"Ġtaxi":9955,"ody":9956,".'\"":9957,"Ġdos":9958,"shire":9959,"Ġaccidents":9960,"Ġdemonstration":9961,"His":9962,"ĠBO":9963,"ĠICE":9964,"van":9965,"File":9966,"ĠManning":9967,"ounded":9968,"Ġdirections":9969,"lled":9970,"Ġoffences":9971,"Ġlaptop":9972,"ĠUniversal":9973,"Ġmilestone":9974,"ĠNarendra":9975,"Ġnotion":9976,"Ġuns":9977,"ĠLower":9978,"Ġmidfield":9979,"Ġoutper":9980,"trans":9981,"ĠJa":9982,"three":9983,"Adds":9984,"Ġpressures":9985,"Ġprohibited":9986,"Ġutilities":9987,"Ġbes":9988,"ĠReporter":9989,"Ġcommodities":9990,"leton":9991,"Ġslower":9992,"EE":9993,"auer":9994,"Ġtablet":9995,"sl":9996,"iously":9997,"Ġaiming":9998,"eland":9999,"ĠNEXT":10000,"tered":10001,"IVE":10002,"onic":10003,"May":10004,"ĠMilitary":10005,"Mark":10006,"Ġlender":10007,"mate":10008,"Ġaboard":10009,"they":10010,"Ġrespondents":10011,"Ġconversion":10012,"Ġsecuring":10013,"Ġentity":10014,"ĠHarbor":10015,"ĠCu":10016,"Ġcats":10017,"ĠACC":10018,"ĠIbrahim":10019,"GL":10020,"Ġinvitation":10021,"Ġcond":10022,"ĠRecords":10023,"ĠAdrian":10024,"Ġbrave":10025,"Ġmineral":10026,"Ġsooner":10027,"Ġsatisfied":10028,"Ġpets":10029,"Ġnotably":10030,"ı":10031,"Ġmarking":10032,"ĠRO":10033,"ĠHaw":10034,"ĠVis":10035,"Ġmarketplace":10036,"ĠNat":10037,"ĠForward":10038,"ĠLeft":10039,"Ġaggravated":10040,"ĠClose":10041,"acey":10042,"Ġlandmark":10043,"Ġdisruption":10044,"ĠChallenge":10045,"ĠDays":10046,"ĠCoun":10047,"ahan":10048,"Ġaides":10049,"South":10050,"ĠDylan":10051,"ĠRavens":10052,"ĠNature":10053,"lli":10054,"Ġdiplomats":10055,"350":10056,"ĠDrake":10057,"tag":10058,"Ġlicensed":10059,"ĠDenmark":10060,"Ġcancel":10061,"Ġinstant":10062,"DI":10063,"Ġpunch":10064,"ĠJenkins":10065,"Ġstrengthening":10066,"des":10067,"-$":10068,"Ġallegation":10069,"Ġsizes":10070,"iza":10071,"Ġmentally":10072,"ĠResidents":10073,"acked":10074,"Ġsensors":10075,",'\"":10076,"illion":10077,"ĠChampion":10078,"Ġexcessive":10079,"Ġhum":10080,"ĠComp":10081,"rend":10082,"ĠLakes":10083,"Ġburst":10084,"Ġtrainer":10085,"Ġclearing":10086,"ĠSilicon":10087,"Ġ350":10088,"DE":10089,"ĠGates":10090,"ĠHorn":10091,"ests":10092,"ĠCourtesy":10093,"Ġbipartisan":10094,"Ġhabits":10095,"ĠAlexa":10096,"walk":10097,"Ġsnapped":10098,"ĠEight":10099,"itis":10100,"zel":10101,"Ġcustoms":10102,"Ġsouthwest":10103,"Ġvary":10104,"Because":10105,"Ġpayout":10106,"Ġaccelerate":10107,"ĠBarr":10108,"tu":10109,"Ġfined":10110,"cost":10111,"ĠTheater":10112,"ĠCorbyn":10113,"Ġstem":10114,"Ġundermine":10115,".;":10116,"Ġstays":10117,"Ġbreakthrough":10118,"Ġturnover":10119,"hot":10120,"Ġtriumph":10121,"Ġpainted":10122,"ĠWinnipeg":10123,"ĠKas":10124,"ĠStuart":10125,"irk":10126,"Am":10127,"Ġtrusted":10128,"aze":10129,"ĠLate":10130,"Ġaccessories":10131,"Ġmemorable":10132,"ĠFool":10133,"Ġrotation":10134,"ĠBulldogs":10135,"ĠChen":10136,"Ġpoised":10137,"ĠMonte":10138,"ĠClarke":10139,"leading":10140,"Ġvenues":10141,"Ġbeneficial":10142,"ĠLiam":10143,"ĠBrothers":10144,"ĠNeed":10145,"Ġconc":10146,"olly":10147,"ĠJulian":10148,"ogue":10149,"Ġfounding":10150,"Ġsidelines":10151,"Ġdeclare":10152,"ĠMember":10153,"Ġexamine":10154,"abs":10155,"Ġboundaries":10156,"ĠBrisbane":10157,"Ġlaunches":10158,"lor":10159,"ĠGa":10160,"Ġthr":10161,"expected":10162,"wal":10163,"ĠBarnes":10164,"Ġclashes":10165,"content":10166,"ĠClemson":10167,"iger":10168,"Mar":10169,"Ġaccord":10170,"Ġsoutheast":10171,"ģ":10172,"ĠStarbucks":10173,"osing":10174,"Ġseasonal":10175,"icking":10176,"Ġloyalty":10177,"Ġtent":10178,"ĠDy":10179,"Ġevident":10180,"Ġlobby":10181,"Ġtours":10182,"Ġbombing":10183,"uations":10184,"Ġrises":10185,"Ġdemonstrations":10186,"ĠWATCH":10187,"pin":10188,"Ġdeb":10189,"ĠDraft":10190,"rog":10191,"Ġseal":10192,"ĠPerformance":10193,"ĠLGBT":10194,"Ġsed":10195,"Ġgig":10196,"nan":10197,"Ġrainfall":10198,"Ġfabric":10199,"Ġmanages":10200,"Ġlifting":10201,"ĠMagazine":10202,"ĠCriminal":10203,"Ġhikes":10204,"Ġcatching":10205,"Ġ1989":10206,"OG":10207,"Ġdisappointment":10208,"Ġir":10209,"ĠEV":10210,"stown":10211,"pass":10212,"120":10213,"Ġmedals":10214,"ĠSimmons":10215,"Ġinaugural":10216,"ĠCorn":10217,"Ġmotorcycle":10218,"lets":10219,"ĠSkype":10220,"ét":10221,"Ġscary":10222,"opp":10223,"thirds":10224,"ĠMohamed":10225,"Ġteenagers":10226,"ANK":10227,"Ġserver":10228,"Ġouts":10229,"Ġdishes":10230,"four":10231,"dr":10232,"ĠOt":10233,"ĠSandy":10234,"ĠShane":10235,"orters":10236,"SH":10237,"Ġtouching":10238,"ĠNike":10239,"ĠHBO":10240,"driving":10241,"Ġplug":10242,"ĠBaseball":10243,"eling":10244,"hn":10245,"ulate":10246,"eed":10247,"ĠChristine":10248,"ĠGlobe":10249,"Ġethics":10250,"ĠTrevor":10251,"iya":10252,"Ġ360":10253,"Ġawaiting":10254,"Ġcounterpart":10255,"Ġsubsidies":10256,"pointers":10257,"Ġspy":10258,"ILL":10259,"Ġtakeover":10260,"ĠBeyond":10261,"Ġsurprisingly":10262,"TION":10263,"ĠSong":10264,"Ġni":10265,"Ġcommonly":10266,"Ġjack":10267,"Ġsubstitute":10268,"ews":10269,"Ġrecalls":10270,"ĠCommons":10271,"Ġsin":10272,"del":10273,"ĠMod":10274,"Ġpressing":10275,"ĠTelevision":10276,"ĠInside":10277,"ª":10278,"Ġbacklash":10279,"Ġcredible":10280,"ĠJenner":10281,"ĠPu":10282,"ĠStevens":10283,"ĠWE":10284,"Last":10285,"Ġinsurers":10286,"ĠJoin":10287,"bled":10288,"digit":10289,"Ġflooded":10290,"ĠShore":10291,"ĠTrophy":10292,"zing":10293,"ĠImmigration":10294,"Ġsuperior":10295,"IAN":10296,"Ġcasino":10297,"Ġenabling":10298,"Ġmeantime":10299,"Ġperformers":10300,"Ġproportion":10301,"Ġlawmaker":10302,"ĠConf":10303,"Ġconvert":10304,"Ġfarmer":10305,"Ġbu":10306,"ĠGE":10307,"ĠRepresentative":10308,"ĠBannon":10309,"ĠHelp":10310,"PT":10311,"formed":10312,"ĠSuperintendent":10313,"Ġfrustrating":10314,"ĠRegister":10315,"ĠPolitical":10316,"Ġboots":10317,"ĠRu":10318,"ĠSha":10319,"Ġinstrument":10320,"tor":10321,"ĠBelt":10322,"ĠWalsh":10323,"Ġrecipe":10324,"ilt":10325,"ĠClean":10326,"iors":10327,"Ġtwenty":10328,"iler":10329,"nder":10330,"Ġwinger":10331,"Ġwheat":10332,"ĠAviation":10333,"Ġcorrupt":10334,"Ġconnectivity":10335,"ĠVen":10336,"order":10337,"esc":10338,"break":10339,"Ġmetals":10340,"Ġtraditionally":10341,"Ġbell":10342,"Ġviolating":10343,"rough":10344,"Ġintroducing":10345,"Ġguided":10346,"ĠMol":10347,"Ġdesert":10348,"ĠBree":10349,"Le":10350,"ĠZone":10351,"ĠGlass":10352,"ĠEUR":10353,"ĠYahoo":10354,"Ġlaps":10355,"Ġdiffer":10356,"ĠHold":10357,"Ġtimely":10358,"Ġsuccessor":10359,"Ġcomic":10360,"Ġbears":10361,"Ġlicence":10362,"Ġreject":10363,"Ġsophisticated":10364,"Too":10365,"Ġobjectives":10366,"ĠId":10367,"urers":10368,"Ġraid":10369,"COM":10370,"Ġelect":10371,"ĠHampshire":10372,"Ġlens":10373,"Ġdesigners":10374,"Ġpresently":10375,"ĠRCMP":10376,"ĠEgyptian":10377,"ĠWalter":10378,"ĠWallace":10379,"Ġ2025":10380,"utics":10381,"ried":10382,"Ġrefuse":10383,"Ġsiblings":10384,"ĠNothing":10385,"Ġdressing":10386,"Ġnerve":10387,"AST":10388,"Ġuncertainties":10389,"Ġtale":10390,"ĠTalk":10391,"Ġissuing":10392,"shot":10393,"ĠTak":10394,"Ġacid":10395,"ĠNintendo":10396,"Ġwash":10397,"pd":10398,"ĠClaire":10399,"ĠScot":10400,"Ġsuits":10401,"ĠBayern":10402,"gest":10403,"Ġapplicable":10404,"Ġinteraction":10405,"ĠEnforcement":10406,"ĠRohingya":10407,"Ġjan":10408,"Ġunited":10409,"ĠCoalition":10410,"Ġlegislators":10411,"Ġdetectives":10412,"ĠSing":10413,"ĠBetween":10414,"ĠPoly":10415,"pool":10416,"mal":10417,"Ġreply":10418,"Ġschemes":10419,"ĠHolmes":10420,"ĠSenators":10421,"ĠVerizon":10422,"Ġwelcoming":10423,"ĠCricket":10424,"ĠMarco":10425,"ĠYears":10426,"ĠLiving":10427,"Ġcounterparts":10428,"ĠParadise":10429,"ĠTrad":10430,"#":10431,"iw":10432,"ĠSoccer":10433,"umbled":10434,"Ġdeceased":10435,"heim":10436,"Ġevaluation":10437,"Ġwrap":10438,"Ġmild":10439,"aji":10440,"ĠUCLA":10441,"ĠNative":10442,"president":10443,"ĠXbox":10444,"Ġenterprises":10445,"ĠSlam":10446,"oga":10447,"Rock":10448,"piece":10449,"ĠColeman":10450,"Ġcomparable":10451,"uba":10452,"Ġprovinces":10453,"ĠFormula":10454,"ipt":10455,"ô":10456,"Ġtick":10457,"ĠIMF":10458,"anch":10459,"atta":10460,"rew":10461,"However":10462,"LS":10463,"etta":10464,"ĠCustoms":10465,"SU":10466,"Ġpublishing":10467,"Ġinch":10468,"Ġkills":10469,"¤":10470,"ĠSus":10471,"ĠBeth":10472,"Ġsteam":10473,"jpg":10474,"pointer":10475,"Ġturnovers":10476,"Ġpowder":10477,"ĠUSB":10478,"ĠWildlife":10479,"ĠDirect":10480,"atively":10481,"ĠFerrari":10482,"Ġpleasure":10483,"ĠMatthews":10484,"Ġski":10485,"ography":10486,"ĠVermont":10487,"ĠMargaret":10488,"ĠMunich":10489,"Ġlayer":10490,"ĠProperty":10491,"Ġeconomics":10492,"ĠCrew":10493,"UK":10494,"Ġunnecessary":10495,"ĠGlasgow":10496,"Ġsealed":10497,"Ġclarity":10498,"Ġsurplus":10499,"ĠCanyon":10500,"ĠApart":10501,"Ġacceptance":10502,"ĠEllis":10503,"uster":10504,"rid":10505,"ĠHawks":10506,"Ġstatewide":10507,"Ġthreaten":10508,"ĠJail":10509,"Ġinclusive":10510,"Ġmud":10511,"Ġpat":10512,"Ġbitter":10513,"Ġalternatives":10514,"Ġaffiliate":10515,"Ġevaluate":10516,"ĠBaby":10517,"Ġperception":10518,"tim":10519,"Ġrefusing":10520,"Ġgrey":10521,"Ġarguably":10522,"Ġfirmly":10523,"ĠDark":10524,"Ġexcuse":10525,"ĠRaymond":10526,"Ġballots":10527,"inton":10528,"Ġ125":10529,"ĠCatherine":10530,"Ġsacks":10531,"ĠDeb":10532,"Ġworkout":10533,"web":10534,"Ġbatteries":10535,"breaking":10536,"ML":10537,"Ġunacceptable":10538,"ĠValentine":10539,"ĠYOU":10540,"ĠRT":10541,"Ġjurisdiction":10542,"Ġexamined":10543,"strom":10544,"ĠPocket":10545,"Ġcement":10546,"Ġuniversal":10547,"ĠOz":10548,"Ġkit":10549,"Ġchurches":10550,"Ġsuburban":10551,"ĠKushner":10552,"ĠDavidson":10553,"Sports":10554,"email":10555,"Ġrealistic":10556,"Ġintend":10557,"ĠGrey":10558,",''":10559,"Ġscholarship":10560,"Ġphilosophy":10561,"Ġwheels":10562,"Ġmotivation":10563,"eway":10564,"match":10565,"ĠDate":10566,"John":10567,"Ġcontrolling":10568,"750":10569,"aven":10570,"Ġfilmed":10571,"Ġ160":10572,"ĠBrock":10573,"ĠDetails":10574,"Ġlogistics":10575,"Ġassumptions":10576,"ĠStep":10577,"Ġfails":10578,"ĠNotre":10579,"Ġjuice":10580,"Ġcounting":10581,"Ġphotograph":10582,"Ġfortunate":10583,"Ġestablishing":10584,"ĠNJ":10585,"ĠWorkers":10586,"ĠQuinn":10587,"ĠHeather":10588,"Ġtimeline":10589,"Ġimported":10590,"ĠNASCAR":10591,"Ġexercises":10592,"Ġsearched":10593,"ĠRalph":10594,"alf":10595,"Ġgene":10596,"Ġdependent":10597,"én":10598,"iate":10599,"ĠBristol":10600,"Ġhung":10601,"Ġtropical":10602,"Ġintensity":10603,"ĠIdaho":10604,"ĠMull":10605,"Ġsuite":10606,"Ġblockchain":10607,"cz":10608,"ovich":10609,"Ġworn":10610,"ĠLE":10611,"AV":10612,"emi":10613,"Ġidentification":10614,"Ġtunnel":10615,"ĠARE":10616,"ĠArm":10617,"Ġoutrage":10618,"Ġtwist":10619,"uka":10620,"ĠGra":10621,"Ġjets":10622,"ĠThus":10623,"Ġcompound":10624,"Ġfinancially":10625,"2019":10626,"asse":10627,"Ġspare":10628,"ĠNoah":10629,"ĠMade":10630,"ĠMom":10631,"Ġphenomenon":10632,"Ġnurses":10633,"Ġoutlined":10634,"Ġpolit":10635,"ĠCarm":10636,"Ġleagues":10637,"Ġmath":10638,"Ġmodified":10639,"Ġwillingness":10640,"ĠAmanda":10641,"Ġgrandfather":10642,"Of":10643,"DR":10644,"Ġdip":10645,"ĠRAM":10646,"ĠChristie":10647,"Ġargues":10648,"ĠEX":10649,"ĠNine":10650,"ĠScroll":10651,"ĠTHIS":10652,"Pro":10653,"Ġkeys":10654,"Ġprocessor":10655,"Ġscam":10656,"ĠTraining":10657,"Ġhoney":10658,"Ĵ":10659,"Ġfacebook":10660,"ĠLegal":10661,"Ġaging":10662,"Ġspiritual":10663,"ĠHost":10664,"Ġlung":10665,"ĠUSC":10666,"Ġdirt":10667,"Ġfe":10668,"after":10669,"ĠDiana":10670,"Ġounce":10671,"date":10672,"ĠFinals":10673,"Ķ":10674,"Ġthorough":10675,"Ġviable":10676,"Ġanytime":10677,"Ġfost":10678,"orter":10679,"ware":10680,"ĠHolland":10681,"ĠMand":10682,"ĠSend":10683,"2013":10684,"ĠVolkswagen":10685,"Ġsuitable":10686,"ifies":10687,"Ġcomedian":10688,"Ġneighbours":10689,"ĠKnow":10690,"Ġcurious":10691,"ĠTwenty":10692,"ĠPrevention":10693,"ĠStephanie":10694,"Ġpilots":10695,"Ġstored":10696,"Ġdire":10697,"Ġfits":10698,"ision":10699,"ĠShell":10700,"Ġshifts":10701,"Ġpepper":10702,"Ġattendees":10703,"ĠName":10704,"hers":10705,"rip":10706,"Ġwatchdog":10707,"andy":10708,"Ġbio":10709,"Ġpublisher":10710,"powered":10711,"ĠCM":10712,"rian":10713,"ĠRand":10714,"wise":10715,"ĠJesse":10716,"Ġladies":10717,"ĠMetropolitan":10718,"ĠMicro":10719,"Ġkicking":10720,"Ġmeg":10721,"Ġclouds":10722,"Ġtrim":10723,"wear":10724,"ĠML":10725,"Ġconsists":10726,"Ġrig":10727,"Ġhonestly":10728,"GS":10729,"ĠNicholas":10730,"Ġcope":10731,"Ġpublish":10732,"working":10733,"bur":10734,"ĠNar":10735,"olds":10736,"aja":10737,"ĠSad":10738,"Ġclicking":10739,"Ġbids":10740,"ĠZuckerberg":10741,"Ġ900":10742,"Ġexam":10743,"ivers":10744,"Ġpray":10745,"Ġreader":10746,"ĠSeth":10747,"inem":10748,"Ġconfront":10749,"stra":10750,"AW":10751,"ĠGian":10752,"Ġaccordance":10753,"Ġinteract":10754,"ĠSharks":10755,"Ġfireworks":10756,"gment":10757,"illy":10758,"Ġconst":10759,"ARY":10760,"Ġprizes":10761,"Ġshoulders":10762,"Ġaccessed":10763,"Ġecosystem":10764,"Ġlicensing":10765,"La":10766,"Ġdedication":10767,"Ġdé":10768,"Ġyouths":10769,"lem":10770,"Ġtoy":10771,"ĠProm":10772,"ounding":10773,"rod":10774,"Ġ1000":10775,"ishes":10776,"Over":10777,"Ġgaps":10778,"Ġmissions":10779,"Ġrailway":10780,"Day":10781,"orp":10782,"ĠSchumer":10783,"Ġeclipse":10784,"Ġshell":10785,"ĠBY":10786,"Many":10787,"ĠRecord":10788,"Ġdrunk":10789,"ayan":10790,"Ġsuggestion":10791,"Ġdefenders":10792,"ĠNewton":10793,"Ġdisputes":10794,"Ġevolution":10795,"Ġcredibility":10796,"ĠTenn":10797,"Ġplain":10798,"size":10799,"cont":10800,"Ġlone":10801,"Ġfingers":10802,"BUR":10803,"ĠInvestigation":10804,"ĠQualcomm":10805,"var":10806,"Ġcountless":10807,"ĠRebecca":10808,"½":10809,"abi":10810,"Ġreflecting":10811,"ĠTurn":10812,"Ġinteractive":10813,"Ġincentive":10814,"second":10815,"offs":10816,"ĠBerkeley":10817,"ĠTexans":10818,"Ġheated":10819,"Ġscorer":10820,"ĠSharif":10821,"Ġmigrant":10822,"west":10823,"ĠHoliday":10824,"Ġwrist":10825,"Ġchairs":10826,"Ġrecommends":10827,"ĠWildcats":10828,"ĠPed":10829,"ĠQuarter":10830,"ĠIV":10831,"ĠArch":10832,"Ġstandings":10833,"Ġbombs":10834,"Ġcapped":10835,"Can":10836,"Ġcaring":10837,"ĠLah":10838,"lim":10839,"Ġdragged":10840,"ĠBeat":10841,"DB":10842,"Ġaired":10843,"Ġjeans":10844,"action":10845,"Ġgenerating":10846,"ĠGir":10847,"risk":10848,"lon":10849,"stage":10850,"âĤ¬":10851,"earing":10852,"ĠTogether":10853,"Ġreun":10854,"ĠCorey":10855,"ĠBak":10856,"Ġprestigious":10857,"Ġapplicants":10858,"here":10859,"ĠMattis":10860,"Ġridiculous":10861,"ĠLess":10862,"Ġrains":10863,"Ġpresenting":10864,"anti":10865,"Ġdisabilities":10866,"Ġapartments":10867,"storm":10868,"ĠHem":10869,"Ġhabit":10870,"ĠRuth":10871,"ĠNPR":10872,"nut":10873,"Ġappreciated":10874,"Ġseparation":10875,"uda":10876,"Ġminus":10877,"ĠPhotos":10878,"Ġblew":10879,"ĠVoice":10880,"Ġrallies":10881,"Ġfond":10882,"ĠTaking":10883,"yt":10884,"FE":10885,"ĠTory":10886,"ressed":10887,"ĠLy":10888,"Ġrocks":10889,"ĠRah":10890,"Ġelementary":10891,"nis":10892,"ĠPresidential":10893,"Ġnutrition":10894,"Ġbaseman":10895,"Ġsuperstar":10896,"ĠWa":10897,"lar":10898,"Ġstaged":10899,"ĠLearn":10900,"Ġbroadcaster":10901,"Ġboasts":10902,"Ġdoubts":10903,"rum":10904,"Ġbare":10905,"cap":10906,"Ġclimbing":10907,"ĠSelect":10908,"ĠCant":10909,"ĠNord":10910,"ĠBeck":10911,"ĠKad":10912,"ello":10913,"Ġenforce":10914,"ĠZe":10915,"ked":10916,"elly":10917,"ĠLED":10918,"ĠOperations":10919,"ĠLuk":10920,"Ġcertificate":10921,"Ġdeter":10922,"Ġspill":10923,"Ġgrain":10924,"league":10925,"Up":10926,"ĠKid":10927,"using":10928,"ĠJays":10929,"Ġoccasionally":10930,"ĠMI":10931,"yes":10932,"Ġdetect":10933,"Ġpropaganda":10934,"Ġneighboring":10935,"sub":10936,"avan":10937,"ĠAstros":10938,"oti":10939,"threatening":10940,"Ġshorter":10941,"INGS":10942,"Ġfeeding":10943,"Ġelevated":10944,"ĠWenger":10945,"Ġundergo":10946,"Ġpsychological":10947,"Ġautom":10948,"NP":10949,"anks":10950,"ĠNokia":10951,"Ġdrones":10952,"Ġrecognised":10953,"Ġheroes":10954,"agen":10955,"Ġparole":10956,"ĠBah":10957,"Ġhomeowners":10958,"ĠSweet":10959,"Ġinstances":10960,"ĠParish":10961,"ĠSL":10962,"Ġunw":10963,"Ġdelicious":10964,"¯":10965,"ĠInvestments":10966,"ĠPhilippine":10967,"inos":10968,"Ġmes":10969,"Ġbite":10970,"Ġcornerback":10971,"ĠHat":10972,"Ġdeserved":10973,"ologists":10974,"[":10975,"Ġwrongdoing":10976,"ĠTrent":10977,"ĠVe":10978,"ĠDeal":10979,"Mr":10980,"Ġovers":10981,"Ġhonors":10982,"ĠITV":10983,"Ġpayroll":10984,"Ġconfused":10985,"Ġelaborate":10986,"ange":10987,"World":10988,"ĠResort":10989,"ilia":10990,"ĠKr":10991,"Ġconclude":10992,"First":10993,"ĠDR":10994,"Ġpeer":10995,"Ġrunway":10996,"ĠPotter":10997,"cons":10998,"bad":10999,"si":11000,"ĠClimate":11001,"ĠHoll":11002,"Ġweighing":11003,"Ġepidemic":11004,"ĠBible":11005,"Ġhon":11006,"Ġrenew":11007,"Ġgambling":11008,"ĠNationals":11009,"itable":11010,"ĠOutlook":11011,"Ġreactions":11012,"ĠCos":11013,"ĠDana":11014,"India":11015,"ĠAirbus":11016,"power":11017,"watch":11018,"Ġstyles":11019,"Ġordinance":11020,"Ġcam":11021,"Ġinvent":11022,"ĠDurant":11023,"Ġexchanged":11024,"Ġyoga":11025,"ĠMichel":11026,"ĠWyoming":11027,"ĠPhase":11028,"ĠHannah":11029,"Ġtem":11030,"Ġfare":11031,"omer":11032,"Ġtrails":11033,"Ġquietly":11034,"ĠFourth":11035,"Ġwise":11036,"Ġappetite":11037,"Ġpedestrian":11038,"Ġfierce":11039,"hin":11040,"ako":11041,"Ġvacant":11042,"Ġdynamics":11043,"Ġbust":11044,"ĠGT":11045,"century":11046,"Ġpermitted":11047,"Ġfog":11048,"Ġrecruitment":11049,"ĠDue":11050,"Ġbro":11051,"Ġsil":11052,"ĠOpp":11053,"Ġphrase":11054,"ĠChip":11055,"ĠBase":11056,"Ġjazz":11057,"Ġenemies":11058,"Ġremainder":11059,"bles":11060,"Ġ105":11061,"ĠGur":11062,"Ġretiring":11063,"ĠCour":11064,"ĠSi":11065,"Ġinevitable":11066,"ĠAdvisory":11067,"ĠCampaign":11068,"ĠPeninsula":11069,"base":11070,"Ġjustify":11071,"inen":11072,"North":11073,"Ġfreezing":11074,"Ġphotography":11075,"Ġappointments":11076,"ĠTree":11077,"Os":11078,"Ġdivide":11079,"ĠMMA":11080,"Ġdeclines":11081,"ĠAbbott":11082,"ACH":11083,"ĠJah":11084,"Ġspr":11085,"Ġskilled":11086,"ĠTry":11087,"ANT":11088,"ael":11089,"ĠMcN":11090,"Ġtariff":11091,"generation":11092,"ĠMans":11093,"Or":11094,"Ġraped":11095,"Ġdisability":11096,"Ġnominations":11097,"Ġhappiness":11098,"ĠLSU":11099,"ĠInterstate":11100,"ĠDance":11101,"ĠMaking":11102,"Ġbailout":11103,"oro":11104,"ĠObviously":11105,"Ġinbox":11106,"football":11107,"hy":11108,"ĠCase":11109,"Ġentertaining":11110,"Ġhardest":11111,"ĠOpposition":11112,"Ġflip":11113,"ĠPirates":11114,"anu":11115,"ĠKlopp":11116,"Ġballistic":11117,"Ġprinted":11118,"ĠNFC":11119,"UST":11120,"Ġglasses":11121,"Ġrum":11122,"ĠDuncan":11123,"hal":11124,"Ġpreview":11125,"BER":11126,"dec":11127,"Ġsustainability":11128,"Ġaff":11129,"Ġhungry":11130,"service":11131,"avi":11132,"Ġsometime":11133,"Ġmod":11134,"ĠLib":11135,"oko":11136,"Ġfundraiser":11137,"Ġcrowded":11138,"mates":11139,"Ġcreativity":11140,"ĠHell":11141,"Ġtreaty":11142,"ĠSoftware":11143,"ĠRandy":11144,"ĠPolish":11145,"sa":11146,"ardi":11147,"Ġcab":11148,"ĠCamera":11149,"Ġlicenses":11150,"Ġ1988":11151,"Ġcontinuous":11152,"Ġpaired":11153,"Ġtally":11154,"Ġgrip":11155,"cho":11156,"Ġsurged":11157,"Ġpodium":11158,"Ġcontrary":11159,"SL":11160,"ĠResearchers":11161,"cing":11162,"Ġmi":11163,"Ġdisputed":11164,"Ġgrades":11165,"Ġseverely":11166,"ĠMcL":11167,"ondo":11168,"Ġshelters":11169,"Ġdomain":11170,"ĠSwitch":11171,"Ġtestify":11172,"case":11173,"omet":11174,"atch":11175,"ĠAff":11176,"Ġcasting":11177,"berger":11178,"Ġintimate":11179,"erc":11180,"plan":11181,"ĠPast":11182,"ĠUt":11183,"Ġapologized":11184,"ĠDet":11185,"alle":11186,"Ġwhilst":11187,"Ġpel":11188,"Ġexecute":11189,"Ġharmful":11190,"ĠRB":11191,"onda":11192,"ĠFul":11193,"II":11194,"Those":11195,"Ġcryptocurrency":11196,"Ġrealise":11197,"ĠAthens":11198,"ĠApplication":11199,"ORD":11200,"Ġmidst":11201,"ĠSem":11202,"Ġmessaging":11203,"Ġcousin":11204,"ĠMarsh":11205,"ĠAlmost":11206,"uto":11207,"wire":11208,"ĠManaging":11209,"Ġsends":11210,"ĠDerby":11211,"Ġpad":11212,"Ġdevoted":11213,"ĠWorking":11214,"ĠWestminster":11215,"Ġdirty":11216,"ements":11217,"ĠLew":11218,"door":11219,"Ġadvisor":11220,"ival":11221,"Ġsubscribe":11222,"Ġcredited":11223,"Ġpressed":11224,"Ġbrick":11225,"Ġrehabilitation":11226,"Ġ\"[":11227,"erry":11228,"Ġtransformed":11229,"arp":11230,"Ġreceivers":11231,"ĠFan":11232,"ĠKris":11233,"ĠCharlottesville":11234,"Ġste":11235,"Ġconstructed":11236,"Ġbroadly":11237,"ĠBetter":11238,"ĠJanet":11239,"Ġenthusiasm":11240,"ĠIrving":11241,"ĠConst":11242,"Everyone":11243,"agn":11244,"ĠCrawford":11245,"Ġregards":11246,"ĠBurns":11247,"Ġjokes":11248,"erg":11249,"ARD":11250,"apped":11251,"Ġtravelled":11252,"ĠPoor":11253,"ĠHolly":11254,"Ġcontainer":11255,"Ġinfected":11256,"Ġlean":11257,"ĠWould":11258,"Ġmagnitude":11259,"ĠDou":11260,"minded":11261,"Ġpastor":11262,"Ġwherever":11263,"ulation":11264,"Ġ1986":11265,"ĠMegan":11266,"Ġgraphic":11267,"Ġtalents":11268,"Ġkn":11269,"ĠEC":11270,"ĠMcM":11271,"ĠKon":11272,"eni":11273,"ĠEsc":11274,"inas":11275,"ĠNom":11276,"Ġchasing":11277,"arl":11278,"ĠHungary":11279,"Ġmainland":11280,"ĠDist":11281,"utes":11282,"Ġrubber":11283,"iat":11284,"ĠMorrison":11285,"ushing":11286,"iny":11287,"Ġcopies":11288,"ĠFat":11289,"agged":11290,"Ġfloating":11291,"ĠCurtis":11292,"Ġfatally":11293,"ĠManuel":11294,"Ġgraduates":11295,"nar":11296,"ĠKenny":11297,"Ġretreat":11298,"Ġretro":11299,"ĠPierre":11300,"listed":11301,"ĠDale":11302,"ding":11303,"Ġintentions":11304,"Ġsentences":11305,"ĠSere":11306,"Ġinvasion":11307,"Ġpremiums":11308,"ĠGardner":11309,"Ġshipments":11310,"Ġcol":11311,"bell":11312,"ilo":11313,"Ġworthy":11314,"Ġinterceptions":11315,"Ġcomplain":11316,"icle":11317,"ĠTah":11318,"ĠMt":11319,"ĠSyracuse":11320,"Since":11321,"aches":11322,"ĠCand":11323,"Ġinteractions":11324,"ĠShawn":11325,"nc":11326,"Ġtheaters":11327,"ART":11328,"Th":11329,"Ġalter":11330,"aley":11331,"imo":11332,"Ġresponders":11333,"kan":11334,"ĠDarren":11335,"Ġdeliveries":11336,"PI":11337,"125":11338,"Ġlaughing":11339,"ĠPatterson":11340,"Ġinfections":11341,"Ġtur":11342,"130":11343,"Ġhackers":11344,"Ġwarn":11345,"Ġfreeze":11346,"Ġscreaming":11347,"ĠEcho":11348,"ĠDom":11349,"MAN":11350,"ĠJoy":11351,"Ġbeneath":11352,"ĠHalf":11353,"Ġpatent":11354,"Ġugly":11355,"Ġlip":11356,"Ġnominees":11357,"ĠGrade":11358,"Ġinfluenced":11359,"Ġabilities":11360,"Ġlimiting":11361,"Ġsmell":11362,"Ġesc":11363,"ĠBernard":11364,"cs":11365,"ĠMyers":11366,"oted":11367,"Black":11368,"Ġlim":11369,"Ġsworn":11370,"ĠBlair":11371,"anes":11372,"ĠEvent":11373,"Ġmature":11374,"Ġpositioned":11375,"Ġerupted":11376,"grand":11377,"ĠTell":11378,"Ġbackdrop":11379,"Ġyeah":11380,"ĠClear":11381,"Ġsignificance":11382,"Ġpatience":11383,"ĠWing":11384,"Ġhorrible":11385,"Ġdeploy":11386,"ipe":11387,"Ġbitcoin":11388,"Ġcommitting":11389,"Ġdismiss":11390,"ĠBlood":11391,"ĠMeyer":11392,"selling":11393,"Ġregarded":11394,"Ġlottery":11395,"ĠLuther":11396,"Ġpipe":11397,"Ġcro":11398,"ĠANC":11399,"ĠSolar":11400,"Ġsimilarly":11401,"Ġham":11402,"ĠHonor":11403,"tar":11404,"gin":11405,"ĠArmstrong":11406,"Ġbrowser":11407,"agon":11408,"via":11409,"Ġentries":11410,"Ġinfl":11411,"Ġgraduation":11412,"Ġalleges":11413,"ĠLoading":11414,"Ġsuperb":11415,"ially":11416,"Ġadministrator":11417,"uls":11418,"Ġartistic":11419,"ĠANGEL":11420,"ĠBang":11421,"Ġfossil":11422,"¨":11423,"Ġpoly":11424,"ĠGuardiola":11425,"ĠPerth":11426,"Ġeducate":11427,"Cl":11428,"Ġcommittees":11429,"Ġforthcoming":11430,"Ġadjustments":11431,"count":11432,"Ġincoming":11433,"brook":11434,"ĠMinneapolis":11435,"Ġgown":11436,"ĠCroatia":11437,"host":11438,"Ġcompetitor":11439,"Ġlyrics":11440,"Ġbelonging":11441,"ĠFrances":11442,"ĠHaley":11443,"ĠBruins":11444,"Ġmask":11445,"ĠPv":11446,"dollar":11447,"Ġbowling":11448,"Ġjewelry":11449,"ĠJulia":11450,"Ġbroadband":11451,"ĠBhar":11452,"ĠArmed":11453,"vy":11454,"government":11455,"kov":11456,"Ġpremises":11457,"Ġjersey":11458,"Ġapplies":11459,"ĠFreeman":11460,"Ġgrows":11461,"ĠEquity":11462,"Ġmaterially":11463,"Ġfigured":11464,"ience":11465,"Ġmajors":11466,"ĠYe":11467,"ĠHey":11468,"oned":11469,"aping":11470,"Ġtoilet":11471,"ĠConnor":11472,"Ġavoiding":11473,"pos":11474,"Once":11475,"ĠRockets":11476,"ĠSnapchat":11477,"Go":11478,"Ġsolidarity":11479,"ĠAffordable":11480,"Ġdial":11481,"ĠOmar":11482,"xt":11483,"ĠVatican":11484,"anta":11485,"ĠSuperior":11486,"Ġbeaches":11487,"ĠKi":11488,"Ã¥":11489,"KY":11490,"Ġgro":11491,"ĠEmpire":11492,"Ġoccurs":11493,"Ġjoked":11494,"Ġquotes":11495,"ĠSaskatchewan":11496,"pert":11497,"Ġmaintains":11498,"olt":11499,"Ġupgrades":11500,"ĠCho":11501,"ĠAlexis":11502,"ĠHundreds":11503,"ĠBud":11504,"Ġcenturies":11505,"ĠInvestor":11506,"ĠGomez":11507,"Ġconceded":11508,"Ġexpressing":11509,"ĠIBM":11510,"Ġadvancing":11511,"ĠDollar":11512,"jer":11513,"Ġexceed":11514,"author":11515,"rist":11516,"seat":11517,"ĠPrimary":11518,"ĠForbes":11519,"ĠAlzheimer":11520,"Ġdevastated":11521,"Ġawful":11522,"ĠStudio":11523,"Ġbullpen":11524,"Ġmobility":11525,"Ġanalyze":11526,"lie":11527,"AFP":11528,"iche":11529,"ĠRoyals":11530,"Ġcoupled":11531,"Ġdug":11532,"ĠRing":11533,"Ġenvironments":11534,"national":11535,"ĠCongo":11536,"Ġalleging":11537,"wn":11538,"ulating":11539,"Ġur":11540,"Ġreaches":11541,"ĠPine":11542,"Ġthreshold":11543,"Ġtournaments":11544,"Ġheating":11545,"ĠGard":11546,"ĠHamas":11547,"Ġ«":11548,"ĠHolding":11549,"Ġpossibilities":11550,"ĠHassan":11551,"ĠMohammad":11552,"Ġoffenders":11553,"Ġautomated":11554,"Ġrealised":11555,"ouse":11556,"building":11557,"ĠDub":11558,"ĠGeneva":11559,"Ġfacial":11560,"ĠRestaurant":11561,"ĠNg":11562,"Ġtot":11563,"Ġgrace":11564,"ĠCP":11565,"Ġposter":11566,"hart":11567,"ĠNi":11568,"Ġreaff":11569,"Ġprov":11570,"Ġ111":11571,"ĠAid":11572,"Ġscrap":11573,"izers":11574,"ogen":11575,"Ġtissue":11576,"Ġvibrant":11577,"Ġrider":11578,"CD":11579,"ĠKitchen":11580,"Ġgenre":11581,"¬":11582,"depth":11583,"kind":11584,"Ġendorsed":11585,"Ġsimultaneously":11586,"Ġintern":11587,"ĠDrag":11588,"Ġembraced":11589,"Ġcounted":11590,"uj":11591,"ĠOg":11592,"Ġphysician":11593,"ĠIR":11594,"IST":11595,"ĠKir":11596,"Ġhacking":11597,"ĠSources":11598,"astic":11599,"growing":11600,"ĠWake":11601,"Ġhint":11602,"Ġcompiled":11603,"Ġreign":11604,"Ġcinema":11605,"Ġboosting":11606,"Ġaccommodation":11607,"ĠEuropa":11608,"Ġsubsidiaries":11609,"Ġclosures":11610,"ĠBil":11611,"ĠBou":11612,"wh":11613,"ĠAw":11614,"FT":11615,"hole":11616,"ĠNova":11617,"ĠNSW":11618,"Ġrap":11619,"Ġencourages":11620,"GR":11621,"ds":11622,"ĠMuk":11623,"ĠSurvey":11624,"ĠReagan":11625,"oning":11626,"Ġneighbouring":11627,"ĠMcCl":11628,"acht":11629,"Ġfinishes":11630,"ĠEsp":11631,"pat":11632,"Ġdestinations":11633,"ĠWagner":11634,"Ġconfronted":11635,"square":11636,"Ġpie":11637,"brand":11638,"hl":11639,"Ġabsent":11640,"Ġsurf":11641,"Ġrifle":11642,"ĠSS":11643,"ĠDeath":11644,"wich":11645,"Ġbeds":11646,"ĠLock":11647,"ĠAgu":11648,"atives":11649,"jee":11650,"Ġoral":11651,"Ġbudgets":11652,"Ġinspiring":11653,"IONS":11654,"works":11655,"Ġspirits":11656,"Ġcabin":11657,"Ġsatisfaction":11658,"Ġvoluntary":11659,"ĠMunicipal":11660,"Ġdeportation":11661,"ĠWriter":11662,"ĠVI":11663,"VERTISEMENT":11664,"/.":11665,"ĠSouthampton":11666,"aces":11667,"ĠHelen":11668,"ĠHum":11669,"110":11670,"Ġgarbage":11671,"through":11672,"Ġkingdom":11673,"MT":11674,"augh":11675,"Ġbizarre":11676,"ĠStarting":11677,"Ġwooden":11678,"ĠProgress":11679,"iron":11680,"sten":11681,"ĠSergio":11682,"ĠHR":11683,"Ġturnout":11684,"ĠAmericas":11685,"ĠSara":11686,"Ġagrees":11687,"apper":11688,"Ġbra":11689,"Ġrecycling":11690,"oom":11691,"Ġflee":11692,"Ġdistinct":11693,"IAL":11694,"aha":11695,"Ġfever":11696,"ĠPartnership":11697,"ĠYu":11698,"ĠPixel":11699,"ĠBlock":11700,"ĠMelissa":11701,"igg":11702,"Ġdecides":11703,"ĠNorman":11704,"Ġmas":11705,"held":11706,"ĠPD":11707,"Ġsheer":11708,"ĠDim":11709,"ĠCass":11710,"Ġcolumnist":11711,"ĠBros":11712,"Ġturnaround":11713,"ĠValue":11714,"ĠBachelor":11715,"awn":11716,"Ġassignment":11717,"ested":11718,"ĠJudiciary":11719,"Ġdiamond":11720,"Ġmus":11721,"Ġindigenous":11722,"lines":11723,"Ġ1984":11724,"igroup":11725,"ict":11726,"ĠJaguars":11727,"Ġlun":11728,"Ġprofiles":11729,"Ġcomputing":11730,"ĠBelgian":11731,"ĠLloyd":11732,"ĠGoing":11733,"Ġdisp":11734,"Ġ1987":11735,"eder":11736,"ĠVin":11737,"Ġgovern":11738,"Ġblend":11739,"ĠSebastian":11740,"ĠMidwest":11741,"iga":11742,"Ġspl":11743,"Ġtopping":11744,"Ġnetworking":11745,"ĠEmer":11746,"Ġoxygen":11747,"ĠInterest":11748,"ĠMoy":11749,"Ġtrader":11750,"Ġbay":11751,"Ġsticking":11752,"ĠMovement":11753,"Ġbidding":11754,"tax":11755,"Ġacademy":11756,"ĠMO":11757,"ĠSpirit":11758,"Ġhealing":11759,"wen":11760,"ĠPrix":11761,"cal":11762,"ĠOperating":11763,"Ġinstantly":11764,"ĠTonight":11765,"Ġsacked":11766,"Ġautomation":11767,"umps":11768,"ĠNey":11769,"March":11770,"ĠBuck":11771,"Ġconcentration":11772,"Here":11773,"Ġtravelers":11774,"Ġprotective":11775,"ĠMoody":11776,"Ġentrepreneur":11777,"Ġfac":11778,"kowski":11779,"Ġpreparations":11780,"Ġdominate":11781,"Ġspray":11782,"Ġdisturbing":11783,"ĠFraser":11784,"ĠCody":11785,"ashi":11786,"ĠPel":11787,"Ġrisky":11788,"Ġawkward":11789,"ĠVA":11790,"ails":11791,"Ġangle":11792,"Ġundergoing":11793,"Ġalbums":11794,"Ġafterwards":11795,"ĠNaw":11796,"uge":11797,"enter":11798,"ĠSussex":11799,"ĠRecently":11800,"Ġlikelihood":11801,"large":11802,"Ġsnaps":11803,"ibr":11804,"ĠMalcolm":11805,"Ġcru":11806,"Ġaltogether":11807,"Ġsetup":11808,"Ġtorture":11809,"Ġfiber":11810,"Ġquarterbacks":11811,"ĠGetting":11812,"ipping":11813,"ĠNorwegian":11814,"ĠMiles":11815,"ĠArnold":11816,"ĠDisease":11817,"Ġtends":11818,"ife":11819,"ĠCaroline":11820,"Ġnavigate":11821,"Ġbrush":11822,"ĠAssociates":11823,"Ġbath":11824,"ĠCenters":11825,"ĠMC":11826,"Ġtaxpayer":11827,"comp":11828,"Ġaccomplish":11829,"ĠTraffic":11830,"ĠBru":11831,"Ġgreenhouse":11832,"ĠMalaysian":11833,"ĠPur":11834,"ased":11835,"ĠKnicks":11836,"aters":11837,"Ġalt":11838,"ICK":11839,"Ġcalculations":11840,"Ġmindset":11841,"unch":11842,"Ġgu":11843,"Ġsteadily":11844,"Ġfiction":11845,"ĠPap":11846,"forming":11847,"ĠActor":11848,"ĠBerry":11849,"imp":11850,"ĠUpper":11851,"Ġassessed":11852,"Ġlawn":11853,"ĠRoh":11854,"Ġclearance":11855,"funded":11856,"Ġpret":11857,"ĠHom":11858,"VS":11859,"ĠTourism":11860,"ĠRy":11861,"ĠGonz":11862,"ĠStudios":11863,"Ġanchor":11864,"Ġrecognise":11865,"Ġcooperate":11866,"enny":11867,"aza":11868,"ĠMeet":11869,"Ġeventual":11870,"SW":11871,"ĠCounsel":11872,"ĠSave":11873,"Ġlucrative":11874,"Ġslim":11875,"ĠGreens":11876,"Ġchemistry":11877,"ĠSheikh":11878,"Ġbridges":11879,"business":11880,"ĠSaf":11881,"ĠGy":11882,"Ġprotocol":11883,"Ġnephew":11884,"ĠBrands":11885,"ĠCulture":11886,"orship":11887,"Ġ(£":11888,"ĠDell":11889,"astics":11890,"Ġproving":11891,"ĠMann":11892,"aca":11893,"Ġindoor":11894,"ĠUganda":11895,"ĠRomney":11896,"ĠStage":11897,"Ġward":11898,"ĠAmber":11899,"haw":11900,"Ġtw":11901,"Ġbullying":11902,"ĠCAR":11903,"Ġassociates":11904,"ĠHopkins":11905,"Ġsuburb":11906,"Ġaggressively":11907,"Ġpostponed":11908,"Ġbas":11909,"Ġburglary":11910,"ĠFound":11911,"Ġfloors":11912,"Any":11913,"Ġjam":11914,"Ġvisibility":11915,"Ġbenefited":11916,"ĠAud":11917,"aying":11918,"iku":11919,"ĠPas":11920,"ĠGPS":11921,"ĠOwens":11922,"Ġreluctant":11923,"ĠOlivia":11924,"ols":11925,"Ġemotion":11926,"ĠHeavy":11927,"Ġhostile":11928,"Ġfavorites":11929,"Ġfeat":11930,"ĠCord":11931,"ĠGO":11932,"Ġindicted":11933,"idal":11934,"ĠIL":11935,"Ħ":11936,"acer":11937,"ICH":11938,"oda":11939,"Ġrecipients":11940,"Ġtribal":11941,"Ġresist":11942,"ĠCritics":11943,"Ġsang":11944,"ĠMath":11945,"ĠBrighton":11946,"ĠKw":11947,"Ġlimitations":11948,"Ġinterception":11949,"onde":11950,"ĠRobertson":11951,"Ġenjoys":11952,"site":11953,"Ġwings":11954,"ĠCeltic":11955,"Ġrelaxed":11956,"Share":11957,"Ġwarrants":11958,"oco":11959,"Ġcritically":11960,"GC":11961,"Ġcute":11962,"Ġlaying":11963,"itude":11964,"ĠMediterranean":11965,"Ġwatches":11966,"Ġdisagree":11967,"ĠReturn":11968,"ARC":11969,"people":11970,"Ġtwelve":11971,"Ġoverdose":11972,"ĠLot":11973,"ĠFROM":11974,"ĠPeters":11975,"Ġadministrators":11976,"Ġslam":11977,"jar":11978,"OH":11979,"ĠInitiative":11980,"Ġteamed":11981,"ĠMajority":11982,"June":11983,"ĠPlaza":11984,"lake":11985,"Ġglimpse":11986,"Ġrings":11987,"Ġos":11988,"Ġmentor":11989,"have":11990,"Ġlanguages":11991,"Ġuncle":11992,"agu":11993,"ĠWine":11994,"ĠCategory":11995,"ĠIng":11996,"Ġcontests":11997,"ĠRosen":11998,"ĠWhatever":11999,"Ġdenying":12000,"ean":12001,"Ġspec":12002,"Ġgrad":12003,"Ġtenants":12004,"show":12005,"ĠGregory":12006,"Ġcontention":12007,"Ġunanimously":12008,"ĠPin":12009,"fa":12010,"ĠPink":12011,"Ġswitched":12012,"acre":12013,"ĠTrading":12014,"VP":12015,"ĠMaple":12016,"Neill":12017,"Ġdiscounts":12018,"alls":12019,"Ġsounded":12020,"Ġrumours":12021,"ĠCre":12022,"hall":12023,"ĠTele":12024,"Ġthankful":12025,"Ġsurveyed":12026,"UB":12027,"Ġdignity":12028,"Ġnod":12029,"Ġmisleading":12030,"ĠTX":12031,"ĠBurke":12032,"Ġmounting":12033,"Ġskies":12034,"Ġbesides":12035,"ĠGarrett":12036,"tha":12037,"Ġintelligent":12038,"Ġtanks":12039,"apping":12040,"ĠRat":12041,"aint":12042,"Ġentertain":12043,"ĠAbdullah":12044,"Ġsink":12045,"ĠLan":12046,"ĠManufacturing":12047,"NFL":12048,"Ġthemes":12049,"ĠHaven":12050,"ĠDavies":12051,"ĠKerr":12052,"ĠLen":12053,"Ġcourtroom":12054,"Ġfailures":12055,"Ġlately":12056,"ĠElectronics":12057,"Ġgorgeous":12058,"Ġnotification":12059,"Ġ2030":12060,"aved":12061,"Ġdeer":12062,"economic":12063,"ĠStatistics":12064,"Ġconfrontation":12065,"Ġgovernors":12066,"ĠHaram":12067,"ĠLGBTQ":12068,"Ġprocessed":12069,"ĠDuchess":12070,"Ġdowns":12071,"Ġpork":12072,"Ġhumor":12073,"ocese":12074,"Ġneeding":12075,"Ġmidterm":12076,"ĠOval":12077,"Ġcorners":12078,"Ġtablets":12079,"eds":12080,"vere":12081,"Ġattacker":12082,"Paul":12083,"pee":12084,"ĠAlice":12085,"Ġrenowned":12086,"Ġ09":12087,"ocking":12088,"Ġcreditors":12089,"ĠPedro":12090,"ĠPhone":12091,"Ġsurveys":12092,"ĠWelsh":12093,"Ġcow":12094,"Ġbuilds":12095,"Ġ000":12096,"ĠAzerbaijan":12097,"ĠYad":12098,"Ġinfant":12099,"Ġmotorists":12100,"Ġpoorly":12101,"Ġmedications":12102,"Ġstupid":12103,"ĠCastro":12104,"user":12105,"antly":12106,"alty":12107,"ĠCond":12108,"issa":12109,"ĠIvan":12110,"Ġcostume":12111,"Ġ08":12112,"Ġhence":12113,"Ġdangers":12114,"Ġbullish":12115,"Life":12116,"Ġflavor":12117,"ĠCharleston":12118,"Ġbikes":12119,"Ġworkshops":12120,"Ġarranged":12121,"Ġcontender":12122,"Ġsequel":12123,"ĠPlant":12124,"Ġdonor":12125,"Ġfactories":12126,"rict":12127,"ellen":12128,"Ġrobots":12129,"ĠWor":12130,"ĠDirectors":12131,"ĠPeru":12132,"Ġqueen":12133,"ĠTimothy":12134,"ĠToo":12135,"Ġobservers":12136,"Ġears":12137,"Ġbel":12138,"link":12139,"uns":12140,"Ġhomers":12141,"Ġadjacent":12142,"Ġconfidential":12143,"Ġstunned":12144,"iden":12145,"illed":12146,"ESS":12147,"Ġconvenient":12148,"ĠLindsey":12149,"por":12150,"upp":12151,"Ġborrow":12152,"ĠAhmad":12153,"ORT":12154,"Ġrelate":12155,"ĠSelf":12156,"ĠVanguard":12157,"utter":12158,"ĠBranch":12159,"ĠBolton":12160,"bat":12161,"Ġoutright":12162,"fighters":12163,"ĠBed":12164,"Ġpes":12165,"inski":12166,"Ġgunshot":12167,"Ġprinting":12168,"ĠSent":12169,"vern":12170,"Ġharvest":12171,"Ġbubble":12172,"Ġrefund":12173,"Ġfuels":12174,"Ġdive":12175,"Ġdiplomat":12176,"Ġpile":12177,"ĠVery":12178,"rot":12179,"ĠSearch":12180,"ĠJoyce":12181,"ĠPruitt":12182,"ĠLevel":12183,"ĠBP":12184,"ĠLac":12185,"had":12186,"Ġexpenditure":12187,"ĠMadd":12188,"Ġpockets":12189,"ĠClippers":12190,"ĠDear":12191,"ĠGive":12192,"Ġhal":12193,"Ġvertical":12194,"Ġwholesale":12195,"what":12196,"ĠSpringfield":12197,"ayed":12198,"ĠSom":12199,"Ġsecrets":12200,"Ġcharts":12201,"iar":12202,"ibility":12203,"LAND":12204,"Ġbearing":12205,"Ġprom":12206,"Ġtab":12207,"Ġsheets":12208,"ĠGL":12209,"Ġendless":12210,"opening":12211,"ĠOwen":12212,"Ġunderneath":12213,"ĠErik":12214,"ĠDACA":12215,"Ġsteering":12216,"Ġfootprint":12217,"ĠRoma":12218,"ĠDucks":12219,"ĠEllen":12220,"ĠProfessional":12221,"ĠGardens":12222,"Ġgoalie":12223,"Ġshine":12224,"Ġturmoil":12225,"Ġhunger":12226,"ĠâĢĭ":12227,"active":12228,"hey":12229,"Ġblessed":12230,"ason":12231,"oping":12232,"ĠThousands":12233,"Ġdose":12234,"ĠLor":12235,"Ġevolved":12236,"Ġcharities":12237,"ĠPE":12238,"ĠRub":12239,"ws":12240,"Ġmist":12241,"ĠShen":12242,"Ġbiological":12243,"ĠTweet":12244,"Ġcollections":12245,"Ġsubstantially":12246,"inner":12247,"Ġbattled":12248,"ĠCong":12249,"Hold":12250,"wp":12251,"Ġwells":12252,"Ġsake":12253,"Ġunrest":12254,"ĠKurt":12255,"Ġripped":12256,"itation":12257,"Ġneighbourhood":12258,"Ġinv":12259,"Ġcad":12260,"ĠCuban":12261,"ĠWealth":12262,"Ġtuition":12263,"Ġdeclaring":12264,"sch":12265,"orne":12266,"Ġwondered":12267,"ĠChaff":12268,"Ġdealer":12269,"ĠNumber":12270,"Mobile":12271,"Ġscratch":12272,"Ġprepares":12273,"ĠSens":12274,"ĠIstanbul":12275,"ĠPanama":12276,"ĠCay":12277,"Ġallocation":12278,"itutional":12279,"Ġhar":12280,"ĠNazi":12281,"ĠSund":12282,"Ġwarehouse":12283,"Ġbackyard":12284,"ĠIll":12285,"Ġunlawful":12286,"ĠReform":12287,"Ġbasement":12288,"ĠHi":12289,"ĠPictures":12290,"Ġtransfers":12291,"ĠSell":12292,"Ġfluid":12293,"Ġambitions":12294,"wife":12295,"Ġintensive":12296,"Ġsteals":12297,"Ġfestive":12298,"ĠHayes":12299,"Ġrestoration":12300,"Ġbranded":12301,"Journal":12302,"Ġmacro":12303,"Ġconsole":12304,"ĠMelania":12305,"ĠRahul":12306,"Ġdisposal":12307,"Ġcult":12308,"Ġpetrol":12309,"Ġtires":12310,"Ġkidnapping":12311,"Ġ115":12312,"Ġswap":12313,"ĠSud":12314,"Ġblown":12315,"ĠHindu":12316,"ĠBeckham":12317,"ĠGul":12318,"Ġfixture":12319,"Ġwisdom":12320,"Ġmines":12321,"fort":12322,"Ġrivers":12323,"ĠCyber":12324,"Ġtouches":12325,"race":12326,"Ġrelax":12327,"Ġcrashes":12328,"Ġconstituency":12329,"Ġ1979":12330,"Ġbureau":12331,"Ġinterface":12332,"Ġdetected":12333,"ĠBio":12334,"Ġhighlighting":12335,"ames":12336,"Ġcorresponding":12337,"great":12338,"Ġgray":12339,"Ġadvantages":12340,"ĠME":12341,"ĠAbbas":12342,"Ġnaked":12343,"rington":12344,".),":12345,"ĠFace":12346,"third":12347,"Ġtranscript":12348,"ples":12349,"Good":12350,"ĠArctic":12351,"Ġtolerance":12352,"reat":12353,"green":12354,"ĠMik":12355,"Ġoutreach":12356,"Ġrolls":12357,"Ġgen":12358,"Ġsupplied":12359,"Ġguarantees":12360,"aug":12361,"Ġsemif":12362,"ounds":12363,"running":12364,"Ġfitting":12365,"ĠRisk":12366,"iveness":12367,"family":12368,"Ġti":12369,"ĠIsaac":12370,"Ġdump":12371,"ĠPatricia":12372,"Ġpassport":12373,"ĠRhode":12374,"Who":12375,"log":12376,"Ġstat":12377,"Ġrat":12378,"ango":12379,"SB":12380,"ĠMaur":12381,"Ġsmiling":12382,"Ġstrikeouts":12383,"Ġpupils":12384,"Ġcomplications":12385,"ĠAdvanced":12386,"ĠMonetary":12387,"ĠTall":12388,"ĠALL":12389,"Ġcontributor":12390,"ĠAdvertising":12391,"Ġhorrific":12392,"Ġcompeted":12393,"ĠKenneth":12394,"Ġhailed":12395,"Ġbones":12396,"Ġbolster":12397,"ĠBoss":12398,"Ġhospitalized":12399,"ĠTelegraph":12400,"ĠIndependence":12401,"Ġdr":12402,"ĠHang":12403,"Ġdocumented":12404,"Ġsubtle":12405,"invest":12406,"Ġbounced":12407,"ĠMAN":12408,"Ġprofession":12409,"Ń":12410,"Ġexcellence":12411,"ĠInspector":12412,"ĠBL":12413,"Ġdisrupt":12414,"ĠWinston":12415,"ĠCommunist":12416,"ĠSharon":12417,"Ġmechanical":12418,"Ġtreats":12419,"Ġdesperately":12420,"ĠIndy":12421,"ĠGi":12422,"ĠComposite":12423,"ĠHeath":12424,"aser":12425,"ĠCardiff":12426,"ilit":12427,"Ġeased":12428,"Ġprospective":12429,"Ġcommissioned":12430,"Ġtire":12431,"Ġalign":12432,"Ġgesture":12433,"Ġweakened":12434,"URE":12435,"SN":12436,"Ġnationals":12437,"Ġrelies":12438,"ĠIRS":12439,"ĠCount":12440,"Ġmedicines":12441,"Ġcongress":12442,"Ġstranger":12443,"Qu":12444,"lessly":12445,"ĠQueens":12446,"ĠAlleg":12447,"uing":12448,"ĠWy":12449,"ĠMiguel":12450,"idi":12451,"Ġcivic":12452,"ĠPetro":12453,"endo":12454,"Obviously":12455,"Ġreflection":12456,"ĠStop":12457,"ĠFitzgerald":12458,"placed":12459,"shore":12460,"Ġcorrectly":12461,"ĠNE":12462,"amy":12463,"ĠCT":12464,"some":12465,"ĠMb":12466,"oi":12467,"ĠHogan":12468,"ĠInnovation":12469,"ĠVilla":12470,"ĠCAN":12471,"ĠCemetery":12472,"into":12473,"Ġquestionable":12474,"Ġcreator":12475,"rug":12476,"Ġsemifinals":12477,"mission":12478,"Ġcle":12479,"ĠWaters":12480,"ĠNixon":12481,"ĠBT":12482,"Ġassuming":12483,"ĠJer":12484,"ĠClay":12485,"pack":12486,"ĠCool":12487,"may":12488,"Ġdecor":12489,"Ġspike":12490,"ĠSomalia":12491,"ĠKarn":12492,"ĠDamascus":12493,"Shares":12494,"Ġsus":12495,"ĠMoss":12496,"Ġ1985":12497,"Ġsuperintendent":12498,"ĠResults":12499,"Ġspends":12500,"prom":12501,"Ġshipped":12502,"Ġlaundering":12503,"ĠLeslie":12504,"Ġmeteor":12505,"Ġabandon":12506,"Ġdeliberately":12507,"ĠSentinel":12508,"Ġfascinating":12509,"Ġenrollment":12510,"ĠExperts":12511,"ĠSimilarly":12512,"ĠCuomo":12513,"bor":12514,"Ġune":12515,"neutral":12516,"Ġhamstring":12517,"Ġnegotiated":12518,"zes":12519,"ĠLeo":12520,"ĠDoctor":12521,"Ġcurriculum":12522,"ĠFocus":12523,"Ġtravels":12524,"Ġbeverage":12525,"ĠIncluding":12526,"tz":12527,"type":12528,"ĠRange":12529,"Ġfloods":12530,"Ġcoached":12531,"Ġdominance":12532,"letico":12533,"ĠRafael":12534,"Ġpredictions":12535,"Ġprosperity":12536,"ĠCav":12537,"Ġclinics":12538,"ĠBanking":12539,"ĠComing":12540,"ears":12541,"ĠKaepernick":12542,"ĠBlvd":12543,"Ġretained":12544,"isions":12545,"Ġko":12546,"Ġensemble":12547,"Ġprecise":12548,"Ġcompact":12549,"MD":12550,"ĠJet":12551,"ached":12552,"ĠTru":12553,"ĠBass":12554,"ĠIcon":12555,"Ġexcluding":12556,"sur":12557,"Ġconstruct":12558,"Ġvoiced":12559,"pan":12560,"Ġinability":12561,"Ġexc":12562,"Ġmate":12563,"Ġtrailing":12564,"Ġsuccessive":12565,"Ġbets":12566,"Ġgauge":12567,"Ġminorities":12568,"ĠIND":12569,"ĠVel":12570,"ĠGP":12571,"oid":12572,"bon":12573,"Ġpred":12574,"Ġdash":12575,"Ġperformer":12576,"Ġoccasional":12577,"aken":12578,"mes":12579,"America":12580,"Ġliver":12581,"Sp":12582,"Big":12583,"Ġwildfires":12584,"ĠJackie":12585,"ĠLed":12586,"ĠFinland":12587,"Ġjurors":12588,"olic":12589,"urance":12590,"ĠEdge":12591,"open":12592,"Ġscenarios":12593,"Ġglory":12594,"entry":12595,"ĠCoffee":12596,"rep":12597,"ĠChand":12598,"ĠVas":12599,"ĠIslamabad":12600,"Ġbur":12601,"ĠFle":12602,"ĠEdition":12603,"Ġshoe":12604,"ï¸ı":12605,"**":12606,"tle":12607,"ĠEb":12608,"keeping":12609,"ĠBasketball":12610,"ĠVon":12611,"ĠCF":12612,"MENT":12613,"amm":12614,"ĠFernando":12615,"Ġcompares":12616,"ĠDouble":12617,"Ġconvictions":12618,"Ġatop":12619,"Ġcops":12620,"Ġremembers":12621,"Ġlacking":12622,"dom":12623,"itate":12624,"ĠBeauty":12625,"Ġdevelops":12626,"ĠGor":12627,"Ġfunctional":12628,"ĠCOUNTY":12629,"ĠUpon":12630,"Ġsprint":12631,"Ġinjection":12632,"Ġminors":12633,"ĠTamil":12634,"ĠGat":12635,"101":12636,"ety":12637,"Ġdrum":12638,"Ġtasked":12639,"Ġpact":12640,"Ġ170":12641,"MR":12642,"ĠRamos":12643,"Ġcandy":12644,"Sc":12645,"iced":12646,"Ġsupermarket":12647,"Ġworrying":12648,"Ġsellers":12649,"ĠTag":12650,".:":12651,"Ġmixture":12652,"oting":12653,"Bl":12654,"ĠLl":12655,"ĠJal":12656,"ican":12657,"ĠBid":12658,"country":12659,"ĠStrategy":12660,"Ġadverse":12661,"Ġplunged":12662,"ĠMit":12663,"Ġstark":12664,"aton":12665,"Ġbooking":12666,"Tr":12667,"Ġcontainers":12668,"Ġvintage":12669,"ĠPit":12670,"Ġsurfaced":12671,"Ġindependently":12672,"Ġdetection":12673,"ĠBeyon":12674,"Ġcasualties":12675,"Ġstabbing":12676,"oved":12677,"Ġbarred":12678,"Ġthereby":12679,"Ġpartnered":12680,"Ġposing":12681,"ĠShannon":12682,"ĠChapel":12683,"Ġtechnically":12684,"uous":12685,"»":12686,"ometer":12687,"Ġwildfire":12688,"share":12689,"heart":12690,"Ġammunition":12691,"Ġthrive":12692,"ĠStre":12693,"GP":12694,"cé":12695,"ĠMonaco":12696,"goal":12697,"ĠUm":12698,"ĠHSBC":12699,"ĠHilton":12700,"ĠViv":12701,"ĠKell":12702,"Ġdecisive":12703,"Ġmotive":12704,"amo":12705,"feld":12706,"ĠWH":12707,"iry":12708,"ulu":12709,"ĠSchneider":12710,"Ġcampaigning":12711,"Ġseparately":12712,"igo":12713,"ĠED":12714,"ĠRamirez":12715,"Ġmetro":12716,"ĠPatel":12717,"ĠChi":12718,"ĠAudi":12719,"Ġcharacteristics":12720,"Ġrestart":12721,"Ġkeyboard":12722,"ĠSD":12723,"his":12724,"biz":12725,"ĠSoft":12726,"ĠGrammy":12727,"Ġcontested":12728,"Ġweekends":12729,"Ġ112":12730,"Ġcycling":12731,"Ġhealthier":12732,"ija":12733,"Ġheader":12734,"Ġemploy":12735,"İ":12736,"Ġshortages":12737,"ĠAsk":12738,"ĠIvanka":12739,"Ġpartisan":12740,"Ġflowing":12741,"Ġcave":12742,"ENS":12743,"Ġups":12744,"read":12745,"ouch":12746,"Ġ102":12747,"Ġforming":12748,"bot":12749,"bie":12750,"Ġenrolled":12751,"Ġconcussion":12752,"Ġaffidavit":12753,"Ġmysterious":12754,"uries":12755,"ĠMang":12756,"Ġauthentic":12757,"Ġmetrics":12758,"ĠTwins":12759,"Ġprep":12760,"IJ":12761,"Ġdesired":12762,"ĠDiv":12763,"wall":12764,"ĠTab":12765,"Ġcompet":12766,"Ġrelied":12767,"Ġinequality":12768,"Ġmanual":12769,"ĠBucks":12770,"agging":12771,"Ġcorporation":12772,"Ġbanner":12773,"Ġgraphics":12774,"Ġaccurately":12775,"ĠMeeting":12776,"Ġconsult":12777,"ser":12778,"Ġprotesting":12779,"Ġhurting":12780,"omed":12781,"tes":12782,"Ġrode":12783,"Ġstartups":12784,"Ġhanding":12785,"ĠNest":12786,"Ġconsistency":12787,"anned":12788,"dem":12789,"ĠLyon":12790,"ĠCompetition":12791,"Ġtricky":12792,"Ġcos":12793,"ĠBengals":12794,"arry":12795,"Ġunderwent":12796,"ĠKit":12797,"à":12798,"uploads":12799,"Ġskate":12800,"Ġ''":12801,"Ġjun":12802,"ĠContent":12803,"focused":12804,"lat":12805,"ĠExp":12806,"ought":12807,"Ġnightmare":12808,"ĠExpect":12809,"Ġprecisely":12810,"ĠMonica":12811,"Ġlobbying":12812,"ĠChester":12813,"ĠInvest":12814,"Former":12815,"Ġimminent":12816,"ĠNL":12817,"Ġcomparing":12818,"ĠChes":12819,"ede":12820,"ĠNobel":12821,"mers":12822,"ĠKin":12823,"ĠBoko":12824,"ount":12825,"Ġthoroughly":12826,"Ġscattered":12827,"sharing":12828,"markets":12829,"ĠMis":12830,"Ġambition":12831,"Ġpreference":12832,"Ġeffectiveness":12833,"rio":12834,"Ġheavyweight":12835,"Ġovert":12836,"anya":12837,"ĠKanye":12838,"ishi":12839,"Ġrewards":12840,"uled":12841,"bach":12842,"Ġemphasized":12843,"Ġapologize":12844,"ĠRecent":12845,"!!":12846,"Ġanimated":12847,"ĠExxon":12848,"Ġfruits":12849,"Ġstripped":12850,"fold":12851,"ĠIndonesian":12852,"ller":12853,"Ġdementia":12854,"Ġkidney":12855,"Ġhalted":12856,"years":12857,"Ġconcerts":12858,"Ġrefers":12859,"ĠFri":12860,"Your":12861,"irl":12862,"Ġleap":12863,"jud":12864,"ĠHugh":12865,"ĠFO":12866,"Ġsore":12867,"Ġkil":12868,"ĠMate":12869,"cci":12870,"Ġsetback":12871,"Ġtightening":12872,"keeper":12873,"ĠAlbany":12874,"Ġpolicymakers":12875,"Ġdisorders":12876,"ĠCBC":12877,"ĠDiaz":12878,"Ġmaps":12879,"Ġroutinely":12880,"Ġverify":12881,"Ġbash":12882,"ĠJinping":12883,"Ġdisasters":12884,"ĠMonroe":12885,"ĠLouise":12886,"JP":12887,"ĠNevertheless":12888,"Ġconcessions":12889,"ĠPog":12890,"going":12891,"ĠFifth":12892,"ĠJill":12893,"ICT":12894,"ĠFM":12895,"ĠSugar":12896,"ĠBarb":12897,"Ġmidway":12898,"Ġtin":12899,"ĠPic":12900,"ĠPL":12901,"Ġleaks":12902,"Ġgrief":12903,"Ġtattoo":12904,"`":12905,"Ġment":12906,"ĠNu":12907,"Ġmarry":12908,"Ġdiving":12909,"Ġ1982":12910,"Ġcoin":12911,"ĠPoc":12912,"Ġstarred":12913,"ĠRiverside":12914,"Ġsidelined":12915,"Ġminers":12916,"STON":12917,"Ġbelongs":12918,"ĠSantos":12919,"ĠTechnical":12920,"aco":12921,"Ġadvise":12922,"Ġstreams":12923,"Ġcooler":12924,"ĠHE":12925,"Ġordering":12926,"ĠTask":12927,"ĠACT":12928,"ĠAnton":12929,"Ġcertification":12930,"ĠLeafs":12931,"ĠTS":12932,"ĠSerbia":12933,"azi":12934,"inks":12935,"ĠEST":12936,"Ġrelay":12937,"°":12938,"Ġdisappearance":12939,"ĠRomania":12940,"Ġoven":12941,"Ġowed":12942,"ĠStrip":12943,"ulated":12944,"UC":12945,"ITE":12946,"bling":12947,"Then":12948,"ppy":12949,"Ġunlimited":12950,"Ġcalories":12951,"Ġmerchandise":12952,"Ġblonde":12953,"ĠSpicer":12954,"performing":12955,"Ġimpl":12956,"Ġplates":12957,"Ġmosque":12958,"Ġdemon":12959,"Ġought":12960,"Ġdumped":12961,"Ġtracked":12962,"even":12963,"Ġstabil":12964,"imet":12965,"ĠLiga":12966,"ugh":12967,"ther":12968,"agar":12969,"Ġarchitect":12970,"Ġallocated":12971,"ĠJoey":12972,"Ġmarathon":12973,"master":12974,"ĠBert":12975,"Ġast":12976,"ĠEbola":12977,"ĠConservation":12978,"nic":12979,"Ġparallel":12980,"Ġinmate":12981,"Ġlocate":12982,"Ġdistribute":12983,"guard":12984,"Ġtackling":12985,"ential":12986,"Ġvi":12987,"Ġcups":12988,"Ġrhythm":12989,"Ġendured":12990,"ĠHub":12991,"ois":12992,"ĠLiberals":12993,"ĠRedskins":12994,"ĠEP":12995,"ĠKnox":12996,"fr":12997,"Ġmassacre":12998,"oka":12999,"Ġcompl":13000,"raft":13001,"ĠPublished":13002,"Ġattraction":13003,"ĠStephens":13004,"ility":13005,"ĠPul":13006,"ĠCapt":13007,"Ġexploded":13008,"Ġexceeded":13009,"lying":13010,"Ġcal":13011,"Mart":13012,"Ġpaintings":13013,"inate":13014,"ĠBrendan":13015,"Ġfortune":13016,"onductor":13017,"Ġphysicians":13018,"ĠStudy":13019,"ĠBul":13020,"ĠModern":13021,"HD":13022,"ĠBour":13023,"Ġtying":13024,"Ġ1967":13025,"Ġlighter":13026,"Ġtoss":13027,"inspired":13028,"Ġgreeted":13029,"Ġcycl":13030,"Ġverified":13031,"Ġmerit":13032,"sign":13033,"lder":13034,"Ġdebts":13035,"ĠSnyder":13036,"Ġamendments":13037,"Ġindicators":13038,"ĠDortmund":13039,"then":13040,"ĠListen":13041,"ĠFB":13042,"ref":13043,"ĠIoT":13044,"ĠBrewers":13045,"ĠLeadership":13046,"ĠNicolas":13047,"ĠBody":13048,"Ġsam":13049,"ĠAdvisor":13050,"Ġcord":13051,"Ġabuses":13052,"ĠPortuguese":13053,"Ġflown":13054,"VR":13055,"Ġconsumed":13056,"Ġreass":13057,"Ġalien":13058,"Ġrivalry":13059,"ĠREPORT":13060,"ĠRush":13061,"Ġdirecting":13062,"Ġsearches":13063,"ĠHP":13064,"ĠRoll":13065,"ĠFay":13066,"ĠClare":13067,"Ġhaul":13068,"Ġriot":13069,"Ġsettlements":13070,"Ġnorm":13071,"Ġaccelerated":13072,"ĠLok":13073,"Ġclever":13074,"Ġhyd":13075,"Ġstats":13076,"ĠHull":13077,"kers":13078,"Ġbuys":13079,"uter":13080,"Ġfue":13081,"https":13082,"UD":13083,"Ġisolation":13084,"Ġsuspend":13085,"ĠRules":13086,"ĠCircle":13087,"ĠHopefully":13088,"played":13089,"â̳":13090,"ĠPRE":13091,"sim":13092,"edd":13093,"ĠProperties":13094,"Ġbeans":13095,"Ġrevive":13096,"ĠBir":13097,"oug":13098,"Ġmob":13099,"Ġshowdown":13100,"iman":13101,"Ġpap":13102,"Ġvol":13103,"wu":13104,"Ġdiver":13105,"Ġpill":13106,"ĠMarlins":13107,"ĠLamar":13108,"Ġpersistent":13109,"Ġcondolences":13110,"ĠThor":13111,"Ab":13112,"Ġimpress":13113,"ĠRaptors":13114,"Ġreferences":13115,"Ġstiff":13116,"ĠBash":13117,"eding":13118,"Ġmurders":13119,"ĠGene":13120,"ĠManila":13121,"Ġbrokers":13122,"Ms":13123,"start":13124,"ĠDhabi":13125,"etz":13126,"Ġsubmission":13127,"ĠSchmidt":13128,"ĠPersonal":13129,"ĠBeverly":13130,"ĠMovie":13131,"ĠLamb":13132,"Ġplacement":13133,"Ġfolk":13134,"Ġfrequency":13135,"Ġplanted":13136,"Ġtwins":13137,"prov":13138,"rec":13139,"Ġpermanently":13140,"Ġcoordination":13141,"ĠCart":13142,"Ġobstacles":13143,"Ġliterature":13144,"Ġtu":13145,"Ġchill":13146,"ĠReserved":13147,"Ġlovers":13148,"ĠOutside":13149,"Ġslideshow":13150,"ĠGru":13151,"Ġty":13152,"Ġsalad":13153,"Ġlaboratory":13154,"ĠHolt":13155,"Ġ103":13156,"urb":13157,"ĠOrganisation":13158,"ĠAndrews":13159,"Ġrecipient":13160,"arch":13161,"Ġbleeding":13162,"ĠPand":13163,"Ġoverturned":13164,"Ġlistened":13165,"Ġclause":13166,"Ġnationalist":13167,"Ġresumed":13168,"ĠCout":13169,"ĠPride":13170,"Ġlayers":13171,"ĠBella":13172,"Ġreversed":13173,"Ġpriest":13174,"ĠFX":13175,"Ġalbeit":13176,"Ġhalfway":13177,"Ġcotton":13178,"ĠCarey":13179,"ĠTE":13180,"OCK":13181,"Ġbuck":13182,"ributes":13183,"ea":13184,"Ġfancy":13185,"ĠBuc":13186,"Ġbans":13187,"uters":13188,"Ġliabilities":13189,"ĠSou":13190,"ĠBernie":13191,"Ġintervene":13192,"food":13193,"ĠNDP":13194,"Ġinsist":13195,"Ġcontracted":13196,"hawk":13197,"),\"":13198,"ĠDawn":13199,"Ġmol":13200,"Ġcommissioners":13201,"Ġstranded":13202,"Ġoverwhelmed":13203,"Ġrecipes":13204,"Ġva":13205,"Ġrad":13206,"Ġscare":13207,"rez":13208,"Ġeliminating":13209,"Ġresc":13210,"ĠBreak":13211,"chn":13212,"Ġdelight":13213,"iot":13214,"Ġfreely":13215,"TI":13216,"ĠBluetooth":13217,"ĠMonth":13218,"ĠFlor":13219,"ĠFreddie":13220,"Ġtrailed":13221,"Ġinvestigative":13222,"Ġimposing":13223,"Ġattracting":13224,"awk":13225,"ĠSherman":13226,"Ġsucceeded":13227,"Ġvent":13228,"Ġreconciliation":13229,"ĠCel":13230,"ĠThroughout":13231,"ĠDowntown":13232,"ĠBrother":13233,"Ġtraditions":13234,"Ġmir":13235,"Ġstamp":13236,"tery":13237,"etti":13238,"isch":13239,"tic":13240,"Ġbanning":13241,"loss":13242,"ĠSpeedway":13243,"Ġstalled":13244,"ĠEN":13245,"ASH":13246,"thing":13247,"ĠAppeals":13248,"rac":13249,"Ġdistress":13250,"ĠConservatives":13251,"ĠPremium":13252,"usa":13253,"Ġslump":13254,"imm":13255,"ĠSupp":13256,"ĠWong":13257,"Ġdistant":13258,"Ġ104":13259,"Ġtide":13260,"ĠNorfolk":13261,"ĠYang":13262,"Ġsmashed":13263,"ĠBarrett":13264,"inho":13265,"Ġrobbed":13266,"ĠFarmers":13267,"filled":13268,"BT":13269,"Ġautumn":13270,"Ġtemple":13271,"ĠJacobs":13272,"Ġprecipitation":13273,"ĠHours":13274,"ĠFlight":13275,"Ġbeside":13276,"ĠOre":13277,"!)":13278,"ĠTurnbull":13279,"Ġpig":13280,"Ġcooling":13281,"Ġservers":13282,"oriented":13283,"Ġlocks":13284,"ĠSears":13285,"aving":13286,"ĠQuick":13287,"ĠGlob":13288,"ĠMining":13289,"Ġhorizon":13290,"arians":13291,"ĠOm":13292,"writing":13293,"Ġbelieving":13294,"Ġbon":13295,"Ġmounted":13296,"Ġpunt":13297,"ucci":13298,"uzz":13299,"cul":13300,"Ġkiss":13301,"ĠOnt":13302,"ĠCyprus":13303,"Ġrelying":13304,"Ġpiano":13305,"Ġcure":13306,"Ġcontinuously":13307,"ĠNobody":13308,"ĠBund":13309,"osis":13310,"ĠAurora":13311,"ĠBach":13312,"ĠKendall":13313,"Ġechoed":13314,"iable":13315,"Ġconscious":13316,"Ġmonster":13317,"omo":13318,"proof":13319,"ĠNate":13320,"Ġfilmmaker":13321,"ĠNaj":13322,"Ġvendor":13323,"ĠFoot":13324,"ĠChang":13325,"ĠFest":13326,"Ġselfie":13327,"Ġenters":13328,"ĠConor":13329,"ĠMosul":13330,"ĠWHAT":13331,"Ġwa":13332,"ĠGamb":13333,"osta":13334,"Ġcautioned":13335,"ĠTucker":13336,"ĠAirways":13337,"Ġvisitor":13338,"Ġ·":13339,"ĠRevolution":13340,"aching":13341,"Ġearliest":13342,"ĠQuality":13343,"Ġshorts":13344,"ube":13345,"ĠOperation":13346,"ĠSabha":13347,"Ġstrengths":13348,"ikes":13349,"Ġsexy":13350,"Ġrot":13351,"ibles":13352,"Ġcolours":13353,"THE":13354,"ailed":13355,"Ġwoke":13356,"ĠEmbassy":13357,"Ġinfamous":13358,"rov":13359,"State":13360,"â̦.":13361,"Ġpond":13362,"Ġcapt":13363,"fore":13364,"De":13365,"Ġedited":13366,"self":13367,"Hey":13368,"Ġportrait":13369,"ĠManufact":13370,"ĠStand":13371,"Ġcontenders":13372,"':":13373,"acker":13374,"Ġwithdrawn":13375,"ĠBraves":13376,"ĠHosp":13377,"changing":13378,"ĠBag":13379,"Ġadjustment":13380,"ĠCousins":13381,"ĠAAP":13382,"Ġfi":13383,"Ġoutdoors":13384,"Ġlacked":13385,"BM":13386,"ĠWHO":13387,"ĠPST":13388,"ĠLuck":13389,"Ġassisting":13390,"ĠGround":13391,"ĠTeen":13392,"ĠOle":13393,"Ġembarrassing":13394,"ĠWalt":13395,"ĠVision":13396,"ĠFal":13397,"ĠZoo":13398,"ĠWorth":13399,"ĠFloyd":13400,"ĠGujarat":13401,"Ġtipped":13402,"Ġfam":13403,"ĠDad":13404,"Ġworship":13405,"Ġtyre":13406,"Ġrebuilding":13407,"Ġqualities":13408,"ĠLives":13409,"Ġbeats":13410,"Ġ450":13411,"Ġexisted":13412,"ĠGeorg":13413,"Ġpoured":13414,"rows":13415,"ĠOx":13416,"ĠSid":13417,"Ġmac":13418,"Ġteaches":13419,"ĠEli":13420,"alla":13421,"Ġdownside":13422,"ĠBend":13423,"non":13424,"ĠArmenia":13425,"Ġcultures":13426,"ĠMae":13427,"Ġduration":13428,"ĠAthletics":13429,"Ġjuvenile":13430,"Ġlid":13431,"Ġbankers":13432,"Ġoverview":13433,"wy":13434,"Ġorbit":13435,"Vs":13436,"because":13437,"Ps":13438,"ĠFran":13439,"Ġtouring":13440,"Ġwary":13441,"Ġ106":13442,"Ġlaser":13443,"ĠVij":13444,"âĦ¢":13445,"Ġsurrender":13446,"press":13447,"rees":13448,"NO":13449,"ĠShortly":13450,"ĠKor":13451,"edu":13452,"Ġhatred":13453,"Ġtee":13454,"Ġfamously":13455,"Ġkeeper":13456,"ND":13457,"Ġreduces":13458,"HC":13459,"Ġhay":13460,"Ġunnamed":13461,"ĠTes":13462,"Ġattackers":13463,"ĠFew":13464,"ĠRichards":13465,"Ġ1968":13466,"Ġspeeches":13467,"Ġcybersecurity":13468,"ĠInfrastructure":13469,"Ġ07":13470,"ENCE":13471,"uties":13472,"Ġanxious":13473,"ĠGang":13474,"Ġannouncements":13475,"lette":13476,"oret":13477,"ĠRockies":13478,"ĠEmployees":13479,"ĠThrones":13480,"Ġhugely":13481,"Ġclin":13482,"ĠHob":13483,"Ġfraction":13484,"ĠOfficial":13485,"ĠMariners":13486,"ĠElse":13487,"Ġsanctuary":13488,"ĠPhotograph":13489,"Ġreopen":13490,"lf":13491,"hm":13492,"vest":13493,"Ġspeeding":13494,"Ġtooth":13495,"ĠShi":13496,"ĠTitle":13497,"ĠMes":13498,"ĠJobs":13499,"fair":13500,"ĠDanish":13501,"ĠMalik":13502,"Ġlaughed":13503,"Ġnavy":13504,"ĠActress":13505,"ĠWilliamson":13506,"overs":13507,"Ġreckless":13508,"Ġjo":13509,"otic":13510,"Ġassaulting":13511,"Ġpri":13512,"ĠPi":13513,"Ġlesser":13514,"Ġtit":13515,"Ġdat":13516,"Ġnail":13517,"ĠMarathon":13518,"ĠGren":13519,"ĠDol":13520,"Ġjointly":13521,"Ġamended":13522,"mine":13523,"ĠBashar":13524,"ĠHyundai":13525,"Ġuncovered":13526,"Ġeducated":13527,"atti":13528,"pres":13529,"ĠBRE":13530,"Ġya":13531,"Bank":13532,"odd":13533,"lit":13534,"ĠLinks":13535,"Ġswitching":13536,"itte":13537,"ĠSind":13538,"erved":13539,"Ġ**":13540,"Ġpositively":13541,"Ġfrankly":13542,"Ġrevenge":13543,"ĠTrinity":13544,"ĠCDC":13545,"Ġthreatens":13546,"Ġhammer":13547,"NET":13548,"ĠMut":13549,"Ġsy":13550,"Ġunidentified":13551,"icken":13552,"Ġdrills":13553,"Ġtense":13554,"Ġforeigners":13555,"OST":13556,"Ġethical":13557,"ĠDurham":13558,"ĠQual":13559,"Ġterritories":13560,"Ġid":13561,"hor":13562,"enders":13563,"Mc":13564,"OV":13565,"percent":13566,"Ġdom":13567,"Ġupward":13568,"Ġamb":13569,"Ġvisas":13570,"zan":13571,"Ãĥ":13572,"Ġundocumented":13573,"Ġsuburbs":13574,"Ġhydro":13575,"ĠJob":13576,"ĠAdelaide":13577,"oya":13578,"ĠSR":13579,"ĠMick":13580,"Ġconsolidation":13581,"Ġemotionally":13582,"ĠHop":13583,"Her":13584,"Ġloses":13585,"ĠMoto":13586,"eled":13587,"Ġregulated":13588,"ental":13589,"Ġencountered":13590,"Ġhop":13591,"ĠTrafford":13592,"Ġsticks":13593,"Ġveto":13594,"Ġexpose":13595,"Ġstretched":13596,"fin":13597,"inance":13598,"chair":13599,"ĠGareth":13600,"ĠPil":13601,"ĠHammond":13602,"Ġserial":13603,"omy":13604,"Ġcellphone":13605,"ĠClara":13606,"Ġreacted":13607,"ĠNic":13608,"ĠHomes":13609,"ĠBroadcasting":13610,"ĠFut":13611,"ĠSupply":13612,"assing":13613,"ĠNewman":13614,"Ġcharitable":13615,"ĠClayton":13616,"Ġsovereignty":13617,"Ġconvincing":13618,"ĠPrincipal":13619,"ĠHigher":13620,"ĠCut":13621,"ĠCarrie":13622,"ĠSpot":13623,"Sometimes":13624,"ĠJar":13625,"ĠConsider":13626,"ieu":13627,"Ġrefinery":13628,"Ġbloody":13629,"wheel":13630,"Ġcryptocurrencies":13631,"Fund":13632,"ĠSunderland":13633,"ĠEvents":13634,"âĢĭ":13635,"Ġaccidentally":13636,"deep":13637,"Ġfranc":13638,"bec":13639,"ĠHartford":13640,"Ġstellar":13641,"wright":13642,"kick":13643,"UG":13644,"ĠBeast":13645,"Ġrefusal":13646,"ĠRoberto":13647,"ĠDixon":13648,"ĠDiane":13649,"name":13650,"asts":13651,"ĠCharter":13652,"Ġfueled":13653,"Ġcontents":13654,"Ġaccessing":13655,"Ġtroubles":13656,"Ġtops":13657,"Ġdebuted":13658,"icating":13659,"Ġinvestigator":13660,"Ġsubscribing":13661,"Ġcoordinated":13662,"ĠFil":13663,"six":13664,"teen":13665,"Ġwithdrew":13666,"ĠGilbert":13667,"Ġ1983":13668,"arsity":13669,"Ġimagination":13670,"Ġhandgun":13671,"ĠAlibaba":13672,"Ġbug":13673,"Ġ107":13674,"ĠCOMP":13675,"ĠSomething":13676,"Ġreliability":13677,"ĠFCC":13678,"ĠFowler":13679,"Ġsingled":13680,"nom":13681,"Ġknocking":13682,"Ġmeddling":13683,"Ġdetermining":13684,"reports":13685,"Ġshade":13686,"ĠSN":13687,"anto":13688,"Ġcomplaining":13689,"ĠNan":13690,"WS":13691,"Ġyoungsters":13692,"Il":13693,"ĠKaw":13694,"ĠProp":13695,"ĠCell":13696,"ĠHurricanes":13697,"Ġpublicity":13698,"ĠXin":13699,"rial":13700,"ICO":13701,"Ġsupervision":13702,"ĠSpotify":13703,"ĠNewport":13704,"Ġprince":13705,"anche":13706,"Ġsubscriber":13707,"ĠVic":13708,"ACT":13709,"ĠRaf":13710,"ĠActing":13711,"Ġcollusion":13712,"pet":13713,"isl":13714,"Ġcommerce":13715,"Health":13716,"ĠAbraham":13717,"pri":13718,"Ġlightweight":13719,"Ġinsurer":13720,"Like":13721,"Ġhelmet":13722,"Ġevac":13723,"look":13724,"ĠNaval":13725,"160":13726,"ĠFleet":13727,"vol":13728,"Ġexpired":13729,"ĠKlein":13730,"ĠEmmy":13731,"ABLE":13732,"ĠMorocco":13733,"ĠTrip":13734,"uted":13735,"Ġnos":13736,"ĠVista":13737,"mas":13738,"ĠRocky":13739,"ĠFlint":13740,"enberg":13741,"ĠBrow":13742,"Ġsignatures":13743,"Ġpolar":13744,"ajo":13745,"Ġendorsement":13746,"Ġreservations":13747,"LIN":13748,"anny":13749,"elli":13750,"last":13751,"Ġoversee":13752,"cm":13753,"ĠOilers":13754,"Are":13755,"Ġjudiciary":13756,"onte":13757,"ĠTrack":13758,"Ġsupervisor":13759,"erk":13760,"isher":13761,"Ġintact":13762,"Ġslid":13763,"icals":13764,"paid":13765,"ĠMAR":13766,"lement":13767,"ĠLiu":13768,"ĠLarge":13769,"ĠWings":13770,"pect":13771,"ĠRum":13772,"Ġanalyzed":13773,"Ġemploys":13774,"arte":13775,"ims":13776,"ĠEventually":13777,"Ġaffiliated":13778,"Ġhospitality":13779,"ĠSprint":13780,"Ġresolutions":13781,"Ġliquor":13782,"ĠNAFTA":13783,"ANY":13784,"Ġradiation":13785,"ĠProv":13786,"Ġpause":13787,"ĠTMZ":13788,"Ġelbow":13789,"Ġresilience":13790,"ĠParents":13791,"mus":13792,"ĠSafe":13793,"Ġinterpretation":13794,"Ġraced":13795,"IND":13796,"KR":13797,"Ġhinted":13798,"ĠErin":13799,"ĠBahrain":13800,"Ġcredentials":13801,"eless":13802,"Ġprocurement":13803,"ĠWebb":13804,"ĠLowe":13805,"ĠNak":13806,"ĠLearning":13807,"zh":13808,"Ġdipped":13809,"ĠSuite":13810,"Ġmisdemeanor":13811,"ALE":13812,"Ġstrengthened":13813,"ĠSophie":13814,"Ġconfirms":13815,"Ġrac":13816,"gey":13817,"Ġshootout":13818,"Ġble":13819,"Ġcircles":13820,"ĠChef":13821,"Ġcomprised":13822,"ĠSantiago":13823,"Ġfeud":13824,"beat":13825,"Ġstaffers":13826,"Ġacute":13827,"ski":13828,"Ġpolled":13829,"ĠKur":13830,"ĠJen":13831,"ĠUltimately":13832,"anded":13833,"ĠHoney":13834,"Ġannounces":13835,"Ġamateur":13836,"around":13837,"Ġfunctioning":13838,"group":13839,"ĠSqu":13840,"Where":13841,"Ġvoid":13842,"ĠSandra":13843,"isers":13844,"Ġhelicopters":13845,"ĠGym":13846,"ĠWol":13847,"mouth":13848,"Ġsubjected":13849,"ici":13850,"ually":13851,"ĠWash":13852,"ĠLindsay":13853,"ĠVers":13854,"Ġjumps":13855,"Ġneglect":13856,"ĠKuwait":13857,"fund":13858,"ĭ":13859,"ather":13860,"lly":13861,"ei":13862,"Although":13863,".''":13864,"Ġunhappy":13865,"Ġpills":13866,"Ġmagical":13867,"Ġdro":13868,"Ġinviting":13869,"ĠJohnston":13870,"oving":13871,"450":13872,"ĠMerc":13873,"Ġadmitting":13874,"Ġinsisting":13875,"ĠCru":13876,"ĠResource":13877,"oir":13878,"Ġcomplexity":13879,"ĠRoth":13880,"ĠCher":13881,"July":13882,"raf":13883,"Ġaggregate":13884,"Ġhelm":13885,"uclear":13886,"olan":13887,"Ġoffenses":13888,"ĠWolves":13889,"ĠFu":13890,"ĠPierce":13891,"Ġemailed":13892,"ĠStra":13893,"Ġpedestrians":13894,"ĠER":13895,"ĠConway":13896,"Ġblowing":13897,"CLOSE":13898,"hab":13899,"ĠGreene":13900,"Ġconfessed":13901,"ĠTorres":13902,"ĠHolocaust":13903,"Ġrepay":13904,"Ġdemonstrates":13905,"ĠPool":13906,"gent":13907,"Ġdeleted":13908,"Ġ$$":13909,"ĠSO":13910,"Ġdri":13911,"ĠNeg":13912,"ĠVP":13913,"ĠPF":13914,"ĠPrep":13915,"Ġorganizing":13916,"icker":13917,"Ġmanufactured":13918,"enson":13919,"adas":13920,"Ġwines":13921,"Ġmachinery":13922,"Ġspecialists":13923,"ĠDetective":13924,"ĠDL":13925,"Op":13926,"Ġquicker":13927,"ĠPenguins":13928,"Engine":13929,"zone":13930,"Ġsequence":13931,"ĠLost":13932,"Ġwarmer":13933,"ĠEthiopia":13934,"Ġaffirmed":13935,"fest":13936,"resses":13937,"Ġsoap":13938,"Ġbooth":13939,"Ġnotorious":13940,"amin":13941,"Ġpursued":13942,"ĠCer":13943,"ĠSB":13944,"Ġlivestock":13945,"Ġtrace":13946,"Ġrespects":13947,"arden":13948,"April":13949,"Ġ128":13950,"ĠSaid":13951,"ennial":13952,"Ġnamely":13953,"ĠBot":13954,"Ġ108":13955,"ĠLem":13956,"nell":13957,"Ġconfirming":13958,"Ġlogged":13959,"Ġprofound":13960,"elo":13961,"ĠChambers":13962,"RT":13963,"Ġnewer":13964,"Ġsideline":13965,"ĠCardinal":13966,"este":13967,"Ġnarrowly":13968,"Ġcompromised":13969,"Ġpolicing":13970,"Ġporn":13971,"Ġarc":13972,"Ġlearnt":13973,"INE":13974,"step":13975,"ĠDomin":13976,"Ġwaist":13977,"Ġboycott":13978,"mitted":13979,"iffs":13980,"ground":13981,"ĠMaterials":13982,"Ġceasefire":13983,"Right":13984,"ĠZen":13985,"estyle":13986,"Thank":13987,"ĠOnePlus":13988,"ĠMLS":13989,"Ġconstituents":13990,"oster":13991,"ĠProsecutor":13992,"Ġpriorit":13993,"ĠDebbie":13994,"ĠExpand":13995,"uv":13996,"Ġintegrate":13997,"Ġimmun":13998,"Ġdisciplinary":13999,"ĠImm":14000,"Ġja":14001,"Ġgardens":14002,"ĠHim":14003,"obe":14004,"Ġhitter":14005,"Ġbullets":14006,"Ġevolving":14007,"ĠScientists":14008,"Michael":14009,"ĠDO":14010,"Ġunbelievable":14011,"Ġlooming":14012,"Ġdownturn":14013,"Ġmentality":14014,"Ġreopened":14015,"Ġash":14016,"ĠChapman":14017,"Ġloop":14018,"ĠUT":14019,"ĠTier":14020,"Ġunaware":14021,"Ġgratitude":14022,"Ġperforms":14023,"olk":14024,"Ġ\"(":14025,"Ġlacks":14026,"Ġinstructed":14027,"ĠRecreation":14028,"sample":14029,"Ġrequesting":14030,"Canada":14031,"Ġsupposedly":14032,"ĠHardy":14033,"Ġholder":14034,"change":14035,"ĠDominic":14036,"ĠXavier":14037,"Ġlig":14038,"Ġcandid":14039,"ĠRab":14040,"Ġconferences":14041,"ĠBurton":14042,"Dr":14043,"Ġmunicipalities":14044,"Ġcrushed":14045,"Ġseekers":14046,"ĠCitizens":14047,"Ġheightened":14048,"ĠCasino":14049,"Ġdesktop":14050,"Ġwhoever":14051,"ĠImpact":14052,"Ġcocktail":14053,"Ġphilanthrop":14054,"ĠSAN":14055,"ĠPreston":14056,"Ġobesity":14057,"Ġrestrict":14058,"ĠKab":14059,"ĠProvidence":14060,"Ġscar":14061,"ĠChart":14062,"Ġbosses":14063,"ĠRate":14064,"Ġsav":14065,"pay":14066,"Ġtransplant":14067,"ĠNoble":14068,"child":14069,"Ġconclusions":14070,"FI":14071,"Ġsack":14072,"Ġexperimental":14073,"holder":14074,"oca":14075,"herty":14076,"ĠMT":14077,"Ġcatcher":14078,"LY":14079,"Ġgrams":14080,"reet":14081,"Ġadaptation":14082,"Ġhumble":14083,"Ġbot":14084,"Ġidentical":14085,"ication":14086,"ifer":14087,"ĠCrow":14088,"Ġregain":14089,"ĠLightning":14090,"Ġkg":14091,"Ġcomposed":14092,"Ġcorrespondent":14093,"Ġreunion":14094,"Ġobserve":14095,"Ġcomprising":14096,"Ġimpeachment":14097,"Ġresh":14098,"Ġlemon":14099,"ĠSnap":14100,"Ġproprietary":14101,"een":14102,"ourt":14103,"Ġdetective":14104,"Ġlabels":14105,"Ġcorridor":14106,"ĠClinic":14107,"Ġarra":14108,"ĠPearl":14109,"Ġinformal":14110,"ĠUnd":14111,"ĠVenezuelan":14112,"Ġpeninsula":14113,"Ġdefeating":14114,"Ġsyndrome":14115,"iere":14116,"Ġspite":14117,"bag":14118,"aran":14119,"Ġspecialized":14120,"ĠAA":14121,"ĠLyn":14122,"Ġinstrumental":14123,"Smith":14124,"Ġpivotal":14125,"Ġnightclub":14126,"ĠCob":14127,"Ġcolorful":14128,"Ġartwork":14129,"Ġ1981":14130,"Ġdawn":14131,"erville":14132,"uated":14133,"ief":14134,"Ġlinking":14135,"ĠOw":14136,"Ġappreci":14137,"Ġreductions":14138,"elling":14139,"Ġsalmon":14140,"bb":14141,"ĠPhillip":14142,"yle":14143,"Ġassure":14144,"Ġdiscretion":14145,"Ġefficiently":14146,"ĠMau":14147,"abil":14148,"Ġintentionally":14149,"Ġactivated":14150,"Ġimmense":14151,"ĠStrategic":14152,"Ġcheating":14153,"ĠTrend":14154,"ĠSamantha":14155,"Ġcomple":14156,"Ġhack":14157,"ĠSerie":14158,"ĠText":14159,"Ġstylish":14160,"ĠFaith":14161,"ĠGST":14162,"Ġexterior":14163,"Ġblessing":14164,"Ġblanket":14165,"Ġcooked":14166,"Ġretaliation":14167,"Ġtro":14168,"Ġshelves":14169,"rose":14170,"ĠGram":14171,"Ġsho":14172,"ĠArgentine":14173,"Ġclerk":14174,"specific":14175,"Ġagreeing":14176,"Ġstandout":14177,"black":14178,"Ġtrending":14179,"Ġviolate":14180,"Get":14181,"ño":14182,"ĠOpt":14183,"ĠFrankfurt":14184,"ĠFranco":14185,"eness":14186,"Ġlining":14187,"Ġzoo":14188,"oil":14189,"lia":14190,"rab":14191,"Ġorganize":14192,"Ġwoods":14193,"Ġscan":14194,"Ġurgency":14195,"Ġoccurring":14196,"Ġreliance":14197,"Ġconcepts":14198,"Ġeligibility":14199,"0000":14200,"ĠBrief":14201,"Ġabusive":14202,"ĠBench":14203,"Ġrub":14204,"ĠDil":14205,"Ġmount":14206,"Ġmaturity":14207,"ĠNut":14208,"nee":14209,"enc":14210,"Ġgunfire":14211,"ĠKill":14212,"Ġgates":14213,"Ġflower":14214,"iol":14215,"Ġshaped":14216,"Ġundoubtedly":14217,"Ġbackgrounds":14218,"ĠComplex":14219,"\":{\"":14220,"Ġnaming":14221,"Ġmonument":14222,"Ġoh":14223,"Ġembedded":14224,"Ġbang":14225,"ĠKro":14226,"Ġaggression":14227,"ĠMits":14228,"During":14229,"ĠEp":14230,"iners":14231,"ĠAnaheim":14232,"Ġrom":14233,"Ġoutgoing":14234,"Ġfulfill":14235,"Ġreminds":14236,"Ġren":14237,"à¤":14238,"ĠSue":14239,"Ġrefresh":14240,"Ġlif":14241,"Ġfil":14242,"ĠLead":14243,"Ġregulate":14244,"ĠTeachers":14245,"Ġclarify":14246,"obs":14247,"Ġblasted":14248,"ĠAx":14249,"Ġflavors":14250,"Ġmega":14251,"Ġhurdles":14252,"Ġinspector":14253,"ĠSalvador":14254,"Ġprescribed":14255,"Ġrenovation":14256,"OUR":14257,"Ġutil":14258,"ĠBradford":14259,"Ġwasted":14260,"Ġlineman":14261,"Ġpalm":14262,"icate":14263,"Ġoverseeing":14264,"otted":14265,"ĠRapids":14266,"Ġjustified":14267,"aby":14268,"Ġextends":14269,"Ġoath":14270,"bow":14271,"ĠRivera":14272,"Jan":14273,"ĠImran":14274,"Ġforests":14275,"ĠShel":14276,"ĠBrun":14277,"Ġaerial":14278,"ĠNOW":14279,"PAR":14280,"Ġbeverages":14281,"ettel":14282,"Ġfragile":14283,"Ġcodes":14284,"Į":14285,"abel":14286,"Watch":14287,"road":14288,"Ġdismissal":14289,"ĠRosa":14290,"Ġcrunch":14291,"²":14292,"Ġinnovations":14293,"Ġhabitat":14294,"Ġforefront":14295,"ĠKoch":14296,"ĠChevrolet":14297,"Ġwheelchair":14298,"Ġconsiderably":14299,"Ġexpenditures":14300,"Ġtexts":14301,"Ġprompt":14302,"Ġskating":14303,"Ġpetroleum":14304,"ĠICC":14305,"Ġvit":14306,"fit":14307,"Ġprolonged":14308,"ĠLucy":14309,"Ġcho":14310,"Ġrocked":14311,"ĠBrom":14312,"Ġfreed":14313,"Ġyours":14314,"ĠEden":14315,"Ġmonitored":14316,"asted":14317,"Ġoversees":14318,"ieri":14319,"Ġideology":14320,"ĠFine":14321,"tering":14322,"Top":14323,"Ġdamp":14324,"uta":14325,"Ġlethal":14326,"Ġpurple":14327,"udge":14328,"ĠChemical":14329,"ĠPetersburg":14330,"Ġwarns":14331,"Ġcollectively":14332,"Ġâ":14333,"Ġplaintiffs":14334,"ĠBoris":14335,"Ġsheep":14336,"oves":14337,"ĠAuthor":14338,"Ġcampuses":14339,"Ġdestroying":14340,"Ġgloves":14341,"Ġcease":14342,"Ġdelegates":14343,"Ġpreceded":14344,"realDonaldTrump":14345,"Ġforwards":14346,"erton":14347,"ĠBuzzFeed":14348,"Ġoccupation":14349,"ĠLegion":14350,"Ġstir":14351,"Ġshale":14352,"Ġterrific":14353,"Ġnewborn":14354,"Ġstandoff":14355,"OWN":14356,"Ġmuscles":14357,"ĠHerman":14358,"ĠLiz":14359,"ĠExperience":14360,"ĠSuccess":14361,"ĠHispanic":14362,"ĠCCTV":14363,"Ġcomplement":14364,"ĠBing":14365,"Ġprem":14366,"ĠJohannes":14367,"Ġdent":14368,"itar":14369,"ĠHein":14370,"ĠNicola":14371,"Ġconcludes":14372,"ĠKhal":14373,"Ġparish":14374,"Ġshaking":14375,"ĠSchw":14376,"mod":14377,"ĠLil":14378,"ña":14379,"ĠBog":14380,"ĠFight":14381,"Ġgre":14382,"Ġfel":14383,"Ġheal":14384,"err":14385,"TM":14386,"airo":14387,"health":14388,"Ġswings":14389,"Ġtier":14390,"anka":14391,"ribune":14392,"emouth":14393,"ĠBloom":14394,"Ġowing":14395,"Tech":14396,"Ġdough":14397,"Ġbatch":14398,"ĠLion":14399,"ĠZamb":14400,"Ġcrashing":14401,"ĠXL":14402,"ppers":14403,"ĠDoctors":14404,"ĠSor":14405,"video":14406,"Ġcigarettes":14407,"ĠBoxing":14408,"Ġconstitute":14409,"Ġconcentrate":14410,"ĠArmenian":14411,"Ġsemester":14412,"position":14413,"emic":14414,"ĠNYC":14415,"ĠCampus":14416,"Ġalternate":14417,"Ġexped":14418,"Ġpublishers":14419,"2015":14420,"Ġunanimous":14421,"ĠPrevious":14422,"Ġwellness":14423,"ĠCreative":14424,"edy":14425,"AGE":14426,"ĠCavs":14427,"Ġ1978":14428,"Ġfu":14429,"ĠTata":14430,"ĠChoice":14431,"Ġwoes":14432,"ĠCable":14433,"Ġ~":14434,"ĠGem":14435,"Ġconsolidated":14436,"ĠManitoba":14437,"Cloud":14438,"Ġrounded":14439,"ĠVentura":14440,"Ġshark":14441,"Ġdresses":14442,"Ġtraction":14443,"eda":14444,"Ġdiv":14445,"Ġdental":14446,"Wh":14447,"ĠGig":14448,"ĠBoyd":14449,"ĠTransit":14450,"Ġtelevised":14451,"SON":14452,"ĠVince":14453,"Ġcloses":14454,"apt":14455,"ĠWheeler":14456,"ĠTyson":14457,"Ġforensic":14458,"Ġpunished":14459,"Ġseas":14460,"Ġnavigation":14461,"Ġprecedent":14462,"Ġextremist":14463,"Ġcomposite":14464,"PO":14465,"Ġsurvivor":14466,"ĠVale":14467,"gars":14468,"HT":14469,"ĠRiyadh":14470,"Ġrevival":14471,"ĠPayne":14472,"Ġcollaborative":14473,"ĠCustomers":14474,"ĠPf":14475,"Ġproves":14476,"erve":14477,"Ġelev":14478,"ĠPaper":14479,"Ġchore":14480,"Ġthriller":14481,"Ġstraw":14482,"cock":14483,"Gu":14484,"Ġaligned":14485,"ĠChronicle":14486,"Ġshouting":14487,"Ġ1976":14488,"Ġlightning":14489,"Ġworlds":14490,"ĠOpening":14491,"enton":14492,"ĠAna":14493,"ĠGol":14494,"ĠTechn":14495,"lis":14496,"Ġorientation":14497,"ĠArri":14498,"ĠPG":14499,"ross":14500,"Ġsank":14501,"LOS":14502,"ĠAllison":14503,"Ġsmiles":14504,"USD":14505,"Ġkits":14506,"Bar":14507,"ĠBri":14508,"Ġounces":14509,"ĠNielsen":14510,"eno":14511,"Ġ109":14512,"Ġnorms":14513,"Ġskip":14514,"180":14515,"Ġmonitors":14516,"2012":14517,"Ġincorporate":14518,"Ġmechanisms":14519,"ĠHack":14520,"ĠBomb":14521,"ĠGavin":14522,"ĠNatalie":14523,"Ġdiscusses":14524,"Ġassembled":14525,"Ġcognitive":14526,"owner":14527,"Ġgenuinely":14528,"Ġdisappear":14529,"ĠAK":14530,"Ġstal":14531,"Ġsoup":14532,"ĠFinn":14533,"Ġcares":14534,"Ġfinest":14535,"Ġtuned":14536,"ende":14537,"ĠStefan":14538,"Ġaccompanying":14539,"î":14540,"Maybe":14541,"Ġoffender":14542,"TT":14543,"Ġ212":14544,"Ġvolleyball":14545,"needed":14546,"Ġquo":14547,"Ġdim":14548,"ĠHistorical":14549,"ĠLance":14550,"gmail":14551,"ĠGate":14552,"Ġdemonstrators":14553,"Ġdy":14554,"cia":14555,"ĠSteele":14556,"ĠJoan":14557,"ĠKerala":14558,"KA":14559,"ĠElectoral":14560,"Ġpaths":14561,"ø":14562,"Ne":14563,"Ġaccepts":14564,"Ġlowering":14565,"Ġportions":14566,"ĠValencia":14567,"Ġfestivals":14568,"Ġgeneric":14569,"usk":14570,"ĠVernon":14571,"ĠOrioles":14572,"Ġrenewal":14573,"Ġbelonged":14574,"Ġbreathe":14575,"Ġ220":14576,"Ġrecruited":14577,"Ġlogic":14578,"Ġrecreation":14579,"Ġverbal":14580,"ĠHaz":14581,"double":14582,"Ġfavourites":14583,"Ġfundamentals":14584,"ĠSoc":14585,"360":14586,"SO":14587,"Ġalerted":14588,"Ġbriefed":14589,"ĠBruno":14590,"Ġseating":14591,"Ġfreight":14592,"ĠAmer":14593,"Ġwished":14594,"table":14595,"growth":14596,"ĠWent":14597,"Ġhilarious":14598,"Ġthroat":14599,"bet":14600,"gon":14601,"Ġample":14602,"hee":14603,"ĠHood":14604,"ĠIceland":14605,"ĠAnkara":14606,"iang":14607,"Ġpracticing":14608,"azer":14609,"Ġleaf":14610,"Ġhottest":14611,"Ġmarginal":14612,"Ġrevelations":14613,"ĠPrices":14614,"ĠLar":14615,"times":14616,"Ġhandles":14617,"ĠNaz":14618,"Ġinstitute":14619,"Ġtranslate":14620,"ĠJP":14621,"Ġsoared":14622,"Ġconsume":14623,"ĠTap":14624,"ĠCelebrity":14625,"ĠMayweather":14626,"ĠOracle":14627,"Ġmor":14628,"ANA":14629,"Ġpaperwork":14630,"aste":14631,"Ġdil":14632,"Ġdecorated":14633,"Ġpromotional":14634,"ĠMerrill":14635,"Ġappliances":14636,"ĠCOP":14637,"Ġlips":14638,"ĠBrennan":14639,"ĠMile":14640,"ĠNetworks":14641,"ĠComment":14642,"ĠIb":14643,"ĠAgg":14644,"IDE":14645,"Ġinitiate":14646,"Ġknockout":14647,"Ġbargain":14648,"Ġaccordingly":14649,"bee":14650,"ĠGerald":14651,"Ġproblematic":14652,"Ġtrap":14653,"Ġfinalists":14654,"addy":14655,"would":14656,"Ġstrictly":14657,"ĠRamsey":14658,"Ġdownward":14659,"Ġextract":14660,"Ġfamed":14661,"ĠOUT":14662,"Ġinduct":14663,"ĠAuckland":14664,"Ġpoetry":14665,"mos":14666,"ĠGuinea":14667,"management":14668,"ohan":14669,"ĠGuide":14670,"aily":14671,"umping":14672,"Ġenacted":14673,"ĠEye":14674,"vision":14675,"umi":14676,"aped":14677,"Ġbicycle":14678,"ĠHouth":14679,"ĠNAS":14680,"Ġtapped":14681,"wer":14682,"otti":14683,"EA":14684,"Ġsurprises":14685,"ĠUpdate":14686,"ĠPun":14687,"ĠMiz":14688,"ĠOro":14689,"Ġcostumes":14690,"title":14691,"Ġsurviving":14692,"According":14693,"themed":14694,"ĠPeoples":14695,"Se":14696,"Ġassociations":14697,"hett":14698,"Time":14699,"Ġessay":14700,"Ġmu":14701,"ĠScore":14702,"ĠSpani":14703,"ĠSEE":14704,"Ġmales":14705,"Ġrage":14706,"EU":14707,"ĠYellow":14708,"rupt":14709,"Ġapparel":14710,"Ġsweat":14711,"Ġnearest":14712,"zman":14713,"Ġanticipation":14714,"Ġinjuring":14715,"Ġousted":14716,"chan":14717,"ĠAlert":14718,"Ġber":14719,"atal":14720,"Com":14721,"Ġ04":14722,"Ġafterward":14723,"edge":14724,"ĠBooker":14725,"lex":14726,"ĠWhole":14727,"Ġtoughest":14728,"ĠMaharashtra":14729,"lier":14730,"ĠTennis":14731,"Ġhandy":14732,"ĠMetal":14733,"ĠiTunes":14734,"ĠDiscovery":14735,"Ġcompassion":14736,"ĠLIVE":14737,"Ġeconomically":14738,"Ġendangered":14739,"GO":14740,"Ġmound":14741,"word":14742,"ĠTouch":14743,"ogo":14744,"Ġincomes":14745,"when":14746,"ĠAside":14747,"Ġscandals":14748,"Ġfunctionality":14749,"ĠAer":14750,"Ġcouncils":14751,"Ġdenial":14752,"140":14753,"Ġimplied":14754,"Ġoutfits":14755,"Ġsuited":14756,"Ġ1973":14757,"ĠPizza":14758,"Ġdebates":14759,"record":14760,"Ġhype":14761,"ĠRus":14762,"ĠRobbie":14763,"Ġtouted":14764,"ĠSharp":14765,"Ġbeings":14766,"Ġslavery":14767,"encies":14768,"ĠRooney":14769,"Ġnan":14770,"Ġraids":14771,"Ġinstructor":14772,"Market":14773,"Ġshook":14774,"Ġdeliberate":14775,"ĠNorthwestern":14776,"ĠEss":14777,"Ġwhatsoever":14778,"ĠConfederate":14779,"YS":14780,"ĠCameroon":14781,"ĠFlip":14782,"Yeah":14783,"Ġwashing":14784,"mand":14785,"ĠLex":14786,"Ġissuance":14787,"Ġniche":14788,"Ġfold":14789,"ĠWendy":14790,"Ġhy":14791,"Ġbucket":14792,"ĠVW":14793,"ĠCairo":14794,"ĠSK":14795,"ĠKang":14796,"Ġintake":14797,"Ġhills":14798,"anz":14799,"©":14800,"ugu":14801,"ĠFortunately":14802,"ĠMarqu":14803,"Ġimprisonment":14804,"oking":14805,"Ġdistributors":14806,"zie":14807,"Ġstip":14808,"ĠWire":14809,"Ġcouncillors":14810,"Ġsue":14811,"ĠRegardless":14812,"ĠEnc":14813,"Ġbaking":14814,"ĠVenture":14815,"Ġintriguing":14816,"Ġupheld":14817,"ĠActive":14818,"Ġgenes":14819,"ĠDawson":14820,"ĠPreviously":14821,"ĠRac":14822,"Ġmetric":14823,"Files":14824,"ĠiPhones":14825,"ĠWelcome":14826,"Ġburns":14827,"ĠScreen":14828,"ashes":14829,"ĠApr":14830,"Ġtheories":14831,"san":14832,"ĠRenault":14833,"ĠSinger":14834,"Ġfounders":14835,"Russian":14836,"ĠBelfast":14837,"Ġimagined":14838,"ĠPlanet":14839,"ĠCatalan":14840,"ĠRochester":14841,"Ġevolve":14842,"ĠOT":14843,"Ġpassword":14844,"Ġhomelessness":14845,"Ġbacklog":14846,"Ġpresenter":14847,"Ġfal":14848,"ISH":14849,"ĠEM":14850,"icked":14851,"Ġunlock":14852,"city":14853,"Ġnegotiation":14854,"Ġdancers":14855,"dan":14856,"ĠCOL":14857,"VC":14858,"boat":14859,"Ġoverly":14860,"deal":14861,"lander":14862,"Ġdiss":14863,"ICS":14864,"Ġfifty":14865,"Ġowe":14866,"Ġprisons":14867,"ifications":14868,"wo":14869,"ĠAu":14870,"Ġapiece":14871,"ĠCourtney":14872,"Ġ1975":14873,"Ġsurpass":14874,"Ġidentities":14875,"Ġintegral":14876,"Ġdocumentation":14877,"Ġelegant":14878,"ĠIg":14879,"Ġdear":14880,"Ġ113":14881,"ĠGupta":14882,"Ġcontentious":14883,"rish":14884,"Ġclues":14885,"Ġadditions":14886,"Ġep":14887,"rus":14888,"Ġcentered":14889,"ĠPhillies":14890,"father":14891,"Ġborough":14892,"Ġbuttons":14893,"Ġdeported":14894,"ĠREC":14895,"ĠAlready":14896,"eh":14897,"hur":14898,"Ġupbeat":14899,"omen":14900,"Ġdetailing":14901,"Ġwr":14902,"Ġvaried":14903,"ĠEconomics":14904,"Ġensures":14905,"ĠCivic":14906,"Ġunpaid":14907,"sold":14908,"ĠHil":14909,"ĠMult":14910,"ĠRising":14911,"ĠMini":14912,"Ġneuro":14913,"Ġpenal":14914,"Ġneighbour":14915,"ĠChavez":14916,"Ġjew":14917,"ĠVIP":14918,"Connor":14919,"ĠTalking":14920,"Ġcorrection":14921,"Ġstandpoint":14922,"roads":14923,"ĠWool":14924,"Ġverification":14925,"Ġmic":14926,"olf":14927,"Ġexemption":14928,"Ġfilter":14929,"Ġballoon":14930,"leases":14931,"ician":14932,"ĠSpr":14933,"Ġtoe":14934,"Ġunconstitutional":14935,"Ġmanslaughter":14936,"Ġtossed":14937,"ĠMeg":14938,"ATIONS":14939,"ACK":14940,"ĠRouge":14941,"ĠHansen":14942,"ĠHook":14943,"Out":14944,"ĠHorse":14945,"ĠBath":14946,"ĠAlways":14947,"Ġincorporated":14948,"Ġconjunction":14949,"ĠFit":14950,"Ġexamining":14951,"Ġwallet":14952,"Ġensured":14953,"Ġacclaimed":14954,"ippers":14955,"Ġbeneficiaries":14956,"Ġunexpectedly":14957,"Ġexploit":14958,"ĠWillie":14959,"Ġcomb":14960,"ĠWalton":14961,"rica":14962,"icky":14963,"Ġate":14964,"ĠPadres":14965,"Ġrib":14966,"Ġsnacks":14967,"ĠFernandez":14968,"ĠMachine":14969,"ction":14970,"Ġillnesses":14971,"ĠHoffman":14972,"ĠSpaceX":14973,"Ġju":14974,"Ġswift":14975,"Ġembark":14976,"ĠRailway":14977,"Ġmeasuring":14978,"agers":14979,"arsh":14980,"Ġessence":14981,"angle":14982,"Ġolive":14983,"ĠCommander":14984,"iggs":14985,"Ġrewarded":14986,"Ġdispatched":14987,"Ġplayground":14988,"½":14989,"ĠProgramme":14990,"Ġstudios":14991,"Ġskeptical":14992,"ĠOlymp":14993,"ĠKeys":14994,"ĠSunshine":14995,"amba":14996,"ĠDonna":14997,"Ġlightly":14998,"Ġobtaining":14999,"Ġpoisoning":15000,"Ġaz":15001,"Ġ1972":15002,"Ġunconscious":15003,"ECT":15004,"Ġlied":15005,"ĠKaz":15006,"Ġ06":15007,"ĠMoving":15008,"Ġnum":15009,"oral":15010,"Ġassessments":15011,"Ġscholarships":15012,"Ġevacuate":15013,"ĠSunni":15014,"Ġquake":15015,"Ġfort":15016,"ques":15017,"ĠAlonso":15018,"Ġthread":15019,"Ġsqueeze":15020,"arat":15021,"oly":15022,"ĠAlphabet":15023,"uting":15024,"icio":15025,"ĠRetirement":15026,"ither":15027,"Ġasleep":15028,"Ġpairs":15029,"Ġmanufacture":15030,"ĠHazard":15031,"Ġsidewalk":15032,"Ġwears":15033,"ĠCraft":15034,"emen":15035,"ieth":15036,"Ġbypass":15037,"ĠLancaster":15038,"Ġflour":15039,"charge":15040,"ĠCLICK":15041,"Ġpotatoes":15042,"ĠKarachi":15043,"Ġvalley":15044,"Ġsights":15045,"Ġfallout":15046,"ords":15047,"BN":15048,"Ġsunshine":15049,"Ġundertaken":15050,"Ġcontestants":15051,"Ġaccomplishments":15052,"Ġconditioning":15053,"Ġcel":15054,"ĠHalifax":15055,"Ġaccent":15056,"***":15057,"Ġpitchers":15058,"Ġadopting":15059,"Ġjustices":15060,"Ġrip":15061,"ince":15062,"Ġelimination":15063,"Ġaerospace":15064,"ĠBeer":15065,"ĠBasin":15066,"Ġunwanted":15067,"goers":15068,"isco":15069,"ĠTwin":15070,"ĠDesert":15071,"rix":15072,"Ġdarkness":15073,"ĠDunn":15074,"City":15075,"pop":15076,"Ġ1969":15077,"ataka":15078,"Ġtal":15079,"Ġautism":15080,"ĠMcLaren":15081,"ĠUEFA":15082,"Ġclassrooms":15083,"ĠLeave":15084,"Americans":15085,"las":15086,"Ġqui":15087,"Ġundefeated":15088,"otto":15089,"ĠNRA":15090,"ĠPorsche":15091,"Ġnuts":15092,"oys":15093,"ĠMethodist":15094,"Ġatt":15095,"Ġtweeting":15096,"children":15097,"eller":15098,"Ġinquiries":15099,"Ġmillennials":15100,"ĠWembley":15101,"INS":15102,"Ġautopsy":15103,"ĠElon":15104,"ĠHicks":15105,"ugg":15106,"Ġwreck":15107,"ĠComcast":15108,"Ġstones":15109,"public":15110,"ĠKem":15111,"bedroom":15112,"ļ":15113,"itated":15114,"Ġsemic":15115,"uman":15116,"Cal":15117,"ANN":15118,"ĠGaz":15119,"Ġundisclosed":15120,"ĠPlanned":15121,"ĠYale":15122,"ĠIST":15123,"lies":15124,"ĠStanding":15125,"Ġrelieved":15126,"EO":15127,"Ġgraduating":15128,"park":15129,"ĠâĢķ":15130,"Ġpensions":15131,"rave":15132,"ĠWonder":15133,"AZ":15134,"Ġcosting":15135,"Ġeditors":15136,"Ġtotaled":15137,"Ġspacecraft":15138,"meter":15139,"Ġ02":15140,"ĠNikki":15141,"sworth":15142,"ĠCrit":15143,"asha":15144,"Ġknees":15145,"Ġhats":15146,"uity":15147,"ĠPanther":15148,"Ġtan":15149,"ĠBuzz":15150,"ĠGlad":15151,"ĠPleasant":15152,"SM":15153,"Ġtricks":15154,"Ġplac":15155,"ĠDanielle":15156,"Ġours":15157,"Ġwashed":15158,"haven":15159,"Ġdrain":15160,"ĠUttar":15161,"Ġapple":15162,"Ġjunk":15163,"Ġturkey":15164,"ĠDug":15165,"Ġdiplomacy":15166,"Ġempire":15167,"Ġpinch":15168,"Ġferry":15169,"ĠDustin":15170,"Ġ03":15171,"Ġelder":15172,"Everything":15173,"ĠProgressive":15174,"ution":15175,"VI":15176,"dam":15177,"Ġlever":15178,"ĠAustralians":15179,"Ġconsequence":15180,"itan":15181,"Ġcondemn":15182,"Ġneg":15183,"ĠOverview":15184,"Ġsuccesses":15185,"Ġprobable":15186,"ĠMirror":15187,"mor":15188,"verse":15189,"Ġevaluating":15190,"ĠBes":15191,"Ġimm":15192,"Ġharness":15193,"Ġresilient":15194,"ĠBuild":15195,"Ġstraightforward":15196,"ADE":15197,"Ġgrandparents":15198,"Ġmarched":15199,"ĠKiev":15200,"Ġchiefs":15201,"oha":15202,"Ġvest":15203,"kn":15204,"enda":15205,"ĠSev":15206,"Ġbatters":15207,"ĠJos":15208,"ĠQue":15209,"ĠCourse":15210,"ĠCorner":15211,"ĠMess":15212,"Ġmourn":15213,"keepers":15214,"ĠRegina":15215,"Everybody":15216,"Ġtrajectory":15217,"Ġdefenseman":15218,"ĠArticles":15219,"Ġspur":15220,"ĠPhD":15221,"Ġpipes":15222,"Ġduck":15223,"Ġcombining":15224,"ĠHit":15225,"ĠGeorgetown":15226,"ĠBee":15227,"Cor":15228,"Ġcomposition":15229,"Ġconnects":15230,"ĠMARK":15231,"taker":15232,"Ġcertainty":15233,"Ġhefty":15234,"ĠHezbollah":15235,"ĠShip":15236,"Ġmalicious":15237,"AI":15238,"Ġbits":15239,"Ġstyl":15240,"Ġimpaired":15241,"ĠCBI":15242,"Despite":15243,"othe":15244,"ĠRyder":15245,"ĠAlf":15246,"ifa":15247,"Ind":15248,"Ġblaming":15249,"ĠToledo":15250,"EW":15251,"ĠEssex":15252,"iated":15253,"ĠAberdeen":15254,"ANCE":15255,"Ġpossess":15256,"Ġsuperhero":15257,"Ġoverhead":15258,"quet":15259,"ĠRicky":15260,"Ġdock":15261,"ĠTelecom":15262,"Ġshelf":15263,"³":15264,"Ġmaritime":15265,"Ġportrayed":15266,"ĠYesterday":15267,"Ġcollided":15268,"Ġcookies":15269,"ĠCul":15270,"Ġindexes":15271,"Ġnaval":15272,"oval":15273,"105":15274,"ĠWeber":15275,"chief":15276,"arma":15277,"ĠRey":15278,"Ġauditor":15279,"ĠMarion":15280,"ĠMartha":15281,"ĠSally":15282,"Ġsedan":15283,"ĠAlison":15284,"nce":15285,"Es":15286,"ĠParade":15287,"Ġpharmacy":15288,"ĠKre":15289,"loe":15290,"cks":15291,"Ġmitigate":15292,"Ġdesigning":15293,"Ġ2024":15294,"Ġportable":15295,"Ġimproves":15296,"ĠAMD":15297,"Ġexcluded":15298,"CON":15299,"ĠOscars":15300,"Ġfixtures":15301,"comb":15302,"ĠBerg":15303,"Ġbother":15304,"Ġboring":15305,"Ġobservation":15306,"ĠCad":15307,"Ġrecordings":15308,"ĠCultural":15309,"Ġweaken":15310,"Ġaccuse":15311,"ĠAbd":15312,"abor":15313,"115":15314,"uffle":15315,"Ġhighways":15316,"atham":15317,"empt":15318,"ĠDeer":15319,"ĠEDT":15320,"ĠWait":15321,"athan":15322,"Ġaccumulated":15323,"Ġguilt":15324,"Ġexempt":15325,"Ġdiluted":15326,"ĠJamal":15327,"Ġshit":15328,"cross":15329,"Ġeve":15330,"Ġshirts":15331,"Ġsatisfy":15332,"ĠPaulo":15333,"AH":15334,"sic":15335,"ĠChloe":15336,"ĠCities":15337,"ĠSwansea":15338,"Ġprecision":15339,"ĠTracy":15340,"ping":15341,"Ġcontinually":15342,"Ġdemographic":15343,"Ġcliff":15344,"Ġjaw":15345,"isted":15346,"ĠDevelop":15347,"ĠAJ":15348,"Ġaisle":15349,"ĠLionel":15350,"Ġpredominantly":15351,"Ġmel":15352,"Ġlifelong":15353,"hs":15354,"Ġshouted":15355,"lad":15356,"Ġdest":15357,"Ġpacks":15358,"ĠKath":15359,"ĠCruise":15360,"fired":15361,"oder":15362,"hua":15363,"Ġgoodbye":15364,"Ġinterfere":15365,"eca":15366,"Ġré":15367,"atum":15368,"itas":15369,"ĠLodge":15370,"ĠWald":15371,"Ġmidday":15372,"umble":15373,"asting":15374,"©":15375,"ĠLeg":15376,"ĠNepal":15377,"Ġchased":15378,"idge":15379,"Ġconv":15380,"Ġfraudulent":15381,"Ġopera":15382,"Ġshr":15383,"ĠUniverse":15384,"ĠJerome":15385,"Ġ1977":15386,"ĠDancing":15387,"ĠRS":15388,"±":15389,"eks":15390,"Ġchic":15391,"Ġpunish":15392,"Ġpropose":15393,"arin":15394,"ĠChop":15395,"ĠAhead":15396,"ĠGallagher":15397,"ĠBangkok":15398,"ĠShelby":15399,"ĠNS":15400,"Ġcheek":15401,"onia":15402,"Ġrelegation":15403,"ĠHind":15404,"ĠCory":15405,"Ġfingerprint":15406,"Ġstrive":15407,"Ġmm":15408,"igs":15409,"Ġholy":15410,"Ġfavored":15411,"ĠSomeone":15412,"ĠLatino":15413,"ĠPatt":15414,"Ġchallenger":15415,"ĠCotton":15416,"Sw":15417,"itten":15418,"ĠXI":15419,"ĠStat":15420,"ĠDIS":15421,"Ġautomakers":15422,"Ġevaluated":15423,"ĠArc":15424,"Ġpersuade":15425,"Af":15426,"Ġreunited":15427,"Ġabs":15428,"Ġbride":15429,"Ġpurely":15430,"uce":15431,"uded":15432,"Ġsettling":15433,"Ġlodged":15434,"Ġfixing":15435,"Ġsuccession":15436,"ĠAlfred":15437,"ĠAlvarez":15438,"mac":15439,"ĠFont":15440,"Ġcontra":15441,"affle":15442,"Ġcopied":15443,"Ġmasses":15444,"ĠElections":15445,"ĠThan":15446,"Ġsoaring":15447,"jay":15448,"Ġsuing":15449,"Ġconcentrated":15450,"Ġconvey":15451,"Ġ240":15452,"gs":15453,"ĠNeal":15454,"Ġnasty":15455,"ĠLB":15456,"odi":15457,"ĠSergei":15458,"Ġthumb":15459,"Ġservants":15460,"Ġrevelation":15461,"Ġdischarge":15462,"ĠBright":15463,"ĠBent":15464,"ĠChrysler":15465,"mill":15466,"ĠImagine":15467,"Ġreceptions":15468,"Ġpersonalities":15469,"Ġsilly":15470,"ĠLoc":15471,"ĠZero":15472,"HI":15473,"rice":15474,"Ġgar":15475,"far":15476,"enh":15477,"ĠBiden":15478,"ĠEntreprene":15479,"Ġassumption":15480,"Ġnicely":15481,"ĠEither":15482,"|":15483,"ĠNW":15484,"ĠKens":15485,"ĠNolan":15486,"Ġowning":15487,"atures":15488,"ĠPastor":15489,"ĠRegistration":15490,"Ġexperiments":15491,"Ġassurance":15492,"Ġhashtag":15493,"oint":15494,"ĠBin":15495,"Ġqualification":15496,"center":15497,"Ġausterity":15498,"ĠPers":15499,"Ġscoop":15500,"Ġpros":15501,"ĠFields":15502,"Ġfur":15503,"ĠJas":15504,"Ġplanting":15505,"security":15506,"ĠTrain":15507,"ĠKathy":15508,"demand":15509,"ĠLev":15510,"Ġtut":15511,"tier":15512,"QU":15513,"Ġexploitation":15514,"Ġignoring":15515,"ĠSex":15516,"Ġadapted":15517,"Ġdisastrous":15518,"Ġempower":15519,"Ġcreators":15520,"ĠLay":15521,"ĠDragon":15522,"ĠWyn":15523,"Ġ1974":15524,"acious":15525,"performance":15526,"ĠTiffany":15527,"isting":15528,"Ġindividually":15529,"ĠLeading":15530,"ĠSask":15531,"Ġcatastrophic":15532,"Ġpunched":15533,"ĠVienna":15534,"Ġsurgical":15535,"Gr":15536,"odo":15537,"Ġgem":15538,"ĠMinority":15539,"Ġmice":15540,"ĠHistoric":15541,"ĠKot":15542,"caster":15543,"Ġsuff":15544,"journal":15545,"Ġpresumably":15546,"ĠBit":15547,"inary":15548,"Ġbre":15549,"Ġenhancing":15550,"Ġgru":15551,"ĠRunning":15552,"hardt":15553,"Ġtroubling":15554,"Ġpumps":15555,"ĠProspect":15556,"etic":15557,"Ġmartial":15558,"Ġcouncillor":15559,"atra":15560,"ths":15561,"ĠSark":15562,"ĠChamp":15563,"scoring":15564,"ĠWel":15565,"rup":15566,"Ġterrifying":15567,"ĠCatch":15568,"Ġinspections":15569,"Ġpornography":15570,"bra":15571,"ĠKeeping":15572,"Ġbanker":15573,"angers":15574,"ĠCrimea":15575,"ĠDisclosure":15576,"iba":15577,"Ġturf":15578,"Ġschedules":15579,"ĠJorge":15580,"ĠAcross":15581,"Ġsolving":15582,"Ġsensation":15583,"ĠWW":15584,"cial":15585,"atz":15586,"Ġlion":15587,"Ġcertificates":15588,"itive":15589,"ĠWes":15590,"ĠPrison":15591,"ĠPlayStation":15592,"duty":15593,"Ġvariable":15594,"Ġstrangers":15595,"istrates":15596,"vs":15597,"Ġreigning":15598,"Ġsliding":15599,"ĠShin":15600,"Ġtelecommunications":15601,"Ġinstalling":15602,"Ġrecogn":15603,"Ġsubway":15604,"too":15605,"ĠMcKin":15606,"ĠStoke":15607,"Ġsensitivity":15608,"bas":15609,"Ġsan":15610,"Ġ(-":15611,"ĠSuarez":15612,"Ġaverages":15613,"ammu":15614,"ĠFen":15615,"Ġrefined":15616,"outh":15617,"Ġcob":15618,"ĠLaz":15619,"essa":15620,"Ġpositioning":15621,"Three":15622,"Ġoils":15623,"Ġassaults":15624,"Ġcompanion":15625,"ĠFlash":15626,"ĠMam":15627,"ĠTill":15628,"Ġblues":15629,"ĠJae":15630,"ĠPier":15631,"Ġbedrooms":15632,"ĠHawkins":15633,"ĠCornell":15634,"Ġanswering":15635,"Ġsec":15636,"Ġrecognizes":15637,"Red":15638,"ĠJamaica":15639,"Ġinsurgents":15640,"Ġbrace":15641,"Ġra":15642,"ĠTai":15643,"ocation":15644,"ignment":15645,"Ġreasonably":15646,"inating":15647,"Ġbonuses":15648,"Ġsandwich":15649,"Ġinadequate":15650,"Ġdelicate":15651,"Ġadorable":15652,"Ġpalace":15653,"Ġsmallest":15654,"Ġpractically":15655,"ĠCrosby":15656,"Ġlevy":15657,"Ġlend":15658,"boards":15659,"shaped":15660,"Ġvulnerability":15661,"ĠKelley":15662,"Ġsponsorship":15663,"ract":15664,"Ġslew":15665,"Ġfederation":15666,"ĠLal":15667,"acies":15668,"ĠFamilies":15669,"Ġproposing":15670,"Ġhyp":15671,"elected":15672,"inkle":15673,"ĠSays":15674,"ĠApollo":15675,"ĠWis":15676,"imer":15677,"Ġcombines":15678,"Ġtim":15679,"ĠQuestion":15680,"Ġborrowers":15681,"Ġswiftly":15682,"ĠMagn":15683,"Ġheadphones":15684,"Russia":15685,"Ġtongue":15686,"Ġbye":15687,"nn":15688,"Ġseller":15689,"ĠWord":15690,"Tom":15691,"ĠDevin":15692,"ĠSurrey":15693,"Ġquad":15694,"Ġcourthouse":15695,"gi":15696,"ĠGrill":15697,">":15698,"Ġrational":15699,"ĠFlames":15700,"ĠCham":15701,"Ġvacuum":15702,"ĠRays":15703,"Ġescalating":15704,"Ġouter":15705,"Ġstretches":15706,"ĠSpeed":15707,"Ġnegatively":15708,"Ġabsorb":15709,"ĠAustrian":15710,"Ġslice":15711,"ĠDiet":15712,"Ġbun":15713,"Ġtactical":15714,"ĠCBD":15715,"Ġedges":15716,"Ġnest":15717,"Ġstrained":15718,"ulates":15719,"ĠTina":15720,"Net":15721,"ķ":15722,"ĠGos":15723,"God":15724,"White":15725,"Ġproudly":15726,"usion":15727,"ĠArlington":15728,"ĠNear":15729,"ĠMaxwell":15730,"Ġbomber":15731,"Ġcared":15732,"Ġapprovals":15733,"Ġexams":15734,"ĠEconomy":15735,"Ġposters":15736,"ĠHampton":15737,"ĠPere":15738,"ĠContract":15739,"Ġhoused":15740,"Ġinstruction":15741,"ĠJess":15742,"Ġacre":15743,"Ġcongestion":15744,"ĠGener":15745,"Ġdioxide":15746,"Ġvar":15747,"ĠAlexandria":15748,"ĠSpider":15749,"Ġcoins":15750,"Ġ225":15751,"Ġterritorial":15752,"ĠSPD":15753,"Ġfloat":15754,"null":15755,"Ġcalculate":15756,"ĠDin":15757,"eto":15758,"Ġcows":15759,"Ġpunct":15760,"Ġexpire":15761,"Ġkidnapped":15762,"Ġcou":15763,"Ġattitudes":15764,"ĠLeh":15765,"ĠHero":15766,"ĠKabul":15767,"Ġcubic":15768,"Ġdigits":15769,"ĠRES":15770,"Ġpipelines":15771,"icide":15772,"ĠSingle":15773,"Ġhurts":15774,"ĠMaz":15775,"ĠPak":15776,"Ġslate":15777,"Ġmultimedia":15778,"ADA":15779,"Mexico":15780,"ĠRelease":15781,"chard":15782,"Ġgarlic":15783,"ĠFletcher":15784,"Ġaforementioned":15785,"Ġ05":15786,"ĠParkway":15787,"Ġfirefighter":15788,"Ġcounseling":15789,"utions":15790,"Cap":15791,"Ġconsultants":15792,"ĠMeh":15793,"ouring":15794,"ĠDI":15795,"mic":15796,"phones":15797,"Ġencounters":15798,"ĠHapp":15799,"Ġcartoon":15800,"flight":15801,"Ġundertake":15802,"ĠHans":15803,"Ġplunge":15804,"ĠParenthood":15805,"Ġkickoff":15806,"ĠCelsius":15807,"ĠRas":15808,"ĠDund":15809,"ounce":15810,"Ġpurse":15811,"Ġmortality":15812,"Ġbrains":15813,"Ġconglomerate":15814,"ĠObserver":15815,"ĠSector":15816,"ĠApparently":15817,"Ġblank":15818,"iston":15819,"Ġweighs":15820,"gro":15821,"ĠPaw":15822,"ĠCOM":15823,"ĠPurdue":15824,"Ġnetted":15825,"ĠLinux":15826,"Mike":15827,"Ġfaithful":15828,"Ġmagazines":15829,"Ġheadquartered":15830,"ĠIps":15831,"Ġindications":15832,"Look":15833,"ĠElite":15834,"Ġsupreme":15835,"Ġchunk":15836,"ĠSz":15837,"ĠVine":15838,"rise":15839,"ĠYas":15840,"general":15841,"ĠOpera":15842,"Ġpriests":15843,"Assad":15844,"Ġaunt":15845,"Ġwhopping":15846,"enzie":15847,"Ġvegan":15848,"Ġinflux":15849,"ĠConsult":15850,"Ġwaiver":15851,"Having":15852,"inning":15853,"Ġproximity":15854,"Ġclassical":15855,"ĠIslanders":15856,"Ġadvertisers":15857,"ĠCe":15858,"ĠSochi":15859,"Ġmemoir":15860,"ĠPlaying":15861,"yers":15862,"Ġstud":15863,"Ġobservations":15864,"Ġadmire":15865,"Ġhiking":15866,"Ġbatter":15867,"Ġconfusing":15868,"Ġprecaution":15869,"kil":15870,"clusive":15871,"opoulos":15872,"ĠWestbrook":15873,"ĠTanzania":15874,"ĠCedar":15875,"usted":15876,"Ġdestructive":15877,"ĠIndies":15878,"osi":15879,"ĠAmid":15880,"Ġintercepted":15881,"Ġpartnering":15882,"Ġsubstances":15883,"ĠSuns":15884,"Ġpromotes":15885,"bird":15886,"Gen":15887,"aper":15888,"ĠEy":15889,"Ġterrain":15890,"Ġ1930":15891,"zon":15892,"Ġbreed":15893,"broken":15894,"uchin":15895,"ĠPrim":15896,"ĠRoland":15897,"Ġfitted":15898,"Ġprotects":15899,"Ġ114":15900,"RP":15901,"Ġdisrupted":15902,"ĠBaylor":15903,"oren":15904,"ĠKeen":15905,"Ġmansion":15906,"Ġgrassroots":15907,"ĠVictory":15908,"Ġbarn":15909,"Ġdepreciation":15910,"oped":15911,"immer":15912,"Ġgarnered":15913,"ĠLip":15914,"ĠTob":15915,"Ġcreatures":15916,"ooter":15917,"Ġconsortium":15918,"obi":15919,"ĠMonster":15920,"arks":15921,"turn":15922,"Ġsketch":15923,"Ġpredicting":15924,"Ġminimize":15925,"ĠEthan":15926,"anson":15927,"ĠAdjusted":15928,"ĠHornets":15929,"ĠNZ":15930,"ĠKathleen":15931,"ĠKier":15932,"ĠMercury":15933,"Ġghost":15934,"Ġhaw":15935,"ĠDemand":15936,"ĠCollection":15937,"ĠFortune":15938,"Ġcruel":15939,"Ġfurious":15940,"ĠKun":15941,"ĠSalem":15942,"Ġunsuccessful":15943,"ĠLomb":15944,"ĠFury":15945,"ahi":15946,"Ġenthusiastic":15947,"Ġsurgeries":15948,"ACE":15949,"Ġroller":15950,"ĠStamford":15951,"Being":15952,"Dec":15953,"check":15954,"Ġaffection":15955,"Ġgifted":15956,"Ġenerg":15957,"Ġvarying":15958,"ĠCharl":15959,"Ġsolved":15960,"ĠNV":15961,"Ġlaptops":15962,"Ġkindness":15963,"mart":15964,"ĠPenny":15965,"Ġ116":15966,"ĠFeder":15967,"ĠCisco":15968,"Ġeducators":15969,"Ġminim":15970,"Ġgangs":15971,"Ġfestivities":15972,"ĠOriginal":15973,"yre":15974,"rying":15975,"Ġtighter":15976,"ĠMalta":15977,"Ġshield":15978,"interest":15979,"Ġbuoy":15980,"Ġsupplement":15981,"ĠSof":15982,"Ġok":15983,"Ġprosecuted":15984,"Ġinterventions":15985,"Ġseize":15986,"Ġcaravan":15987,"ĠCarlson":15988,"ĠEnterprises":15989,"ĠChristina":15990,"ĠWellington":15991,"Ġaltered":15992,"TP":15993,"Ġexpresses":15994,"Ġcomfortably":15995,"Ġstaffing":15996,"afa":15997,"itu":15998,"saving":15999,"Ġinflammation":16000,"hatt":16001,"ĠMiranda":16002,"icious":16003,"Ġgrabbing":16004,"ĠANY":16005,"Ġobjections":16006,"Ġdot":16007,"cle":16008,"Ġrelates":16009,"Ġtribe":16010,"Ġboarding":16011,"ĠEpisode":16012,"ĠEnjoy":16013,"arding":16014,"Ġathletics":16015,"Ġflies":16016,"Ġmortgages":16017,"ruct":16018,"Ġink":16019,"ĠKC":16020,"ĠSecondary":16021,"Ġfer":16022,"ĠQaeda":16023,"OA":16024,"Frank":16025,"track":16026,"ĠChandler":16027,"Ġenv":16028,"ĠLeaders":16029,"ĠKemp":16030,"Ġunsafe":16031,"sponsored":16032,"San":16033,"ĠUsers":16034,"PE":16035,"ĠAccount":16036,"otta":16037,"ĠMix":16038,"ĠCindy":16039,"En":16040,"Ġ175":16041,"Ġoverlooked":16042,"Ġpublications":16043,"Ġrewarding":16044,"Ġexplicit":16045,"Ġnotch":16046,"Ġspecifics":16047,"Ġdesignation":16048,"ĠAppeal":16049,"Ġcontingent":16050,"Ġcage":16051,"ĠKol":16052,"ĠJohns":16053,"ĠReach":16054,"ĠTin":16055,"ĠAfricans":16056,"Ġprec":16057,"ĠRural":16058,"ĠDw":16059,"Ġuphold":16060,"Ġsuffers":16061,"Ġweed":16062,"inst":16063,"Ġcancellation":16064,"ĠShaun":16065,"Ġleve":16066,"Ġdivisive":16067,"Ġhel":16068,"Ġfatigue":16069,"ĠSchwartz":16070,"ĠKirst":16071,"Ġarise":16072,"Ġgrandson":16073,"ĠLawson":16074,"Ġcollaborate":16075,"Ġparticipant":16076,"ĠBryce":16077,"Ġinfield":16078,"mid":16079,"Ġut":16080,"Ġnotices":16081,"Ġsneak":16082,"ĠPAR":16083,"Chris":16084,"Ġutilize":16085,"ĠByron":16086,"ĠZhang":16087,"PF":16088,"Ġoverwhelmingly":16089,"Ġvegetable":16090,"Ġabsurd":16091,"ĠChem":16092,"etime":16093,"Ġenvoy":16094,"Ġlover":16095,"length":16096,"Ġrevolutionary":16097,"ĠYam":16098,"Ġshutting":16099,"mt":16100,"super":16101,"ĠToby":16102,"ĠCoca":16103,"Ġproposition":16104,"Ġembracing":16105,"Ġversatile":16106,"ĠWalking":16107,"Ġillicit":16108,"Ġnude":16109,"Ġunpredictable":16110,"take":16111,"Ġgotta":16112,"ĠXiaomi":16113,"Ġinstit":16114,"ĠPep":16115,"ĠPearson":16116,"Ġrejection":16117,"stead":16118,"Ġmut":16119,"Ġoutspoken":16120,"ĠBaghdad":16121,"ĠFly":16122,"Ġwholly":16123,"ĠRM":16124,"ĠFa":16125,"Ġcleaner":16126,"frey":16127,"ĠHab":16128,"ĠLiber":16129,"Ġwhereabouts":16130,"Ġchefs":16131,"Ġalumni":16132,"Ġstopp":16133,"dd":16134,"forward":16135,"rast":16136,"ĠNash":16137,"ĠCort":16138,"Ġpotent":16139,"Ġmold":16140,"Ġdistinctive":16141,"chip":16142,"ĠBrunswick":16143,"Ġpopulist":16144,"Ġplagued":16145,"eka":16146,"ĠIOC":16147,"ugs":16148,"ĠDob":16149,"Ġmagn":16150,"asser":16151,"hew":16152,"Ġcapturing":16153,"oos":16154,"Ġcrystal":16155,"Ġalarming":16156,"Ġ135":16157,"iating":16158,"Ġnap":16159,"umar":16160,"ĠExpl":16161,"Ġupgrading":16162,"Ġdecl":16163,"Ġoverturn":16164,"ARK":16165,"linked":16166,"ĠContinued":16167,"Ġslumped":16168,"ĠGaga":16169,"iful":16170,"ĠPosted":16171,"ĠRecommended":16172,"Ġsnake":16173,"Ġexplosives":16174,"Ġhind":16175,"Ġcontempt":16176,"Ġmock":16177,"NBA":16178,"Ġstall":16179,"Ġorganisers":16180,"Ġingredient":16181,"Ġblockbuster":16182,"ĠStream":16183,"ĠLeah":16184,"Pic":16185,"Ġventures":16186,"oman":16187,"Ġweakening":16188,"Ġmaximize":16189,"Ġdigging":16190,"uez":16191,"Ġdistinction":16192,"ĠMali":16193,"Ġcontaminated":16194,"Ġhij":16195,"Ġcrafts":16196,"Fl":16197,"Ġcloset":16198,"ĠRapp":16199,"Ġtowers":16200,"Ġamenities":16201,"Ġopioids":16202,"Ġcontend":16203,"load":16204,"ĠJol":16205,"ĠBooks":16206,"Ġsim":16207,"Ġthrilling":16208,"Ġmeter":16209,"ĠMultiple":16210,"Ġarbitration":16211,"Ġcracked":16212,"Pl":16213,"Ġphotographers":16214,"Te":16215,"ĠSidd":16216,"Ġexplored":16217,"170":16218,"Ġpleasant":16219,"ĠCapitals":16220,"ĠRi":16221,"ĠRandall":16222,"overed":16223,"Ġchar":16224,"ĠEverybody":16225,"ĠPolitics":16226,"Ġmoisture":16227,"Ġthriving":16228,"ĠScotia":16229,"arded":16230,"imb":16231,"ĠFantasy":16232,"Ġcemetery":16233,"ĠPath":16234,"eur":16235,"ĠSec":16236,"ĠPlatform":16237,"Ġdeparted":16238,"ĠVIDEO":16239,"ĠPant":16240,"ĠSyn":16241,"Ġ230":16242,"bleacher":16243,"live":16244,"Ġprob":16245,"Ġgymn":16246,"Ġjudged":16247,"orns":16248,"Ġstemming":16249,"umbling":16250,"ĠHew":16251,"ĠCheryl":16252,"Ġconsciousness":16253,"cos":16254,"ĠTate":16255,"CNN":16256,"Ġrecognizing":16257,"meg":16258,"Ġpant":16259,"ulk":16260,"MM":16261,"ĠPrescott":16262,"ĠMarcel":16263,"anas":16264,"Ġhappier":16265,"mag":16266,"ĠLov":16267,"Ġspreads":16268,"ĠSample":16269,"Ġpopped":16270,"HR":16271,"ĠMitt":16272,"Ġ00":16273,"Ġlabeled":16274,"Ġaspirations":16275,"?)":16276,"Ġloads":16277,"ĠBritt":16278,"hurst":16279,"ĠTeams":16280,"Ġextremists":16281,"ĠClement":16282,"lings":16283,"shirts":16284,"cheon":16285,"ĠDEL":16286,"ĠLocation":16287,"Ġpresentations":16288,"ĠFalcon":16289,"Ġtoddler":16290,"kl":16291,"Ġprone":16292,"Ġcommemor":16293,"ĠStanton":16294,"201":16295,"Ġranges":16296,"Ġfielder":16297,"Ġattends":16298,"rade":16299,"Ġproactive":16300,"Ġhostage":16301,"ĠGriffith":16302,"ockey":16303,"ĠAdding":16304,"ĠAFL":16305,"gas":16306,"istics":16307,"Ġsurgeon":16308,"Ġtsunami":16309,"2014":16310,"Ġconstraints":16311,"cu":16312,"Ġsurrendered":16313,"azed":16314,"ĠAirbnb":16315,"650":16316,"zed":16317,"Ġinjustice":16318,"dog":16319,"full":16320,"ĠHear":16321,"Ġsprawling":16322,"Ġhomeland":16323,"ĠSG":16324,"anced":16325,"Ġpools":16326,"ĠCE":16327,"Ġbeers":16328,"AE":16329,"ĠJac":16330,"Ġrecurring":16331,"Writing":16332,"Ġgenius":16333,"ĠFrost":16334,"Ġgrounded":16335,"Ġallege":16336,"lessness":16337,"Ġjumper":16338,"Ġvicious":16339,"Ġsecretly":16340,"Ġhacked":16341,"ĠAmsterdam":16342,"ibu":16343,"Ġ1971":16344,"ĠRosenstein":16345,"nick":16346,"arge":16347,"Ġladder":16348,"elled":16349,"Ġsatellites":16350,"Ġassassination":16351,"ĠDepot":16352,"built":16353,"Ġunrelated":16354,"maid":16355,"ĠDod":16356,"ĠVanderbilt":16357,"Ġboundary":16358,"ĠStafford":16359,"ĠBry":16360,"Ġtribunal":16361,"Ġoutings":16362,"Ġquantity":16363,"imming":16364,"ĠBlacks":16365,"Br":16366,"eri":16367,"uffed":16368,"Ġexplicitly":16369,"ĠBieber":16370,"AKING":16371,"Ġphotographed":16372,"ĠPolit":16373,"Ġpremature":16374,"hered":16375,"ĠVi":16376,"Ġmarsh":16377,"casters":16378,"ĠKra":16379,"Ġdried":16380,"Ġcafe":16381,"eting":16382,"Ġshaping":16383,"aram":16384,"orf":16385,"Ġrichest":16386,"Ġhurricanes":16387,"Ġcommands":16388,"Gl":16389,"anth":16390,"Ġstunt":16391,"Ġyearly":16392,"Ġdefeats":16393,"Ġconsultancy":16394,"call":16395,"Ġlag":16396,"adh":16397,"ĠPalestine":16398,"Ġcustomized":16399,"ĠScar":16400,"ĠWesley":16401,"ready":16402,"Ġpersist":16403,"Ġpacking":16404,"ono":16405,"Ġdischarged":16406,"Ġpouring":16407,"sburg":16408,"Ġreconsider":16409,"ĠMethod":16410,"enez":16411,"cill":16412,"Ġsecular":16413,"pers":16414,"Ġple":16415,"ELS":16416,"ĠMine":16417,"Ġpushes":16418,"Us":16419,"Ġframes":16420,"ĠNets":16421,"ĠSiem":16422,"ĠHitler":16423,"kill":16424,"Ġrented":16425,"Ġcharm":16426,"Ġpulls":16427,"ĠTide":16428,"Ġinsufficient":16429,"itted":16430,"Care":16431,"iera":16432,"Ġcouch":16433,"aders":16434,"ext":16435,"ĠCitizen":16436,"Ġlogical":16437,"ĠMeadows":16438,"ĠDenis":16439,"ĠDrivers":16440,"Ġrepublic":16441,"Ġadvising":16442,"Ġparamedics":16443,"insky":16444,"illard":16445,"encia":16446,"Ġkh":16447,"Ġrh":16448,"Ġfinalized":16449,"Ġreins":16450,"ĠFarrell":16451,"Ġsteer":16452,"Ġproxy":16453,"unes":16454,"ĠSoul":16455,"ĠCopper":16456,"ĠKenyan":16457,"amped":16458,"conference":16459,"sted":16460,"ĠLon":16461,"Ġreplay":16462,"ĠBle":16463,"Ġvibe":16464,"Ġportfolios":16465,"sea":16466,"Ġbeautifully":16467,"Ġairs":16468,"ĠRap":16469,"ĠKatrina":16470,"Ġberth":16471,"gold":16472,"ĠIsaiah":16473,"iques":16474,"elson":16475,"Ġrelentless":16476,"ĠHighland":16477,"ĠPhilippe":16478,"ĠFol":16479,"Ġenduring":16480,"enz":16481,"Ġaer":16482,"icing":16483,"ĠHTC":16484,"Ġdoping":16485,"ĠAlb":16486,"Ġsom":16487,"icia":16488,"Ġcoroner":16489,"Ġdamn":16490,"Ġ119":16491,"Ġwiped":16492,"ĠAuditor":16493,"hern":16494,"ĠJew":16495,"endra":16496,"osp":16497,"ĠRory":16498,"Ġshapes":16499,"ĠPablo":16500,"Ġforemost":16501,"ĠHos":16502,"ĠCunningham":16503,"145":16504,"ĠRecovery":16505,"!!!":16506,"western":16507,"Ġimaging":16508,"ĠRookie":16509,"ĠMTV":16510,"Ġunc":16511,"ĠSporting":16512,"Ġpatrons":16513,"ĠCoverage":16514,"ĠObservatory":16515,"Ġfishermen":16516,"ĠProvince":16517,"ĠAston":16518,"ĠOsh":16519,"ĠWeekend":16520,"Ġrecruits":16521,"Ġdensity":16522,"FM":16523,"ĠGorsuch":16524,"ĠErie":16525,"lining":16526,"Ġshowcased":16527,"ĠRubio":16528,"Ġchaotic":16529,"Ġattractions":16530,"Ġhug":16531,"ĠHerbert":16532,"ĠRespond":16533,"Ġhappily":16534,"Ġtor":16535,"ĠOTHER":16536,"runner":16537,"ĠShakespeare":16538,"Ġstretching":16539,"ĠJudy":16540,"wyn":16541,"ĠCafe":16542,"Ġgreens":16543,"ĠHend":16544,"Ġglam":16545,"iation":16546,"ĠKingston":16547,"Ġincremental":16548,"Live":16549,"ĠBraun":16550,"USS":16551,"reb":16552,"Ġimperative":16553,"Ġsympathy":16554,"Ġrefuge":16555,"Ġadministered":16556,"rance":16557,"ĠLiberia":16558,"Ġmobil":16559,"heads":16560,"Ġinevitably":16561,"ĠEugene":16562,"ĠBerkshire":16563,"ĠHarbour":16564,"ĠTrends":16565,"TB":16566,"Ġdeficits":16567,"Ġlistings":16568,"Ġreadings":16569,"Ġtumor":16570,"Ġoffic":16571,"opy":16572,"Ġdistracted":16573,"Ġappropriately":16574,"ĠWillis":16575,"Ġskirt":16576,"ĠTea":16577,"Ġshades":16578,"Ġbargaining":16579,"Ġretention":16580,"ĠConcert":16581,"ĠMeteor":16582,"ĠCustom":16583,"Ġinputs":16584,"ĠSah":16585,"enta":16586,"Love":16587,"ĠBurg":16588,"ĠCynthia":16589,"ĠMoses":16590,"ubb":16591,"Ġpeoples":16592,"dh":16593,"ĠFro":16594,"bean":16595,"Ġcigarette":16596,"tta":16597,"umm":16598,"Ġphenomenal":16599,"Ġyelling":16600,"Ġinaug":16601,"Ġconven":16602,"ĠGore":16603,"request":16604,"Ġcolonial":16605,"ĠAleppo":16606,"Ġdemolition":16607,"Ġamounted":16608,"Ġstaggering":16609,"Ġclips":16610,"Ġinconsistent":16611,"ĠMilton":16612,"ĠWireless":16613,"ĠReno":16614,"ĠPerkins":16615,"Ġunusually":16616,"Ġmemor":16617,"Ġhectares":16618,"Ġlat":16619,"central":16620,"ĠDig":16621,"ĠMarina":16622,"ĠPartner":16623,"daily":16624,"your":16625,"Reilly":16626,"Ġpope":16627,"phy":16628,"Ġassessing":16629,"ĠRodrigo":16630,"wi":16631,"Ġcompatible":16632,"imate":16633,"Ġgentle":16634,"ĠRhodes":16635,"Brexit":16636,"ieve":16637,"Ġbreaches":16638,"Ġchopped":16639,"Ġcancers":16640,"VEL":16641,"Ġsluggish":16642,"ĠUltra":16643,"ĠUl":16644,"Ġcrises":16645,"ONE":16646,"ĠEquipment":16647,"Ġcater":16648,"Ġadjourn":16649,"Ġreadily":16650,"ĠRolling":16651,"ĠBott":16652,"inel":16653,"ĠRule":16654,"Ġgrind":16655,"ĠHussain":16656,"ussie":16657,"Ġdepressed":16658,"ĠImperial":16659,"ongo":16660,"Ġuniforms":16661,"Ġ117":16662,"Ġchambers":16663,"ĠDum":16664,"ifi":16665,"ĠBetty":16666,"ĠTA":16667,"Ġpromotions":16668,"itary":16669,"Ġcried":16670,"Ġbranding":16671,"ĠBahamas":16672,"ĠDat":16673,"Ġantibiotics":16674,"ĠAus":16675,"Ġumbrella":16676,"Ġgradual":16677,"Ġaltercation":16678,"Ġlure":16679,"ĠJakarta":16680,"Ġunified":16681,"chin":16682,"ettes":16683,"ĠRwanda":16684,"ulations":16685,"Ġbrink":16686,"Ġbroadcasting":16687,"ĠArtist":16688,"Ġrecon":16689,"Ġaqu":16690,"ĠServ":16691,"999":16692,"ĠParticipants":16693,"ĠVentures":16694,"fight":16695,"Ġactivism":16696,"Ġstructured":16697,"Ġportal":16698,"Ġtendency":16699,"ĠAssociate":16700,"Ġcalf":16701,"ĠOrd":16702,"ĠTi":16703,"ĠFrancois":16704,"uary":16705,"ĠVik":16706,"urchase":16707,"Ġfried":16708,"Ġbooming":16709,"Ġparticles":16710,"amas":16711,"INA":16712,"Super":16713,"supp":16714,"urring":16715,"ĠWatts":16716,"affer":16717,"ĠDEC":16718,"Ġroadway":16719,"border":16720,"Ġsequ":16721,"entially":16722,"ieg":16723,"Ġcamping":16724,"Ġ750":16725,"Ġcycles":16726,"ĠReese":16727,"ĠFellow":16728,"isters":16729,"ĠVehicle":16730,"kies":16731,"ĠJonas":16732,"Ġfoundations":16733,"ĠNigel":16734,"Ġstab":16735,"Ġcongressman":16736,"ĠWichita":16737,"antes":16738,"Ġprogression":16739,"Ġditch":16740,"lik":16741,"Ġsid":16742,"Ġele":16743,"ĠMund":16744,"Ġstairs":16745,"lete":16746,"Ġlingering":16747,"Ġsadly":16748,"Ġay":16749,"Em":16750,"Ġdeadliest":16751,"soon":16752,"Ġtangible":16753,"Ġabusing":16754,"Ġcomprises":16755,"vil":16756,"ĠBun":16757,"Ġdoubling":16758,"Ġcommun":16759,"Ġslogan":16760,"Ġloading":16761,"Ġshallow":16762,"Ġattributes":16763,"Che":16764,"Ġcheering":16765,"Ġrefuses":16766,"cam":16767,"bes":16768,"hon":16769,"ĠSpartans":16770,"cept":16771,"ĠComputer":16772,"ĠCanberra":16773,"ĠWARNING":16774,"Ġstuffed":16775,"block":16776,"ĠJennings":16777,"ĠAU":16778,"atin":16779,"Ġom":16780,"Ġbachelor":16781,"Ġprediction":16782,"ĠWinner":16783,"agne":16784,"Ġrob":16785,"ĠKatherine":16786,"Ġli":16787,"ĠHumph":16788,"ĠPEOPLE":16789,"IRO":16790,"Cola":16791,"Ġguitarist":16792,"isen":16793,"ĠHighlights":16794,"Ġwelcomes":16795,"Ġprisoner":16796,"Ġpsychology":16797,"Ġextradition":16798,"Ġrou":16799,"ĠLund":16800,"Ġthoughtful":16801,"RY":16802,"orman":16803,"Alex":16804,"Ġlaughter":16805,"Ġfumble":16806,"Ġsynthetic":16807,"Ġdigit":16808,"ĠRoc":16809,"ĠFactory":16810,"ellery":16811,"ishment":16812,"ilar":16813,"ĠEarl":16814,"ĠSutton":16815,"ĠJur":16816,"ĠAllan":16817,"ĠKoreans":16818,"uki":16819,"Ġculinary":16820,"PU":16821,"Stock":16822,"stars":16823,"ĠDayton":16824,"beck":16825,"Ġinstability":16826,"ĠBring":16827,"Ġbreeding":16828,"Ġmiracle":16829,"bons":16830,"Ġdonating":16831,"ĠKick":16832,"ĠSag":16833,"afi":16834,"Ġharassed":16835,"asm":16836,"Their":16837,"inity":16838,"Ġacademics":16839,"Ġstatute":16840,"ĠAmit":16841,"Ġpressured":16842,"east":16843,"\"),":16844,"iso":16845,"220":16846,"Ġairplane":16847,"ĠMcCabe":16848,"ctions":16849,"ĠMesa":16850,"Ġsensational":16851,"ĠFE":16852,"ĠNeigh":16853,"Ġbribery":16854,"Ġflaws":16855,"Ġfemales":16856,"Ġmisses":16857,"ĠColor":16858,"ĠVietnamese":16859,"ĠMental":16860,"Unfortunately":16861,"ĠPont":16862,"Ġ1940":16863,"dry":16864,"ĠGazette":16865,"ĠAns":16866,"Ġwhistle":16867,"Ġsymbolic":16868,"Ġpossessions":16869,"ĠDriver":16870,"Ġbracket":16871,"ĠReign":16872,"oji":16873,"Ġoct":16874,"Ġtube":16875,"ĠFelix":16876,"Ġtranslated":16877,"Ġpromptly":16878,"ĠErnest":16879,"arth":16880,"Ġdumb":16881,"Ġinfluences":16882,"taking":16883,"Ġprivat":16884,"erers":16885,"Ġmalware":16886,"Ġpredictable":16887,"Ġtighten":16888,"Ġheights":16889,"Ġfairness":16890,"facing":16891,"Ġrematch":16892,"Ġpoet":16893,"Ġfundamentally":16894,"Ġcoveted":16895,"Ġlivelihood":16896,"ĠABOUT":16897,"Ġsourced":16898,"Ġdeferred":16899,"Ġslashed":16900,"ĠSchultz":16901,"Ġtriggering":16902,"ĠShiv":16903,"Ġlithium":16904,"ahead":16905,"Ġleisure":16906,"Ġbackpack":16907,"ilateral":16908,"ĠNuclear":16909,"ĠLeone":16910,"ĠNice":16911,"Ġenthusiasts":16912,"September":16913,"Ġenroll":16914,"ĠWear":16915,"erey":16916,"angs":16917,"such":16918,"Ġunpopular":16919,"Ġdisciplined":16920,"Ġshrinking":16921,"ĠBrewing":16922,"ĠReally":16923,"Ġdirective":16924,"175":16925,"Ġnotifications":16926,"Ġfortunes":16927,"ĠHour":16928,"ĠGan":16929,"ĠChurchill":16930,"ĠDodge":16931,"ĠJeep":16932,"Ġsour":16933,"Ġderived":16934,"Ġft":16935,"riv":16936,"Ġlaundry":16937,"Ġfentanyl":16938,"ĠSioux":16939,"achi":16940,"workers":16941,"Ġworkload":16942,"rooms":16943,"ĠQU":16944,"ĠTruth":16945,"Ġdefenses":16946,"Ġdunk":16947,"IJ":16948,"Ġderby":16949,"ĠMotion":16950,"ĠMayo":16951,"ĠIke":16952,"Ġpreferences":16953,"Ġped":16954,"elman":16955,"moon":16956,"Ġshoots":16957,"ĠNoel":16958,"Ġmilit":16959,"ĠCambodia":16960,"ĠMLA":16961,"Ġhonoured":16962,"fast":16963,"Ġalgorithms":16964,"Ġstormed":16965,"NT":16966,"Benz":16967,"Ġvaccines":16968,"Ġmarching":16969,"Ġ118":16970,"ĠWilmington":16971,"GM":16972,"coin":16973,"Ġunderwater":16974,"ĠClearly":16975,"Ġorgans":16976,"mir":16977,"Ġdenounced":16978,"pless":16979,"imal":16980,"ĠKom":16981,"Ġfatalities":16982,"Ġyoungster":16983,"Ġthirty":16984,"Ġinternally":16985,"222":16986,"Ġdemonstrating":16987,"Ġbusiest":16988,"Ġperpetrators":16989,"Ġstun":16990,"Both":16991,"ĠMcCoy":16992,"gn":16993,"ĠDalton":16994,"ĠDAY":16995,"Ġsacred":16996,"Ġconsuming":16997,"Ġ(+":16998,"ĠPioneer":16999,"ĠApplications":17000,"ĠBolt":17001,"ĠBarkley":17002,"ĠExpo":17003,"ĠLore":17004,"ĠPrivacy":17005,"ĠHarley":17006,"Ġtractor":17007,"Ġtenth":17008,"ĠHaiti":17009,"ÃŃn":17010,"ĠTVs":17011,"ĠCathedral":17012,"Ġunite":17013,"Ġbinding":17014,"oks":17015,"ĠJenny":17016,"Ġcaller":17017,"ĠIngram":17018,"ĠPrairie":17019,"Ġrunoff":17020,"Ġasserted":17021,"icit":17022,"ĠSie":17023,"102":17024,"ĠMB":17025,"Ġobstruction":17026,"Ġgroom":17027,"Ġtolerate":17028,"Ġcans":17029,"forth":17030,"Ġvillain":17031,"Ġdefining":17032,"ĠFrenchman":17033,"otte":17034,"Ġcontr":17035,"clock":17036,"onder":17037,"Ġprolific":17038,"ĠElectronic":17039,"ĠSak":17040,"annie":17041,"ASS":17042,"Ġmultinational":17043,"Associated":17044,"IZ":17045,"ĠBelle":17046,"Ġmand":17047,"asis":17048,"Mac":17049,"Ġpretend":17050,"ĠCommunication":17051,"Ġheartbreaking":17052,"ĠShepherd":17053,"ĠBIG":17054,"mph":17055,"ĠShield":17056,"ĠLiv":17057,"ĠStatus":17058,"Ġbikini":17059,"Ġranch":17060,"Ġpeacefully":17061,"ITCH":17062,"bourne":17063,"ĠVariety":17064,"Ġstationed":17065,"Ġhed":17066,"Ġexhausted":17067,"Ġsurpassed":17068,"Ġcatalyst":17069,"Ġsmuggling":17070,"uating":17071,"Ġ123":17072,"Ġdup":17073,"ĠSul":17074,"conf":17075,"jit":17076,"Ġmaiden":17077,"asta":17078,"ĠCalvin":17079,"borne":17080,"Ġgrim":17081,"Ġtort":17082,"cott":17083,"olas":17084,"NR":17085,"Ġbreakout":17086,"ĠHun":17087,"ĠGuatemala":17088,"Ġhistorian":17089,"ĠLawyers":17090,"ĠDisplay":17091,"Ġobstruct":17092,"ĠOsborne":17093,"Ġtherapies":17094,"ĠAub":17095,"Ġinjunction":17096,"stroke":17097,"Ġseafood":17098,"Ġhazardous":17099,"ĠWolver":17100,"ĠViolence":17101,"ĠBillion":17102,"ĠLetter":17103,"ĠWorldwide":17104,"Real":17105,"Ġexpires":17106,"Ġflawed":17107,"European":17108,"Ġrigorous":17109,"ĠSimilar":17110,"ĠSurface":17111,"ĠEF":17112,"mys":17113,"ĠFunds":17114,"ographer":17115,"Ġtribes":17116,"Ġspouse":17117,"Ġunsure":17118,"aways":17119,"Ġtrainers":17120,"arie":17121,"ĠZar":17122,"ĠComedy":17123,"ĠLit":17124,"ĠNoon":17125,"Ġgallon":17126,"Ġconsulate":17127,"ĠBras":17128,"iology":17129,"onies":17130,"ĠBelichick":17131,"ĠRoot":17132,"ĠLux":17133,"ĠSed":17134,"ĠTos":17135,"Ġinherited":17136,"tw":17137,"Ġdeaf":17138,"Ġdriveway":17139,"jah":17140,"ĠScientific":17141,"ĠNottingham":17142,"both":17143,"awan":17144,"Ġnut":17145,"ĠLebanese":17146,"ĠAAA":17147,"ĠSuzuki":17148,"ĠBU":17149,"ells":17150,"Ġspecify":17151,"ĠNotes":17152,"Ġvoluntarily":17153,"ĠMolly":17154,"Ġoutskirts":17155,"Ġbehaviors":17156,"Ġmilitia":17157,"Ġsplash":17158,"Ġpersonalized":17159,"ĠFiat":17160,"ĠKind":17161,"ĠTruck":17162,"py":17163,"ĠWIN":17164,"dist":17165,"itational":17166,"APP":17167,"ĠPelicans":17168,"ĠGam":17169,"mel":17170,"Ġmandated":17171,"Ġbalances":17172,"ĠWizards":17173,"iary":17174,"ĠAvailable":17175,"Ġkay":17176,"jin":17177,"eyed":17178,"Ġsterling":17179,"Ġconcealed":17180,"ĠFedEx":17181,"ĠPO":17182,"ĠJacqu":17183,"anted":17184,"eme":17185,"ĠDefensive":17186,"manship":17187,"Ġreliever":17188,"Ġshortstop":17189,"Ġphot":17190,"ĠGain":17191,"ĠConcern":17192,"due":17193,"Ġalgorithm":17194,"fell":17195,"ĠMountains":17196,"icians":17197,"Ġhonoring":17198,"Ġuploaded":17199,"Ġtore":17200,"GH":17201,"orde":17202,"ĠCoin":17203,"ĠAven":17204,"Ġliterary":17205,"Before":17206,"Ġtactic":17207,"Ġsocially":17208,"ĠSik":17209,"Ġthermal":17210,"Ġhor":17211,"price":17212,"Ġrooted":17213,"arrow":17214,"Ġcirculating":17215,"Ġlaughs":17216,"ĠLines":17217,"lig":17218,"Ġjudgement":17219,"....":17220,"Ġsewer":17221,"Ġdancer":17222,"ĠPens":17223,"Ġsig":17224,"ische":17225,"wives":17226,"Ġgran":17227,"ĠBron":17228,"ĠHyde":17229,"yards":17230,"Ġcandidacy":17231,"Ġhey":17232,"Ġcontributors":17233,"ĠUpdated":17234,"Ġ190":17235,"Ġhalls":17236,"Ġemphas":17237,"ĠCherry":17238,"Ġrim":17239,"Ġbilled":17240,"Ġbaked":17241,"ĠPopular":17242,"lb":17243,"Ġgravity":17244,"Under":17245,"Ġreservation":17246,"organ":17247,"ĠPict":17248,"ĠWhitney":17249,"Ġonboard":17250,"NEY":17251,"ĠBreaking":17252,"Ġflagged":17253,"rar":17254,"ĠBasic":17255,"ĠDomestic":17256,"ĠPent":17257,"Ġvigilant":17258,"Ġzoning":17259,"Fire":17260,"Ġcorrected":17261,"isbury":17262,"ĠLaure":17263,"ĠDevon":17264,"print":17265,"ĠTopics":17266,"ĠFuel":17267,"Ġcirculation":17268,"ĠPratt":17269,"Ġskiing":17270,"Ġtornado":17271,"dep":17272,"ĠUnless":17273,"ifting":17274,"Ġfool":17275,"should":17276,"Ġinspectors":17277,"Ġprotested":17278,"Ġba":17279,"ussia":17280,"Ġspun":17281,"grass":17282,"phone":17283,"Ġpotato":17284,"ĠBehind":17285,"cil":17286,"Ġconcession":17287,"Ġapplause":17288,"ĠChin":17289,"Ġceremonies":17290,"pit":17291,"Ġtraumatic":17292,"Ġbasics":17293,"Ġparameters":17294,"ĠMoz":17295,"ĠAIDS":17296,"Ph":17297,"Ġjudging":17298,"Ġlecture":17299,"Ġmunicipality":17300,"Ġcardiac":17301,"ogan":17302,"pir":17303,"could":17304,"Channel":17305,"Ġshattered":17306,"ĠAV":17307,"continental":17308,"chie":17309,"ibi":17310,"ĠOy":17311,"Mon":17312,"ĠCN":17313,"WC":17314,"Ġdistributor":17315,"ĠSavannah":17316,"Ġcleaned":17317,"ĠFlores":17318,"Ġembarrassed":17319,"Ġclay":17320,"Ġvolcano":17321,"Ġstressful":17322,"Ġsummoned":17323,"ĠSeg":17324,"Ġstatistical":17325,"ĠShak":17326,"Ġadequately":17327,"worthy":17328,"fighting":17329,"alan":17330,"Ġnecessity":17331,"Ġresidency":17332,"Ġsober":17333,"arius":17334,"ĠTaj":17335,"mount":17336,"wards":17337,"Ġaesthetic":17338,"Coin":17339,"ĠDew":17340,"were":17341,"SK":17342,"Ġpowerhouse":17343,"Ġcleanup":17344,"ĠWITH":17345,"ĠHers":17346,"ĠRao":17347,"ĠFlyers":17348,"Ġdominating":17349,"issued":17350,"ĠMcGr":17351,"Ġinsurgency":17352,"Ġburial":17353,"ĠPlains":17354,"ensive":17355,"ĠPresent":17356,"Mo":17357,"Ġnerves":17358,"Ġsmoothly":17359,"staff":17360,"Ġrestoring":17361,"ĠGeneration":17362,"Ġcommuters":17363,"ĠLegend":17364,"ĠGad":17365,"lied":17366,"Ġissuer":17367,"ĠDozens":17368,"Ġphases":17369,"ĠWu":17370,"ĠTunisia":17371,"ĠPacers":17372,"Ġdur":17373,"ĠIG":17374,"annon":17375,"sided":17376,"Ġvo":17377,"ĠNI":17378,"Ġvitamin":17379,"Ġsoc":17380,"Ġimmunity":17381,"Ġgenerates":17382,"ĠMcGu":17383,"Ġexplores":17384,"Ġassistants":17385,"Ġstems":17386,"ushed":17387,"ĠZak":17388,"ĠOwners":17389,"Ġvariant":17390,"ardy":17391,"ĠNewark":17392,"ĠCatalonia":17393,"Ġautonomy":17394,"Ġgreet":17395,"Ġawait":17396,"ĠLuckily":17397,"ĠTicket":17398,"ĠSTOR":17399,"asy":17400,"Ġincorrect":17401,"Ġconsisting":17402,"Ġperspectives":17403,"ĠQuint":17404,"Ġtotaling":17405,"Ġnortheastern":17406,"Ġcharacterized":17407,"Ġsurfaces":17408,"nation":17409,"Ġprevents":17410,"ĠSho":17411,"Ġelectorate":17412,"Ġshortfall":17413,"chy":17414,"aws":17415,"ĠAddress":17416,"Ġdefensively":17417,"quel":17418,"chester":17419,"Ġterr":17420,"ahu":17421,"lined":17422,"ĠNev":17423,"unn":17424,"Def":17425,"pc":17426,"ĠSig":17427,"Ġnonetheless":17428,"ĠSundays":17429,"ĠBAS":17430,"Ġpolicemen":17431,"ĠGoal":17432,"apa":17433,"Ġrope":17434,"Ġoutage":17435,"ĠPaso":17436,"Ġsadness":17437,"ĠGrowing":17438,"ĠKyr":17439,"Ġale":17440,"ĠBreitbart":17441,"ĠVia":17442,"ĠBrig":17443,"idence":17444,"Ġ145":17445,"quire":17446,"Ġdistraction":17447,"ĠOdd":17448,"ĠSimply":17449,"ĠNin":17450,"Ġcompetent":17451,"ded":17452,"iper":17453,"ĠKaty":17454,"ĠSolomon":17455,"Ġfeeds":17456,"ĠMort":17457,"ĠRica":17458,"affe":17459,"Ġcooperating":17460,"Ġarrivals":17461,"Ġdelete":17462,"ĠAth":17463,"Ġtrustees":17464,"Ġtub":17465,"Ġsaga":17466,"otes":17467,"ĠCJ":17468,"Ġexited":17469,"stakes":17470,"Ġinflu":17471,"2000":17472,"ĠDonovan":17473,"ĠNur":17474,"Ġoutline":17475,"Ġaudition":17476,"oked":17477,"ĠJag":17478,"money":17479,"Ġcardiovascular":17480,"song":17481,"ĠOften":17482,"ĠGoff":17483,"ĠOaks":17484,"Will":17485,"acon":17486,"Ġ?":17487,"Har":17488,"ĠLambert":17489,"atoon":17490,"ĠAF":17491,"ĠMavericks":17492,"nia":17493,"ĠChennai":17494,"\"},\"":17495,"Ġpairing":17496,"mad":17497,"ause":17498,"ĠRide":17499,"111":17500,"ĠFallon":17501,"ĠHyder":17502,"ĠPiper":17503,"Ġfilmmakers":17504,"icon":17505,"ĠBeau":17506,"Ġbutt":17507,"lot":17508,"Ġrifles":17509,"Ġsunglasses":17510,"ĠTRA":17511,"Ġmagnetic":17512,"arty":17513,"ĠYo":17514,"ĠWeight":17515,"?!":17516,"ether":17517,"Ġaspir":17518,"Ġhunters":17519,"Ġcontamination":17520,"Ben":17521,"political":17522,"],\"":17523,"ĠBever":17524,"Ġmonuments":17525,"won":17526,"auc":17527,"Ġexpressions":17528,"Ġlakes":17529,"iao":17530,"abin":17531,"Ġpleading":17532,"Ġdiscounted":17533,"Ġdisappoint":17534,"ĠTW":17535,"craft":17536,"Ġsocieties":17537,"ĠAugusta":17538,"Ġbott":17539,"Ġmarker":17540,"ĠWrestling":17541,"CBC":17542,"athy":17543,"ĠAZ":17544,"Ġfabulous":17545,"valued":17546,"Ġoptical":17547,"Ġshaken":17548,"OSS":17549,"ĠImp":17550,"ĠAUD":17551,"inals":17552,"Ġrevital":17553,"Ġcontroller":17554,"Ġgrasp":17555,"uling":17556,"ĠFrederick":17557,"ague":17558,"bull":17559,"ĠLadies":17560,"Ġdisruptive":17561,"Ġbenefiting":17562,"Ġverge":17563,"ĠDak":17564,"Ġgrabs":17565,"ĠPAC":17566,"GN":17567,"ĠMcMahon":17568,"rob":17569,"ĠEspecially":17570,"ĠChrome":17571,"ĠBundesliga":17572,"104":17573,"Ġliberty":17574,"ĠSF":17575,"Ġvarieties":17576,"East":17577,"Ġgrowers":17578,"Ġsocialist":17579,"Ġunemployed":17580,"AMI":17581,"Ġtotals":17582,"ĠGib":17583,"Ġdefect":17584,"ĠOrtiz":17585,"ĠPerfect":17586,"Ġpraying":17587,"ISS":17588,"Ġul":17589,"Ġthrust":17590,"osc":17591,"ĠOtherwise":17592,"Ġobsessed":17593,"Ġ650":17594,"ĠWebsite":17595,"Ġspectators":17596,"ĠScout":17597,"ĠBoone":17598,"ĠDillon":17599,"Ġabortions":17600,"lect":17601,"utz":17602,"Ġvillagers":17603,"Ġaccelerating":17604,"Ġslap":17605,"Ġvague":17606,"Ġjurisdictions":17607,"League":17608,"ĠUruguay":17609,"Ġobstacle":17610,"Ġmanufactures":17611,"Ġcampaigned":17612,"ĠAdvance":17613,"ĠNort":17614,"emer":17615,"Ġ1964":17616,"Ġirre":17617,"Ġprog":17618,"ĠFeatured":17619,"Ġcommute":17620,"Ġhandset":17621,"akis":17622,"ĠArs":17623,"tail":17624,"iker":17625,"Ġcrafted":17626,"Ġupl":17627,"ĠMarcos":17628,"Looking":17629,"Ġseated":17630,"ĠBoat":17631,"Ġreadiness":17632,"ĠLLP":17633,"otechnology":17634,"facebook":17635,"ĠScouts":17636,"ĠEar":17637,"ĠAdv":17638,"ĠDemocracy":17639,"NI":17640,"oci":17641,"ĠSnapdragon":17642,"Saturday":17643,"ĠPra":17644,"ĠCoastal":17645,"ĠVoters":17646,"ĠLeigh":17647,"ohn":17648,"orry":17649,"Ġtechnicians":17650,"armed":17651,"Ġshrink":17652,"Ġspinning":17653,"agram":17654,"320":17655,"liner":17656,"ĠContest":17657,"ĠCountries":17658,"Ġfarewell":17659,"ĠCW":17660,"aris":17661,"Ġstorytelling":17662,"Ġpasser":17663,"Ġsailing":17664,"control":17665,"Ġdissent":17666,"ĠRih":17667,"Ġedit":17668,"Ġspoilers":17669,"itched":17670,"ĠBentley":17671,"Ġcant":17672,"mn":17673,"ĠMacy":17674,"Ġindefinitely":17675,"Ġvill":17676,"Ġmeth":17677,"ĠEL":17678,"Ġoptional":17679,"Ġremark":17680,"ĠVanessa":17681,"ã":17682,"Ġmasks":17683,"ĠProvincial":17684,"Ġculprit":17685,"ĠTol":17686,"Ġsnack":17687,"ĠInfinity":17688,"ĠPub":17689,"Ġbrakes":17690,"Ġclar":17691,"Ġinception":17692,"love":17693,"Ġwonders":17694,"Ġforged":17695,"ĠCEOs":17696,"Ġspecifications":17697,"irst":17698,"ension":17699,"ĠMarin":17700,"det":17701,"Ġordeal":17702,"ĠFeed":17703,"December":17704,"Ġstrokes":17705,"fect":17706,"orial":17707,"Ġshowcasing":17708,"Ġstack":17709,"UAL":17710,"ĠAlexandra":17711,"Ġpoison":17712,"ĠFry":17713,"ĠCars":17714,"Ġprototype":17715,"ĠUSDA":17716,"ĠIF":17717,"flows":17718,"Ġtailored":17719,"ĠGear":17720,"Ġmyth":17721,"Ġplatinum":17722,"seven":17723,"founded":17724,"encing":17725,"ĠTip":17726,"ĠMald":17727,"Ġgeopolitical":17728,"112":17729,"Ġenqu":17730,"ĠNR":17731,"ĠNadu":17732,"leen":17733,"ĠTat":17734,"Ġcolon":17735,"ĠSize":17736,"Ġvis":17737,"Ġbere":17738,"ĠAnnie":17739,"ĠWatkins":17740,"Ġpumping":17741,"cur":17742,"ĠBates":17743,"Ġslug":17744,"miss":17745,"Ġforecasting":17746,"source":17747,"Ġacknowledges":17748,"Ġprosecute":17749,"Ġtestament":17750,"Ġcum":17751,"ems":17752,"Ġsocks":17753,"ĠSame":17754,"Ġcompetitiveness":17755,"Ġdefinitive":17756,"Ġintensified":17757,"Ġsatisfying":17758,"Ġphysics":17759,"ĠHarden":17760,"Ġsubsidy":17761,"Men":17762,"ĠPaddock":17763,"Ġworkouts":17764,"ĠSaw":17765,"Ġcrisp":17766,"ĠBezos":17767,"ĠVote":17768,"Ġguiding":17769,"anged":17770,"Ġstaple":17771,"ŀ":17772,"ules":17773,"ĠAvengers":17774,"Ġoptim":17775,"ĠBuffett":17776,"Ġtimetable":17777,"oust":17778,"HE":17779,"ĠGrab":17780,"Have":17781,"cca":17782,"Ġwaived":17783,"Ġretaining":17784,"Ġaber":17785,"Ġoffline":17786,"Ġvigil":17787,"books":17788,"ĠRein":17789,"Ġacknowledging":17790,"ĠDoyle":17791,"Ġproteins":17792,"Ġmixing":17793,"ĠAlcohol":17794,"ĠJD":17795,"Ġsyn":17796,"Ġthieves":17797,"Ġhomemade":17798,"Ġfeminist":17799,"ĠRoosevelt":17800,"ĠCoal":17801,"Ġwishing":17802,"ĠSIGN":17803,"ĠLad":17804,"Ġempathy":17805,"ĠBrooke":17806,"ĠMash":17807,"inations":17808,"''":17809,"ulators":17810,"Ġdrastically":17811,"Ġfloral":17812,"ĠGuild":17813,"Ġundercover":17814,"ĠLaboratory":17815,"ĠRank":17816,"Ġrestraining":17817,"Ġparagraph":17818,"Ġpersona":17819,"ĠEmployment":17820,"ogs":17821,"ĠGw":17822,"ĠMedal":17823,"Ġwildly":17824,"fare":17825,"ĠCNBC":17826,"photo":17827,"Ġtransforming":17828,"Ġtermination":17829,"still":17830,"INT":17831,"Ġbal":17832,"ĠEconom":17833,"ĠLarson":17834,"Ġheck":17835,"Ġquantitative":17836,"Ġemergence":17837,"esta":17838,"Ġknot":17839,"Ġwhale":17840,"ĠðŁĺ":17841,"Ġperimeter":17842,"Ġempowerment":17843,"Ġmg":17844,"Ġrents":17845,"Ġrefreshing":17846,"Ġleasing":17847,"Ġpatents":17848,"andi":17849,"Ġfathers":17850,"Ġunse":17851,"Ġprocessors":17852,"Down":17853,"Ġreversal":17854,"veh":17855,"andal":17856,"ĠKov":17857,"Blue":17858,"Ġspecializes":17859,"Link":17860,"ĠConsidering":17861,"ĠEdmund":17862,"Ġneo":17863,"agger":17864,"rg":17865,"Ġseverity":17866,"Ġcour":17867,"RL":17868,"ĠTeresa":17869,"Ġgallons":17870,"Ġacquitted":17871,"Ġaccompl":17872,"Ġcracks":17873,"Ġsciences":17874,"Club":17875,"Ġpredicts":17876,"ĠVu":17877,"Ġhints":17878,"ĠZack":17879,"Ġrefurb":17880,"Ġdestabil":17881,"ĠSamar":17882,"ĠInfo":17883,"fs":17884,"Ġratios":17885,"Ġinherent":17886,"ĠContinental":17887,"Ġtreasure":17888,"Ġcaucus":17889,"Ġenact":17890,"orporated":17891,"ineries":17892,"Ġtastes":17893,"main":17894,"Ġsq":17895,"ickson":17896,"corruption":17897,"ulture":17898,"ĠGoodman":17899,"ĠLing":17900,"ĠSup":17901,"Ġexposing":17902,"immers":17903,"Ġresponds":17904,"heimer":17905,"Air":17906,"ĠFigures":17907,"Ġlongstanding":17908,"ĠAnalytics":17909,"Ġenforced":17910,"Ġnickname":17911,"Ġclinch":17912,"ĠCarpenter":17913,"ĠPharma":17914,"Ġconstructive":17915,"Ġgel":17916,"ĠSham":17917,"ĠTOP":17918,"ĠDerrick":17919,"ör":17920,"birds":17921,"ĠTong":17922,"ĠBatman":17923,"ĠRouhani":17924,"ĠOlive":17925,"ĠRiv":17926,"Ġdessert":17927,"Ġguides":17928,"Ġsag":17929,"Ġchemotherapy":17930,"Ġslept":17931,"ĠFranc":17932,"ĠDunk":17933,"writers":17934,"ĠÃĹ":17935,"Ġ401":17936,"Ġoutfielder":17937,"ĠHamburg":17938,"izu":17939,"Ġscr":17940,"Ġcomparisons":17941,"Ġwhites":17942,"Ġtraits":17943,"Ġcollateral":17944,"LEY":17945,"ideshow":17946,"Ġstatutory":17947,"Ġruin":17948,"Ġsituated":17949,"tem":17950,"Ġinject":17951,"rage":17952,"550":17953,"Ġfactions":17954,"ĠNaomi":17955,"cutting":17956,"Ġcommunicating":17957,"Ġrailroad":17958,"Ġsparking":17959,"Ġrespiratory":17960,"ĠWebster":17961,"ĠCarbon":17962,"Ġundertaking":17963,"Ġcomposer":17964,"ĠFigure":17965,"Ġspecified":17966,"Video":17967,"uber":17968,"Ġsexuality":17969,"lected":17970,"ĠBurger":17971,"ĠCards":17972,"SR":17973,"ĠLie":17974,"Ġrecount":17975,"Ġexceeding":17976,"Ġquoting":17977,"ĠJama":17978,"ĠVictorian":17979,"Ġsway":17980,"ĠGes":17981,"ĠSI":17982,"ĠKazakhstan":17983,"Ġaccusation":17984,"etr":17985,"Ah":17986,"Ġproc":17987,"Ġlamb":17988,"ĠMorales":17989,"ĠLily":17990,"Ġderail":17991,"Ġcontributes":17992,"iddle":17993,"ĠConcord":17994,"Ġelectr":17995,"Ġequip":17996,"Ġquantum":17997,"Ġthereafter":17998,"Ġarrange":17999,"Ġraided":18000,"ĠMove":18001,"ĠSang":18002,"ĠGaming":18003,"Ġbiology":18004,"ĠAmnesty":18005,"Ġdemise":18006,"ĠBarton":18007,"Ġqualifier":18008,"ANI":18009,"Ġundersc":18010,"Ġroyalty":18011,"ĠINC":18012,"Ġsne":18013,"ariat":18014,"ĠWan":18015,"Ġcluster":18016,"quin":18017,"Ġwhales":18018,"ĠFear":18019,"ĠBrew":18020,"Ġdeport":18021,"airs":18022,"Ġcensus":18023,"OUS":18024,"Ġrespectful":18025,"bone":18026,"Ġwaivers":18027,"friend":18028,"Ġsystemic":18029,"ĠDion":18030,"James":18031,"ĠAdmission":18032,"Ġstigma":18033,"ĠTIME":18034,"Ġunderpin":18035,"ĠWitnesses":18036,"Ġdigs":18037,"Ġgenocide":18038,"Ġstaging":18039,"rolled":18040,"Ġspecially":18041,"oop":18042,"Ġbaseline":18043,"ĠRF":18044,"avis":18045,"Ġvocals":18046,"COL":18047,"LD":18048,"Ġimpending":18049,"ĠCaldwell":18050,"Ġaluminium":18051,"Ġstra":18052,"ĠTayyip":18053,"Ġadmissions":18054,"falls":18055,"Ġrealizing":18056,"oen":18057,"ĠRV":18058,"ĠMog":18059,"Ġadvocating":18060,"ĠPepper":18061,"lived":18062,"ĠWick":18063,"Facebook":18064,"ĠSpect":18065,"Ġshout":18066,"Ġfractured":18067,"vet":18068,"Ġ1966":18069,"Ġcompensate":18070,"ĠVolume":18071,"Ġcategor":18072,"ĠHuntington":18073,"Free":18074,"OUGH":18075,"local":18076,"Sch":18077,"uti":18078,"Ġburger":18079,"Ġbush":18080,"Ġimpacting":18081,"Ġfrost":18082,"tti":18083,"ĠFresno":18084,"onz":18085,"shaw":18086,"ĠLibyan":18087,"Ġassert":18088,"ĠLegacy":18089,"ĠIE":18090,"ĠKinder":18091,"ĠHorizon":18092,"Ġtum":18093,"Ġsignaled":18094,"ĠFors":18095,"Ġspeedy":18096,"rang":18097,"ĠFT":18098,"Ġselecting":18099,"Ġpale":18100,"WD":18101,"Ġprobability":18102,"OUND":18103,"istrate":18104,"Ġsens":18105,"ocating":18106,"Ġinterpret":18107,"Ġpuzzle":18108,"Ġinland":18109,"Ġmanipulation":18110,"Sal":18111,"Ġfulfilling":18112,"ĠMcMaster":18113,"Make":18114,"jun":18115,"giving":18116,"ĠNiagara":18117,"Ġscholars":18118,"ALT":18119,"ĠSteam":18120,"omin":18121,"ĠSau":18122,"ĠDowning":18123,"Ġgy":18124,"ĠTit":18125,"ĠLav":18126,"ĠPepsi":18127,"Ġdumping":18128,"ĠDetect":18129,"ĠTDs":18130,"ĠKob":18131,"ĠSY":18132,"Ġpioneer":18133,"Ġ_":18134,"Ġclarified":18135,"ĠTests":18136,"opic":18137,"ĠMN":18138,"ĠBowman":18139,"umin":18140,"Ġwidow":18141,"Ġrallying":18142,"ĠPull":18143,"Ġprojection":18144,"Ġescalation":18145,"Ġlibraries":18146,"ĠFounder":18147,"ĠHugo":18148,"ĠStyle":18149,"Ġfreelance":18150,"Ġlisteners":18151,"Ġdiscovering":18152,"ĠPlans":18153,"Ġfranchises":18154,"ĠPam":18155,"Ġfarther":18156,"UI":18157,"opers":18158,"103":18159,"ublished":18160,"keys":18161,"aky":18162,"Ġinnov":18163,"¦":18164,"ĠDrum":18165,"Ġwraps":18166,"ĠCongressman":18167,"ĠVenus":18168,"fake":18169,"ĠBronx":18170,"ĠDinner":18171,"faced":18172,"Ġbackward":18173,"inge":18174,"Ġarsenal":18175,"ĠAce":18176,"uden":18177,"fre":18178,"Ġspa":18179,"ĠSaunders":18180,"ĠMatter":18181,"ĠSpons":18182,"Ġconsultations":18183,"ĠRuss":18184,"Ġsculpture":18185,"Ġuncommon":18186,"Nov":18187,"pg":18188,"otherapy":18189,"Ġgol":18190,"ĠBlazers":18191,"Ġadvises":18192,"ĠRegulatory":18193,"ĠBoyle":18194,"Äģ":18195,"Ġcuisine":18196,"Ġencouragement":18197,"yp":18198,"eny":18199,"ĠOrchestra":18200,"ĠChicken":18201,"Ġ1965":18202,"ĠPret":18203,"ĠCooperation":18204,"ĠDevices":18205,"ĠRodney":18206,"ĠHonduras":18207,"ĠEgg":18208,"Ġchurn":18209,"Ġclutch":18210,"ĠBernstein":18211,"Ġain":18212,"Ġformidable":18213,"ĠFacility":18214,"Ġpag":18215,"mons":18216,"bol":18217,"Ġliteracy":18218,"Ġsubmissions":18219,"ĠHulu":18220,"ĠConstitutional":18221,"ĠIsh":18222,"ĠPaula":18223,"olve":18224,"Ġabundance":18225,"ĠAla":18226,"ĠEcuador":18227,"Ġreconstruction":18228,"Ġcrush":18229,"reek":18230,"ĠÂŃ":18231,"ibo":18232,"Ġpracticed":18233,"Ġpac":18234,"rett":18235,"Ġpasta":18236,"Ġresp":18237,"ĠFlag":18238,"pal":18239,"Ġcommenting":18240,"Ġrecap":18241,"âĢĶâĢĶ":18242,"ĠToy":18243,"ĠMeredith":18244,"Ġreceipt":18245,"Ġseparating":18246,"ĠMap":18247,"Ġmogul":18248,"ĠBurlington":18249,"Ġger":18250,"Ġcoordinate":18251,"grad":18252,"Ġescalated":18253,"Ġproceeded":18254,"turned":18255,"Ġupt":18256,"hum":18257,"ĠWere":18258,"Whether":18259,"Ġenjoyable":18260,"energy":18261,"Ġprohibit":18262,"Ġhurdle":18263,"Ġdivorced":18264,"Ġcommentator":18265,"GT":18266,"ATH":18267,"Ġtravellers":18268,"Ġpopulated":18269,"ĠVo":18270,"ĠRebels":18271,"Ġspurred":18272,"Ġideological":18273,"Ġelephant":18274,"keyes":18275,"Pat":18276,"Ġlinger":18277,"Ġreps":18278,"Ġcocktails":18279,"ĠKristen":18280,"istically":18281,"Ġgunmen":18282,"Ġ1920":18283,"Ġquart":18284,"National":18285,"Ġexceptions":18286,"kat":18287,"priced":18288,"ĠHarold":18289,"ĠPistons":18290,"Ġcompounds":18291,"Ġmouse":18292,"Ġexhibits":18293,"ĠBurk":18294,"Ġclassmates":18295,"Ġcirculated":18296,"Ġattributable":18297,"ĠBaton":18298,"Ġorganizer":18299,"Ġdurable":18300,"Ġsingers":18301,"ĠOman":18302,"Ġhydrogen":18303,"Ġslash":18304,"Ġaccidental":18305,"ĠAbrams":18306,"KS":18307,"itty":18308,"Ġrust":18309,"Ġselections":18310,"porting":18311,"ĠEmanuel":18312,"XX":18313,"ĠThornton":18314,"Ġcolumns":18315,"Ġsentiments":18316,"fun":18317,"Ġplight":18318,"ĠSister":18319,"ĠMaggie":18320,"hya":18321,"Daniel":18322,"Ġplung":18323,"orio":18324,"ĠYorker":18325,"ĠSaturdays":18326,"Ġloc":18327,"aye":18328,"illon":18329,"ĠConsulting":18330,"pled":18331,"ĠZin":18332,"ĠFarms":18333,"ĠGiuliani":18334,"ĠMIN":18335,"ĠHanson":18336,"ĠComplete":18337,"ourke":18338,"oche":18339,"ĠJord":18340,"Ġprofessors":18341,"ĠWILL":18342,"ĠCron":18343,"Ġdorm":18344,"Ġcracking":18345,"tur":18346,"ORS":18347,"Ant":18348,"Ġdeduction":18349,"ĠSIM":18350,"igue":18351,"ĠValent":18352,"ĠEthereum":18353,"ĠSunny":18354,"ĠExtra":18355,"ivan":18356,"ĠFo":18357,"Ġleases":18358,"ibe":18359,"Ġ1800":18360,"Ġslapped":18361,"emaker":18362,"Ġfa":18363,"rien":18364,"ĠPeriod":18365,"ĠES":18366,"ĠBlu":18367,"Ġpreserving":18368,"Ġsmarter":18369,"mans":18370,"Ġgest":18371,"zu":18372,"nu":18373,"Ġdivest":18374,"roc":18375,"ĠFlood":18376,"Given":18377,"ĠNorton":18378,"Ġgranting":18379,"Ġdealings":18380,"Ġgeographic":18381,"esa":18382,"Ġcub":18383,"Ġcriticizing":18384,"ĠCub":18385,"Ġsurroundings":18386,"ĠInternal":18387,"Ġsle":18388,"Ġcrushing":18389,"ĠPP":18390,"izations":18391,"ĠAbdel":18392,"Joe":18393,"ĠVisitors":18394,"ĠCarly":18395,"INGTON":18396,"ĠGC":18397,"ĠWB":18398,"Ġgently":18399,"·":18400,"though":18401,"ĠAlto":18402,"Ġresting":18403,"ĠPerson":18404,"ĠTon":18405,"Ġbore":18406,"ĠClar":18407,"Ġmot":18408,"Ġbathrooms":18409,"ĠTypically":18410,"Ġdisconnect":18411,"Ġtightly":18412,"ĠHarvest":18413,"ĠHed":18414,"ĠGermans":18415,"atar":18416,"Ġkeynote":18417,"Ġimproper":18418,"fil":18419,"Ġintens":18420,"iev":18421,"Ġmedi":18422,"Ġtenant":18423,"Ġfootsteps":18424,"uli":18425,"Ġlegalization":18426,"106":18427,"ĠLexington":18428,"folio":18429,"Ġ½":18430,"ĠRita":18431,"Ġbattered":18432,"inka":18433,"ĠJavaScript":18434,"ĠMusical":18435,"ĠTalent":18436,"Ġlounge":18437,"Ġintimidation":18438,"ikh":18439,"ĠFam":18440,"Ġtherapeutic":18441,"Ġbalancing":18442,"Ġrocky":18443,"liners":18444,"ĠPredators":18445,"Ġregistering":18446,"Ġdiligence":18447,"ĠRover":18448,"ĠDot":18449,"Ġterminated":18450,"ĠEdu":18451,"Ġcharming":18452,"ĠPLAY":18453,"ĠFact":18454,"ĠCi":18455,").\"":18456,"ĠWrestle":18457,"hun":18458,"Ġopenings":18459,"Ġfou":18460,"Ġ126":18461,"spe":18462,"ĠAW":18463,"Ġbud":18464,"ĠTemper":18465,"ĠOrthodox":18466,"Ġprogressed":18467,"tre":18468,"Ġtasting":18469,"Ġscrutin":18470,"ĠLima":18471,"Ġlayout":18472,"Ġlitter":18473,"ijk":18474,"ĠParkinson":18475,"ĠAnfield":18476,"Ġdevelopmental":18477,"Ġheaven":18478,"ĠWoodward":18479,"index":18480,"Ġpistol":18481,"Ġreson":18482,"ĠWS":18483,"Ġemb":18484,"ĠLap":18485,"ĠPle":18486,"lington":18487,"ĠSit":18488,"Ġabruptly":18489,"ĠSenegal":18490,"ĠYates":18491,"aceutical":18492,"ĠJak":18493,"ĠHastings":18494,"iste":18495,"ĠDB":18496,"ĠAgent":18497,"Ġpreservation":18498,"ĠLank":18499,"ĠSuffolk":18500,"Ġboo":18501,"essed":18502,"Ġempowering":18503,"enne":18504,"Ġrecycled":18505,"Ġstrateg":18506,"Ġbrake":18507,"135":18508,"ĠStef":18509,"ĠFlake":18510,"ĠGregg":18511,"ĠRent":18512,"Ġinstallment":18513,"FW":18514,"ĠCran":18515,"obo":18516,"ml":18517,"ĠJade":18518,"Ġaccuses":18519,"ĠNvidia":18520,"Ġburg":18521,"High":18522,"Ġbothered":18523,"ĠBenn":18524,"Ġinterrupted":18525,"Ġtrek":18526,"Ġserv":18527,"Ġpatron":18528,"Ġdictator":18529,"owa":18530,"jad":18531,"ĠTulsa":18532,"Ġboil":18533,"Ġdisplaying":18534,"Ġcinem":18535,"awaited":18536,"¸":18537,"Ġreacts":18538,"ĠDee":18539,"ĠGron":18540,"igation":18541,"Ġservic":18542,"capt":18543,"Ġinsane":18544,"ĠVeteran":18545,"umen":18546,"End":18547,"ĠCream":18548,"Ġextremism":18549,"ĠMalone":18550,"Col":18551,"Ġsafeguard":18552,"Ġtomatoes":18553,"die":18554,"Ġchamp":18555,"zero":18556,"ĠPRES":18557,"Ġchoir":18558,"Ġpediatric":18559,"Ġprivileged":18560,"Ġdownstream":18561,"Business":18562,"ĠFighting":18563,"atable":18564,"Ġsums":18565,"Ġinsult":18566,"arten":18567,"ĠWikiLeaks":18568,"Ġpads":18569,"Ġretali":18570,"ĠHunts":18571,"Ġindie":18572,"ĠShields":18573,"ĠMortgage":18574,"oses":18575,"ampton":18576,"ĠVideos":18577,"ĠPER":18578,"itionally":18579,"ĠKimmel":18580,"sum":18581,"trade":18582,"acity":18583,"marked":18584,"ĠAngus":18585,"Ġtemper":18586,"Ġseizure":18587,"Ġfictional":18588,"utton":18589,"eva":18590,"Rs":18591,"Ġintra":18592,"ĠRequest":18593,"ppe":18594,"ĠeBay":18595,"ĠUSS":18596,"Ġ1500":18597,"Ġpossessing":18598,"Ġbacon":18599,"ĠSexual":18600,"ĠBuff":18601,"Ġslaughter":18602,"Ġjur":18603,"zhou":18604,"suit":18605,"ĠCha":18606,"ĠBuk":18607,"crime":18608,"ĠEasy":18609,"ĠChain":18610,"aq":18611,"ĠPall":18612,"flation":18613,"225":18614,"oup":18615,"109":18616,"ĠMcKenzie":18617,"Ġclearer":18618,"ĠDogs":18619,"oration":18620,"Ġsubs":18621,"Follow":18622,"ĠShirley":18623,"Ġadjusting":18624,"ĠEFF":18625,"Ġflipped":18626,"Ġconform":18627,"ĠLaurent":18628,"Ġcircular":18629,"ĠNOR":18630,"Ġmort":18631,"Ġtexture":18632,"avour":18633,"Ġflex":18634,"ĠHedge":18635,"ðŁĺ":18636,"Ġtrophies":18637,"ĠINV":18638,"Ġboast":18639,"ĠTyr":18640,"ĠNichols":18641,"ĠSpa":18642,"Ġcheered":18643,"Ġprey":18644,"reach":18645,"Ġbreached":18646,"ĠRegions":18647,"ĠLyft":18648,"ĠTul":18649,"ĠKore":18650,"Ġendure":18651,"ĠCover":18652,"\").":18653,"ĠSavage":18654,"ère":18655,"reens":18656,"Ġnic":18657,"sector":18658,"Ġweaknesses":18659,"Ġreboot":18660,"Ġ210":18661,"Ġimagery":18662,"ĠFrem":18663,"Ġclue":18664,"ĠLars":18665,"Ġfaction":18666,"hetic":18667,"Ġallied":18668,"ĠMarvin":18669,"Ġmethodology":18670,"ĠTN":18671,"Ġutter":18672,"Ġ270":18673,"ĠVolvo":18674,"oline":18675,"ĠACLU":18676,"Ġindirect":18677,"Ġminer":18678,"ĠBale":18679,"ĠStrange":18680,"ĠFuller":18681,"Ġexpelled":18682,"ĠTropical":18683,"Ġremotely":18684,"ĠTIM":18685,"Ġinnocence":18686,"Ġconfined":18687,"Ġfares":18688,"Ġprevalent":18689,"Ġdesp":18690,"House":18691,"azar":18692,"Ġgestures":18693,"ĠCES":18694,"ĠDM":18695,"eal":18696,"ĠÐ":18697,"Ġburnt":18698,"Ġframed":18699,"ĠDani":18700,"Ġhol":18701,"ĠCannes":18702,"ĠHayden":18703,"Ġwardrobe":18704,"ĠAssange":18705,"ĠSamp":18706,"bay":18707,"sky":18708,"ĠHence":18709,"ĠGrizzlies":18710,"rates":18711,"laws":18712,"ĠMandela":18713,"ĠHoover":18714,"rics":18715,"charged":18716,"Ġexclude":18717,"Ġpassive":18718,"Ġcontinuation":18719,"Ġblunt":18720,"Ġvac":18721,"ĠEmerging":18722,"rench":18723,"tv":18724,"ĠHollow":18725,"ĠOC":18726,"Ġadvisors":18727,"Ġrendered":18728,"ĠBernardino":18729,"ĠSupporters":18730,"ronic":18731,"Ġchancellor":18732,"Ġ1963":18733,"Ġuranium":18734,"Ġak":18735,"ĠOptions":18736,"ermott":18737,"ĠBerger":18738,"ibia":18739,"Ġexplosions":18740,"Ġimpairment":18741,"Ġhail":18742,"Ġalley":18743,"Ġcruelty":18744,"ĠClarence":18745,"Ġvariations":18746,"Ġrealm":18747,"Ġrenovations":18748,"ĠNorwich":18749,"Ġbelongings":18750,"Ġmerchants":18751,"ĠMinisters":18752,"ĠDodd":18753,"Ġviewer":18754,"Ġneutrality":18755,"quer":18756,"ĠPrinceton":18757,"dead":18758,"arest":18759,"GET":18760,"ĠCanadiens":18761,"ĠIgn":18762,"clear":18763,"Mal":18764,"ĠBridges":18765,"ĠHayward":18766,"Ġremarked":18767,"ingle":18768,"Ġsob":18769,"Ġdepart":18770,"beans":18771,"Ġpreserved":18772,"ĠFairfax":18773,"Ġforgot":18774,"ĠBeh":18775,"Rob":18776,"Ġcooperative":18777,"ullah":18778,"Ġmates":18779,"Ġrang":18780,"Ġthigh":18781,"Ġabducted":18782,"Ġchaired":18783,"ĠHearts":18784,"Ġidentifies":18785,"ĠBuckingham":18786,"ijn":18787,"ĠJab":18788,"Ġclashed":18789,"feed":18790,"sites":18791,"ĠCareer":18792,"exp":18793,"ĠBuccaneers":18794,"scape":18795,"Ġupdating":18796,"Ġintentional":18797,"ĠGuam":18798,"ĠBreakfast":18799,"ĠHag":18800,"Media":18801,"Ġtapping":18802,"Ġpics":18803,"Ġeaten":18804,"Ġpremise":18805,"Kim":18806,"ĠStorage":18807,"Ġextensively":18808,"Ġoutrageous":18809,"ĠSadly":18810,"Global":18811,"¢":18812,"leaning":18813,"CM":18814,"Ġeasiest":18815,"ument":18816,"Ġ122":18817,"Ġdaunting":18818,"ISE":18819,"Ġsunset":18820,"Ġreset":18821,"Ġbent":18822,"Trust":18823,"ĠCaleb":18824,"ĠRut":18825,"ĠBast":18826,"ETS":18827,"iencies":18828,"Ġpu":18829,"ature":18830,"Ġrealities":18831,"omi":18832,"Ġsoda":18833,"Ġunveil":18834,"ĠGoldberg":18835,"opes":18836,"Ġuprising":18837,"ĠMR":18838,"Ġendorse":18839,"Ġsail":18840,"Ġconverting":18841,"Ġglamorous":18842,"ĠHollande":18843,"108":18844,"isky":18845,"Ġcushion":18846,"240":18847,"Ġadventures":18848,"Ġantitrust":18849,"ĠStockholm":18850,"pace":18851,"ĠVald":18852,"ĠTransfer":18853,"ERT":18854,"ĠMcInt":18855,"Ġsurging":18856,"ogn":18857,"Ġlauded":18858,"ĠZam":18859,"ĠRough":18860,"TOR":18861,"Ġwed":18862,"Ġorigins":18863,"ĠEld":18864,"oso":18865,"Ġsupplying":18866,"ĠPetty":18867,"ĠTwe":18868,"ĠDenise":18869,"ĠBec":18870,"Ġbehave":18871,"Ġ121":18872,"estone":18873,"ĠBoulder":18874,"ĠBlackhawks":18875,"ĠWyatt":18876,"Ġfiguring":18877,"ĠDeborah":18878,"agi":18879,"significant":18880,"Ġasthma":18881,"Ġmessy":18882,"mpire":18883,"Ġax":18884,"Ġaspiring":18885,"ĠNH":18886,"ĠGina":18887,"heavy":18888,"ĠVick":18889,"ÃŃs":18890,"something":18891,"Ġbodily":18892,"Ġunauthorized":18893,"ĠActually":18894,"ĠOH":18895,"Ġmicrophone":18896,"allah":18897,"Ġrampant":18898,"Ġrelocated":18899,"Ġwidening":18900,"ĠCait":18901,"nel":18902,"ĠBlackBerry":18903,"Ġprofessionally":18904,"ĠInterestingly":18905,"Ġbarbecue":18906,"Ġresisting":18907,"ĠNunes":18908,"disc":18909,"Ġgroundbreaking":18910,"orable":18911,"ĠRegulation":18912,"Ġborrowed":18913,"Ġleaking":18914,"Ġlengths":18915,"Ġunveiling":18916,"houses":18917,"Ġ155":18918,"ĠBillboard":18919,"icion":18920,"Times":18921,"ĠZoe":18922,"ĠAbby":18923,"bus":18924,"ĠMinutes":18925,"ributed":18926,"Ġparap":18927,"Ġfertil":18928,"ABC":18929,"ĠIsle":18930,"Ġtherapist":18931,"Ġgubernatorial":18932,"ĠAust":18933,"ĠLoan":18934,"Bo":18935,"ĠNRL":18936,"rag":18937,"Clear":18938,"Ġrevision":18939,"Ġflesh":18940,"BD":18941,"iji":18942,"Ġproductions":18943,"Ġcoconut":18944,"ĠMcCorm":18945,"ĠDash":18946,"Ġgeography":18947,"hearted":18948,"Ġarson":18949,"Ġgoaltender":18950,"Ġbelly":18951,"Ġqualifications":18952,"ĠActiv":18953,"Ġhooked":18954,"ĠHungarian":18955,"Ġprotocols":18956,"inking":18957,"Ġfronts":18958,"ĠKuala":18959,"ĠToys":18960,"ĠFitness":18961,"Ġwarfare":18962,"Ġoutp":18963,"ĠQuestions":18964,"Ġwel":18965,"ĠShan":18966,"ĠMorton":18967,"ĠRomero":18968,"Ġglance":18969,"ĠTay":18970,"Ġsneakers":18971,"ĠSymphony":18972,"Ġinspect":18973,"enna":18974,"Nobody":18975,"Ġscrapped":18976,"ĠDeVos":18977,"ĠDominican":18978,"Ġplanets":18979,"anova":18980,"Ġnotify":18981,"Ġincurred":18982,"Ġunders":18983,"Ġdetainees":18984,"ĠMarriott":18985,"electric":18986,"ĠKes":18987,"union":18988,"ĠWatt":18989,"ATING":18990,"Ġslipping":18991,"Ġraft":18992,"Ġresisted":18993,"Ġcred":18994,"tern":18995,"Ġflurry":18996,"Line":18997,"Ġconsulted":18998,"Ġanalyzing":18999,"107":19000,"ĠWide":19001,"¶":19002,"human":19003,"ĠFEMA":19004,"Ġsmash":19005,"Ġcorps":19006,"Ġbarric":19007,"Ġcollar":19008,"ĠTB":19009,"without":19010,"ĠCanucks":19011,"Ġneedle":19012,"ĠSidney":19013,"ĠLauderdale":19014,"Ġglove":19015,"ilee":19016,"pic":19017,"Ġbenef":19018,"ĠHydro":19019,"ĠDisc":19020,"ĠArg":19021,"Ġtermin":19022,"Ġsympath":19023,"Ġpest":19024,"ĠCoff":19025,"Ġadvancement":19026,"social":19027,"pol":19028,"ĠEmails":19029,"Ġstacked":19030,"ibly":19031,"ĠAlbion":19032,"Ġfist":19033,"hero":19034,"ĠMarian":19035,"asia":19036,"Ġtownship":19037,"Ġslick":19038,"Ġmodeling":19039,"achers":19040,"ĠArgent":19041,"ĠSUN":19042,"arde":19043,"Ġpinned":19044,"Ġhitters":19045,"Ġdare":19046,"ictions":19047,"arily":19048,"Ġsting":19049,"Ġprimaries":19050,"appointed":19051,"Ġformats":19052,"Ġglitter":19053,"Ġpatches":19054,"Ġstrategically":19055,"Ġaka":19056,"Ġyielded":19057,"BY":19058,"Ġjeopard":19059,"ĠVand":19060,"Ġcrowned":19061,"Ġoccupants":19062,"Ġtanker":19063,"ĠVisa":19064,"Great":19065,"Ġseasoned":19066,"ĠAviv":19067,"Ġfiery":19068,"Ġderivatives":19069,"Ġdiverted":19070,"Ġacqu":19071,"Ġsandwiches":19072,"ĠLorenzo":19073,"Ġpardon":19074,"ĠBarber":19075,"ĠAgricultural":19076,"ĠPhilly":19077,"Ġregrets":19078,"ĠMillions":19079,"ĠFrazier":19080,"Ġtreasury":19081,"ĠKenn":19082,"Ġdestined":19083,"olved":19084,"Back":19085,"leader":19086,"lyss":19087,"ĠReyes":19088,"001":19089,"bags":19090,"ĠStandards":19091,"ĠExcellence":19092,"ĠMaid":19093,"ĠAnthem":19094,"FIELD":19095,"Ġrevived":19096,"ĠQuad":19097,"Ġdistinguished":19098,"Ġweighted":19099,"Ġritual":19100,"Ġinvites":19101,"wana":19102,"iture":19103,"ĠCI":19104,"ĠMAY":19105,"Ġunfairly":19106,"ĠKP":19107,"ĠMidlands":19108,"Ġmint":19109,"uers":19110,"Ġcatalog":19111,"arant":19112,"Ġlosers":19113,"Ġscheduling":19114,"esar":19115,"Ġtransferring":19116,"Ġbankrupt":19117,"Ġmethamphetamine":19118,"ĠEsk":19119,"ĠTreatment":19120,"ĠResponse":19121,"Ġhomework":19122,"ĠBald":19123,"Ġembarrassment":19124,"Ġpoorest":19125,"ĠPlatinum":19126,"ĠFac":19127,"Ġunleashed":19128,"Ġbrighter":19129,"002":19130,"Ġdisl":19131,"ĠLowry":19132,"ived":19133,"ĠDemon":19134,"ĠNonetheless":19135,"arro":19136,"ĠCONT":19137,"ifted":19138,"ĠFreder":19139,"isson":19140,"Ġrout":19141,"ARA":19142,"Ġswinging":19143,"Oct":19144,"Ġliable":19145,"Ġleaning":19146,"Ġlungs":19147,"380":19148,"ĠProcess":19149,"ĠCov":19150,"terrorism":19151,"Ġresistant":19152,"Ġpumped":19153,"Ġtripled":19154,"Semitism":19155,"ĠMia":19156,"Ġpenetration":19157,"ĠLutheran":19158,"BU":19159,"odes":19160,"Ġspanning":19161,"utch":19162,"Trans":19163,"ĠVolunteers":19164,"Ġpathway":19165,"Ġinfectious":19166,"Ġdrastic":19167,"ĠEngineers":19168,"Ġprincess":19169,"acts":19170,"usting":19171,"utive":19172,"achel":19173,"DO":19174,"Ġpave":19175,"ĠHerrera":19176,"Ġnearing":19177,"help":19178,"Ġembarked":19179,"Ġmodes":19180,"ĠDriving":19181,"Ġopting":19182,"Best":19183,"Ġbehavioral":19184,"Ġcables":19185,"App":19186,"otion":19187,"ĠExt":19188,"ĠSinclair":19189,"ĠInsp":19190,"Ġsinking":19191,"Next":19192,"ĠLumpur":19193,"ĠShadow":19194,"Donald":19195,"itals":19196,"Ġmentions":19197,"floor":19198,"Ġconsiderations":19199,"ĠSquad":19200,"ĠPlate":19201,"dos":19202,"Friday":19203,"Hopefully":19204,"arre":19205,"Ġalum":19206,"\":\"/":19207,"Ġfet":19208,"anza":19209,"Ġdign":19210,"ĠNguyen":19211,"ĠRutgers":19212,"ĠSew":19213,"Ġfilters":19214,"ofi":19215,"Ġunavailable":19216,"ranking":19217,"Ġrefining":19218,"ĠUNC":19219,"Ġmax":19220,"yll":19221,"Ġhandsome":19222,"Ġutterly":19223,"See":19224,"ĠStores":19225,"Ke":19226,"ĠAdvoc":19227,"ordon":19228,"umbles":19229,"Ġbugs":19230,"olar":19231,"ĠCork":19232,"Ġtoken":19233,"Ġauthorization":19234,"Ġconscience":19235,"Ġrepl":19236,"edi":19237,"owitz":19238,"iven":19239,"Ġlieu":19240,"Ġlifts":19241,"Lean":19242,"Ġmagnificent":19243,"ĠFilms":19244,"onents":19245,"Ġ***":19246,"Green":19247,"ĠAdvocate":19248,"ĠArrow":19249,"Ġblows":19250,"Ġexploited":19251,"fly":19252,"ĠAmar":19253,"ĠNOTICE":19254,"Ġsincere":19255,"found":19256,"ĠRud":19257,"Ġcy":19258,"ĠHeidi":19259,"Ġempowered":19260,"Ġweakest":19261,"ĠKru":19262,"Credit":19263,"aunted":19264,"Ġexotic":19265,"aning":19266,"Ġaw":19267,"ĠMulti":19268,"Ġanimation":19269,"850":19270,"ĠCounter":19271,"ĠNit":19272,"alli":19273,"Ġcapitalize":19274,"Ġexecuting":19275,"Ġdescent":19276,"ovi":19277,"ĠKimberly":19278,"headed":19279,"Ġmentioning":19280,")-":19281,"ĠSpecifically":19282,"ayette":19283,"ihad":19284,"ĠIss":19285,"Ġdisagreed":19286,"ĠKum":19287,"Ġurges":19288,"Ġpermitting":19289,"Ġpy":19290,"isp":19291,"Ġhygiene":19292,"Ġmourning":19293,"Ġcyclists":19294,"cats":19295,"FER":19296,"cycl":19297,"Ġnewcomers":19298,"Ġplead":19299,"Ġmend":19300,"secret":19301,"fan":19302,"Ġtranslates":19303,"unit":19304,"ĠTank":19305,"drive":19306,"ĠSite":19307,"Ġacceleration":19308,"ĠEnrique":19309,"ĠElaine":19310,"Ġstaring":19311,"Ġbackwards":19312,"Ġot":19313,"Ġvot":19314,"ĠHK":19315,"Ġfian":19316,"ĠLockheed":19317,"Ġmanifest":19318,"ĠZurich":19319,"pad":19320,"ĠRav":19321,"flow":19322,"Ġmoms":19323,"ĠSolid":19324,"ĠReady":19325,"aughlin":19326,"Ġreminding":19327,"ĠCOR":19328,"Ġoptimal":19329,"ĠCrisis":19330,"Ġcholesterol":19331,"ĠGerard":19332,"Ġfest":19333,"Ġsanction":19334,"Ġdragging":19335,"inent":19336,"ĠBravo":19337,"Ġamend":19338,"aval":19339,"Ġpoem":19340,"Ġinvasive":19341,"Ġlandsc":19342,"leigh":19343,"Ġheadache":19344,"ĠMuse":19345,"ĠTurning":19346,"girl":19347,"cess":19348,"Ġfalsely":19349,"Ġplaintiff":19350,"Ġheavier":19351,"Ġrumored":19352,"Ġeleven":19353,"ĠConsumers":19354,"ĠOriginally":19355,"ĠStatement":19356,"bors":19357,"Ġrevoked":19358,"ĠOmaha":19359,"Fox":19360,"ĠKle":19361,"Ġvault":19362,"Ġoutdated":19363,"umes":19364,"ĠArk":19365,"Ġapologised":19366,"Ġrockets":19367,"ĠMarines":19368,"Ġcaptures":19369,"ĠMW":19370,"ĠWalters":19371,"ĠFactor":19372,"Ġensuing":19373,"ĠSession":19374,"oons":19375,"Ġ132":19376,"gt":19377,"ĠPoints":19378,"Ġexhaust":19379,"ĠOsaka":19380,"heed":19381,"Ġhandic":19382,"amber":19383,"inging":19384,"Ġll":19385,"Ġescorted":19386,"Ġfloated":19387,"Ġmerge":19388,"Ġcompliment":19389,"ĠVC":19390,"Ġinsulin":19391,"ĠDebt":19392,"ça":19393,"Ġpens":19394,"Ġassertion":19395,"Ġredevelopment":19396,"moderate":19397,"Ġleftist":19398,"ĠBA":19399,"Ġherd":19400,"Ġinsecurity":19401,"liter":19402,"Ġcommence":19403,"ĠCaucus":19404,"Ġnovels":19405,"ĠChevron":19406,"Ġerosion":19407,"ĠNicholson":19408,"ĠRoof":19409,"ĠVolunteer":19410,"Ġcompelled":19411,"Ġcongratulated":19412,"ĠPanel":19413,"Ġov":19414,"idelity":19415,"Ġspect":19416,"Ġbee":19417,"ĠAssistance":19418,"Ġterrified":19419,"iew":19420,"Ġweekday":19421,"ĠHiggins":19422,"special":19423,"ubs":19424,"anton":19425,"Ġbribes":19426,"Ġneat":19427,"ĠCliff":19428,"Ġdisqualified":19429,"ĠND":19430,"Ġvers":19431,"andra":19432,"Ġgraft":19433,"value":19434,"Ġportray":19435,"Ġdaytime":19436,"ksh":19437,"Ġconsist":19438,"Ġhonesty":19439,"ĠTimber":19440,"ĠNich":19441,"Ġinvented":19442,"ĠBuch":19443,"Ġskull":19444,"Ġtags":19445,"Ġ124":19446,"ighth":19447,"Ġrelaxing":19448,"Online":19449,"Ġsanctioned":19450,"Sport":19451,"ĠCove":19452,"Ġcomics":19453,"MW":19454,"AMA":19455,"mother":19456,"Home":19457,"ĠCustomer":19458,"Ġstrides":19459,"ĠWins":19460,"Ġrollout":19461,"ĠWeaver":19462,"Ġshuttle":19463,"Ġsteak":19464,"Ġglorious":19465,"ĠToll":19466,"Ġtrustee":19467,"Ġinstallations":19468,"ĠOpportunity":19469,"Ġoper":19470,"horse":19471,"Ġaided":19472,"irus":19473,"Ġsleek":19474,"Ġyelled":19475,"ĠSocialist":19476,"Ġapplaud":19477,"ĠWah":19478,"Ġdevote":19479,"Ġdh":19480,"Ġarchitectural":19481,"ĠMAC":19482,"centric":19483,"ĠSense":19484,"illas":19485,"ĠArchbishop":19486,"glass":19487,"Ġallowance":19488,"Ġbundle":19489,"andon":19490,"eight":19491,"ĠKare":19492,"haus":19493,"ĠAndreas":19494,"Ġdoll":19495,"RAM":19496,"Ġvolunteering":19497,"ĠRaleigh":19498,"Ġbees":19499,"Ġnickel":19500,"Ġgenerosity":19501,"Ġhomeowner":19502,"ĠLieutenant":19503,"Ġlandfall":19504,"ĠRenew":19505,"ĠGiving":19506,"ĠContribut":19507,"aret":19508,"ulf":19509,"Ġreinforce":19510,"ĠSalv":19511,"ĠVenice":19512,"Ġfreedoms":19513,"ĠTools":19514,"Ġ1962":19515,"ĠWarm":19516,"majority":19517,"Ġpleas":19518,"oding":19519,"plant":19520,"Ġtow":19521,"ĠBlanc":19522,"ĠPipeline":19523,"ĠMoor":19524,"Ġrefrain":19525,"ĠExplore":19526,"language":19527,"cers":19528,"ĠWT":19529,"sent":19530,"ĠNun":19531,"Ġplastics":19532,"acas":19533,"Ġdisruptions":19534,"Ġdiscomfort":19535,"enko":19536,"Ġimprisoned":19537,"Copyright":19538,"Ġmyriad":19539,"Ġparenting":19540,"Ġspree":19541,"NBC":19542,"Ġonion":19543,"ĠIsraelis":19544,"ĠRA":19545,"Ġrelocate":19546,"113":19547,"ĠHir":19548,"ĠDre":19549,"ĠDry":19550,"ĠONE":19551,"ĠAdministrator":19552,"Ġprints":19553,"ĠGret":19554,"Ġundergraduate":19555,"ĠLif":19556,"avers":19557,"ĠCarney":19558,"Ġapex":19559,"Ġlenses":19560,"Ġliberals":19561,"gb":19562,"ĠWhereas":19563,"Ġcountryside":19564,"amine":19565,"ĠTerminal":19566,"Ġintr":19567,"ĠTrey":19568,"ALS":19569,"Ġcontinental":19570,"Ġselfies":19571,"FILE":19572,"ĠUnity":19573,"Ġauthoritarian":19574,"Ġoriginated":19575,"ĠExcept":19576,"yna":19577,"Ġmonet":19578,"Ġundermining":19579,"ĠGS":19580,"pi":19581,"iq":19582,"Ġslides":19583,"ĠSummary":19584,"Ġpains":19585,"cluding":19586,"Ġequation":19587,"locked":19588,"Ġfraternity":19589,"Ġwithstand":19590,"Ġdevastation":19591,"Ġdemo":19592,"late":19593,"Ġpunches":19594,"Ġgeared":19595,"nen":19596,"ĠBowie":19597,"attle":19598,"Ġpolitic":19599,"ĠGle":19600,"mented":19601,"ĠCoordinator":19602,"Ġupwards":19603,"ĠMega":19604,"angled":19605,"Ġengineered":19606,"Ġluggage":19607,"ĠWen":19608,"ĠSergeant":19609,"Ġkindergarten":19610,"ĠPortsmouth":19611,"uddin":19612,"ket":19613,"oba":19614,"Ġoscill":19615,"esse":19616,"ĠOlson":19617,"ĠBorough":19618,"Ġsupplements":19619,"ĠEvening":19620,"ANE":19621,"Ġlava":19622,"Ġgearing":19623,"setting":19624,"urgical":19625,"asty":19626,"ĠDaytona":19627,"Ġbrewery":19628,"Ġpledges":19629,"rounder":19630,"ulous":19631,"ĠHancock":19632,"rex":19633,"Ġram":19634,"Ġproceeding":19635,"ĠMurdoch":19636,"Ġdowngrade":19637,"Ġstatues":19638,"Ġdebated":19639,"ĠSleep":19640,"Ġ144":19641,"ĠRuby":19642,"ĠFi":19643,"123":19644,"ĠArabic":19645,"Ġlasts":19646,"ĠIvy":19647,"ĠWid":19648,"rown":19649,"stick":19650,"?'\"":19651,"ĠSTEM":19652,"Ġsensible":19653,"htar":19654,"Ġharbor":19655,"Ġcra":19656,"ĠAlbum":19657,"ĠCarnival":19658,"Ġimplies":19659,"agement":19660,"ĠInitially":19661,"Ġchooses":19662,"Jeff":19663,"ĠHig":19664,"Ġtam":19665,"Ġlump":19666,"ucks":19667,"Ġrepatri":19668,"ĠMercy":19669,"zza":19670,"Ġ365":19671,"ĠRicardo":19672,"ogram":19673,"Ġundergone":19674,"system":19675,"Ġtel":19676,"ĠKee":19677,"ully":19678,"istas":19679,"Ġgrains":19680,"ĠTomorrow":19681,"ĠRC":19682,"ĠTurk":19683,"Ġfreshmen":19684,"ĠAway":19685,"ĠSach":19686,"ĠUltimate":19687,"Ġoffensively":19688,"ismo":19689,"Ġteaser":19690,"ĠJud":19691,"Ġlegitimacy":19692,"opt":19693,"ĠCobb":19694,"Ġrejecting":19695,"ĠSolo":19696,"ĠArcher":19697,"Ġsoutheastern":19698,"ĠPlain":19699,"ĠLoss":19700,"Ġminerals":19701,"ĠMari":19702,"Ġscrambling":19703,"ĠPeak":19704,"Ġhavoc":19705,"rings":19706,"Ġunofficial":19707,"ĠHaj":19708,"director":19709,"ĠCanal":19710,"ĠNSA":19711,"ĠEaton":19712,"ĠPART":19713,"ĠCommissioners":19714,"Ġwellbeing":19715,"resa":19716,"Ġunderstandable":19717,"dates":19718,"ĠSorry":19719,"Ġastonishing":19720,"Ġrevise":19721,"ĠEc":19722,"ĠLack":19723,"endi":19724,"endale":19725,"also":19726,"Ġcolder":19727,"Ġheel":19728,"Ġcellular":19729,"Conn":19730,"ĠThur":19731,"Ġmassage":19732,"olla":19733,"clus":19734,"Ġtoilets":19735,"ĠCelebr":19736,"Ġtackled":19737,"Ġchorus":19738,"ETA":19739,"anca":19740,"ĠOLED":19741,"Ġpunk":19742,"ĠBrain":19743,"ĠNuggets":19744,"Ġseamless":19745,"make":19746,"atted":19747,"ĠRog":19748,"ĠPatch":19749,"Ġruined":19750,"Ins":19751,"Ġconsolidate":19752,"Ġgospel":19753,"ĠCaption":19754,"Ġoverweight":19755,"Ġscreened":19756,"ĠKraft":19757,"ĠBain":19758,"breaker":19759,"ĠFeinstein":19760,"ĠDoc":19761,"Ġdeepest":19762,"ĠOL":19763,"Ġtunes":19764,"Ġrightly":19765,"ĠLanc":19766,"ĠBrotherhood":19767,"Ġpoultry":19768,"ĠPure":19769,"Ġstimulate":19770,"Ġdiscourse":19771,"ĠStark":19772,"Ġmuseums":19773,"ention":19774,"Ġtaxation":19775,"ĠAkron":19776,"ayer":19777,"ĠKirby":19778,"farm":19779,"oser":19780,"Ġcommend":19781,"Ġunarmed":19782,"ensions":19783,"Ġsuperst":19784,"Ġoceans":19785,"Ġmisuse":19786,"LO":19787,"ĠByrne":19788,"ĠMaritime":19789,"Ġdense":19790,"Ġexcuses":19791,"Ġsuppose":19792,"ĠMarks":19793,"Ġrainy":19794,"Ġreplicate":19795,"Ġboutique":19796,"ĠRenaissance":19797,"jas":19798,"icted":19799,"Ġreferenced":19800,"ĠTir":19801,"ĠHatch":19802,"ĠCry":19803,"ĠPayPal":19804,"Ġfulfil":19805,"ĠHawaiian":19806,"come":19807,"ĠThirty":19808,"Ġ260":19809,"ĠYak":19810,"Ġangles":19811,"Ġlandlord":19812,"Ġlavish":19813,"Women":19814,"ĠNT":19815,"Ġreinforced":19816,"Ġprevail":19817,"ĠCommunities":19818,"Ġfootwear":19819,"Ġassurances":19820,"Ġlb":19821,"Ġairing":19822,"Ġresorts":19823,"ĠFiji":19824,"ĠShay":19825,"Ġprevailing":19826,"many":19827,"Ġimpe":19828,"ĠDul":19829,"Ġsymbols":19830,"zb":19831,"ĠCere":19832,"Ġapplauded":19833,"Ġsoundtrack":19834,"Ġdrunken":19835,"ĠEuropeans":19836,"Ġherds":19837,"moving":19838,"WR":19839,"ĠHindi":19840,"Ġwaking":19841,"Jo":19842,"Andrew":19843,"rosse":19844,"ĠLegislative":19845,"Ġdisgrace":19846,"Nothing":19847,"ĠBulgaria":19848,"Ġhumidity":19849,"Ġtranslation":19850,"Ġmeasurements":19851,"Ġvying":19852,"ĠBrid":19853,"Max":19854,"Ġdir":19855,"unci":19856,"Ġdefines":19857,"Ġperfection":19858,"ancers":19859,"Matt":19860,"ĠShinzo":19861,"ĠPresidents":19862,"Ġginger":19863,"onna":19864,"existing":19865,"rika":19866,"enced":19867,"ĠBray":19868,"Ġgall":19869,"Ġdisrespect":19870,"ĠCumber":19871,"Ġcontestant":19872,"ucky":19873,"anticipated":19874,"abled":19875,"LLOW":19876,"Bel":19877,"ĠKear":19878,"Ġstoryline":19879,"Ġrigs":19880,"ĠScots":19881,"ĠChap":19882,"ĠThankfully":19883,"Ġcommunist":19884,"ĠAdviser":19885,"Ġregist":19886,"Ġannoying":19887,"ĠDVD":19888,"Ġethic":19889,"ĠFilipino":19890,"ĠAdidas":19891,"Ġbilling":19892,"Ġalleviate":19893,"Ġsmoked":19894,"Ġhazard":19895,"EV":19896,"Ag":19897,"baum":19898,"Ġdoses":19899,"Ġoutcry":19900,"Ġinclined":19901,"Ġpsychologist":19902,"itzer":19903,"January":19904,"Ġmornings":19905,"aught":19906,"Ġsurreal":19907,"ĠCannon":19908,"avy":19909,"ĠCris":19910,"cf":19911,"Ġinterpreted":19912,"Ġpersecution":19913,"vation":19914,"Ġupfront":19915,"ĠWaste":19916,"Ġmills":19917,"Ġbombings":19918,"ĠHeaven":19919,"ĠFlat":19920,"Ġboxer":19921,"Ġavenues":19922,"Invest":19923,"ĠZika":19924,"Ġbackstage":19925,"idas":19926,"eston":19927,"ead":19928,"Ġbishops":19929,"Ġrender":19930,"Ġfootballer":19931,"Ġspilled":19932,"Only":19933,"Ġsaddened":19934,"ĠAbove":19935,"inator":19936,"tro":19937,"onen":19938,"ĠAMC":19939,"Ġstringent":19940,"Ġfooting":19941,"ĠGhost":19942,"Ġtexting":19943,"ĠCPI":19944,"ĠUW":19945,"Ġaccol":19946,"iries":19947,"ĠFlex":19948,"ĠCarolyn":19949,"Andre":19950,"Ġsiege":19951,"Muslim":19952,"Ġautomobile":19953,"reci":19954,"Ġdean":19955,"atre":19956,"Ġwax":19957,"Ġwo":19958,"ĠDuffy":19959,"Ġfiance":19960,"Ġfib":19961,"Ġeagle":19962,"ĠCatal":19963,"Ġinfants":19964,"Ġsubmitting":19965,"Ġdownhill":19966,"Ġstaffer":19967,"ĠLights":19968,"Ġeater":19969,"ĠCaliforn":19970,"Ġsupervisors":19971,"ĠPy":19972,"Ġcondemnation":19973,"Ġsci":19974,"Ġhated":19975,"Ġtil":19976,"ĠLavrov":19977,"Ġsab":19978,"Ġmotors":19979,"Ġlogging":19980,"ĠOwn":19981,"Ġpi":19982,"Ġrepeating":19983,"ĠDOJ":19984,"enary":19985,"ĠChow":19986,"fat":19987,"Ġbalcony":19988,"orie":19989,"NING":19990,"ĠUnified":19991,"Neil":19992,"Bill":19993,"ĠSims":19994,"uten":19995,"LV":19996,"ĠEMS":19997,"Ġsip":19998,"Ġreplaces":19999,"ichi":20000,"ĠFig":20001,"ĠCharity":20002,"Ġpeek":20003,"Ġrack":20004,"Ġcousins":20005,"Ġresolving":20006,"Ġthrone":20007,"ĠEngine":20008,"ĠChak":20009,"Ġlamented":20010,"Ġwipe":20011,"Ġnutrients":20012,"ĠChat":20013,"AMP":20014,"ĠOprah":20015,"uming":20016,"serving":20017,"Ġfir":20018,"Ġlandlords":20019,"neck":20020,"Ġupload":20021,"Ġunspecified":20022,"Ġicy":20023,"´":20024,"Ġze":20025,"Ġprohibits":20026,"ĠFI":20027,"Res":20028,"ĠEff":20029,"hell":20030,"umbo":20031,"Ġreceipts":20032,"Ġoperatives":20033,"stant":20034,"Ġwives":20035,"ĠCinema":20036,"Ġnegligence":20037,"Ġgases":20038,"ĠLau":20039,"Ġbrew":20040,"August":20041,"never":20042,"Ġpenned":20043,"Ġincomplete":20044,"ĠZh":20045,"esi":20046,"Ġranged":20047,"apolis":20048,"Ġwithdrawing":20049,"ĠLevi":20050,"ĠLevy":20051,"ĠDaly":20052,"Ġdelaying":20053,"ĠMSNBC":20054,"ĠCyrus":20055,"ĠNutrition":20056,"NN":20057,"Ġwinding":20058,"Ġglow":20059,"ĠMY":20060,"Ġgoodwill":20061,"ĠMON":20062,"Ġslots":20063,"ĠNina":20064,"ĠFIR":20065,"ĠLTE":20066,"ĠInnov":20067,"dev":20068,"ctic":20069,"Ġanalyses":20070,"ĠBangalore":20071,"Ġtales":20072,"Ġovercame":20073,"ĠThurs":20074,"Ġcherry":20075,"ĠNou":20076,"ĠFlowers":20077,"1000":20078,"updated":20079,"rieve":20080,"ĠBeautiful":20081,"iak":20082,"Ġplayback":20083,"Ġheadset":20084,"Ġashamed":20085,"Min":20086,"Ġadm":20087,"ĠLucky":20088,"ĠTucson":20089,"Ġentirety":20090,"ranging":20091,"ĠVance":20092,"kered":20093,"image":20094,"ĠGord":20095,"War":20096,"Ġsimilarities":20097,"dig":20098,"ĠJude":20099,"Ġlonely":20100,"hra":20101,"ĠStaples":20102,"ĠACA":20103,"Ġmeasurement":20104,"Ġcooper":20105,"ATER":20106,"ĠMeng":20107,"Ġbarring":20108,"190":20109,"ĠBatt":20110,"Ġreproductive":20111,"ĠRowe":20112,"Ġsubsid":20113,"Ġslogans":20114,"ugar":20115,"ĠKeller":20116,"ingham":20117,"fuel":20118,"Ġhid":20119,"afe":20120,"Ġindul":20121,"cash":20122,"Ġstressing":20123,"ĠMIT":20124,"Ġtrump":20125,"ancer":20126,"ĠPes":20127,"ĠMint":20128,"Ġcrossover":20129,"ĠWeiss":20130,"ĠElvis":20131,"ĠPermanent":20132,"ĠKhalid":20133,"Ġunjust":20134,"Ġexceptionally":20135,"Ġfut":20136,"Ġavid":20137,"ĠEthics":20138,"Ġutilized":20139,"Ġfeasibility":20140,"Ġcatering":20141,"Press":20142,"wayne":20143,"October":20144,"Ġfavors":20145,"Ġobsession":20146,"Ġmelt":20147,"Ġmug":20148,"ĠMK":20149,"Ġapples":20150,"Ġvine":20151,"cliffe":20152,"Ġgrat":20153,"Ġspells":20154,"ounced":20155,"Ġdecree":20156,"issy":20157,"Team":20158,"Ġdeploying":20159,"Feb":20160,"Ġmiserable":20161,"Ġwat":20162,"ĠBust":20163,"ĠNorris":20164,"ĠTimberwolves":20165,"Ġangered":20166,"ĠArn":20167,"oft":20168,"rome":20169,"Ġadvertisements":20170,"onal":20171,"Ġnun":20172,"Ġtorque":20173,"Ġslave":20174,"Ġnonsense":20175,"Ġcoy":20176,"Ġcites":20177,"Game":20178,"Ġarchitects":20179,"playing":20180,"Ġgener":20181,"Ġsocio":20182,"Ġmeditation":20183,"Ġforgive":20184,"Ġsmiled":20185,"%),":20186,"Ġpers":20187,"ĠSoph":20188,"Ġoccupy":20189,"atton":20190,"Ġwitnessing":20191,"Ġapologise":20192,"Ġpredecessors":20193,"ĠCassidy":20194,"Ġtallied":20195,"NER":20196,"Ġtract":20197,"ĠHolder":20198,"ĠPav":20199,"Ġjackets":20200,"Mel":20201,"raud":20202,"Ġexercising":20203,"ĠChung":20204,"ĠAmin":20205,"athi":20206,"ĠMem":20207,"Ġracked":20208,"Ġcarved":20209,"ĠMickey":20210,"ĠLafayette":20211,"Ġgrill":20212,"ĠINFORMATION":20213,"usc":20214,"ĠPromotion":20215,"yson":20216,"istry":20217,"Ġfulfilled":20218,"Ġrestraint":20219,"Ġpopping":20220,"ĠSlater":20221,"Ġmercy":20222,"aden":20223,"Ġsubmarine":20224,"ĠBowling":20225,"dogs":20226,"ĠSwe":20227,"Ġnoticeable":20228,"Ġbis":20229,"ĠPremiership":20230,"Ġspat":20231,"ĠTow":20232,"ĠWand":20233,"Ġmechanics":20234,"while":20235,"ĠBenson":20236,"Ġmolecules":20237,"Ġcrosses":20238,"Ġrecalling":20239,"ĠCertainly":20240,"HAM":20241,"Ġsever":20242,"ĠRudy":20243,"ĠDUI":20244,"OLD":20245,"ĠTobacco":20246,"Ġsubdued":20247,"Ġquota":20248,"TF":20249,"Ġflats":20250,"Ġemphasize":20251,"Ġbelts":20252,"ĠOpinion":20253,"Ġpiled":20254,"ĠSpark":20255,"ĠElias":20256,"Ġclassification":20257,"ĠHands":20258,"ĠCV":20259,"Ġtoast":20260,"Ġcandle":20261,"atching":20262,"short":20263,"ĠDup":20264,"Ġult":20265,"bats":20266,"Ġmarketers":20267,"ĠAvery":20268,"ĠColbert":20269,"ĠIk":20270,"ĠVac":20271,"ĠJackets":20272,"Ġmerits":20273,"eli":20274,"PORT":20275,"Ġelevator":20276,"irming":20277,"effective":20278,"Ġgroceries":20279,"Ġhi":20280,"ĠINTER":20281,"ĠSAP":20282,"ĠNYPD":20283,"ĠKY":20284,"Ġangel":20285,"Ġspectacle":20286,"ré":20287,"ĠRoche":20288,"Ġinsects":20289,"Ġcommenced":20290,"ĠFoley":20291,"Ġdarker":20292,"ĠUg":20293,"ĠMostly":20294,"Ġtermed":20295,"uci":20296,"ĠExec":20297,"ĠBrittany":20298,"Ġharmony":20299,"Ġadvocated":20300,"Ġparcel":20301,"ĠHots":20302,"Ġmonarch":20303,"ĠSiri":20304,"odge":20305,"ĠPag":20306,"Ġprogressing":20307,"grounds":20308,"Ġonstage":20309,"Ġwarmth":20310,"ĠWon":20311,"Ġviolates":20312,"ĠSaudis":20313,"Ġbumper":20314,"Ġpatrols":20315,"ĠBarron":20316,"Ġindoors":20317,"Ġtar":20318,"Each":20319,"Val":20320,"Ġapplicant":20321,"ĠCater":20322,"Ġclassics":20323,"ĠThreat":20324,"Ġwrapping":20325,"ĠIdlib":20326,"anking":20327,"Did":20328,"adia":20329,"ĠRig":20330,"ĠBram":20331,"ĠLaurie":20332,"ĠHair":20333,"ĠCannabis":20334,"Ġdaylight":20335,"ĠNorm":20336,"ĠRip":20337,"sin":20338,"unta":20339,"Pass":20340,"ĠAcad":20341,"ĠCummings":20342,"Ġtheirs":20343,"ĠDistribution":20344,"especially":20345,"Ġgrilled":20346,"Ġaffiliates":20347,"ĠVander":20348,"ĠCath":20349,"ĠProductions":20350,"ĠTrek":20351,"230":20352,"Ġcasinos":20353,"ĠCain":20354,"atu":20355,"idget":20356,"ĠWinds":20357,"Ġunanswered":20358,"Ġintercept":20359,"ĠMarty":20360,"Ġrefin":20361,"Ġlieutenant":20362,"cas":20363,"Chief":20364,"average":20365,"ilot":20366,"Ġscrimmage":20367,"ĠMud":20368,"speaking":20369,"ĠFranken":20370,"ĠTories":20371,"Ġabstract":20372,"awar":20373,"ĠTerms":20374,"dal":20375,"ĠFur":20376,"Ġhumour":20377,"rh":20378,"Ġsitu":20379,"aed":20380,"ĠFIN":20381,"Ġtranscripts":20382,"approved":20383,"ĠParsons":20384,"Ġpigs":20385,"Ġrepayment":20386,"ĠARM":20387,"ĠElliot":20388,"ĠLevine":20389,"Ġtagged":20390,"pun":20391,"ĠDwight":20392,"Ġconfiguration":20393,"sis":20394,"ĠAdult":20395,"Ġearthquakes":20396,"Ġcreature":20397,"ĠMRI":20398,"Ġmach":20399,"Ġprescriptions":20400,"cover":20401,"Ġministries":20402,"Ġinaccurate":20403,"ĠLabs":20404,"ĠMGM":20405,"Ġtomato":20406,"Ġeng":20407,"Ġopposes":20408,"owan":20409,"Ġmapping":20410,"Ġconsum":20411,"online":20412,"eters":20413,"code":20414,"Aug":20415,"Point":20416,"branded":20417,"pling":20418,"ĠCalder":20419,"Oper":20420,"ĠMiddles":20421,"Ġchampagne":20422,"ĠTues":20423,"Ġsampling":20424,"Ġenergetic":20425,"rano":20426,"ĠStyles":20427,"Ġneglected":20428,"ĠDamon":20429,"Ġendanger":20430,"Ġsouthwestern":20431,"ĠATM":20432,"ĠDuck":20433,"engers":20434,"Ġdan":20435,"yth":20436,"Ġbou":20437,"ĠDecl":20438,"Gold":20439,"Ġprojecting":20440,"Google":20441,"ĠHussein":20442,"Ġaccomplishment":20443,"itarian":20444,"Ġgossip":20445,"ĠRai":20446,"ril":20447,"ĠSke":20448,"Ġpsychiatric":20449,"ĠMacBook":20450,"ĠAdobe":20451,"ĠHodg":20452,"Ġaccompany":20453,"Ġadvertised":20454,"Ġreminiscent":20455,"Ġgeographical":20456,"Ġconvertible":20457,"IK":20458,"CTV":20459,"Ġcommunal":20460,"Ġchim":20461,"Ġselfish":20462,"Ġdrilled":20463,"Ġtortured":20464,"Ġblacks":20465,"noon":20466,"Ġmanifesto":20467,"ĠRichie":20468,"acco":20469,"Im":20470,"Ġdebit":20471,"ĠSNP":20472,"perfect":20473,"gard":20474,"ĠRatio":20475,"Ġstubborn":20476,"Ġaccumulation":20477,"Ġcongregation":20478,"Ġkissing":20479,"Ġkillers":20480,"ĠAbbey":20481,"von":20482,"ĠFuj":20483,"ĠIsabel":20484,"NB":20485,"ĠNish":20486,"ĠJulius":20487,"ĠZimmer":20488,"Ġuncover":20489,"dar":20490,"isle":20491,"ĠCompar":20492,"Ġcounselor":20493,"ĠSok":20494,"ĠCumm":20495,"ĠHip":20496,"Ġurgently":20497,"Ġrentals":20498,"Ġapproving":20499,"Ġirrigation":20500,"Ġprostate":20501,"ĠJudicial":20502,"ĠSubmit":20503,"ĠTanner":20504,"attack":20505,"emb":20506,"Ġreclaim":20507,"Ġec":20508,"Ġbrutality":20509,"Ġcommanding":20510,"Ġreasoning":20511,"Roy":20512,"ĠElect":20513,"ĠMobil":20514,"anding":20515,"Ġmirrors":20516,"Israel":20517,"Ġpavement":20518,"Ġoverdue":20519,"ĠMd":20520,"street":20521,"Ġthrill":20522,"pora":20523,"azon":20524,"Ġbrewing":20525,"enge":20526,"ĠDisaster":20527,"Ġbuilder":20528,"ods":20529,"utsch":20530,"Ġterminals":20531,"ĠBaird":20532,"enburg":20533,"Ġhast":20534,"Ġbrass":20535,"Ġparental":20536,"enture":20537,"ĠConduct":20538,"Ġexpands":20539,"luck":20540,"mur":20541,"ĠBj":20542,"Ġadministrations":20543,"ĠOlivier":20544,"oux":20545,"Ġnarrowed":20546,"winner":20547,"Ġmakeshift":20548,"ĠVAT":20549,"ĠJavier":20550,"-,":20551,"Ġsystematic":20552,"Ġenforcing":20553,"emin":20554,"ĠAudio":20555,"United":20556,"gener":20557,"ĠKara":20558,"ivas":20559,"ĠPretty":20560,"ĠLob":20561,"Ġpetitions":20562,"ĠMercer":20563,"ampa":20564,"product":20565,"Ġdistributing":20566,"Ġtunnels":20567,"Ġcondo":20568,"ĠRSS":20569,"ĠCarlo":20570,"Ġpumpkin":20571,"Ġsto":20572,"Ġassumes":20573,"oway":20574,"hiba":20575,"lection":20576,"Ġgam":20577,"ĠAires":20578,"Ġtransmitted":20579,"Ġtrousers":20580,"Ġcheers":20581,"ĠJensen":20582,"Ġemer":20583,"Ġsimpler":20584,"Ġcolored":20585,"ĠSustainable":20586,"Ġinstruct":20587,"Ġpoles":20588,"Ġsupervised":20589,"Ġinteg":20590,"ĠMoreno":20591,"boarding":20592,"igrant":20593,"ĠYoga":20594,"Ġenvironmentally":20595,"Ġsacrifices":20596,"Ġshores":20597,"Ġ127":20598,"Ġestranged":20599,"Ġintoxicated":20600,"Ġemergencies":20601,"ĠKosovo":20602,"yang":20603,"Ġfastball":20604,"Ġpackaged":20605,"LAN":20606,"Ġhurry":20607,"ĠManny":20608,"Ġporch":20609,"Ġcuriosity":20610,"ĠKend":20611,"thouse":20612,"ĠTou":20613,"mun":20614,"Ġwaving":20615,"Ġpasswords":20616,"ĠSwan":20617,"Ġprefers":20618,"ĠCorrections":20619,"aic":20620,"Ġejected":20621,"Ġdossier":20622,"ĠChal":20623,"Ġfacto":20624,"Ġspine":20625,"leck":20626,"Ġrestriction":20627,"Ġdisagreement":20628,"grown":20629,"ĠEdgar":20630,"Ġquantities":20631,"ĠRapid":20632,"Ġpals":20633,"Ġspared":20634,"Ġremarkably":20635,"ructure":20636,"Ġbackers":20637,"ĠGoals":20638,"cles":20639,"rolling":20640,"ĠBlasio":20641,"Ġorchestra":20642,"ologies":20643,"ĠRise":20644,"Power":20645,"Ġuptick":20646,"atha":20647,"ĠMob":20648,"Ġshotgun":20649,"downs":20650,"ĠBorg":20651,"Ġmorale":20652,"Call":20653,"wave":20654,"ĠDuc":20655,"Ġunwilling":20656,"oad":20657,"Ġbusinessmen":20658,"Ġrefriger":20659,"Ġgamers":20660,"Ġcele":20661,"Ġprecip":20662,"Ġrenegoti":20663,"OY":20664,"ĠPharm":20665,"Ġresponsive":20666,"Ġservant":20667,"eye":20668,"Ġraping":20669,"vas":20670,"Ġgroin":20671,"ĠMelvin":20672,"ĠKurds":20673,"Ġstricter":20674,"ĠMum":20675,"ients":20676,"Ġstandalone":20677,"Ġforums":20678,"Ġcommemorate":20679,"Far":20680,"ĠTelegram":20681,"Ġscreenings":20682,"ĠLeonardo":20683,"ighton":20684,"ĠDOWN":20685,"Ġmodule":20686,"Ġremedy":20687,"Ġ280":20688,"Su":20689,"ĠBecker":20690,"ĠGast":20691,"prem":20692,"ĠInto":20693,"oyle":20694,"114":20695,"Ġadhere":20696,"Report":20697,"ĠJaneiro":20698,"ĠKry":20699,"Pakistan":20700,"Ġrobotic":20701,"ande":20702,"Ġoverlooking":20703,"ĠTreaty":20704,"Ġrect":20705,"yne":20706,"Ġbattlefield":20707,"ĠGeoff":20708,"Ġearns":20709,"ĠMiner":20710,"Ġteased":20711,"Ġexemptions":20712,"Ġvacancy":20713,"oku":20714,"Ġvulnerabilities":20715,"ĠRou":20716,"Ġobserv":20717,"Ġoverlook":20718,"Ġcorrespond":20719,"Ġtheatrical":20720,"Ġrobotics":20721,"ĠCompl":20722,"ĠPasadena":20723,"laden":20724,"Ġvastly":20725,"olit":20726,"Ġjustification":20727,"Ġtampering":20728,"ĠSutherland":20729,"ĠMens":20730,"Ġinvisible":20731,"uren":20732,"ĠAshton":20733,"owl":20734,"Ġdisqual":20735,"ĠEva":20736,"Ġfriction":20737,"ĠIrvine":20738,"Ġaliens":20739,"ĠPension":20740,"ĠAssets":20741,"ĠBenedict":20742,"ittal":20743,"Ġsword":20744,"Ġunderwear":20745,"ĠFarmer":20746,"Ġtimber":20747,"Ġdependence":20748,"ĠTang":20749,"Ġ165":20750,"ĠNazis":20751,"Ġpunching":20752,"ĠGloria":20753,"usat":20754,"Ġluxurious":20755,"chuk":20756,"ĠCot":20757,"Ġregained":20758,"Ġreassure":20759,"Ġhello":20760,"Ġante":20761,"Ġnegotiators":20762,"Add":20763,"paced":20764,"ér":20765,"Ġdemolished":20766,"Ann":20767,"joy":20768,"ĠJenna":20769,"Apple":20770,"Ġdisturbance":20771,"Ġcommissions":20772,"ĠPolitico":20773,"along":20774,"Ġnem":20775,"Ġauctions":20776,"ruck":20777,"ĠOD":20778,"ofer":20779,"Play":20780,"Ġcarn":20781,"vez":20782,"Ġtents":20783,"Ġcongratulate":20784,"ĠLiquid":20785,"ĠCoyotes":20786,"uku":20787,"ĠAllah":20788,"Ġbend":20789,"Ġcanvas":20790,"ĠClifford":20791,"Ġvolunteered":20792,"Luc":20793,"bp":20794,"ĠCensus":20795,"ĠShot":20796,"Ġanonymously":20797,"ĠAnglo":20798,"ĠBayer":20799,"ĠAber":20800,"ĠCorrectional":20801,"Ġhardship":20802,"ĠBuenos":20803,"ĠDaw":20804,"Ġbaskets":20805,"Ġupstairs":20806,"Ġmindful":20807,"ĠLCD":20808,"ĠBlackburn":20809,"ĠHale":20810,"477":20811,"Ġcircus":20812,"ĠDragons":20813,"Ġrubble":20814,"rb":20815,"Ġheadaches":20816,"aunt":20817,"itus":20818,"Ġscaled":20819,"ĠComic":20820,"asio":20821,"ĠNordic":20822,"Per":20823,"Ġbombers":20824,"ilitation":20825,"Ġindirectly":20826,"ĠHod":20827,"andan":20828,"operation":20829,"Ġpuppy":20830,"ĠMats":20831,"Ġstewards":20832,"roup":20833,"Ġmemorandum":20834,"Ġpatio":20835,"const":20836,"ĠBold":20837,"ĠKaiser":20838,"Following":20839,"Ġcompat":20840,"Ġsidewalks":20841,"ĠFitzpatrick":20842,"Ġsunlight":20843,"ĠLever":20844,"ĠBecky":20845,"icles":20846,"ĠProbably":20847,"Ġgarner":20848,"ĠTomas":20849,"Ġblankets":20850,"uga":20851,"jiang":20852,"Ġrevel":20853,"ĠHutch":20854,"llers":20855,"Ġtrimmed":20856,"ĠSTR":20857,"ĠKR":20858,"ĠPike":20859,"ĠASS":20860,"Bay":20861,"Ġdiagnostic":20862,"ĠSteph":20863,"Ġtoured":20864,"ĠAvoid":20865,"vic":20866,"Without":20867,"ĠClinical":20868,"Ġblo":20869,"undo":20870,"ĠBoise":20871,"Ġspeculated":20872,"ĠProt":20873,"vention":20874,"Ġscholar":20875,"ĠSta":20876,"Featured":20877,"ĠPrev":20878,"Ġpenny":20879,"ĠHath":20880,"rawn":20881,"Ġrenovated":20882,"ĠFried":20883,"itol":20884,"uddle":20885,"Ġinquest":20886,"Ġmetropolitan":20887,"lights":20888,"Ġtempo":20889,"onom":20890,"ĠImport":20891,"Asia":20892,"Ġowes":20893,"Ġmagistrate":20894,"ĠFriedman":20895,"Ġcontacting":20896,"Ġstrains":20897,"Ġhomage":20898,"Ġlent":20899,"ception":20900,"git":20901,"Ġlively":20902,"Ġscra":20903,"WW":20904,"ön":20905,"rill":20906,"Jack":20907,"ĠShank":20908,"iani":20909,"Ġdecreasing":20910,"MON":20911,"ĠSupervisor":20912,"ĠCats":20913,"ĠFusion":20914,"Ġracially":20915,"ĠTara":20916,"ĠPurchase":20917,"ĠRally":20918,"ĠGraph":20919,"ĠHello":20920,"hest":20921,"ĠVarg":20922,"Ġdrowned":20923,"ĠThu":20924,"ĠWet":20925,"ĠEug":20926,"Ġrainbow":20927,"Ġtelev":20928,"ĠAmir":20929,"Based":20930,"Ġcookie":20931,"uding":20932,"Ġcontracting":20933,"Ġobjected":20934,"Ġfork":20935,"acent":20936,"ĠTil":20937,"ĠLilly":20938,"ĠEur":20939,"Ġhormone":20940,"Ġnails":20941,"ĠFischer":20942,"Ġpier":20943,"EMENT":20944,"Ġeruption":20945,"visory":20946,"Ġspeculate":20947,"apan":20948,"ĠJub":20949,"ĠHuckabee":20950,"string":20951,"stay":20952,"Ġsustaining":20953,"VM":20954,"Ġpriv":20955,"Ġclos":20956,"Ġdownloaded":20957,"ĠIv":20958,"Ġfinanced":20959,"ĠSao":20960,"ĠEverett":20961,"rene":20962,"ĠWo":20963,"ĠPiet":20964,"Ġengulfed":20965,"Ġexiting":20966,"uni":20967,"horn":20968,"Ġgrav":20969,"ection":20970,"Ġdrainage":20971,"Ġfuelled":20972,"Ġorganizational":20973,"bike":20974,"ĠAreas":20975,"Ġpoliceman":20976,"ĠFirm":20977,"ĠSlide":20978,"Ġrand":20979,"ĠJedi":20980,"Ge":20981,"really":20982,"Manchester":20983,"ĠWise":20984,"parent":20985,"Ġlad":20986,"Ġurine":20987,"ĠColombian":20988,"geon":20989,"Ġ1961":20990,"Mania":20991,"Ġgraph":20992,"Ġcod":20993,"fred":20994,"Ġeffic":20995,"ĠGateway":20996,"asket":20997,"Ġdiminished":20998,"Mass":20999,"Ġ205":21000,"Long":21001,"Ġgranddaughter":21002,"Ġshining":21003,"Semitic":21004,"Ġarising":21005,"Ġ330":21006,"ĠDU":21007,"ĠZah":21008,"Ġexclusion":21009,"ĠClaus":21010,"Ġven":21011,"oine":21012,"ĠAPI":21013,"reve":21014,"Ġmilitias":21015,"Ġfro":21016,"Ġwaved":21017,"ĠLuxembourg":21018,"Ġdiamonds":21019,"Ġstabilize":21020,"Ġqueue":21021,"ĠSponsor":21022,"Ġeldest":21023,"ĠLud":21024,"Ġwasting":21025,"Ġdimension":21026,"Ġmotorcycles":21027,"ucker":21028,"ĠTav":21029,"Ġsupremacy":21030,"Take":21031,"ĠCPU":21032,"cup":21033,"Ġdisregard":21034,"Ġenvelope":21035,"ĠCah":21036,"Ġproposes":21037,"ĠMaurice":21038,"Ġhobby":21039,"Ġharmon":21040,"Ġribbon":21041,"ĠOrigin":21042,"Ġbuilders":21043,"Ġconj":21044,"Ġcert":21045,"eat":21046,"ĠStern":21047,"ulia":21048,"vals":21049,"cling":21050,"Ġprovocative":21051,"Ġsofter":21052,"Ġ1948":21053,"Ġremod":21054,"ĠSob":21055,"Ġmaxim":21056,"Ġblueprint":21057,"oit":21058,"ĠGarner":21059,"Ġfibre":21060,"search":21061,"ĠWrite":21062,"270":21063,"Ġclergy":21064,"ĠPalo":21065,"obile":21066,"Mad":21067,"Ġclown":21068,"Ġtraced":21069,"280":21070,"ĠAlberto":21071,"Ġdrums":21072,"ĠFridays":21073,"ĠStrat":21074,"stated":21075,"ĠStevenson":21076,"Pr":21077,"Ġboasted":21078,"ĠBrees":21079,"ĠDonn":21080,"ĠMaya":21081,"Ġrelieve":21082,"Ġ1080":21083,"Ġcheapest":21084,"Ġuniquely":21085,"Ġjungle":21086,"Ġprevalence":21087,"Ġoutfield":21088,"ĠMaps":21089,"Ġaccustomed":21090,"pac":21091,"Ġcombinations":21092,"ĠSoros":21093,"stad":21094,"Ġket":21095,"Ġdisgusting":21096,"ĠOFF":21097,"irs":21098,"Ġbiased":21099,"Ġpaved":21100,"iked":21101,"utterstock":21102,"ocal":21103,"Ġsurround":21104,"ĠGuang":21105,"Ġspear":21106,"ĠBellev":21107,"ortun":21108,"Rec":21109,"acho":21110,"Ġfrightening":21111,"Ġtyres":21112,"normal":21113,"ĠYan":21114,"ĠWarsaw":21115,"ĠBod":21116,"ourse":21117,"199":21118,"Ver":21119,"erent":21120,"Ġsparkling":21121,"Ġchanting":21122,"Ġ1945":21123,"Ġturbo":21124,"Ġhazards":21125,"IRE":21126,"ĠRonnie":21127,"Ġsplitting":21128,"ĠMatte":21129,"roph":21130,"Ġtended":21131,"Ġvandalism":21132,"alis":21133,"SY":21134,"Ġoversaw":21135,"Happy":21136,"ĠTC":21137,"275":21138,"Ġeco":21139,"ĠKers":21140,"Ġextensions":21141,"ĠFlan":21142,"ĠCena":21143,"ĠDowns":21144,"Ġdrummer":21145,"Ġawaited":21146,"ĠACL":21147,"Ġlegends":21148,"ĠRollins":21149,"hend":21150,"Ġdeparting":21151,"Ġtha":21152,"Ġunre":21153,".(":21154,"Ġfaded":21155,"Ġretirees":21156,"vid":21157,"Ġentrants":21158,"ĠStella":21159,"arer":21160,"Ġteaspoon":21161,"ĠSheridan":21162,"irc":21163,"ĠRelief":21164,"ĠButt":21165,"Ġris":21166,"Ġundermined":21167,"Ġsunk":21168,"Sam":21169,"kamp":21170,"riot":21171,"rating":21172,"Ġclubhouse":21173,"Ġpeaked":21174,"ĠSki":21175,"Ġairstrikes":21176,"Ġconce":21177,"ĠCPR":21178,"Ġesp":21179,"ĠWave":21180,"ĠColiseum":21181,"outheastern":21182,"Ġtrou":21183,"Ġfeather":21184,"ĠSoy":21185,"ĠBihar":21186,"Ġintervened":21187,"mits":21188,"colored":21189,"330":21190,"Ġprocession":21191,"apeake":21192,"ité":21193,"riel":21194,"Ġmart":21195,"afer":21196,"ĠGuests":21197,"ĠPie":21198,"Ġshiny":21199,"ĠSixers":21200,"ĠRoads":21201,"Ġkicker":21202,"ĠCrimes":21203,"Ġfrontier":21204,"ansen":21205,"November":21206,"smith":21207,"ĠLaun":21208,"fried":21209,"weet":21210,"ĠGrass":21211,"Ġsanitation":21212,"ĠEat":21213,"ĠParts":21214,"ĠTun":21215,"amar":21216,"ĠJupiter":21217,"ĠFS":21218,"Ġunsc":21219,"ĠDone":21220,"Ġleveraging":21221,"Ġtucked":21222,"Ġineffective":21223,"Ġriots":21224,"wei":21225,"ĠAttend":21226,"Ġpertaining":21227,"amen":21228,"monds":21229,"Ġmism":21230,"serious":21231,"ĠViol":21232,"rous":21233,"Ġ129":21234,"uebl":21235,"umption":21236,"tri":21237,"ĠWedding":21238,"Ġtroopers":21239,"ĠTHR":21240,"olving":21241,"leys":21242,"Med":21243,"Ġseparatists":21244,"Ġimper":21245,"ĠFrontier":21246,"Ġwhit":21247,"ĠMutual":21248,"Ġrested":21249,"Ġunhealthy":21250,"gang":21251,"Ġresearching":21252,"ĠColonel":21253,"Ġaffordability":21254,"ĠRegarding":21255,"ĠWend":21256,"ĠMellon":21257,"Ġplots":21258,"Ġcanal":21259,"PER":21260,"ĠShopping":21261,"etry":21262,"Ġoccurrence":21263,"Ġgraves":21264,"BF":21265,"ĠKau":21266,"indust":21267,"Ġbeard":21268,"uate":21269,"ĠProdu":21270,"ĠSomali":21271,"ishers":21272,"ĠFell":21273,"ĠHutchinson":21274,"Ġhust":21275,"Ġillustration":21276,"Ġ//":21277,"Ġsharks":21278,"Ġcoincidence":21279,"Ġremake":21280,"Ġmural":21281,"course":21282,"ĠSultan":21283,"arse":21284,"Ġwhip":21285,"ĠPodcast":21286,"Ġtightened":21287,"Ġdenim":21288,"Ġlandfill":21289,"future":21290,"Ġsuperv":21291,"Hand":21292,"Ġpraising":21293,"ĠEly":21294,"ĠGust":21295,"ĠMayer":21296,"Ġorphan":21297,"Ġrepaired":21298,"ĠPir":21299,"Ġspiral":21300,"husband":21301,"ienne":21302,"iatric":21303,"Ġmarriages":21304,"Ġhorn":21305,"plain":21306,"ĠLum":21307,"ession":21308,"ĠFeatures":21309,"Ġbreakup":21310,"Ġentrepreneurship":21311,"rina":21312,"Ġembargo":21313,"Ġcapitalism":21314,"ĠMinor":21315,"Ġpromo":21316,"Ġexcel":21317,"Japan":21318,"Ġworsening":21319,"Ġstumbled":21320,"Ġpins":21321,"Ġswipe":21322,"Ġexile":21323,"Ġseparatist":21324,"ĠBian":21325,"Ġrelocation":21326,"Ġcommanders":21327,"Ġdowned":21328,"Ġblogger":21329,"packed":21330,"ĠSchn":21331,"Ġwaterfront":21332,"ĠYus":21333,"Ġnegotiator":21334,"Ġfavourable":21335,"Iran":21336,"oulder":21337,"Ġcance":21338,"Ġvind":21339,"angel":21340,"Ġauthenticity":21341,"Ġtowel":21342,"bul":21343,"ĠNeville":21344,"ĠBuddhist":21345,"fields":21346,"uly":21347,"Ġniece":21348,"Ġcorrections":21349,"Ġassignments":21350,"ĠSchl":21351,"Ġharmed":21352,"375":21353,"Ġwounding":21354,"ĠPosition":21355,"Ġsupermarkets":21356,"Ġdisclosures":21357,"Ġ185":21358,"esp":21359,"ĠMcCull":21360,"ĠMale":21361,"Ġsailors":21362,"mis":21363,"ĠSophia":21364,"Ġunfolded":21365,"owell":21366,"ĠScarborough":21367,"Ġentrepreneurial":21368,"118":21369,"ogy":21370,"ĠLikewise":21371,"Ġswung":21372,"Ġdrawings":21373,"Ġdrafting":21374,"ĠSimple":21375,"ĠFilip":21376,"arf":21377,"Ġfade":21378,"Ġmerged":21379,"ĠLeaf":21380,"sun":21381,"Ġflame":21382,"Ġindices":21383,"ĠCreate":21384,"ittle":21385,"ĠWer":21386,"ĠMond":21387,"Ġoz":21388,"ĠSmoke":21389,"Ġreplies":21390,"ĠDH":21391,"Ġjud":21392,"ĠFalk":21393,"Ġ---":21394,"Ġconstitutes":21395,"Ġtheat":21396,"119":21397,"Ġintermediate":21398,"vill":21399,"ĠGow":21400,"ĠHut":21401,"ł":21402,"155":21403,"ĠLocated":21404,"ĠDoor":21405,"Ġsliced":21406,"aru":21407,"Ġtearing":21408,"defense":21409,"oyer":21410,"Ġprodu":21411,"Ġseminar":21412,"asso":21413,"Ġpeaks":21414,"Ġconceal":21415,"Ġcrypto":21416,"Ġsetbacks":21417,"ĠAlicia":21418,"ĠFAA":21419,"Ġcontinuity":21420,"Ġcatastrophe":21421,"Ġbeg":21422,"Ġscales":21423,"apixel":21424,"Ġsalon":21425,"Ste":21426,"Ġlesbian":21427,"Ġanticip":21428,"Ġutilization":21429,"Ġchickens":21430,"Ġspinal":21431,"ĠJuliet":21432,"ĠFas":21433,"prising":21434,"ĠSalvation":21435,"Ġ138":21436,"Ġutilizing":21437,"âĢ¢":21438,"ĠMessenger":21439,"Ġrebellion":21440,"ĠAlexand":21441,"Ġinsect":21442,"Ġribs":21443,"ĠBild":21444,"Ġmonopoly":21445,"Queen":21446,"ĠNaples":21447,"Ġ133":21448,"Ġhourly":21449,"Ġego":21450,"Ġpencil":21451,"ĠPew":21452,"Ġdesirable":21453,"vant":21454,"ĠLAT":21455,"Ġperpet":21456,"lish":21457,"Ġ201":21458,"Ġdistances":21459,"Ġdistressed":21460,"Work":21461,"Ġtattoos":21462,"Ġstereotypes":21463,"istent":21464,"ĠCoral":21465,"fo":21466,"Ġpayable":21467,"Ġakin":21468,"ĠLis":21469,"ĠFinding":21470,"Ġsusceptible":21471,"ĠKiw":21472,"Ġforgiveness":21473,"ĠMoment":21474,"ĠDmitry":21475,"Ġrenov":21476,"Ġquint":21477,"ĠWaterloo":21478,"ĠReality":21479,"Ġstray":21480,"ĠBeaver":21481,"Ġbites":21482,"Ġelusive":21483,"Ġvirtue":21484,"Ġgadgets":21485,"Ġlandslide":21486,"ĠHealthy":21487,"Ġpits":21488,"Donnell":21489,"Ġirony":21490,"uct":21491,"Ġpractitioners":21492,"Ġreck":21493,"governmental":21494,"Ġatomic":21495,"Ġmotiv":21496,"Ġpolic":21497,"Ġcommunicated":21498,"ĠHS":21499,"Ġcriticize":21500,"Ġsynerg":21501,"Del":21502,"ĠRoe":21503,"Ġinspirational":21504,"ĠWarning":21505,"pel":21506,"Ġnevertheless":21507,"Ġdespair":21508,"Ġ(.":21509,"Ġfearing":21510,"Ġgrop":21511,"tree":21512,"Ġtrusts":21513,"Ġinterviewing":21514,"amic":21515,"Ġscor":21516,"ject":21517,"Another":21518,"pose":21519,"Ġdepicted":21520,"ĠPhotography":21521,"ĠLenovo":21522,"ĠEpic":21523,"ĠBoot":21524,"GI":21525,"enses":21526,"Class":21527,"arity":21528,"Ġservicing":21529,"ĠHann":21530,"Ġawe":21531,"Ġoverdoses":21532,"ĠFinnish":21533,"Ġpav":21534,"ĠPCs":21535,"SEC":21536,"ĠStro":21537,"Ġattracts":21538,"Ġapprehended":21539,"128":21540,"Ġunstable":21541,"ĠOutdoor":21542,"Ġcloth":21543,"ĠUlster":21544,"Ġvisually":21545,"Ġsculpt":21546,"Ġsufficiently":21547,"ĠKendrick":21548,"Ġengages":21549,"Ġknives":21550,"ĠGut":21551,"Ġarbit":21552,"osition":21553,"Ġemoji":21554,"Ġpinpoint":21555,"Ġremembering":21556,"rence":21557,"ĠVish":21558,"Ġimproperly":21559,"Ġranc":21560,"Ġupstream":21561,"Ġcheckpoint":21562,"Ġrash":21563,"eson":21564,"Ġtoes":21565,"260":21566,"Ġinvalid":21567,"Ġonions":21568,"Ġlashed":21569,"ĠDong":21570,"Ġprovisional":21571,"ĠFern":21572,"Ġirresponsible":21573,"actively":21574,"ĠKnown":21575,"Ġben":21576,"ĠBlank":21577,"Ġactresses":21578,"paying":21579,"Ġsyrup":21580,"isman":21581,"Ġeducating":21582,"Sunday":21583,"ifiable":21584,"Post":21585,"Ġcalculation":21586,"Ġhesitate":21587,"ĠIncreasing":21588,"Ġreeling":21589,"ĠDairy":21590,"ensing":21591,"Ġmaternity":21592,"Ø":21593,"./":21594,"ĠElm":21595,"Ġweddings":21596,"ĠYard":21597,"117":21598,"ĠRocket":21599,"OF":21600,"Ġtreasurer":21601,"Ġrattled":21602,"ĠDrop":21603,"arel":21604,"ĠFulton":21605,"ĠGiant":21606,"ĠFloor":21607,"Jet":21608,"ikk":21609,"ĠBucs":21610,"ostics":21611,"reme":21612,"ĠRouse":21613,"Ġdeliber":21614,"ĠEle":21615,"Ġconducts":21616,"ĠBlog":21617,"connected":21618,"Ġprayed":21619,"Ġcolourful":21620,"Ġaugmented":21621,"Ġbatted":21622,"Ġrelevance":21623,"ĠRomanian":21624,"acqu":21625,"ĠChel":21626,"ĠClo":21627,"ĠGraves":21628,"Ġchees":21629,"ĠGibbs":21630,"CLE":21631,"Ġfertility":21632,"Ġambul":21633,"Ġspecs":21634,"ĠIRA":21635,"ĠBooth":21636,"ithe":21637,"ĠPlayoff":21638,"ammed":21639,"Ġcollaborating":21640,"Ġlunar":21641,"Ġconfronting":21642,"Ġattribute":21643,"King":21644,"riz":21645,"Ġcasualty":21646,"acia":21647,"waters":21648,"Ġpaving":21649,"Ġcaregivers":21650,"nor":21651,"Ġreacting":21652,"ĠHash":21653,"Ġsqueezed":21654,"Ġexert":21655,"ĠMichele":21656,"ĠConc":21657,"ĠHep":21658,"Ġsewage":21659,"wart":21660,"GY":21661,"Ġdiscourage":21662,"ĠFir":21663,"Ġtextile":21664,"ĠSpice":21665,"ĠFah":21666,"Ġcomplainant":21667,"Ġinstinct":21668,"camp":21669,"ĠEdison":21670,"ĠVIDEOS":21671,"LM":21672,"ĠSands":21673,"About":21674,"Ġdisk":21675,"brid":21676,"Ġmuted":21677,"ACC":21678,"Ġwre":21679,"event":21680,"Ġicons":21681,"Express":21682,"udes":21683,"ĠBeatles":21684,"color":21685,"ĠHaas":21686,"ĠWolfe":21687,"ĠYOUR":21688,"Ġaccessibility":21689,"ĠCornwall":21690,"Ġing":21691,"Ġatrocities":21692,"weather":21693,"ĠDominion":21694,"ĠMIL":21695,"ĠLara":21696,"Ġunravel":21697,"Ġmaneuver":21698,"Ġfoam":21699,"ribe":21700,"CI":21701,"Ġcandles":21702,"acs":21703,")(":21704,"coon":21705,"ĠPurple":21706,"ĠGovernors":21707,"ĠKeystone":21708,"ĠYuk":21709,"file":21710,"Ġviol":21711,"gery":21712,"370":21713,"train":21714,"Ġgunshots":21715,"olin":21716,"Ġviruses":21717,"ĠTex":21718,"hours":21719,"Ġprev":21720,"ĠRid":21721,"ected":21722,"ĠVog":21723,"riers":21724,"Ġmurdering":21725,"ĠIz":21726,"Ġdeliberations":21727,"arming":21728,"unda":21729,"Ġrink":21730,"ĠDrugs":21731,"idered":21732,"Ġforge":21733,"Ġexpansive":21734,"VIEW":21735,"ĠBots":21736,"Ġswitches":21737,"KO":21738,"atten":21739,"Ġvariants":21740,"ĠVirtual":21741,"ĠCoch":21742,"yon":21743,"ĠKai":21744,"Ġbullied":21745,"iday":21746,"version":21747,"Ġlib":21748,"ĠCec":21749,"igated":21750,"ĠTRUMP":21751,"ĠPod":21752,"Ġtoppled":21753,"Ġeyeing":21754,"ĠPatients":21755,"techn":21756,"Ġhampered":21757,"Ġavert":21758,"ĠScheme":21759,"ĠCorm":21760,"Ġpony":21761,"Ġzoom":21762,"abo":21763,"Ġsleeves":21764,"lane":21765,"ĠLester":21766,"ĠDane":21767,"Ġcough":21768,"Ġsignings":21769,"HER":21770,"Ġsibling":21771,"Ġredemption":21772,"Ġstockp":21773,"ĠAlgeria":21774,"Ġpadd":21775,"ĠBrenda":21776,"uchi":21777,"Ġtransporting":21778,"Ġspeculative":21779,"ĠSek":21780,"abal":21781,"Ġshipment":21782,"oker":21783,"Ġwarranty":21784,"atan":21785,"Ġblister":21786,"ĠCelebration":21787,"Ġwal":21788,"Ġlac":21789,"Ġprioritize":21790,"ression":21791,"BP":21792,"Ġcollaborated":21793,"ĠNewsletter":21794,"ĠDamian":21795,"ĠResidential":21796,"Ġgra":21797,"Ġfeasible":21798,"ĠCrest":21799,"ĠBean":21800,"ĠSturgeon":21801,"ĠTale":21802,"ĠContin":21803,"ĠMush":21804,"Ġrocking":21805,"ĠMane":21806,"ĠHumane":21807,"resistant":21808,"ĠFra":21809,"highest":21810,"fts":21811,"Ġamassed":21812,"ĠPavilion":21813,"ĠSkin":21814,"Ġunfold":21815,"Ġresur":21816,"ĠPET":21817,"model":21818,"Ġemploying":21819,"Ġrude":21820,"Ġirrelevant":21821,"angu":21822,"Page":21823,"PN":21824,"igator":21825,"ĠReb":21826,"ĠArrest":21827,"ĠGund":21828,"Ġmalls":21829,"zhen":21830,"wed":21831,"Ġdaring":21832,"Ġfactual":21833,"ĠGent":21834,"Ġinforming":21835,"ĠStri":21836,"ĠLounge":21837,".]":21838,"ĠTribunal":21839,"ĠMoines":21840,"Ġshadows":21841,"generated":21842,"fulness":21843,"Ġheartfelt":21844,"ĠLivingston":21845,"ĠClerk":21846,"Ġnationalism":21847,"ĠMiche":21848,"balls":21849,"anos":21850,"agle":21851,"Ġprejudice":21852,"Ġevenly":21853,"Ġswearing":21854,"Ġexits":21855,"Ġcondemning":21856,"Ġvanilla":21857,"club":21858,"ĠFunding":21859,"ĠDover":21860,"Ġhots":21861,"Ġfres":21862,"Ġgoodness":21863,"ĠMcKay":21864,"Ġbulls":21865,"avia":21866,"129":21867,"Ġ1947":21868,"Ġdefamation":21869,"ĠMoran":21870,"irms":21871,"ĠFitz":21872,"ĠRossi":21873,"urated":21874,"Ġvariation":21875,"ĠBauer":21876,"ĠSchro":21877,"Ġcolony":21878,"ĠParliamentary":21879,"ikan":21880,"Ġstirring":21881,"ĠSheldon":21882,"Ġaccessory":21883,"ĠUtilities":21884,"Ġnab":21885,"Ġpract":21886,"Ġherein":21887,"ĠRole":21888,"ĠMant":21889,"Ġpharm":21890,"Ġ215":21891,"ĠNGO":21892,"ĠAnything":21893,"ĠMacedonia":21894,"Ġbree":21895,"ĠWTO":21896,"Chicago":21897,"ĠProtect":21898,"quarters":21899,"ĠGrassley":21900,"ĠInteractive":21901,"ĠInterview":21902,"Ġ550":21903,"Ġastronauts":21904,"Ġfreak":21905,"ĠIntegrated":21906,"Ġindict":21907,"Ġgenerators":21908,"acio":21909,"Kevin":21910,"Ġvaccination":21911,"Ġblockade":21912,"ĠSons":21913,"Ġcapita":21914,"ĠAnita":21915,"ĠExport":21916,"ĠNex":21917,"ĠAram":21918,"Ġzinc":21919,"Ġrevamped":21920,"Ġselective":21921,"Ġmanipulate":21922,"ĠBedford":21923,"ĠBattery":21924,"Ġqualifiers":21925,"lean":21926,"Ġscrew":21927,"film":21928,"ror":21929,"ĠEllison":21930,"ombo":21931,"ĠOst":21932,"165":21933,"Ġslaves":21934,"ĠPayton":21935,"Ġbarg":21936,"Ġrugged":21937,"ĠWinn":21938,"ĠHammer":21939,"ĠUPS":21940,"Euro":21941,"Ġunfamiliar":21942,"Ġdistract":21943,"Ġbuffer":21944,"ledge":21945,"Ġtrunk":21946,"Ġ320":21947,"122":21948,"Ġdilemma":21949,"Ġpra":21950,"Ġutmost":21951,"Ġcampaigners":21952,"icular":21953,"eful":21954,"�":21955,"ĠHQ":21956,"neau":21957,"Ġsir":21958,"test":21959,"Company":21960,"Ġrescind":21961,"ardon":21962,"MG":21963,"Gov":21964,"ĠRaz":21965,"Ġrod":21966,"fed":21967,"Ġpsych":21968,"Ġunin":21969,"ĠArbor":21970,"Ġnewcomer":21971,"ĠEdwin":21972,"raising":21973,"quist":21974,"Ġdiscoveries":21975,"Steve":21976,"Ġscramble":21977,"js":21978,"Ġacoustic":21979,"Ġdeterioration":21980,"Ġobserving":21981,"ĠWinning":21982,"ĠSaban":21983,"idy":21984,"Ġoverd":21985,"Ġscouting":21986,"Ġpunitive":21987,"ĠShelter":21988,"Ġmocked":21989,"Ġdreamed":21990,"Ġinvaluable":21991,"LP":21992,"standard":21993,"Ġrecounted":21994,"ĠSabres":21995,"points":21996,"Ġfringe":21997,"ĠBarker":21998,"alian":21999,"ĠPROV":22000,"Ġcartel":22001,"Ġovercrowd":22002,"tain":22003,"Year":22004,"ĠWelfare":22005,"ĠChr":22006,"Ġintroduces":22007,"ĠDoing":22008,"ĠGlover":22009,"Ġdeteriorating":22010,"Par":22011,"Ġattendant":22012,"ĠMold":22013,"ĠFlying":22014,"ovan":22015,"Ġoptimize":22016,"Ġchapters":22017,"Ġdull":22018,"gay":22019,"ĠATP":22020,"ĠKah":22021,"ainer":22022,"feet":22023,"Ġjoking":22024,"Ġdisadvantage":22025,"Rep":22026,"Ġtwisted":22027,"Ġslain":22028,"Ġcomprise":22029,"Ġrestricting":22030,"Ġdispos":22031,"Ġshaky":22032,"Ġembattled":22033,"owe":22034,"conscious":22035,"oken":22036,"Ġmistaken":22037,"ĠDra":22038,"Ġreservoir":22039,"Ġspate":22040,"Scott":22041,"avor":22042,"Ġqual":22043,"amel":22044,"hunt":22045,"ĠChevy":22046,"Ġclaw":22047,"Ġwitch":22048,"ĠZimmerman":22049,"arium":22050,"Ġrubbish":22051,"Ġstrings":22052,"Ġdoc":22053,"Ġplaque":22054,"ĠCyr":22055,"Ġflourish":22056,"Ġworthwhile":22057,"Ġbanners":22058,"ĠLemon":22059,"ĠRainbow":22060,"Ġconsisted":22061,"ĠHOW":22062,"Ñ":22063,"Ġblogs":22064,"CLUS":22065,"eely":22066,"Ġbeast":22067,"ĠMai":22068,"Ġhostility":22069,"eros":22070,"Ġforeseeable":22071,"ĠCorker":22072,"ĠWEEK":22073,"visors":22074,"ressive":22075,"ĠViktor":22076,"Ġbureaucracy":22077,"Ġ256":22078,"ĠFeel":22079,"ĠAdventure":22080,"Ġefficacy":22081,"ĠInstitution":22082,"ĠHarbaugh":22083,"ĠPractice":22084,"ĠChristianity":22085,"Thanks":22086,"Ġfridge":22087,"idel":22088,"Ġeff":22089,"Ġvein":22090,"terms":22091,"Ġignorance":22092,"Ġscream":22093,"Ġwit":22094,"ĠRousse":22095,"ĠWillow":22096,"Ġhallway":22097,"former":22098,"Ġshooters":22099,"ĠReporting":22100,"Ġgal":22101,"Ġsavvy":22102,"rand":22103,"Ġremed":22104,"ĠBaron":22105,"inar":22106,"Ġseizures":22107,"ĠThorn":22108,"ĠProtesters":22109,"ĠRevolutionary":22110,"think":22111,"ĠCabrera":22112,"Four":22113,"ĠRudd":22114,"Ġprost":22115,"ĠBottom":22116,"Port":22117,"nas":22118,"ifax":22119,"Wire":22120,"Ġtokens":22121,"antis":22122,"ĠSOU":22123,"ĠMilk":22124,"asters":22125,"Ġshrimp":22126,"Ġcakes":22127,"blue":22128,"ifty":22129,"View":22130,"adium":22131,"fen":22132,"zyk":22133,"ĠEmil":22134,"Ġdismay":22135,"Ġtilt":22136,"aska":22137,"Young":22138,"Ġpredators":22139,"Ġovershadowed":22140,"mitt":22141,"ĠSemin":22142,"ĠSchiff":22143,"ĠClarkson":22144,"212":22145,"210":22146,"Ġvanished":22147,"Ġmesh":22148,"ĠBurnett":22149,"ĠMent":22150,"ĠBlind":22151,"ĠPatriot":22152,"ĠVil":22153,"Ġflick":22154,"ĠTowns":22155,"ĠWhites":22156,"Ġspice":22157,"ĠMode":22158,"Ġnominate":22159,"Ġwrest":22160,"ĠAshes":22161,"Ġrows":22162,"ĠClint":22163,"Ġgentleman":22164,"utan":22165,"athlon":22166,"ĠIntermediate":22167,"hews":22168,"Ġoffended":22169,"ĠPaige":22170,"ĠFinch":22171,"ĠAboriginal":22172,"positive":22173,"Stop":22174,"Ġrenting":22175,"Ġ[â̦]":22176,"ĠHert":22177,"Ġvegetation":22178,"apes":22179,"ĠCanon":22180,"appa":22181,"Ġabst":22182,"ĠKatz":22183,"Ġsurfing":22184,"aghan":22185,"ĠPresidency":22186,"Ġscaling":22187,"ĠSas":22188,"Ġpeanut":22189,"Ġrecommending":22190,"cious":22191,"endez":22192,"eker":22193,"ĠKamp":22194,"Ġsitcom":22195,"Ġcrust":22196,"women":22197,"ĠJes":22198,"ĠWhe":22199,"ĠWarwick":22200,"Ġepit":22201,"ĠAlc":22202,"Ġdictate":22203,"ĠSPORTS":22204,"ĠLanguage":22205,"Ġindicative":22206,"ĠMacDonald":22207,"Ġreorgan":22208,"Ġ`":22209,"ARS":22210,"Ġliberation":22211,"Ġbless":22212,"Ġreflective":22213,"Ġà¤":22214,"Ġdesires":22215,"ĠHank":22216,"ĠLaunch":22217,"Ġrotating":22218,"ĠStones":22219,"Ġcoordinating":22220,"ĠZeit":22221,"Ġskepticism":22222,"ĠAlam":22223,"ĠTrout":22224,"ĠSMS":22225,"ĠCrescent":22226,"ĠTeacher":22227,"Ġfury":22228,"Ġeyebrows":22229,"onga":22230,"ĠPilot":22231,"ĠRutherford":22232,"Ġinterstate":22233,"established":22234,"Ġbaggage":22235,"Ġ131":22236,"riks":22237,"mil":22238,"Ġneon":22239,"Ġqueer":22240,"ourced":22241,"ĠKash":22242,"ĠEleven":22243,"illes":22244,"ĠOpportun":22245,"Ġstre":22246,"Washington":22247,"ĠDifferent":22248,"Ġexempl":22249,"Ġboarded":22250,"Ġrogue":22251,"ĠDNC":22252,"rone":22253,"Ġreversing":22254,"nine":22255,"ĠIvory":22256,"itating":22257,"uve":22258,"Ġfracture":22259,"255":22260,"ĠAssessment":22261,"Ġsubjective":22262,"Ġfluct":22263,"ĠJaguar":22264,"Ġstride":22265,"Ġreapp":22266,"ĠGrow":22267,"against":22268,"ĠMedina":22269,"scenes":22270,"ĠNieto":22271,"Ġsou":22272,"ĠFleming":22273,"Ġnarcotics":22274,"ĠBere":22275,"ĠBub":22276,"ĠAck":22277,"Ġvinyl":22278,"ĠCopy":22279,"ĠGarland":22280,"ĠDuty":22281,"Ġinn":22282,"Ġmerchant":22283,"Ġactivate":22284,"Ġglowing":22285,"ettle":22286,"ĠBran":22287,"Ġsilk":22288,"anco":22289,"TL":22290,"ĠFurn":22291,"Ġwithheld":22292,"Ġpulse":22293,"ĠGU":22294,"BUS":22295,"ĠHyper":22296,"Ġpicnic":22297,"Ġpositives":22298,"ĠParamount":22299,"Ġ737":22300,"Ġenlisted":22301,"ĠValerie":22302,"false":22303,"ĠChocolate":22304,"ĠSTAR":22305,"Ġdescended":22306,"Ġtasty":22307,"ĠDaesh":22308,"ĠNed":22309,"Ġcomplimentary":22310,"Ġdepicting":22311,"ĠHavana":22312,"college":22313,"Ġtraces":22314,"Ġundue":22315,"ĠSisters":22316,"aum":22317,"ĠCourier":22318,"ĠOng":22319,"ĠSparks":22320,"ongs":22321,"ĠYong":22322,"URR":22323,"los":22324,"Ġhorsepower":22325,"confidence":22326,"ĠPett":22327,"ĠMeasure":22328,"Ġmarches":22329,"zig":22330,"ĠTOR":22331,"Ġexported":22332,"ĠRak":22333,"ĠInvestigations":22334,"Ġterminate":22335,"ĠTian":22336,"Ġmasters":22337,"ĠDS":22338,"Ġoutraged":22339,"ĠCups":22340,"ĠWeir":22341,"exec":22342,"Ġjourneys":22343,"Ġabide":22344,"Ġavail":22345,"ĠStreets":22346,"Ġfixes":22347,"Ġcocoa":22348,"Ġabundant":22349,"Ġhubs":22350,"mort":22351,"Ġrobberies":22352,"ĠBark":22353,"Ġprecautions":22354,"Ġhammered":22355,"ometric":22356,"mith":22357,"ĠMcCann":22358,"ĠJaw":22359,"ĠQuest":22360,"ĠMcF":22361,"Ġlob":22362,"Ġlegalized":22363,"Ġquirky":22364,"Ġtrailers":22365,"ĠIndividual":22366,"Ġcumulative":22367,"Ġenlarge":22368,"Ġconvoy":22369,"olen":22370,"got":22371,"landers":22372,"Ġscanner":22373,"Ġscans":22374,"ĠEg":22375,"prof":22376,"Ġhosp":22377,"ĠColo":22378,"Ġerr":22379,"Ġdeval":22380,"ĠUsually":22381,"Ġbul":22382,"ummy":22383,"Ġtandem":22384,"occupied":22385,"Ġmandates":22386,"ĠSwim":22387,"121":22388,"ussed":22389,"EF":22390,"Ġfries":22391,"Until":22392,"rc":22393,"Ġbadge":22394,"Ġstrips":22395,"Ġmagnet":22396,"Ġarchive":22397,"stan":22398,"ĠDeadline":22399,"Ġdisposable":22400,"Ġbob":22401,"Ġnorthwestern":22402,"Jul":22403,"ĠSAL":22404,"Ġinfluencing":22405,"Ġdevil":22406,"ĠEllie":22407,"cms":22408,"ingo":22409,"888":22410,"Ġcosmetic":22411,"Also":22412,"Ġyacht":22413,"Ġlazy":22414,"Ġmerc":22415,"Ġabsorbed":22416,"harm":22417,"116":22418,"Ġsubpoena":22419,"Ġcounters":22420,"ĠLori":22421,"Ġrandomly":22422,"nea":22423,"waves":22424,"Ġrelie":22425,"ĠKiss":22426,"Ġchassis":22427,"Ġbakery":22428,"Images":22429,"ĠHolden":22430,"Ġamazed":22431,"Ġalignment":22432,"ĠPowers":22433,"Ġlabelled":22434,"Ġstaunch":22435,"Ġsignaling":22436,"Ġsenate":22437,"Ġunconventional":22438,"ĠAlternative":22439,"Ġambassadors":22440,"ĠVPN":22441,"atics":22442,"Ġmosquito":22443,"ĠScholarship":22444,"Ġhelpless":22445,"alone":22446,"ZA":22447,"chel":22448,"Ġconstituencies":22449,"ĠCafé":22450,"Ġhatch":22451,"ĠRupert":22452,"Ġrendering":22453,"Ġreinstated":22454,"Ġinterval":22455,"Texas":22456,"ĠAHL":22457,"February":22458,"review":22459,"Ġgle":22460,"Ġfals":22461,"Ġmarkers":22462,"Ġgovernmental":22463,"ĠPos":22464,"Ġarose":22465,"every":22466,"Ġrulings":22467,"obar":22468,"Govern":22469,"gren":22470,"isan":22471,"Ġmarketed":22472,"Click":22473,"Ġord":22474,"Ġballoons":22475,"asers":22476,"ĠHorton":22477,"pub":22478,"ĠAerospace":22479,"Ġflank":22480,"Ġmolecular":22481,"bour":22482,"nuts":22483,"Ġalliances":22484,"Ġbenchmarks":22485,"ocate":22486,"stadt":22487,"ĠGoodwin":22488,"lap":22489,"ĠFactors":22490,"Never":22491,"ĠNem":22492,"Ġroadside":22493,"orth":22494,"Ġexhibited":22495,"ĠPearce":22496,"ĠOlsen":22497,"Ġpostal":22498,"ĠLiberation":22499,"reen":22500,"mary":22501,"Ġropes":22502,"Ġlarg":22503,"Ġgob":22504,"boys":22505,"ĠSax":22506,"Ġreimbursement":22507,"ĠVie":22508,"ĠCatholics":22509,"ĠMartial":22510,"Ġpremiered":22511,"Ġawaits":22512,"ĠUnderstanding":22513,"ĠBelarus":22514,"ĠVor":22515,"ogi":22516,"iaz":22517,"Ġvictorious":22518,"Ġancestors":22519,"Ġwreckage":22520,"Ġoppression":22521,"ĠChildhood":22522,"Ġwidth":22523,"ĠPlymouth":22524,"ĠFifty":22525,"Ġoccupancy":22526,"etts":22527,"ĠFiscal":22528,"lifting":22529,"ĠTraditional":22530,"Ġnostalgia":22531,"Law":22532,"Ġlays":22533,"Ġarresting":22534,"Ġanticipating":22535,"Ġinsults":22536,"ĠExtension":22537,"Ġgenerator":22538,"ummer":22539,"Ġageing":22540,"Ġbouncing":22541,"ember":22542,"ĠWAR":22543,"ĠNico":22544,"ĠWow":22545,"ĠRaven":22546,"flower":22547,"ĠCrim":22548,"bh":22549,"Ġundo":22550,"Ġburgers":22551,"roud":22552,"ĠAtkinson":22553,"ĠYEAR":22554,"Ġpoorer":22555,"ICA":22556,"ĠSchedule":22557,"Ġstronghold":22558,"ĠMillennium":22559,"Ġ###":22560,"ilda":22561,"ĠGH":22562,"Ġupscale":22563,"aldi":22564,"ĠResolution":22565,"Ġswelling":22566,"Ġgrieving":22567,"ĠNile":22568,"ĠTig":22569,"ERY":22570,"ooth":22571,"BALL":22572,"Ġballet":22573,"Ġbucks":22574,"ĠUV":22575,"akin":22576,"Ġchilling":22577,"Ġdatabases":22578,"ĠGD":22579,"section":22580,"Ġhires":22581,"Ġmul":22582,"Ġsen":22583,"ĠTownsend":22584,"Ġinspected":22585,"ilic":22586,"Ġdiscriminatory":22587,"fol":22588,"Ġalcoholic":22589,"ĠHoff":22590,"Carl":22591,"Ġvicinity":22592,"lein":22593,"ĠEco":22594,"ĠGovern":22595,"Ġsecrecy":22596,"aned":22597,"ĠDUP":22598,"Ġ570":22599,"Ġsow":22600,"Ġstalls":22601,"Ġinsulting":22602,"ĠDT":22603,"Ġinforms":22604,"fitting":22605,"ĠDepending":22606,"ĠMelanie":22607,"ĠThom":22608,"path":22609,"Ġadmired":22610,"Peter":22611,"idents":22612,"ielding":22613,"ĠShanahan":22614,"TD":22615,"Things":22616,"sn":22617,"Ġconstituted":22618,"Ġ137":22619,"Ġderailed":22620,"ĠBonnie":22621,"Ġgraffiti":22622,"Ġearnest":22623,"Ġcompliant":22624,"blown":22625,"Ġalle":22626,"prise":22627,"Ġfocal":22628,"Ġgentlemen":22629,"ĠTalks":22630,"Ġpassports":22631,"Ġdeprived":22632,"Ġdude":22633,"ĠNath":22634,"Ġgoverned":22635,"Ġsac":22636,"Ġcastle":22637,"qv":22638,"Ġtolerated":22639,"ĠSci":22640,"close":22641,"ĠDynamics":22642,"Ġflashing":22643,"yk":22644,"ĠConsolid":22645,"Ġinherently":22646,"ĠForrest":22647,"Gene":22648,"Public":22649,"Ġloser":22650,"runners":22651,"Ġprudent":22652,"Ġpioneering":22653,"ĠHowe":22654,"ĠButter":22655,"ĠArabian":22656,"acha":22657,"ĠBBQ":22658,"ĠMineral":22659,"Ġdestiny":22660,"Ġretrieve":22661,"ĠBav":22662,"reth":22663,"oby":22664,"ĠGrid":22665,"Ġgrievances":22666,"ĠTips":22667,"Ġadamant":22668,"Ġdiets":22669,"Ġmilestones":22670,"Ġcollects":22671,"ĠLaboratories":22672,"ĠWC":22673,"Ġpostp":22674,"Ġdams":22675,"ĠOEM":22676,"Ġrumor":22677,"Ġlocking":22678,"Ġemission":22679,"Ġqueries":22680,"Jones":22681,"Ġlang":22682,"ĠAcqu":22683,"ĠMedium":22684,"ĠTreasurer":22685,"Sept":22686,"FB":22687,"Ġintegrating":22688,"Ġbolstered":22689,"Ġincorporating":22690,"encers":22691,"Ġirregularities":22692,"Ġnom":22693,"iod":22694,"ĠAi":22695,"Ġsor":22696,"anked":22697,"Ġrehears":22698,"fig":22699,"ĠBug":22700,"hoff":22701,"Ġtrooper":22702,"Ġgalaxy":22703,"amon":22704,"ĠAtlas":22705,"Ġsolicit":22706,"Ġsings":22707,"ĠInstructions":22708,"ĠMig":22709,"thinking":22710,"ĠCostco":22711,"Ġbreasts":22712,"Ġportraits":22713,"ĠCock":22714,"Ġsubscriptions":22715,"Ġpine":22716,"Ġhaunted":22717,"ĠMED":22718,"eer":22719,"ega":22720,"ĠZa":22721,"ENN":22722,"ĠWinners":22723,"aith":22724,"safe":22725,"Ġ143":22726,"ĠWeston":22727,"ĠLansing":22728,"ĠLaurel":22729,"ocrat":22730,"ograph":22731,"Ġmatchups":22732,"ĠFriend":22733,"Ġdigest":22734,"Ġdimensions":22735,"azing":22736,"Ġtipping":22737,"Ġenrich":22738,"gart":22739,"argo":22740,"Ġoutbreaks":22741,"Ġsalvage":22742,"ĠErica":22743,"Ġmodules":22744,"ĠPDF":22745,"ĠGoods":22746,"oots":22747,"2011":22748,"Ġinterrupt":22749,"Ġradi":22750,"ĠSimone":22751,"vell":22752,"ĠSV":22753,"extremely":22754,"Ġstadiums":22755,"ĠRox":22756,"Ġconflicting":22757,"Ġyouthful":22758,"ĠUM":22759,"series":22760,"Ġded":22761,"Ġfielding":22762,"Pre":22763,"itled":22764,"Ġstreamed":22765,"Ġapprentices":22766,"ĠAlec":22767,"ĠGap":22768,"ĠPrem":22769,"Ġleased":22770,"Ġdeepening":22771,"Ġbounds":22772,"Ġrethink":22773,"ĠVoting":22774,"ĠScha":22775,"blood":22776,"ĠReeves":22777,"Ġbells":22778,"Ġcollector":22779,"ĠCrimson":22780,"ĠWheat":22781,"207":22782,"ĠHB":22783,"ĠBCC":22784,"Ġsync":22785,"ĠAnders":22786,"Ġthanking":22787,"Ġlayoffs":22788,"Ġfoolish":22789,"Ġcustod":22790,"Ġelephants":22791,"Ġcorrelation":22792,"ĠHarding":22793,"ĠGPU":22794,"ĠBarnett":22795,"Ġol":22796,"Ġalarms":22797,"Ġfluctuations":22798,"shop":22799,"Ġcommentators":22800,"ĠAlpine":22801,"Ġmur":22802,"Ġbiotech":22803,"Ġunlocked":22804,"ouri":22805,"roe":22806,"ĠPayment":22807,"ĠPOL":22808,"ĠGuest":22809,"Ġphrases":22810,"ĠBuilt":22811,"erves":22812,"Ġnutritional":22813,"205":22814,"ourage":22815,"Related":22816,"Come":22817,"ĠSAT":22818,"Ġgatherings":22819,"Ġsquads":22820,"Ġorganising":22821,"Ġministerial":22822,"Ġkilomet":22823,"ĠJump":22824,"ĠStrength":22825,"ĠFerr":22826,"Ġillustrated":22827,"ĠOber":22828,"Ġextrad":22829,"Ġlimitation":22830,"idis":22831,"ĠMonths":22832,"ifts":22833,"Ġmotives":22834,"Ġmaternal":22835,"Ġbait":22836,"Ġadversity":22837,"Twitter":22838,"ĠUni":22839,"Ġgrappling":22840,"Ġbowls":22841,"ĠHib":22842,"ĠCopenhagen":22843,"Ġsergeant":22844,"Ġintro":22845,"Ġscrambled":22846,"ĠExc":22847,"Ġshowcases":22848,"Ġplotting":22849,"Ġsym":22850,"ĠNah":22851,"berries":22852,"itching":22853,"conn":22854,"istle":22855,"ĠBeginning":22856,"asley":22857,"ĠMeadow":22858,"ĠCra":22859,"Ġsupremacist":22860,"Ġsweats":22861,"production":22862,"innon":22863,"ovo":22864,"Ġscept":22865,"Ġdrowning":22866,"ĠEh":22867,"Ġdecorations":22868,"Ġsympathetic":22869,"raction":22870,"Ġ195":22871,"ripp":22872,"ĠNotice":22873,"charging":22874,"ĠDIY":22875,"ĠJin":22876,"Ġskinny":22877,"Ġmaj":22878,"Ġwhisk":22879,"Ġcongreg":22880,"RAL":22881,"Ġvolley":22882,"Ġestablishments":22883,"Ġcite":22884,"Miss":22885,"Int":22886,"iola":22887,"ĠBare":22888,"KING":22889,"ools":22890,"private":22891,"Ġflaw":22892,"Ġwires":22893,"Ġideals":22894,"oub":22895,"Ġ\"'":22896,"ĠCompet":22897,"ĠStatements":22898,"ĠHDR":22899,"rm":22900,"Ġbegging":22901,"uffs":22902,"Ġdispatch":22903,"Ġskipped":22904,"Ġlabs":22905,"hawks":22906,"Ġexpl":22907,"Ġpatriotic":22908,"ussions":22909,"Ġportrayal":22910,"ĠBudapest":22911,"ĠCod":22912,"Ġextingu":22913,"smart":22914,"Ġburdens":22915,"ĠDrama":22916,"Ġaltitude":22917,"Ġpursuant":22918,"à¥":22919,"atari":22920,"cot":22921,"Ġhotline":22922,"ooters":22923,"ĠRolls":22924,"Ġjeopardy":22925,"oids":22926,"Ġpageant":22927,"149":22928,"Ġdistinguish":22929,"support":22930,"ĠHighlands":22931,"ĠErnst":22932,"ĠHole":22933,"pering":22934,"ĠHasan":22935,"Ġrece":22936,"Ġirregular":22937,"Ġdisturbed":22938,"Ġcoupon":22939,"ĠElijah":22940,"oise":22941,"Ġfriendships":22942,"girlfriend":22943,"Ġrampage":22944,"arers":22945,"Ġdispens":22946,"assion":22947,"Ġtentative":22948,"ĠExploration":22949,"fashioned":22950,"ĠInstit":22951,"Ġthemed":22952,"ĠKurdistan":22953,"ĠCAL":22954,"ĠSweeney":22955,"Ġransom":22956,"Ġstamps":22957,"ĠSchwe":22958,"ĠLucia":22959,"124":22960,"omore":22961,"Ġmotivate":22962,"ĠWorcester":22963,"wald":22964,"CAR":22965,"iken":22966,"andro":22967,"ffic":22968,"ĠRehab":22969,"Ġgrou":22970,"Ġcontrollers":22971,"ĠHai":22972,"nz":22973,"Ġartillery":22974,"ĠMish":22975,"Ġregistry":22976,"Ġfrontman":22977,"ĠCharg":22978,"orneys":22979,"ĠPRESS":22980,"Ġperceptions":22981,"ĠMcGee":22982,"AU":22983,"mg":22984,"Off":22985,"ĠNGOs":22986,"chemical":22987,"Ġbrun":22988,"ĠHav":22989,"Ġlace":22990,"Ġ202":22991,"Ġdefer":22992,"Ġinjected":22993,"Ġgluten":22994,"ĠRin":22995,"ĠAvalanche":22996,"Ġcorpor":22997,"ĠPamela":22998,"Ġfills":22999,"ĠReve":23000,"ĠMonument":23001,"Ġnationalists":23002,"ĠIQ":23003,"adden":23004,"ĠLoop":23005,"Ġ134":23006,"Reg":23007,"click":23008,"bush":23009,"ĠKub":23010,"ipes":23011,"Ġtoggle":23012,"ĠRae":23013,"Ġburgl":23014,"Ġholistic":23015,"ronics":23016,"Ġprominence":23017,"jack":23018,"Ġfinan":23019,"icates":23020,"Ġvel":23021,"important":23022,"Thursday":23023,"chet":23024,"Ġrefunds":23025,"ĠElder":23026,"ĠOwner":23027,"Ġtakeaway":23028,"Pe":23029,"ĠToro":23030,"Tim":23031,"fix":23032,"before":23033,"ĠMotorola":23034,"Ġlev":23035,"Term":23036,"ĠSne":23037,"Ġmisinformation":23038,"ĠSinai":23039,"Ġnitrogen":23040,"Ġ203":23041,"Ġescaping":23042,"Ġjunction":23043,"ĠSantana":23044,"ĠYemeni":23045,"Ġwhipped":23046,"ĠStephenson":23047,"Ġattire":23048,"ĠBard":23049,"atically":23050,"ĠFaul":23051,"ĠSym":23052,"resh":23053,"ĠMG":23054,"Sub":23055,"ĠCarmen":23056,"Ġig":23057,"ĠSanford":23058,"ĠYa":23059,"cycle":23060,"Ġencryption":23061,"ĠScal":23062,"ĠChest":23063,"ĠMadonna":23064,"agin":23065,"ĠDHS":23066,"ĠCed":23067,"YR":23068,"Ġtruce":23069,"ĠBike":23070,"Ġfoes":23071,"ĠSlovakia":23072,"adal":23073,"Rain":23074,"OPE":23075,"Ġlockdown":23076,"Ġunilateral":23077,"Ġoverseen":23078,"Ġblames":23079,"Ġbarrage":23080,"aan":23081,"uds":23082,"ĠRust":23083,"ĠHC":23084,"cox":23085,"ĠAllied":23086,"ĠJosé":23087,"pected":23088,"Ġunp":23089,"Ġsomeday":23090,"Ġdeductions":23091,"icial":23092,"ĠPRO":23093,"ĠIntern":23094,"Ġhemp":23095,"Ġkilograms":23096,"Ġnets":23097,"ĠBACK":23098,"early":23099,"outed":23100,"Ġrelegated":23101,"Ġ1958":23102,"ĠMustang":23103,"Ġgamble":23104,"Ġprostitution":23105,"ĠPapa":23106,"Ġinexpensive":23107,"GHz":23108,"Ġjerseys":23109,"Ġmisery":23110,"VIS":23111,"ĠRAW":23112,"Ġthri":23113,"Ġaffiliation":23114,"small":23115,"Ġflashed":23116,"Ġcoastline":23117,"Ġgard":23118,"Ġsv":23119,"Ġwaits":23120,"itton":23121,"London":23122,"Ġaccus":23123,"ĠCharge":23124,"Ġincub":23125,"Ġwanna":23126,"ĠAwareness":23127,"abies":23128,"ĠUh":23129,"Ġpersuaded":23130,"ĠThames":23131,"Ġcurated":23132,"Ī":23133,"Ġbrutally":23134,"Ġrooftop":23135,"Ġoy":23136,"Ġ1900":23137,"bery":23138,"Ġuphill":23139,"Ġinteracting":23140,"Ġchilly":23141,"ERE":23142,"Ġcapsule":23143,"ĠSaul":23144,"ocker":23145,"Ġdeserving":23146,"ĠBowen":23147,"ĠReaders":23148,"ĠWriters":23149,"Ġartifacts":23150,"ĠRanger":23151,"reau":23152,"Ġimperson":23153,"Ġhears":23154,"ĠMaher":23155,"neg":23156,"Ġmantra":23157,"Ġmull":23158,"Ġelders":23159,"ĠAmtrak":23160,"Ġspouses":23161,"ĠHak":23162,"Ġopenness":23163,"Ġprevailed":23164,"Ġfortnight":23165,"Pal":23166,"ride":23167,"Ġillustrate":23168,"dominated":23169,"trust":23170,"ī":23171,"ĠFemale":23172,"ĠSlim":23173,"Ġdesc":23174,"ĠKathryn":23175,"Ġdeepen":23176,"TAIN":23177,"eredith":23178,"Ġchanted":23179,"ĠHector":23180,"bread":23181,"ĠIsa":23182,"Ġvolcanic":23183,"Ġah":23184,"owners":23185,"aquin":23186,"Ġmelting":23187,"Ġpreschool":23188,"ocus":23189,"ĠMast":23190,"ĠMyr":23191,"Ġsuppress":23192,"Ġversatility":23193,"ĠNEC":23194,"Ġhoax":23195,"Ġmutually":23196,"ĠNeb":23197,"ĠWheel":23198,"kit":23199,"abl":23200,"again":23201,"ĠSonny":23202,"rift":23203,"Ġsweater":23204,"Ġinund":23205,"ĠTaco":23206,"ĠBout":23207,"Ġnonprofits":23208,"Ġmodify":23209,"Ġprofessionalism":23210,"ĠGould":23211,"ĠGuerrero":23212,"Ġterribly":23213,"ĠBenz":23214,"Ġcountered":23215,"Ġbean":23216,"ĠPhelps":23217,"Ġprowess":23218,"bc":23219,"Ġfeast":23220,"Ġ5000":23221,"Ġrevisit":23222,"Ġchin":23223,"agent":23224,"Ġtones":23225,"Ġextraction":23226,"ĠPosts":23227,"oin":23228,"Ġattain":23229,"Ġgardening":23230,"earned":23231,"ĠOtto":23232,"player":23233,"Ġscams":23234,"ĠHonolulu":23235,"ĠAppro":23236,"ĠHIGH":23237,"Ġdwell":23238,"Islam":23239,"leaders":23240,"Ġlegisl":23241,"expl":23242,"ĠChoi":23243,"Ġfrenzy":23244,"Ġcommercially":23245,"Ġlbs":23246,"Ġgateway":23247,"ĠAndersen":23248,"emia":23249,"lez":23250,"Ġresidences":23251,"office":23252,"ĠHelsinki":23253,"olia":23254,"Ġwolf":23255,"Ġstyling":23256,"ĠJunction":23257,"ĠPeyton":23258,"udo":23259,"ĠDorothy":23260,"Ġfreshly":23261,"ĠJulio":23262,"ĠSunset":23263,"ĠMadden":23264,"Ġissu":23265,"Ġsounding":23266,"sports":23267,"Ġmassively":23268,"ĠRahman":23269,"Ġpresided":23270,"Instead":23271,"Ġ136":23272,"ĠHowell":23273,"beit":23274,"Ġprosperous":23275,"Ġwrongly":23276,"ĠRaqqa":23277,"ĠCes":23278,"Ġbuddy":23279,"Ġchatting":23280,"Ġfencing":23281,"Ġtant":23282,"ocated":23283,"ALK":23284,"Ġsnapping":23285,"euro":23286,"Ryan":23287,"ĠRecogn":23288,"ucked":23289,"Ġpurported":23290,"ĠCann":23291,"Ġintimidating":23292,"Ġrulers":23293,"ĠMarse":23294,"Art":23295,"ĠAadhaar":23296,"Ġvows":23297,"Ġhunter":23298,"ourmet":23299,"ĠVarious":23300,"2009":23301,"anie":23302,"Ġcompassionate":23303,"ĠParking":23304,"Ġmalaria":23305,"Ġamnesty":23306,"Ġworsened":23307,"ĠTitan":23308,"Ġcrossings":23309,"drug":23310,"Ġaddicted":23311,"Ġremorse":23312,"ĠDestiny":23313,"Dear":23314,"Ġhur":23315,"Ġimplicated":23316,"Ġplayful":23317,"Ġripe":23318,"Ġsizable":23319,"Ġcrab":23320,"Ġliqu":23321,"Ġdrib":23322,"Ġcontraction":23323,"cro":23324,"ĠGus":23325,"Ġdoomed":23326,"Ġmog":23327,"ĠMonitor":23328,"Count":23329,"Ġsadd":23330,"Ġwrestler":23331,"Ġrestraints":23332,"Ġraging":23333,"185":23334,"Ġtapes":23335,"Ġmitigation":23336,"ocratic":23337,"Ġvib":23338,"ĠSnowden":23339,"aldo":23340,"Ġweights":23341,"Ġ1959":23342,"ucc":23343,"ĠCoc":23344,"Log":23345,"ĠStev":23346,"Ġdealership":23347,"Ġtrademarks":23348,"iru":23349,"Ġbeneficiary":23350,"Ġlegislator":23351,"Ġdeadlines":23352,"Ġcosmetics":23353,"ĠTammy":23354,"ĠCombined":23355,"Ġeducator":23356,"athon":23357,"Ġcombo":23358,"fu":23359,"appropriate":23360,"nington":23361,"ĠLiberties":23362,"missions":23363,"opard":23364,"ĠMondays":23365,"Ġfetch":23366,"Ġhers":23367,"jon":23368,"ukes":23369,"zek":23370,"Ġvetting":23371,"yet":23372,"Ġfacilitating":23373,"ĠStras":23374,"character":23375,"ĠHeads":23376,"Ġclim":23377,"ĠAlbuquerque":23378,"Ġbind":23379,"Ġconcluding":23380,"ĠBasically":23381,"rail":23382,"ĠTCU":23383,"ĠDepression":23384,"Ġhem":23385,"ĠHue":23386,"Ġpand":23387,"Ġscoreboard":23388,"Av":23389,"Ġidol":23390,"compl":23391,"Ġredesign":23392,"ĠJarrett":23393,"Ġfavoured":23394,"ĠINS":23395,"Ġpropelled":23396,"Ġevasion":23397,"Ġwidened":23398,"Ġwastewater":23399,"nard":23400,"responsive":23401,"Ġdemographics":23402,"engine":23403,"ĠBrewer":23404,"ĠBaxter":23405,"ront":23406,"ĠColon":23407,"Ġpromoter":23408,"Ġgenres":23409,"ovsky":23410,"build":23411,"urate":23412,"ĠCohn":23413,"design":23414,"Ġturbulent":23415,"Ġcurtain":23416,"310":23417,"ĠLamp":23418,"ĠBonds":23419,"church":23420,"Ġdeterrent":23421,"Ġdictatorship":23422,"acement":23423,"haul":23424,"Ġspir":23425,"Ġconceived":23426,"Ġstern":23427,"sit":23428,"Ġsingular":23429,"ĠYog":23430,"Ġconditional":23431,"Ġide":23432,"lund":23433,"Ġautop":23434,"ĠBEST":23435,"ĠJed":23436,"Ġrationale":23437,"Ġalarmed":23438,"Ġshovel":23439,"ĠProb":23440,"ĠMao":23441,"ĠBurgess":23442,"Ġ1953":23443,"above":23444,"ĠManson":23445,"Ġdismal":23446,"ĠFrankie":23447,"Ġtempted":23448,"Ġunderdog":23449,"ribing":23450,"ENCY":23451,"ĠDele":23452,"Las":23453,"places":23454,"Ġnotoriously":23455,"ĠAkin":23456,"Ġglut":23457,"Ġseamlessly":23458,"Ġrecess":23459,"written":23460,"ĠTJ":23461,"occ":23462,"ĠTerritory":23463,"ĠAIR":23464,"ĠDiagn":23465,"Ġvacancies":23466,"Ġcultivation":23467,"ĠAless":23468,"Ġrenamed":23469,"ĠMahmoud":23470,"bright":23471,"Ġvisibly":23472,"Ġnas":23473,"erred":23474,"ĠCarn":23475,"Ġtriggers":23476,"Ġpunishing":23477,"Ġluc":23478,"ĠBett":23479,"Ġbeam":23480,"ĠCheng":23481,"aina":23482,"Ġdetermines":23483,"ĠGerry":23484,"Ġshocks":23485,"Ġstainless":23486,"Ġdefects":23487,"ĠCinem":23488,"Ġtorrent":23489,"Ġresurgence":23490,"Ġcoral":23491,"Ġblitz":23492,"ĠGel":23493,"Ġstemmed":23494,"gur":23495,"Ġlymph":23496,"zzo":23497,"Ġspearheaded":23498,"Ġlicences":23499,"';":23500,"Ġarbitrary":23501,"ĠUzbek":23502,"Ġthief":23503,"reaching":23504,"Ġcand":23505,"ĠEA":23506,"ĠParaly":23507,"ĠEmerson":23508,"ĠSergey":23509,"ĠScher":23510,"ĠWr":23511,"rowing":23512,"Ġ3000":23513,"Ġmighty":23514,"elight":23515,"mAh":23516,"Ġcelebr":23517,"ĠConclusion":23518,"ĠCathy":23519,"Ġpolished":23520,"uddled":23521,"ewski":23522,"Ġfucking":23523,"Ġinterfering":23524,"Ġlandscapes":23525,"Ġfearful":23526,"ĠDetention":23527,"%).":23528,"ĠTT":23529,"Ġbleak":23530,"Ġindebted":23531,"Ġcheat":23532,"Ġconsolation":23533,"ĠPace":23534,"raine":23535,"Ġhonorary":23536,"420":23537,"Ġtechnician":23538,"ĠComprehensive":23539,"Ġfences":23540,"Ġwearable":23541,"ĠMarilyn":23542,"stru":23543,"Ġdrained":23544,"ĠGibraltar":23545,"lag":23546,"Ġdisorderly":23547,"Ġproclaimed":23548,"Ġcapacities":23549,"Ġretains":23550,"ĠVid":23551,"oshi":23552,"ĠEid":23553,"Ġanalytical":23554,"ominium":23555,"ĠExaminer":23556,"ĠNAACP":23557,"ocol":23558,"rev":23559,"ĠRim":23560,"ĠWoody":23561,"ĠMcKenna":23562,"ĠLennon":23563,"ĠEmploy":23564,"Fort":23565,"psy":23566,"Ġsphere":23567,"oday":23568,"ĠChick":23569,"ĠCompared":23570,"ĠIranians":23571,"ĠAccountability":23572,"itchie":23573,"ĠDickinson":23574,"Ġflock":23575,"Ġeclips":23576,"Ġnat":23577,"anke":23578,"ĠNeighborhood":23579,"Ġ141":23580,"Ġscarce":23581,"Ġcreations":23582,"lists":23583,"Ġuseless":23584,"Ġcriticisms":23585,"Ġruler":23586,"ĠHick":23587,"arya":23588,"worker":23589,"alam":23590,"Angelo":23591,"otle":23592,"Ġnewsletters":23593,"Ġerected":23594,"Ġzip":23595,"ĠBirthday":23596,"Ġdogged":23597,"Ġdanced":23598,"Ġconfession":23599,"Ġvomiting":23600,"ickers":23601,"Ġfox":23602,"Ġdeduct":23603,"Ġstresses":23604,"poll":23605,"ĠRadar":23606,"Ġengagements":23607,"Ġexaminer":23608,"Ġopportun":23609,"Ġlongevity":23610,"Ġbanana":23611,"carbon":23612,"uo":23613,"ĠLT":23614,"Ġsynagogue":23615,"Ġblackmail":23616,"INK":23617,"Ġfle":23618,"ĠGutierrez":23619,"Ġracket":23620,"Ġevenings":23621,"Ġdietary":23622,"ĠKok":23623,"Ġfaulty":23624,"Ġabandoning":23625,"ĠFlow":23626,"quest":23627,"estead":23628,"Ġbir":23629,"Ġsuicidal":23630,"ĠGift":23631,"ĠMissing":23632,"ĠMazda":23633,"ĠRib":23634,"ĠJourney":23635,"Ġconcede":23636,"Ġbrushed":23637,"Tw":23638,"andowski":23639,"ĠYun":23640,"Bride":23641,"zai":23642,"awatts":23643,"Ġcha":23644,"Ġspans":23645,"SF":23646,"Ġshells":23647,"planned":23648,"ĠGeographic":23649,"ĠVent":23650,"Ġfav":23651,"Ġinterrogation":23652,"Ġvaries":23653,"ĠPlat":23654,"operative":23655,"avid":23656,"Ġgreatness":23657,"ĠStrait":23658,"ĠSelling":23659,"Ġlawful":23660,"Ġlyn":23661,"Ġfunnel":23662,"Ġpundits":23663,"ties":23664,"Ġpneumonia":23665,"Ġcommencement":23666,"Ġbrisk":23667,"fires":23668,"ĠHTML":23669,"ĠSevent":23670,"Ġhistor":23671,"Ġ147":23672,"olls":23673,"Ġpian":23674,"Little":23675,"Ġcommercials":23676,"Ġdeteriorated":23677,"Ġbasin":23678,"Ġprohibition":23679,"Ġrestrictive":23680,"Ġtom":23681,"ĠPulse":23682,"vale":23683,"Ġmim":23684,"ĠLyons":23685,"ĠTrinidad":23686,"data":23687,"195":23688,"ĠPain":23689,"vor":23690,"ĠDirectorate":23691,"Wow":23692,"essential":23693,"Ġemerges":23694,"ĠDoors":23695,"Ġunde":23696,"Ġarchives":23697,"ĠIX":23698,"ĠAman":23699,"oric":23700,"ĠOper":23701,"nothing":23702,"Ġ142":23703,"igr":23704,"rust":23705,"ĠBYU":23706,"ĠBom":23707,"Ġrift":23708,"ĠAbs":23709,"ĠJenn":23710,"Ġrookies":23711,"hoe":23712,"Ġunderage":23713,"eden":23714,"Ġroasted":23715,"Ġenrol":23716,"Ġerased":23717,"Ġfreeway":23718,"Sil":23719,"Ġplanner":23720,"Ġconfess":23721,"ĠDual":23722,"ĠHeadquarters":23723,"bottom":23724,"Ġstatistic":23725,"ĠPush":23726,"Ġanim":23727,"ITT":23728,"Ġexecutions":23729,"Hub":23730,"ĠStick":23731,"Ġobscure":23732,"oven":23733,"Ġcoats":23734,"unc":23735,"Morning":23736,"Ġnit":23737,"mie":23738,"Ġcurves":23739,"gew":23740,"ĠAnniversary":23741,"members":23742,"ĠAbsolutely":23743,"Ġapt":23744,"otional":23745,"ĠGin":23746,"izo":23747,"Ġpretending":23748,"arak":23749,"Ġorganise":23750,"Ġroyalties":23751,"ĠCamden":23752,"Ġsausage":23753,"Inst":23754,"Ġchalk":23755,"ĠSurf":23756,"ĠSunrise":23757,"Ġmoder":23758,"aido":23759,"loving":23760,"lus":23761,"Ġoblig":23762,"Ġmotions":23763,"Ġclarification":23764,"ĠOM":23765,"Ġbishop":23766,"Ġexhibitions":23767,"ĠRifle":23768,"ĠPhot":23769,"ĠHM":23770,"ATIONAL":23771,"Ġwid":23772,"Ġreside":23773,"ĠPV":23774,"OOK":23775,"ĠTue":23776,"Ġ1200":23777,"Ġ1957":23778,"Ġespionage":23779,"ĠAPPLIC":23780,"Ġblasts":23781,"fter":23782,"Ġimmensely":23783,"ĠLots":23784,"Ġinflammatory":23785,"anging":23786,"Ġtumultuous":23787,"identified":23788,"Ġstead":23789,"ĠAch":23790,"Ãī":23791,"Ġbub":23792,"hler":23793,"olution":23794,"Ġshun":23795,"Ġnull":23796,"Ġunused":23797,"ĠObs":23798,"Ġinsol":23799,"ĠAttack":23800,"ertain":23801,"Ġdefiant":23802,"Through":23803,"ĠArmour":23804,"Ġsimulation":23805,"UCK":23806,"Ġinfluenza":23807,"Ġonset":23808,"Ġbored":23809,"Ġsouls":23810,"Ġreferees":23811,"Ġcollaborations":23812,"ĠLer":23813,"Ġcreepy":23814,"Ġanaly":23815,"ĠEffect":23816,"orting":23817,"Card":23818,"Ġdice":23819,"Ġharvesting":23820,"235":23821,"sty":23822,"ĠMcCartney":23823,"Ġsalute":23824,"UMP":23825,"Ġherb":23826,"ĠAbuse":23827,"ĠRamadan":23828,"Ġsuck":23829,"trained":23830,"ĠPhysical":23831,"iren":23832,"anches":23833,"erie":23834,"Ġhangs":23835,"Ġcataly":23836,"Ġintuitive":23837,"assi":23838,"Ġtechn":23839,"Ġjugg":23840,"Ġgameplay":23841,"Ġapolog":23842,"Ġfifteen":23843,"Ġgalleries":23844,"Ġoutlines":23845,"patient":23846,"ĠPotential":23847,"Ġethnicity":23848,"Ġharbour":23849,"Ġoverthrow":23850,"ĠLung":23851,"Ġwarehouses":23852,"ĠMonitoring":23853,"Ġmentors":23854,"Ġsized":23855,"Ġenvisioned":23856,"Ġgin":23857,"DT":23858,"Ġpropel":23859,"ĠKul":23860,"ference":23861,"estic":23862,"ĠLego":23863,"Ġdinners":23864,"ĠMoe":23865,"designed":23866,"ĠSusp":23867,"ĠBrick":23868,"qua":23869,"IDS":23870,"ĠBam":23871,"athe":23872,"Ġslices":23873,"Ġbottled":23874,"thy":23875,"producing":23876,"ĠTerror":23877,"professional":23878,"ĠKis":23879,"erto":23880,"ĠVehicles":23881,"Ġbeforehand":23882,"Ġdetrimental":23883,"weights":23884,"Ġallowances":23885,"Williams":23886,"ĠSyrians":23887,"ĠSto":23888,"Ġcozy":23889,"reditation":23890,"ensen":23891,"ĠSard":23892,"Ġroy":23893,"ooting":23894,"ĠReserv":23895,"ominated":23896,"emate":23897,"ĠTot":23898,"ĠCarnegie":23899,"ĠThib":23900,"ĠMarshal":23901,"Ġ152":23902,"Ġmayors":23903,"inery":23904,"ĠFiona":23905,"ĠCadillac":23906,"ivated":23907,"Ġeagerly":23908,"ĠOffensive":23909,"Ġastronaut":23910,"ĠVital":23911,"Ġcane":23912,"Ġquitting":23913,"ĠLone":23914,"Ġcensorship":23915,"ĠWelch":23916,"ĠUd":23917,"Ġmarquee":23918,"ĠDip":23919,"Ġwhereby":23920,"Ġtiger":23921,"gem":23922,"Ġconserv":23923,"Ġpresumed":23924,"ĠEntry":23925,"ffer":23926,"ĠProceed":23927,"Ġbrawl":23928,"ĠJaime":23929,"Ġecho":23930,"Ġadvancements":23931,"Ġtransitional":23932,"erick":23933,"Ġbully":23934,"anan":23935,"Ġreinvent":23936,"ĠLetters":23937,"Ġbricks":23938,"ĠSmy":23939,"Ġtowering":23940,"gging":23941,"299":23942,"orian":23943,"dimensional":23944,"ĠForty":23945,"ĠSinn":23946,"ushi":23947,"ĠSurveillance":23948,"enabled":23949,"ĠMous":23950,"ĠVive":23951,"Marcus":23952,"Ġvom":23953,"Ġcreek":23954,"Ġlime":23955,"Ġseismic":23956,"ĠFork":23957,"Ġembroiled":23958,"marks":23959,"Ġherald":23960,"ĠSonia":23961,"â̦\"":23962,"wired":23963,"Ġobliged":23964,"ĠProjects":23965,"lde":23966,"ĠRiders":23967,"Ġovercoming":23968,"Mail":23969,"ĠLawn":23970,"ĠHawk":23971,"figure":23972,"ĠWritten":23973,"Ġens":23974,"Ġspacious":23975,"target":23976,"ĠRecep":23977,"ĠSAM":23978,"Ġentertained":23979,"Ġignited":23980,"ĠCENT":23981,"ogenic":23982,"Ġunatt":23983,"Ġexceeds":23984,"Ġ--------------------------------":23985,"Ġpillars":23986,"ĠBorders":23987,"ickey":23988,"Ġextinction":23989,"Ġviability":23990,"Ġtumors":23991,"ĠWilkinson":23992,"ĠKEY":23993,"Ġbins":23994,"ĠReported":23995,"Sm":23996,"ĠExclusive":23997,"ĠChilean":23998,"info":23999,"Ġwilderness":24000,"did":24001,"absolutely":24002,"pillar":24003,"Ġelites":24004,"ĠPreview":24005,"ixie":24006,"Mont":24007,"ribut":24008,"dream":24009,"Ġplanners":24010,"ĠSomerset":24011,"Ġenvis":24012,"ĠStall":24013,"Ġelevate":24014,"ographies":24015,"rama":24016,"Ha":24017,"Ġamidst":24018,"oho":24019,"Ġrejects":24020,"Jim":24021,"Ġmarginally":24022,"Ġusher":24023,"arez":24024,"ĠHawth":24025,"Ġsprink":24026,"ĠOffer":24027,"Ġanchored":24028,"ucking":24029,"ĠGarn":24030,"ĠConserv":24031,"Ġsocietal":24032,"Ġbrowsing":24033,"Ġbidder":24034,"burgh":24035,"ĠRunner":24036,"Ġtrendy":24037,"verts":24038,"imposed":24039,"ĠPatton":24040,"lements":24041,"Ġspicy":24042,"Ġswe":24043,"ĠStrike":24044,"Ġclam":24045,"ĠYankee":24046,"ĠKT":24047,"ĠGreenwood":24048,"ĠWays":24049,"Ġ2050":24050,"Ġattach":24051,"ĠShim":24052,"Ġmeltdown":24053,"Ġassemble":24054,"ĠUPDATE":24055,"Ġscout":24056,"Brown":24057,"ĠKobe":24058,"Ġpostpone":24059,"liness":24060,"allo":24061,"rief":24062,"ĠGerm":24063,"ĠFD":24064,"ĠReggie":24065,"ĠUnivers":24066,"ĠShepard":24067,"Ġcancell":24068,"ĠRomeo":24069,"ĠWarrior":24070,"ench":24071,"ifier":24072,"Ġprivileges":24073,"Ġsenses":24074,"Ġimpoverished":24075,"ĠPostal":24076,"encer":24077,"ĠConrad":24078,"Ġprinter":24079,"Ġinflicted":24080,"ĠGamble":24081,"ĠHeroes":24082,"132":24083,"Ġrevisions":24084,"Ġunsuccessfully":24085,"ĠHeisman":24086,"Ġstamped":24087,"inding":24088,"ĠLuna":24089,"Ġreinvest":24090,"ducers":24091,"ĠPassword":24092,"Leod":24093,"Ġcompounded":24094,"',\"":24095,"ogging":24096,"Ġprobing":24097,"ĠPBS":24098,"ĠMU":24099,"ĠWhenever":24100,"Ġsped":24101,"ĠCompetitive":24102,"isans":24103,"opa":24104,"Ġcleric":24105,"Ġvivid":24106,"à¸":24107,"126":24108,"Ġinconvenience":24109,"udi":24110,"Ġimmersive":24111,"Ġdiversion":24112,"Ġlogs":24113,"Ġspying":24114,"inct":24115,"Ġlitres":24116,"Ġmetallic":24117,"identally":24118,"FX":24119,"Ġloudly":24120,"Ġnursery":24121,"Ġcollectors":24122,"ĠKart":24123,"Ġescalate":24124,"Ġringing":24125,"Ġprocedural":24126,"Ġdisrupting":24127,"ĠEthiopian":24128,"ĠCFL":24129,"Ġillustrates":24130,"Ġperks":24131,"official":24132,"325":24133,"Ġmillennial":24134,"Ġbreadth":24135,"Ġmelted":24136,"Ġ850":24137,"ĠBake":24138,"donald":24139,"ĠGrac":24140,"Ġseeded":24141,"ĠDiscount":24142,"idates":24143,"Ġdrift":24144,"Ġcaptive":24145,"Ġseriousness":24146,"Ġrepercussions":24147,"Ġdisciplines":24148,"Ġthesis":24149,"Ġsleeve":24150,"ses":24151,"Monday":24152,"Ġthwart":24153,"ĠLic":24154,"Ġquadru":24155,"ĠPresbyterian":24156,"Ġreactors":24157,"ĠSuzanne":24158,"ewater":24159,"Ġlam":24160,"Ġbreastfeeding":24161,"Ġrats":24162,"ĠArtists":24163,"Ġdomestically":24164,"Ġdecom":24165,"ĠArms":24166,"basketball":24167,"Ġscrub":24168,"ĠTeddy":24169,"beh":24170,"ĠBetsy":24171,"ĠNursing":24172,"Ġdescriptions":24173,"127":24174,"gil":24175,"itional":24176,"Ġchampioned":24177,"ĠCalling":24178,"Ġrealization":24179,"ĠBuddy":24180,"hou":24181,"ĠDire":24182,"ĠHuff":24183,"Ġlipstick":24184,"Ray":24185,"Ġflare":24186,"belt":24187,"Ġbrightest":24188,"Ġmalfunction":24189,"ĠManor":24190,"Ġsaturated":24191,"rays":24192,"ĠDW":24193,"ixed":24194,"ĠSlovenia":24195,"seen":24196,"ĠCause":24197,"arios":24198,"ASE":24199,"Ġrend":24200,"ĠTBA":24201,"Ġlecturer":24202,"attering":24203,"Ġaffluent":24204,"CEO":24205,"Ġbreathtaking":24206,"ĠGiles":24207,"irth":24208,"ĠPhilips":24209,"Ġposture":24210,"ĠTSA":24211,"heit":24212,"Ġmenace":24213,"ricks":24214,"ĠAden":24215,"ĠReich":24216,"iggle":24217,"ĠShutterstock":24218,"Ġcourageous":24219,"edia":24220,"Staff":24221,"Ġdivert":24222,"ĠCir":24223,"Ġguessing":24224,"apers":24225,"ĠBritons":24226,"lé":24227,"Ġconvened":24228,"ĠSerbian":24229,"Ġricher":24230,"Ġcock":24231,"Ġdeposited":24232,"company":24233,"Ġdelic":24234,"sensitive":24235,"tank":24236,"ĠPatty":24237,"mia":24238,"onomous":24239,"cn":24240,"Ġclamp":24241,"ĠAcademic":24242,"Ġprosecuting":24243,"ĠTransparency":24244,"Ġdeflation":24245,"Ġdashboard":24246,"ĠDress":24247,"Ġlin":24248,"mu":24249,"ĠGoodell":24250,"Ġlav":24251,"ĠTwelve":24252,"Ġflavour":24253,"Ġfiercely":24254,"Ġbloom":24255,"ĠHaf":24256,"ĠGrad":24257,"LET":24258,"ĠSeeing":24259,"oxide":24260,"Ġmenus":24261,"char":24262,"adoes":24263,"combe":24264,"Street":24265,"ĠRidley":24266,"Ġdepicts":24267,"ĠPred":24268,"ÑĢ":24269,"British":24270,"Ġbumps":24271,"Ġlamp":24272,"ĠDesmond":24273,"ĠPB":24274,"Ġfrag":24275,"tin":24276,"ĠSharing":24277,"Ġdesperation":24278,"Ġcommuter":24279,"igrants":24280,"ĠShapiro":24281,"Ġkinda":24282,"Ġimpartial":24283,"ĠJewel":24284,"Ġcongratulations":24285,"Ġcompost":24286,"Ġadmiration":24287,"Ġpaycheck":24288,"ĠAnonymous":24289,"enger":24290,"Mer":24291,"ĠGospel":24292,"ĠEth":24293,"ĠMH":24294,"Ġfem":24295,"ĠTrial":24296,"Ġdepths":24297,"ĠApplied":24298,"Ġgrit":24299,"Ġerase":24300,"sid":24301,"comm":24302,"}":24303,"Ġretreated":24304,"Ġanalysed":24305,"ĠRegular":24306,"ĠPesh":24307,"ICAL":24308,"pei":24309,"ĠReilly":24310,"ĠTrib":24311,"Ġbooths":24312,"Ġdrank":24313,"Ġcoma":24314,"Ġharvested":24315,"ĠCHAR":24316,"Ġbutterfly":24317,"Ġsailed":24318,"ĠDrink":24319,"eping":24320,"ATCH":24321,"ĠLegends":24322,"Ġinsured":24323,"Ġwholes":24324,"ĠBis":24325,"ĠShea":24326,"ighter":24327,"Ġsnakes":24328,"ĠGunn":24329,"ĠPoss":24330,"Ġdispar":24331,"Ġbombshell":24332,"Ġscanning":24333,"340":24334,"choice":24335,"cool":24336,"\"âĢĶ":24337,"ĠTheo":24338,"rine":24339,"ĠJacques":24340,"Ġdisadvantaged":24341,"Ġparamount":24342,"igate":24343,"stat":24344,"anski":24345,"Ġoutsourcing":24346,"Ġpopulous":24347,"Ġbinge":24348,"ĠOrganic":24349,"urban":24350,"Ġyogurt":24351,"Ġretweet":24352,"osen":24353,"cially":24354,"215":24355,"Ġeditions":24356,"Ġburgeoning":24357,"efully":24358,"ĠThousand":24359,"Ġreplacements":24360,"ĠAmazing":24361,"rator":24362,"icy":24363,"Ġintensify":24364,"Sen":24365,"ĠQuincy":24366,"powers":24367,"ĠAur":24368,"ĠZion":24369,"stal":24370,"Ġpillar":24371,"ĠErit":24372,"ĠPerform":24373,"aston":24374,"Eric":24375,"Ġunh":24376,"IFF":24377,"950":24378,"ĠEngineer":24379,"ĠLands":24380,"Ġdubious":24381,"fy":24382,"ĠWI":24383,"ĠSv":24384,"ĠHendricks":24385,"ĠKod":24386,"Ġoutlining":24387,"ĠCorrespond":24388,"amus":24389,"worst":24390,"arter":24391,"coni":24392,"Ġhierarchy":24393,"ĠTHAT":24394,"Ġexce":24395,"Ġrailways":24396,"Ġmasked":24397,"lene":24398,"Ġoutset":24399,"Ġavalanche":24400,"Ġnicknamed":24401,"Ġ702":24402,"Lee":24403,"Ġ139":24404,"ĠSixth":24405,"365":24406,"nda":24407,"Ġaccountant":24408,"Ġobese":24409,"Ġgrape":24410,"Ġimpunity":24411,"ĠYorkers":24412,"Ġguardian":24413,"icity":24414,"Ġcentrist":24415,"Ġwaterways":24416,"ursed":24417,"Ġhopeless":24418,"header":24419,"Ġtack":24420,"Ġric":24421,"umn":24422,"Ġvalve":24423,"Ġtread":24424,"ĠCST":24425,"Ġhepatitis":24426,"ctor":24427,"ĠRED":24428,"Ġsolitary":24429,"NW":24430,"Ġceremonial":24431,"Ġfoe":24432,"Ġling":24433,"Jason":24434,"ĠLisbon":24435,"Ġ1955":24436,"ĠHeller":24437,"Ġkin":24438,"essen":24439,"Ġturbines":24440,"shi":24441,"Ġlodge":24442,"Ġveterinary":24443,"ĠBoll":24444,"ĠConfederation":24445,"ĠJournalists":24446,"Ġtug":24447,"ĠStarr":24448,"Ġpiles":24449,"Way":24450,"adel":24451,"orean":24452,"Ġoft":24453,"Ġshortcomings":24454,"ĠSheila":24455,"Ġbackbone":24456,"III":24457,"ĠDarwin":24458,"ĠTunis":24459,"Ġsuspicions":24460,"Ġdisagreements":24461,"Ġ247":24462,"illery":24463,"'\"":24464,"Ġsegregation":24465,"ohl":24466,"Ġinstincts":24467,"ĠPoo":24468,"nih":24469,"parency":24470,"uddy":24471,"esting":24472,"asses":24473,"ĠIntroduction":24474,"ĠSirius":24475,"Local":24476,"orous":24477,"Ġrehearsal":24478,"Ġdemol":24479,"Ġtraffickers":24480,"Ġupsetting":24481,"Ġheir":24482,"death":24483,"ĠMoments":24484,"Los":24485,"Ġatmospheric":24486,"aints":24487,"ĠDianne":24488,"Ġlikewise":24489,"ĠMing":24490,"auga":24491,"Ġfirsthand":24492,"Ġnarratives":24493,"ĠAstron":24494,"ĠExtreme":24495,"Ġhorns":24496,"ĠSana":24497,"Ġrecapt":24498,"ĠMist":24499,"ĠRandolph":24500,"connect":24501,"Ġindecent":24502,"Ġforty":24503,"Ġjihadists":24504,"azes":24505,"Ġdread":24506,"Ġgrapes":24507,"Ġremoves":24508,"Ġscreamed":24509,"ĠCrus":24510,"ikers":24511,"Ġsnapshot":24512,"ĠCalls":24513,"Cons":24514,"Ġlettuce":24515,"ĠPig":24516,"urable":24517,"jured":24518,"ILY":24519,"ĠJessie":24520,".).":24521,"Pay":24522,"Tra":24523,"----------------":24524,"ĠUnits":24525,"ĠPlayboy":24526,"Ġarthritis":24527,"Ġafforded":24528,"insk":24529,"ĠFake":24530,"ĠLies":24531,"ĠBaltic":24532,"oyal":24533,"ĠVest":24534,"Ġrusher":24535,"Ġincorporates":24536,"ĠMM":24537,"ĠDru":24538,"ĠWare":24539,"ĠSammy":24540,"ĠGob":24541,"ĠRuk":24542,"Ġ146":24543,"ĠCrowd":24544,"Ġduel":24545,"irts":24546,"Ġsourcing":24547,"hp":24548,"ĠJava":24549,"bred":24550,"ĠRefer":24551,"Ġuninsured":24552,"Ġslope":24553,"256":24554,"Ġregulating":24555,"Ġfundra":24556,"Ġinserted":24557,"ĠNickel":24558,"ĠConsumption":24559,"ĠRomo":24560,"Atlantic":24561,"Ġenclave":24562,"Ġpegged":24563,"Ġdirects":24564,"mbudsman":24565,"ĠDES":24566,"Ob":24567,"Ġlimbs":24568,"Ġbury":24569,"ILA":24570,"Ġstew":24571,"Ġbreeze":24572,"Ġabrupt":24573,"ĠGott":24574,"ĠClaude":24575,"Ġgenetically":24576,"Ġrigid":24577,"ĠDudley":24578,"ĠNer":24579,"registered":24580,"Ġentrenched":24581,"Ġextortion":24582,"ĠNurs":24583,"Ġcontingency":24584,"etter":24585,"Ġrejo":24586,"Ġprotagonist":24587,"Ġcounselling":24588,"ĠVit":24589,"aware":24590,"ĠMonsanto":24591,"GG":24592,"Ġincarcerated":24593,"Ġabduction":24594,"Ġreferencing":24595,"Germany":24596,"uates":24597,"reck":24598,"Ġtram":24599,"Ġchron":24600,"Ġmish":24601,"ĠVes":24602,"ĠTire":24603,"Ġvandal":24604,"ĠCrazy":24605,"ĠLifetime":24606,"ĠSpectrum":24607,"celer":24608,"Ġmotto":24609,"hang":24610,"Ġblade":24611,"gel":24612,"Ġbiography":24613,"Ġallegiance":24614,"hod":24615,"hap":24616,"ptic":24617,"acle":24618,"ĠBlade":24619,"ĠBoh":24620,"Ġ149":24621,"Ġchang":24622,"Ġcanned":24623,"Ġfacilitated":24624,"actor":24625,"iologist":24626,"Ġrebuilt":24627,"Ġawake":24628,"Ġmayoral":24629,"ĠEuros":24630,"Ġdangerously":24631,"MK":24632,"Ġreplica":24633,"Ġcoinc":24634,"blog":24635,"ĠEra":24636,"Ġrelinqu":24637,"quite":24638,"ondon":24639,"rosso":24640,"tun":24641,"Ġtouchscreen":24642,"Ġpops":24643,"ousing":24644,"efficient":24645,"Ġ148":24646,"Ġconced":24647,"although":24648,"Ġ1956":24649,"Ġmortar":24650,"ĠCave":24651,"ĠJung":24652,"urer":24653,"Ġillusion":24654,"ĠBerman":24655,"intend":24656,"Ġcoping":24657,"Dem":24658,"tion":24659,"estation":24660,"ĠSounds":24661,"Ġnavigating":24662,"Ġsperm":24663,"Ġreligions":24664,"Ġfol":24665,"Ġheroic":24666,"FD":24667,"Ġhesitant":24668,"asure":24669,"Ġredeem":24670,"Adam":24671,"Ġfireplace":24672,"vertis":24673,"ĠSung":24674,"290":24675,"iland":24676,"ĠUpdates":24677,"OTUS":24678,"ĠPTSD":24679,"Ġhelmets":24680,"\"?":24681,"Ġslashing":24682,"Ġscouts":24683,"Ġspelling":24684,"ĠInitial":24685,"draw":24686,"Ġchallengers":24687,"Ġsupremacists":24688,"Ġpilgrims":24689,"Ġasc":24690,"ĠFill":24691,"ĠPau":24692,"Ġjewel":24693,"ĠMalt":24694,"icip":24695,"Ġinhabitants":24696,"Ġmetre":24697,"ahar":24698,"Comp":24699,"atches":24700,"inv":24701,"Ġcyclist":24702,"ĠQC":24703,"Ġmanually":24704,"ĠAnchorage":24705,"Ġdiscarded":24706,"Ġconsolid":24707,"Ġnavig":24708,"ĠAnimals":24709,"ĠPole":24710,"esson":24711,"Ġ1954":24712,"Ġsorted":24713,"Ġmadness":24714,"ĠBrigade":24715,"ĠGenesis":24716,"Ġdismissing":24717,"ĠPanasonic":24718,"Ġdizz":24719,"ĠEducational":24720,"ĠKO":24721,"ĠPill":24722,"ĠGIF":24723,"Ġbol":24724,"Ġwards":24725,"Ġcontroversies":24726,"Chinese":24727,"Ġantics":24728,"Ġreliant":24729,"ĠMoff":24730,"Ġethanol":24731,"Ġtorch":24732,"rights":24733,"ĠHabit":24734,"arton":24735,"rera":24736,"ĠSasha":24737,"abella":24738,"Ġproliferation":24739,"Ġsincerely":24740,"communication":24741,"ĠNay":24742,"ĠChattanooga":24743,"ounces":24744,"ĠNXT":24745,"ĠEmir":24746,"Ġmanipulated":24747,"Ġharassing":24748,"wat":24749,"Ġbouts":24750,"Book":24751,"Ġhovering":24752,"ĠScan":24753,"ship":24754,"ĠAngola":24755,"ĠLC":24756,"Ġruins":24757,"Ġsexist":24758,"zar":24759,"Ġpledging":24760,"ober":24761,"Ġembold":24762,"Ġobjection":24763,"Ġboasting":24764,"MIN":24765,"Ġherbs":24766,"Ġgears":24767,"ĠIc":24768,"stre":24769,"him":24770,"Ġhomicides":24771,"cki":24772,"castle":24773,"counter":24774,"ĠCAS":24775,"ĠReasons":24776,"ĠDeclaration":24777,"Ġsimplify":24778,"Ġfared":24779,"Ġescort":24780,"Ġkidn":24781,"ĠHamm":24782,"Ġnailed":24783,"Ġaccommodations":24784,"Ġmodifications":24785,"rible":24786,"Ġwool":24787,"EDIT":24788,"2010":24789,"Ġauthentication":24790,"Ġgoat":24791,"hom":24792,"Ġfederally":24793,"ĠRath":24794,"Ġspiked":24795,"Ġmisrepresent":24796,"Ġavenue":24797,"Ġbroadcasts":24798,"ĠEstonia":24799,"ennes":24800,"ĠMare":24801,"ption":24802,"ĠKag":24803,"Ġcircumstance":24804,"orrow":24805,"isons":24806,"ĠCollabor":24807,"Ġstroll":24808,"ĠCPS":24809,"soft":24810,"iral":24811,"apo":24812,"usky":24813,"poke":24814,"Ġwoo":24815,"ĠElena":24816,"ĠLastly":24817,"Ġlinemen":24818,"Canadian":24819,"ĠAnyway":24820,"Ġsubstantive":24821,"ĠCurt":24822,"Ġard":24823,"ĠYosh":24824,"ĠBuchanan":24825,"Ġrevolving":24826,"Ġspecials":24827,"Ġshrine":24828,"Ġlumber":24829,"Ġorchestrated":24830,"kie":24831,"azy":24832,"Ġexpiration":24833,"ĠDaryl":24834,"ĠPatri":24835,"better":24836,"2020":24837,"ĠFav":24838,"ĠOP":24839,"OTT":24840,"Ġflush":24841,"ĠSikh":24842,"Ġecosystems":24843,"ĠBET":24844,"eared":24845,"audio":24846,"ĠFahrenheit":24847,"police":24848,"Ġincarceration":24849,"Ġerupt":24850,"ĠDamien":24851,"ĠHague":24852,"ulz":24853,"ĠAgents":24854,"ĠBanner":24855,"Ġconductor":24856,"ĠAjax":24857,"arson":24858,"Ġrests":24859,"Ġeurozone":24860,"Ġfelon":24861,"Ġcurator":24862,"morning":24863,"Ġevidenced":24864,"ĠNeh":24865,"Ġmattress":24866,"Ġtast":24867,"Ġfueling":24868,"ĠOccup":24869,"Ġbake":24870,"ĠZac":24871,"meaning":24872,"Ill":24873,"ĠHau":24874,"ĠLaden":24875,"Ġbald":24876,"Mary":24877,"oky":24878,"atri":24879,"Ġtracker":24880,"OTA":24881,"catching":24882,"ĠUnderground":24883,"ĠHuffPost":24884,"ĠAtkins":24885,"oglu":24886,"Ġauthorised":24887,"Ġroutines":24888,"ĠHof":24889,"veland":24890,"Ġlangu":24891,"Ġprot":24892,"ĠHyd":24893,"integ":24894,"Ġbravery":24895,"Ġviolin":24896,"Ġdelightful":24897,"Ġticks":24898,"iton":24899,"Ġreap":24900,"Ġoversized":24901,"ĠPitch":24902,"Ġprized":24903,"Ġfusion":24904,"fact":24905,"acting":24906,"Ġfullback":24907,"Ġpolite":24908,"Ġswear":24909,"Ġconfiscated":24910,"ĠStud":24911,"Ġfielded":24912,"rito":24913,"covered":24914,"financial":24915,"bill":24916,"HK":24917,"OTOS":24918,"loaded":24919,"Ġmarble":24920,"ĠDiplom":24921,".âĢĶ":24922,"Ġeats":24923,"Ġbackfield":24924,"Ġtimeframe":24925,"Ġvegetarian":24926,"Ġswaps":24927,"ĠMines":24928,"igor":24929,"ĠLenn":24930,"ĠDP":24931,"ordered":24932,"ĠShark":24933,"Ġquant":24934,"erence":24935,"Ġashes":24936,"ĠBuckley":24937,"ophobia":24938,"Ġwarranted":24939,"Rose":24940,"Ġunreasonable":24941,"ĠJav":24942,"Ġpalette":24943,"Ġjoints":24944,"Ġadvent":24945,"Ġnoteworthy":24946,"ĠNicol":24947,"ĠChristensen":24948,"Ġplummeted":24949,"ayers":24950,"Ġdefends":24951,"Ġcontended":24952,"ĠCongratulations":24953,"kish":24954,"ĠHannity":24955,"Ġgroundwater":24956,"ĠKramer":24957,"Ġerect":24958,"Ġappet":24959,"ĠKardash":24960,"Ġexacerbated":24961,"Ġexplanations":24962,"vious":24963,"eport":24964,"---":24965,"icism":24966,"ĠNatasha":24967,"ĠGeoffrey":24968,"estro":24969,"Article":24970,"Ġincidence":24971,"Ġprovoked":24972,"elf":24973,"Ġinsistence":24974,"ĠOUR":24975,"Ġfertilizer":24976,"Ġstickers":24977,"ĠGators":24978,"ĠLanding":24979,"ĠDON":24980,"sta":24981,"ĠRobbins":24982,"Ġpixels":24983,"ĠHoy":24984,"imated":24985,"ĠÃī":24986,"â":24987,"Ġsimpl":24988,"Other":24989,"245":24990,"Ġforcibly":24991,"'.\"":24992,"Ġsmashing":24993,"Ġmosquitoes":24994,"Ġpaints":24995,"Ġdebating":24996,"enty":24997,"ĠIB":24998,"leaf":24999,"ĠDah":25000,"Ġreferral":25001,"pired":25002,"Ġbrunch":25003,"gie":25004,"Ġvict":25005,"ribute":25006,"Ġbloggers":25007,"Ġgum":25008,"ĠAdmiral":25009,"France":25010,"ĠPK":25011,"ĠSaturn":25012,"Ġinflated":25013,"WAR":25014,"Ġscenic":25015,"usal":25016,"their":25017,"Ġcontends":25018,"Ġpathways":25019,"inis":25020,"Ġawarding":25021,"Ġmisled":25022,"Ġeternal":25023,"Ġexaminations":25024,"Ġpoker":25025,"Ġsafest":25026,"Ġchildcare":25027,"aday":25028,"Ġpreceding":25029,"ĠCollective":25030,"Ġrespectable":25031,"ographical":25032,"Ġoak":25033,"00000":25034,"ĠCorridor":25035,"oran":25036,"133":25037,"Ġmushrooms":25038,"gaard":25039,"ĠOmega":25040,"ĠNaturally":25041,"anim":25042,"Ġcaptains":25043,"Ġtang":25044,"Ġlobbyists":25045,"ĠSug":25046,"Ġsucc":25047,"249":25048,"ENG":25049,"134":25050,"Ġsolic":25051,"ĠAdded":25052,"ĠSuicide":25053,"ĠFULL":25054,"ĠStrauss":25055,"ĠDiesel":25056,"Ġtempting":25057,"acist":25058,"ĠDelivery":25059,"Ġquiz":25060,"ĠPARK":25061,"Ġcollisions":25062,"Ġrestrained":25063,"purpose":25064,"ĠChanges":25065,"Ġabsentee":25066,"Ġprobes":25067,"hib":25068,"Ġcul":25069,"Ġpetty":25070,"Ġnecess":25071,"Ġcues":25072,"OME":25073,"Ġinadvertently":25074,"urity":25075,"ĠStuff":25076,"FG":25077,"Ġwrestlers":25078,"Ġpaste":25079,"ĠRoku":25080,"Ġcardboard":25081,"aires":25082,"Ġvariables":25083,"ĠSaras":25084,"ĠFif":25085,"Ġinvests":25086,"ĠDiscover":25087,"ĠFix":25088,"Thomas":25089,"ĠLunch":25090,"lv":25091,"camera":25092,"Step":25093,"Ġresumes":25094,"ĠSacred":25095,"ĠShooting":25096,"Ġnoble":25097,"Ġslopes":25098,"Ġont":25099,"Ġtwists":25100,"Very":25101,"Ġbigotry":25102,"ĠTib":25103,"Ġmos":25104,"Ġwarrior":25105,"Ġbroadcasters":25106,"Ġubiquitous":25107,"ameda":25108,"Ġchess":25109,"Special":25110,"Ġconver":25111,"Ġdeleg":25112,"endant":25113,"Ġfoil":25114,"Ġlush":25115,"Ġtaxed":25116,"Mag":25117,"ahs":25118,"Ġtablespoons":25119,"scription":25120,"clamation":25121,"ĠCertain":25122,"ĠDiversity":25123,"Ġhairst":25124,"ĠBrewery":25125,"Ġshedding":25126,"Cla":25127,"Ġpenis":25128,"ĠMurder":25129,"Park":25130,"uner":25131,"iments":25132,"ĠOVER":25133,"hus":25134,"Ġtabloid":25135,"Chart":25136,"Ġvouchers":25137,"ĠCoord":25138,"Ġmethane":25139,"ĠFisheries":25140,"ĠKham":25141,"includes":25142,"ĠSuperman":25143,"ensed":25144,"isure":25145,"Amazon":25146,"Ġvacated":25147,"heet":25148,"Ġroast":25149,"Ġlegalize":25150,"ĠTut":25151,"Ġsignage":25152,"init":25153,"Ġthefts":25154,"202":25155,"Ġstatic":25156,"Ġchants":25157,"Bob":25158,"Ġdiscretionary":25159,"Ġendurance":25160,"Ġcollegiate":25161,"Ġcorridors":25162,"Ġslack":25163,"ĠLash":25164,"Az":25165,"Series":25166,"Ġnonpartisan":25167,"ĠMcGill":25168,"Ġuneven":25169,"ulsive":25170,"eu":25171,"Ġpil":25172,"Ġfisheries":25173,"Ġonslaught":25174,"fiction":25175,"holding":25176,"Ġcheated":25177,"Ġtraumat":25178,"lasting":25179,"Ġmultitude":25180,"ĠThr":25181,"ĠBreast":25182,"Ġ1600":25183,"ĠMatth":25184,"Ġdiminish":25185,"ĠFTC":25186,"Ġgram":25187,"ĠResident":25188,"Ġfading":25189,"Ġmarginalized":25190,"ĠLite":25191,"ĠCarlton":25192,"Ġerad":25193,"Welcome":25194,"ĠFaw":25195,"iddy":25196,"Ġparticip":25197,"Ġcz":25198,"Ġtexted":25199,"Ġsuites":25200,"ĠForever":25201,"Ġrendition":25202,"rait":25203,"ĠPrague":25204,"Ġsponsoring":25205,"Ġcompos":25206,"ĠBeacon":25207,"144":25208,"Ġpupil":25209,"Ġintricate":25210,"Ġathleticism":25211,"Ġoptimization":25212,"Ġloot":25213,"polit":25214,"ĠOtt":25215,"Whatever":25216,"uno":25217,"ĠConstable":25218,"esville":25219,"Ġlookout":25220,"ĠAircraft":25221,"Ġspo":25222,"Ġcorrobor":25223,"Ġhiatus":25224,"ĠKnowing":25225,"ĠHamp":25226,"Ġspe":25227,"Ġstoring":25228,"Ġshakes":25229,"uran":25230,"Ġsickness":25231,"Ġliber":25232,"ĠAdministrative":25233,"Ġpleasing":25234,"ĠEqual":25235,"ĠConversation":25236,"Ġalgae":25237,"Ġlobbyist":25238,"ĠHelena":25239,"ptions":25240,"Ġfaire":25241,"ĠGone":25242,"ĠWiggins":25243,"Robert":25244,"Ġlistens":25245,"ĠDaisy":25246,"Ġsticky":25247,"sale":25248,"ĠMarijuana":25249,"ĠSSD":25250,"ĠTool":25251,"once":25252,"ĠHarmon":25253,"mobile":25254,"Ġdetain":25255,"Money":25256,"Ġflawless":25257,"forced":25258,"Ġguru":25259,"Ġairspace":25260,"ĠArchie":25261,"ĠGender":25262,"ĠMeat":25263,"abilities":25264,"ĠBD":25265,"Open":25266,"Ġoutsider":25267,"issue":25268,"Ġlearns":25269,"natural":25270,"Ġvinegar":25271,"ĠSUB":25272,"ĠRecon":25273,"blers":25274,"Ġsniff":25275,"Ġsuppression":25276,"Ġsaf":25277,"urger":25278,"Ġbunker":25279,"asaki":25280,"ĠSpartan":25281,"ĠTok":25282,"Ġrav":25283,"Ġfoc":25284,"Sean":25285,"etric":25286,"Ġballpark":25287,"ĠHerb":25288,"ĠBM":25289,"ĠPublishing":25290,"Ġroadmap":25291,"pered":25292,"Ġpredator":25293,"ĠBlockchain":25294,"Ġvalidity":25295,"ĠGlou":25296,"ĠYamaha":25297,"Ġadop":25298,"Ġswamp":25299,"Ġcomplied":25300,"Ky":25301,"Greg":25302,"casts":25303,"john":25304,"ĠBosnia":25305,"Ġcinematic":25306,"ĠTavern":25307,"Ġfrustrations":25308,"eryl":25309,"Ġfairy":25310,"UNCH":25311,"ĠTus":25312,"Corp":25313,"ĠNug":25314,"closed":25315,"Ġexercised":25316,"urden":25317,"Ġdigitally":25318,"137":25319,"ĠVictims":25320,"Ġreluctance":25321,"ELL":25322,"ĠTribe":25323,"chall":25324,"Ġwhiskey":25325,"ogl":25326,"Ġmater":25327,"ĠBac":25328,"Ġapartheid":25329,"ĠMBA":25330,"mot":25331,"ĠIre":25332,"®,":25333,"ĠChic":25334,"Ġtimed":25335,"ĠDome":25336,"efer":25337,"Ġobserver":25338,"unky":25339,"ĠKant":25340,"Ġundrafted":25341,"Ġsimplicity":25342,"onds":25343,"Ġstoked":25344,"Ġ1949":25345,"Ġransomware":25346,"ĠPow":25347,"ĠAngelo":25348,"ĠAmbrose":25349,"adjusted":25350,"Guard":25351,"138":25352,"ĠKaplan":25353,"stri":25354,"Ġcries":25355,"NF":25356,"atro":25357,"Ġavocado":25358,"illian":25359,"Ġsculptures":25360,"Ġelevation":25361,"Ġinspires":25362,"Ġgenerals":25363,"arb":25364,"chell":25365,"ĠJournalism":25366,"ĠHybrid":25367,"ĠCaller":25368,"vec":25369,"Lu":25370,"Ġresemble":25371,"bys":25372,"erving":25373,"antz":25374,"Ġwiden":25375,"vised":25376,"Ev":25377,"Ġdiagn":25378,"ĠMakes":25379,"Ġcer":25380,"ĠPats":25381,"single":25382,"sche":25383,"struct":25384,"Ġdissolved":25385,"Ġtimeout":25386,"Ġenhancement":25387,"CF":25388,"Ġindust":25389,"ĠDed":25390,"ĠZo":25391,"CB":25392,"Ġpesticides":25393,"ĠRubin":25394,"George":25395,"opal":25396,"Ġmotel":25397,"critical":25398,"Ġcollapsing":25399,"ĠShal":25400,"tex":25401,"Ġcomplementary":25402,"Ġoust":25403,"ĠFlu":25404,"Ġexporting":25405,"Ġdifferential":25406,"north":25407,"ĠFG":25408,"Ġspoon":25409,"sha":25410,"Ġdismantle":25411,"elta":25412,"Ġjar":25413,"space":25414,"Smart":25415,"mere":25416,"Ð":25417,"ĠGillespie":25418,"Lo":25419,"ĠMead":25420,"capacity":25421,"ĠIssue":25422,"050":25423,"ĠVall":25424,"Ġdisgr":25425,"Ġmeme":25426,"Ġpard":25427,"Ġcompensated":25428,"ĠKet":25429,"major":25430,"ĠBren":25431,"Ġheed":25432,"131":25433,"Ġcm":25434,"Ġdazzling":25435,"ĠCheese":25436,"Ġmonumental":25437,"Ġyielding":25438,"Read":25439,"Ġgrinding":25440,"Ang":25441,"Ġdefiance":25442,"Ġintimidated":25443,"Ġ310":25444,"Ġoutsiders":25445,"houn":25446,"Ma":25447,"ĸ":25448,"ĠForget":25449,"ĠSans":25450,"Ġunfolding":25451,"ĠSap":25452,"ĠLak":25453,"Ġsectarian":25454,"ĠDaddy":25455,"oxy":25456,"hitting":25457,"Ġdetectors":25458,"ĠRee":25459,"Ġbroaden":25460,"Ġslaying":25461,"Ġsuspending":25462,"Ġinvestig":25463,"Tuesday":25464,"Ġantibiotic":25465,"ĠShiite":25466,"igi":25467,"ĠExternal":25468,"ĠPhotographer":25469,"Ġerratic":25470,"NJ":25471,"ĠDock":25472,"Ġoutweigh":25473,"rants":25474,"Ġlobster":25475,"Ġreactor":25476,"Ġunrealistic":25477,"ĠAudrey":25478,"ĠYor":25479,"Anyone":25480,"Ġfraught":25481,"е":25482,"ĠWester":25483,"fc":25484,"ĠDunham":25485,"ĠLug":25486,"allow":25487,"139":25488,"Ġparity":25489,"Ġhorizontal":25490,"ijuana":25491,"Ġcivilization":25492,"ĠGins":25493,"Ġsmokers":25494,"ĠDiabetes":25495,"Five":25496,"ĠDG":25497,"Ġunderscores":25498,"Ġelabor":25499,"ĠLub":25500,"ĠDevil":25501,"Ġ154":25502,"ĠGuarant":25503,"ĠPandora":25504,"Ġexcav":25505,"Ġaccuser":25506,"Ġrevolt":25507,"Ġinstructors":25508,"Ġire":25509,"ographic":25510,"ĠCLE":25511,"Ġexpedition":25512,"ould":25513,"Ġstriving":25514,"south":25515,"onis":25516,"ĠSwed":25517,"MY":25518,"ĠLevin":25519,"Ġcarp":25520,"ĠArchitects":25521,"Ġ{":25522,"Ġcovert":25523,"Ġcooled":25524,"ĠStaten":25525,"Ġspecializing":25526,"ĠHazel":25527,"Ġlen":25528,"ighty":25529,"Ġbrilliantly":25530,"Phil":25531,"Ġlament":25532,"Australia":25533,"203":25534,"Ġticking":25535,"Ġadjud":25536,"Ġroommate":25537,"ĠSheet":25538,"capital":25539,"167":25540,"Ġendeavor":25541,"Ġaver":25542,"Ġdues":25543,"ĠCycl":25544,"oried":25545,"Va":25546,"loading":25547,"Ġpremie":25548,"Ġregimes":25549,"ĠAly":25550,"Ġperennial":25551,"Ġconsoles":25552,"Ġironic":25553,"ichael":25554,"Ġvigorously":25555,"Ġtransmit":25556,"gary":25557,"eking":25558,"Ġjails":25559,"ĠEpiscopal":25560,"eddy":25561,"Ġidle":25562,"Ġsafeguards":25563,"Ġdwindling":25564,"NOR":25565,"torn":25566,"ĠEvangel":25567,"ĠPlastic":25568,"ĠTerm":25569,"Ġforwarded":25570,"avage":25571,"Ġrefrigerator":25572,"arna":25573,"ĠGuinness":25574,"ĠCandy":25575,"Ġbotched":25576,"seller":25577,"Ġpul":25578,"grades":25579,"oshenko":25580,"earth":25581,"nette":25582,"Ġtraps":25583,"Ġtarn":25584,"Ġmilitar":25585,"ĠAriel":25586,"Ġtubes":25587,"ulo":25588,"Water":25589,"edin":25590,"Ġmarvel":25591,"chenko":25592,"ĠElk":25593,"spect":25594,"coe":25595,"ĠIllustrated":25596,"Ġruthless":25597,"etermined":25598,"Ġdys":25599,"Ġbreaching":25600,"gee":25601,"Nick":25602,"Ġcruiser":25603,"Ġciv":25604,"Ġdou":25605,"Ġ;":25606,"deb":25607,"ĠAsheville":25608,"Ġbiting":25609,"Ġyo":25610,"Courtesy":25611,"Ġroses":25612,"ĠConsequently":25613,"Ġrevis":25614,"Ġconfinement":25615,"next":25616,"produced":25617,"Ġmoratorium":25618,"Ġkne":25619,"eties":25620,"Ġplethora":25621,"Ġceleb":25622,"FIN":25623,"Ġdepartures":25624,"ĠWynne":25625,"abilia":25626,"ĠCourts":25627,"olis":25628,"Ġcereal":25629,"Ġblended":25630,"333":25631,"ĠLun":25632,"Ġrepe":25633,"Ġmathematics":25634,"Ġpharmacies":25635,"Center":25636,"Ġwhist":25637,"pine":25638,"Ġperm":25639,"Ġcustomary":25640,"Ġhormones":25641,"Ġcleansing":25642,"Ġconfidentiality":25643,"Ġmascot":25644,"Ġslippery":25645,"Ġmediation":25646,"Ġpodcasts":25647,"Ġcoating":25648,"Ġconveyed":25649,"Ġgir":25650,"ĠNurse":25651,"DM":25652,"Ġlured":25653,"orted":25654,"Ġolig":25655,"ritz":25656,"ĠINF":25657,"Ġtirelessly":25658,"Ġdoorstep":25659,"Ġtomb":25660,"Ġwithholding":25661,"irling":25662,"Ġhog":25663,"Ġ156":25664,"Ġgau":25665,"chem":25666,"raid":25667,"Ġtrolls":25668,"Ġ182":25669,"ĠColumb":25670,"Ġtissues":25671,"Ġnaive":25672,"Ġlect":25673,"Central":25674,"Sign":25675,"168":25676,"Ġbribe":25677,"ĠDoll":25678,"ĠTripoli":25679,"Ġfunk":25680,"Ġplaza":25681,"Ġmechanic":25682,"mem":25683,"Ġmonkey":25684,"grid":25685,"Ġtainted":25686,"ĠNicaragua":25687,"pelling":25688,"ĠXia":25689,"ammers":25690,"Ġorth":25691,"ICAN":25692,"Ġrant":25693,"Ġdiary":25694,"ĠHarrington":25695,"Ġimply":25696,"Qaeda":25697,"Ġworsen":25698,"Ġcrafting":25699,"ĠShir":25700,"Ġcoincided":25701,"Ġsnatched":25702,"ileen":25703,"sei":25704,"Ġsurgeons":25705,"directed":25706,"Ġcompulsory":25707,"Ġnowadays":25708,"ĠLI":25709,"ĠRebel":25710,"Ġlions":25711,"ĠJR":25712,"scar":25713,"ĠRespons":25714,"Ġscroll":25715,"ĠErd":25716,"iety":25717,"\";":25718,"ĠBone":25719,"ĠRumble":25720,"ĠKS":25721,"ĠLaur":25722,"kell":25723,"ĠBirds":25724,"agic":25725,"Ġsimmer":25726,"Ġrunaway":25727,"Ġ162":25728,"auna":25729,"Ġdialog":25730,"Ġlouder":25731,"esque":25732,"RR":25733,"Ġbloss":25734,"Ġcaliber":25735,"nery":25736,"Ġhauled":25737,"Ġbacterial":25738,"ĠVanity":25739,"ĠPrograms":25740,"omew":25741,"ĠMama":25742,"Ġarr":25743,"Ġdod":25744,"ĠJarvis":25745,"ĠFIRST":25746,"Ġinjections":25747,"ĠBallard":25748,"Ġmedically":25749,"angan":25750,"ĠNewfoundland":25751,"Ġfracking":25752,"Ġbast":25753,"outing":25754,"Ġmercury":25755,"Ġwatershed":25756,"ĠAmateur":25757,"Ġ153":25758,"escal":25759,"Ġpainter":25760,"creat":25761,"Ġperceive":25762,"Ġgent":25763,"attacks":25764,"worked":25765,"Ġimporting":25766,"Indian":25767,"Ġconvict":25768,"clad":25769,"Ġbudding":25770,"Ġambient":25771,"ĠWitness":25772,"letes":25773,"Ġbuffet":25774,"Ġneedles":25775,"Ġcoding":25776,"Ġchoke":25777,"Ġcorrespondence":25778,"Ġgods":25779,"Ġdances":25780,"Ġsteadfast":25781,"cert":25782,"Ġroaming":25783,"between":25784,"weak":25785,"Jer":25786,"jandro":25787,"Ġdiscouraged":25788,"Ġfruition":25789,"ĠØ":25790,"ĠKop":25791,"ULL":25792,"efe":25793,"imble":25794,"obb":25795,"ulla":25796,"Ġaccredited":25797,"Ġlectures":25798,"bil":25799,"why":25800,"Ġgreeting":25801,"ĠBoost":25802,"Ġmailed":25803,"Ġtroop":25804,"Ġfrig":25805,"Ġrese":25806,"Ġscratched":25807,"Stars":25808,"ĠRailroad":25809,"ĠIdol":25810,"Ġsuccumbed":25811,"ĠWeeks":25812,"ffe":25813,"Ġjihadist":25814,"ITION":25815,"Ġthreads":25816,"ĠGenerally":25817,"Ġmedieval":25818,"Ġquotas":25819,"ĠFerry":25820,"rique":25821,"Ġprod":25822,"ĠEduc":25823,"rive":25824,"Ġensued":25825,"Cy":25826,"Ġinfring":25827,"Ġprank":25828,"Ġfrontline":25829,"Ġcompletes":25830,"upe":25831,"Ġmanageable":25832,"Ġpoems":25833,"otten":25834,"igne":25835,"threat":25836,"ĠDri":25837,"ĠLINK":25838,"Calif":25839,"ĠDos":25840,"ulent":25841,"Ġaids":25842,"Ġslips":25843,"umped":25844,"Ġstyled":25845,"Ġdisproportionately":25846,"ĠDish":25847,"ĠUncle":25848,"andel":25849,"Ġrecharge":25850,"rators":25851,"ĠSPR":25852,"Ġguarded":25853,"ĠGreatest":25854,"ĠSkills":25855,"ĠNob":25856,"ĠDesk":25857,"ĠCros":25858,"Ġwrit":25859,"Ġquery":25860,"ORTS":25861,"Ġbundled":25862,"Ġgib":25863,"Ġeth":25864,"iesta":25865,"Ġevade":25866,"dict":25867,"straight":25868,"Met":25869,"present":25870,"Ġdiff":25871,"Ġdere":25872,"ĠSpl":25873,"Ġrepr":25874,"ĠBeard":25875,"Ġvain":25876,"Ġappointing":25877,"ĠVisual":25878,"caps":25879,"gado":25880,"ĠRican":25881,"ĠPose":25882,"endor":25883,"Ġ222":25884,"ĠLear":25885,"Ġconstructing":25886,"Dan":25887,"ĠSpears":25888,"ĠTherapy":25889,"pta":25890,"Ġrehabilit":25891,"Ġrisked":25892,"ĠGuer":25893,"HF":25894,"Ġ301":25895,"Ġliking":25896,"Ġmodular":25897,"eree":25898,"ĠMAT":25899,"ĠHomeless":25900,"Ġstove":25901,"erd":25902,"hash":25903,"ĠAchilles":25904,"ĠBeta":25905,"Ġincl":25906,"Ġgunned":25907,"ĠCrab":25908,"ĠMara":25909,"Ġinvaded":25910,"ulatory":25911,"ATA":25912,"angering":25913,"onso":25914,"Ġallocate":25915,"Ġgarment":25916,"itudes":25917,"ĠHuang":25918,"Ġstaples":25919,"ĠAlban":25920,"Ġtrough":25921,"Ġupright":25922,"tie":25923,"Ġexploits":25924,"ĠVaughan":25925,"ĠDarrell":25926,"Ġassortment":25927,"ĠChill":25928,"Ġlearners":25929,"aqu":25930,"Ġexplode":25931,"ĠChong":25932,"bt":25933,"opl":25934,"Ġaltern":25935,"Ġ151":25936,"fur":25937,"ULT":25938,"HOU":25939,"ĠMemory":25940,"Ġboosts":25941,"ynes":25942,"priv":25943,"Ġtimeless":25944,"Ġcurtail":25945,"ĠCary":25946,"ĠHud":25947,"Ġexclus":25948,"Ġ275":25949,"Ġfry":25950,"ĠVera":25951,"Ġdefied":25952,"ĠDust":25953,"Ġenvision":25954,"ĠPhilipp":25955,"Ġenhancements":25956,"ĠLIB":25957,"ggy":25958,"ĠAzure":25959,"esis":25960,"Ġcharismatic":25961,"Ġcoincide":25962,"inged":25963,"ĠChoose":25964,"Ġsizeable":25965,"136":25966,"Ġpronounce":25967,"ĠPositive":25968,"Ġideally":25969,"Ġechoes":25970,"Ġcottage":25971,"Ġencrypted":25972,"Prime":25973,"Ġá":25974,"Ġflashes":25975,"Group":25976,"Ġ501":25977,"heat":25978,"atility":25979,"ĠTesting":25980,"pex":25981,"WT":25982,"154":25983,"annah":25984,"Ġcompromising":25985,"Ġinactive":25986,"Ġdisparity":25987,"Ġgruesome":25988,"ĠFeather":25989,"ĠMandal":25990,"Ġthereof":25991,"ĠProducer":25992,"Ġprofiling":25993,"Ġlogistical":25994,"Ġcornerstone":25995,"ĠClaudia":25996,"Congress":25997,"ĠDill":25998,"ophone":25999,"Ġcameo":26000,"ĠCutler":26001,"Ġcraz":26002,"throw":26003,"ĠKasich":26004,"Ġexploiting":26005,"ĠSeas":26006,"agles":26007,"ĠGeological":26008,"ĠStub":26009,"ĠUps":26010,"MER":26011,"Ġmem":26012,"itution":26013,"Ġunderstandably":26014,"Ġcontractual":26015,"warming":26016,"qi":26017,"Sky":26018,"whelming":26019,"Ġcurse":26020,"ĠAren":26021,"Ġ265":26022,"ĠGree":26023,"Ġpresiding":26024,"Works":26025,"stones":26026,"Ġappalling":26027,"plex":26028,"dj":26029,"aunting":26030,"Ġimag":26031,"Ġsexism":26032,"ĠVert":26033,"ĠRag":26034,"ĠBliss":26035,"posium":26036,"div":26037,"Ġexperimenting":26038,"Ass":26039,"Lago":26040,"worthiness":26041,"ĠBerk":26042,"ĠDisneyland":26043,"Ġexaggerated":26044,"iliation":26045,"ĠFP":26046,"Ġprincipals":26047,"Miami":26048,"ropri":26049,"PLE":26050,"iona":26051,"ĠPokemon":26052,"apse":26053,"Ġbubbles":26054,"INC":26055,"ĠCaps":26056,"ĠBrowne":26057,"sing":26058,"Ġcafé":26059,"Ġceilings":26060,"frame":26061,"ĠIrwin":26062,"ATS":26063,"dated":26064,"Ġprotester":26065,"Ġtaps":26066,"ĠOslo":26067,"Ù":26068,"Ġconcentrations":26069,"Ġdistributions":26070,"Ġglucose":26071,"ĠRudolph":26072,"Ġtowels":26073,"Ġâĸº":26074,"Ġneighbourhoods":26075,"Ġinduction":26076,"Ġglaring":26077,"Ġannexation":26078,"Ġunsustainable":26079,"ĠTend":26080,"Ġthumbs":26081,"iegel":26082,"cript":26083,"gor":26084,"closure":26085,"thought":26086,"Ġpaddle":26087,"Ġemulate":26088,"Ġdiameter":26089,"Ġtailor":26090,"ĠCorpor":26091,"icable":26092,"ĠPrin":26093,"Ġadminister":26094,"ĠJudd":26095,"ĠColleg":26096,"aund":26097,"ĠPond":26098,"ĠNOTE":26099,"Ġcombating":26100,"Ġinvention":26101,"ĠOculus":26102,"ĠRepl":26103,"iscal":26104,"Ġtrilogy":26105,"anian":26106,"ATT":26107,"ĠCoke":26108,"DL":26109,"ĠLup":26110,"living":26111,"Ġadvertise":26112,"ĠConnie":26113,"amping":26114,"Ġsung":26115,"ORY":26116,"ĠTet":26117,"Ġsplits":26118,"Ġreconnect":26119,"Ġlou":26120,"mut":26121,"ulator":26122,"Ġstrap":26123,"Ġswallow":26124,"rote":26125,"Ġexec":26126,"ffen":26127,"ĠCombine":26128,"ĠTreat":26129,"Ġsorrow":26130,"ĠNotably":26131,"ĠSever":26132,"rette":26133,"Ġwherein":26134,"Ġtransitioning":26135,"Ġtrout":26136,"Ġcockpit":26137,"Ġcrawl":26138,"Ġferv":26139,"Ġliquids":26140,"Ġtsp":26141,"atell":26142,"Ġmeasles":26143,"Ġjug":26144,"Ac":26145,"ĠKD":26146,"ĠMoose":26147,"Ġvans":26148,"chain":26149,"ĠPapua":26150,"plet":26151,"Wednesday":26152,"lynn":26153,"chery":26154,"budget":26155,"Tony":26156,"ĠBacon":26157,"Ġstirred":26158,"ĠSpecialist":26159,"Ġcounterfeit":26160,"а":26161,"Ġdifferentiate":26162,"Ġmuscular":26163,"ĠTheodore":26164,"Ġlooms":26165,"ĠXX":26166,"ottage":26167,"Ġbenches":26168,"ĠMunicip":26169,"Po":26170,"ĠHeck":26171,"Ġscars":26172,"ĠNim":26173,"ÙĬ":26174,"ĠIngredients":26175,"Ġecological":26176,"ĠAWS":26177,"Ġdispose":26178,"Ġmattered":26179,"Ġ720":26180,"Ġpatriotism":26181,"ĠGrind":26182,"Ġcurved":26183,"opia":26184,"ĠLiqu":26185,"Ġevangelical":26186,"tto":26187,"ĠMaterial":26188,"ĠShowtime":26189,"ĠBS":26190,"Ġcheckpoints":26191,"Ġcrippling":26192,"ĠBalance":26193,"stress":26194,"bearing":26195,"Ġ216":26196,"ĠGuards":26197,"Ġlinebackers":26198,"Ġoffending":26199,"Ġsands":26200,"umbnail":26201,"atorial":26202,"Ġliberties":26203,"ĠGW":26204,"ĠPulitzer":26205,"ĠAlvin":26206,"ĠFAC":26207,"ĠStrategies":26208,"Ġreiter":26209,"ĠRestaur":26210,"ĠLithuania":26211,"ĠSwanson":26212,"terror":26213,"ĠMaurit":26214,"Ġparadise":26215,"zzle":26216,"owment":26217,"ĠWP":26218,"Ġsodium":26219,"Ġfuturistic":26220,"Ġdots":26221,"Anthony":26222,"Though":26223,"Ġstripes":26224,"Ġorig":26225,"ultz":26226,"Ġ340":26227,"KK":26228,"umer":26229,"ivery":26230,"Ġplacebo":26231,"Ġdemocrat":26232,"Ġsubmerged":26233,"ĠHidden":26234,"pieces":26235,"Ġasteroid":26236,"ĠGraphic":26237,"Ġadvert":26238,"sil":26239,"Ġdreaming":26240,"Ġnationality":26241,"Ġfostering":26242,"daughter":26243,"ĠSavings":26244,"Ġmischief":26245,"ĠClair":26246,"ĠBundy":26247,"Ġblatant":26248,"Ġtabs":26249,"qa":26250,"severe":26251,"attered":26252,"Ġgreed":26253,"Ġresembles":26254,"Ġnominal":26255,"Ġineligible":26256,"wealth":26257,"fax":26258,"payers":26259,"Ġdisplacement":26260,"itute":26261,"Ġunpleasant":26262,"ĠPom":26263,"lif":26264,"edo":26265,"ĠNP":26266,"Inter":26267,"Ġcohort":26268,"ĠStacy":26269,"ĠDai":26270,"Ġhistories":26271,"alin":26272,"273":26273,"Ġdram":26274,"ĠKand":26275,"Ġexpectancy":26276,"ansson":26277,"Ġlimbo":26278,"ĠPolar":26279,"Ġdivine":26280,"oused":26281,"Ġshel":26282,"ĠProblem":26283,"achment":26284,"Ġâĸł":26285,"shoot":26286,"antam":26287,"ĠHerz":26288,"Ġ157":26289,"Ġpreventive":26290,"keye":26291,"Sing":26292,"Ġcharacteristic":26293,"Ġcasually":26294,"ĠTaiwanese":26295,"md":26296,"ĠHubbard":26297,"imon":26298,"Ġsect":26299,"148":26300,"Ġmartyr":26301,"stud":26302,"Ġcongrat":26303,"ĠSWAT":26304,"ĠTheory":26305,"INAL":26306,"opping":26307,"ply":26308,"ĠKindle":26309,"uu":26310,"ĠLith":26311,"kaya":26312,"ĠActivity":26313,"uously":26314,"ĠJeb":26315,"tell":26316,"ĠSpin":26317,"ĠExplorer":26318,"Ġfolded":26319,"ĠCanterbury":26320,"ĠStur":26321,"Ġminiature":26322,"Ġmultif":26323,"ĠPressure":26324,"angling":26325,"ĠOverse":26326,"Ġresides":26327,"Ġimpressions":26328,"Ġauthored":26329,"265":26330,"Ġallergies":26331,"143":26332,"ĠJi":26333,"Ġsticker":26334,"ĠAccord":26335,"Ġcaste":26336,"Ġseparates":26337,"ĠFein":26338,"Daily":26339,"179":26340,"ĠScores":26341,"ĠAuction":26342,"hea":26343,"Ġdisclosing":26344,"ĠTacoma":26345,"Ġverse":26346,"ĠBeg":26347,"Ġfabrics":26348,"aez":26349,"Ġattachment":26350,"isy":26351,"Christ":26352,"Ġaddictive":26353,"Ġvir":26354,"Week":26355,"ĠPlum":26356,"croft":26357,"itivity":26358,"ĠExhibition":26359,"Ġbruised":26360,"Ġmimic":26361,"rers":26362,"Ġanal":26363,"Ġunintended":26364,"Ġpall":26365,"atts":26366,"ĠWarn":26367,"Ġslows":26368,"WH":26369,"Ġembro":26370,"nec":26371,"Ġ168":26372,"285":26373,"ologic":26374,"Ġhob":26375,"ĠPeel":26376,"Mill":26377,"eps":26378,"Ġrobbers":26379,"ĠDahl":26380,"semble":26381,"omics":26382,"toe":26383,"ĠLoch":26384,"Ġreproduction":26385,"ĠCullen":26386,"Ġimplants":26387,"Ġwow":26388,"ĠSTATE":26389,"vt":26390,"Ġdepleted":26391,"Ġbreweries":26392,"Ġhateful":26393,"Ġgast":26394,"Ġhollow":26395,"Ġradically":26396,"ographed":26397,"ĠFog":26398,"onian":26399,"ĠSequ":26400,"Ġdisrespectful":26401,"Dis":26402,"ĠExper":26403,"pron":26404,"ĠAmelia":26405,"ĠSage":26406,"bath":26407,"Ġtransformative":26408,"Ġtremendously":26409,"Ġpillow":26410,"ĠNormal":26411,"Cont":26412,"ĠMedic":26413,"educated":26414,"Ġredesigned":26415,"Ġkneeling":26416,"Ġinh":26417,"Ġroofs":26418,"Ġhandmade":26419,"Ġprotracted":26420,"ĠIsn":26421,"ĠCapacity":26422,"Ġsquash":26423,"ĠVega":26424,"Ġfats":26425,"ĠCertified":26426,"ointed":26427,"Ġpricey":26428,"ĠBasil":26429,"Ġfreezer":26430,"Ġscent":26431,"Ġpizz":26432,"ĠArd":26433,"Ġdistractions":26434,"Ġviolently":26435,"ĠHess":26436,"Ġfunc":26437,"Ġundert":26438,"Ġrejuven":26439,"Ġdisbelief":26440,"cluded":26441,"named":26442,"ĠFailure":26443,"kus":26444,"Ġhostages":26445,"ĠSahara":26446,"Ġ1944":26447,"Leary":26448,"ĠPrel":26449,"enza":26450,"ĠAlly":26451,"ĠKak":26452,"Ġcounselors":26453,"ĠGale":26454,"ĠHok":26455,"ĠSold":26456,"Ġhacker":26457,"Ġhun":26458,"Ġbung":26459,"Ġdeclares":26460,"Ġinfringement":26461,"OOD":26462,"Ġdoub":26463,"jam":26464,"Ġallergy":26465,"ĠShipping":26466,"Ġmedic":26467,"Ġaccommod":26468,"Ġdocumenting":26469,"Ġcompanions":26470,"Ġmodelling":26471,"Ġcarriage":26472,"ĠCherokee":26473,"Ġtresp":26474,"Ġtaxable":26475,"ĠActivities":26476,"ĠCrane":26477,"bots":26478,"ĠRusso":26479,"Ġstocked":26480,"ervation":26481,"Ġcoffin":26482,"aign":26483,"guards":26484,"Ġonwards":26485,"Ġfrank":26486,".*":26487,"unic":26488,"Ġcens":26489,"enic":26490,"ruit":26491,"rained":26492,"Ġadapting":26493,"aments":26494,"Ġstagnant":26495,"azaar":26496,"ĠHarlem":26497,"Ġ158":26498,"ysis":26499,"Ġbraking":26500,"Ġdipping":26501,"Ġclan":26502,"ĠShu":26503,"Ġprops":26504,"qualified":26505,"Ġmistakenly":26506,"ĠStalin":26507,"Ġaddicts":26508,"ĠCALL":26509,"ropolis":26510,"aten":26511,"pec":26512,"ĠDro":26513,"ĠFellowship":26514,"ĠSupporting":26515,"loc":26516,"uben":26517,"499":26518,"Bro":26519,"Ġpots":26520,"Ġchunks":26521,"wr":26522,"ĠColonial":26523,"ĠArchitecture":26524,"Ġconstrained":26525,"Ġenvelop":26526,"ĠIronically":26527,"aban":26528,"Ġapparatus":26529,"Ġcue":26530,"Ġborne":26531,"ĠRoz":26532,"ilton":26533,"Ġtheoretical":26534,"ĠWatching":26535,"Ġfuck":26536,"ĠSilk":26537,"ĠSTE":26538,"bler":26539,"ĠPOST":26540,"ĠUpton":26541,"Ġsummons":26542,"ĠCum":26543,"ĠKL":26544,"Ġrelaxation":26545,"ĠDuff":26546,"Ġincumb":26547,"ĠRedd":26548,"Ġstature":26549,"Ġcanv":26550,"added":26551,"Ġremedies":26552,"ĠISO":26553,"ĠDecker":26554,"Ġafloat":26555,"Ġstartling":26556,"ĠBethlehem":26557,"Ġrealizes":26558,"find":26559,"ĠAra":26560,"Ġphased":26561,"arov":26562,"Ġhalting":26563,"ĠWindow":26564,"Ġdentist":26565,"Ġtumble":26566,"Ġvalidation":26567,"Ġcarve":26568,"ĠIPS":26569,"Ġirrit":26570,"ĠEssential":26571,"Ġfluids":26572,"rons":26573,"Ġimplant":26574,"Ġnuisance":26575,"ĠShelley":26576,"ĠGemini":26577,"Ġpharmac":26578,"iction":26579,"Ġtaped":26580,"ĠGovernments":26581,"ruly":26582,"Ġscant":26583,"Ġprominently":26584,"Ġreim":26585,"unning":26586,"arted":26587,"ĠMatters":26588,"Ġ1918":26589,"ĠPros":26590,"atel":26591,"ĠBattalion":26592,"onduct":26593,"talk":26594,"ĠTinder":26595,"ĠInstant":26596,"ĠKern":26597,"Ġbuckets":26598,"ĠGroups":26599,"Ġmetaphor":26600,"cloud":26601,"ĠString":26602,"Ohio":26603,"Ġcaffeine":26604,"Old":26605,"Ġdefinite":26606,"ĠNikola":26607,"ĠLords":26608,"icol":26609,")?":26610,"Ġenjoyment":26611,"Ġfamine":26612,"Ġdefinitions":26613,"ĠJem":26614,"Check":26615,"Ġaiding":26616,"ĠMé":26617,"Ġrenewables":26618,"Ġsightings":26619,"footed":26620,"Box":26621,"Ġgoats":26622,"Ġshack":26623,"AX":26624,"ĠMonk":26625,"ĠGraduate":26626,"Ġmeats":26627,"handle":26628,"147":26629,"rys":26630,"Ġunsub":26631,"Pont":26632,"uble":26633,"440":26634,"Ġeyel":26635,"thro":26636,"Ġcreep":26637,"^^^^":26638,"Ġpopcorn":26639,"Ġcompression":26640,"sal":26641,"ouf":26642,"Ġrepairing":26643,"Think":26644,"Ġdoubtful":26645,"ĠLooks":26646,"Ġtaller":26647,"Ġsul":26648,"sf":26649,"give":26650,"ĠGau":26651,"Ġrevered":26652,"EMBER":26653,"Ġsloppy":26654,"ersen":26655,"Ġvitamins":26656,"ĠImprovement":26657,"Ġprogresses":26658,"Ġdiploma":26659,"semb":26660,"ustain":26661,"Ġchant":26662,"Ġbumped":26663,"Ġsabotage":26664,"nant":26665,"Ġrabbit":26666,"Ġdividing":26667,"ĠDefender":26668,"Ġlik":26669,"Ġirrespective":26670,"cade":26671,"ĠSter":26672,"touch":26673,"EMA":26674,"Ġparted":26675,"ĠBAR":26676,"hung":26677,"Ġannoyed":26678,"Ġhinder":26679,"Ġexamines":26680,"oan":26681,"ĠBoe":26682,"Ġaggreg":26683,"ĠChu":26684,"ĠUCS":26685,"IGHTS":26686,"pez":26687,"ĠUNESCO":26688,"Ġwindshield":26689,"Martin":26690,"Ġwithhold":26691,"does":26692,"Ġbruising":26693,"Ġdeterior":26694,"bourg":26695,"ĠTowers":26696,"JD":26697,"England":26698,"Ġequivalents":26699,"Ġrazor":26700,"Ġreassuring":26701,"Ġident":26702,"Ġ208":26703,"reath":26704,"ceans":26705,"Ġpatrolling":26706,"eve":26707,"pots":26708,"itative":26709,"Ġsided":26710,"Ġsofa":26711,"Ġunborn":26712,"Ġaug":26713,"Ġperpetual":26714,"effect":26715,"represented":26716,"Ġrails":26717,"ĠSummers":26718,"ĠMOR":26719,"ĠSlow":26720,"ĠExpert":26721,"Ġshameful":26722,"Ġaudits":26723,"Sl":26724,"ĠBurr":26725,"adow":26726,"ĠWAY":26727,"anic":26728,"ĠIslamists":26729,"ĠStranger":26730,"pse":26731,"amaz":26732,"ĠPeggy":26733,"ĠSeventh":26734,"Ġscreenplay":26735,"ĠGriff":26736,"Ireland":26737,"142":26738,"Ġneural":26739,"ĠFernand":26740,"ainment":26741,"ĠMigration":26742,"ureen":26743,"ĠSCH":26744,"Sullivan":26745,"ĠWag":26746,"ĠREG":26747,"Ġ420":26748,"inky":26749,"ĠNewspaper":26750,"School":26751,"Ok":26752,"ĠKrishna":26753,"Ġ480":26754,"erald":26755,"Ġskipping":26756,"Ġharrowing":26757,"158":26758,"rogen":26759,"Ġbetrayal":26760,"Ġculmination":26761,"ĠCirc":26762,"Ġ211":26763,"stro":26764,"ĠTrace":26765,"Ġheaviest":26766,"td":26767,"ĠHenri":26768,"epend":26769,"RB":26770,"arella":26771,"umbai":26772,"Ġcrem":26773,"ĠDistribut":26774,"ruff":26775,"Ġscreams":26776,"Ġscathing":26777,"girls":26778,"Ġtiles":26779,"ĠEvil":26780,"usp":26781,"Ġknowledgeable":26782,"Ġrestitution":26783,"ĠWiFi":26784,"Ġitiner":26785,"exper":26786,"oris":26787,"ĠPokémon":26788,"iane":26789,"produ":26790,"ĠAchievement":26791,"Ġbrunt":26792,"ĠSurgery":26793,"Ġpragmatic":26794,"Ber":26795,"ĠKejriwal":26796,"cus":26797,"Ġconsensual":26798,"acet":26799,"ĠSecondly":26800,"Ġdivul":26801,"uca":26802,"Ġbusted":26803,"emies":26804,"ĠMou":26805,"Ġ217":26806,"Ġexcludes":26807,"ĠSamoa":26808,"Ġlofty":26809,"ĠSic":26810,"ĠRemem":26811,"dn":26812,"Ġeradicate":26813,"Ġpies":26814,"Ġscenery":26815,"ATTLE":26816,"ĠWAS":26817,"Ġinnovate":26818,"ĠEverest":26819,"Ġsynonymous":26820,"izen":26821,"Ġeuth":26822,"ĠFIA":26823,"ITIES":26824,"ĠSuddenly":26825,"Ġforay":26826,"pell":26827,"ÄŁ":26828,"licensed":26829,"Ġfra":26830,"Ġblasting":26831,"autical":26832,"ĠBlizzard":26833,"orer":26834,"Ġchili":26835,"ĠSylvia":26836,"except":26837,"tec":26838,"ĠResistance":26839,"young":26840,"usions":26841,"iotic":26842,"ĠDreams":26843,"ĠArchives":26844,"Ġunleash":26845,"ĠPract":26846,"Ġlikened":26847,"Ġga":26848,"Ġdisappearing":26849,"Ġunnoticed":26850,"Ġfrightened":26851,"arms":26852,"ĠCAD":26853,"Ġcoloured":26854,"ĠSigns":26855,"oing":26856,"Ġvodka":26857,"ruption":26858,"otions":26859,"isal":26860,"ĠBecome":26861,"Ġswoop":26862,"reating":26863,"Ġchoking":26864,"Ġunforgettable":26865,"258":26866,"packs":26867,"345":26868,"ĠAutumn":26869,"Ġther":26870,"399":26871,"ĠFaculty":26872,"Ġ1933":26873,"ĠNormally":26874,"orge":26875,"ĠTess":26876,"ĠChrom":26877,"Ġscripts":26878,"Ġbiking":26879,"Act":26880,"Ġgrazing":26881,"ĠLabrador":26882,"ĠLey":26883,"Ġwandering":26884,"Ġfend":26885,"ĠPolk":26886,"ĠKeane":26887,"ĠBeef":26888,"elope":26889,"ĠApproximately":26890,"Ġ1952":26891,"personal":26892,"Ġhistorians":26893,"ĠMcDonnell":26894,"must":26895,"LES":26896,"iking":26897,"Ġtherm":26898,"Ġhumane":26899,"Ġcrowdfunding":26900,"ĠBenefits":26901,"Land":26902,"Ġanalog":26903,"agency":26904,"ĠCrowley":26905,"Ġbirths":26906,"Ġobj":26907,"Ġfren":26908,"ĠSalmon":26909,"bies":26910,"Ġreve":26911,"216":26912,"Ġbetrayed":26913,"Ġinduced":26914,"acles":26915,"Ġtrad":26916,"Ġforgiven":26917,"Ġearners":26918,"208":26919,"Ġxen":26920,"Ġunle":26921,"Ġnecklace":26922,"Ġgravel":26923,"Ġsalads":26924,"Ġgrooming":26925,"California":26926,"Ġpossessed":26927,"Ġproclamation":26928,"Ġsequences":26929,"ream":26930,"FOX":26931,"arkin":26932,"ĠTRAN":26933,"Ġpurs":26934,"ĠLoans":26935,"Ġsacrificed":26936,"Ġiceberg":26937,"Phill":26938,"Ġgalvan":26939,"Ġsmugglers":26940,"formation":26941,"onson":26942,"ĠVaughn":26943,"Ġdoctrine":26944,"ĠEyes":26945,"Ġunmanned":26946,"states":26947,"Ġdetermin":26948,"almost":26949,"Ġeviction":26950,"Ġtid":26951,"ARR":26952,"Ġcooks":26953,"Bad":26954,"ĠCamb":26955,"Ġlinear":26956,"229":26957,"ĠCooke":26958,"ĠPurch":26959,"join":26960,"ĠCult":26961,"ĠRefugee":26962,"Ġslamming":26963,"ĠðŁij":26964,"Ġpedal":26965,"ĠVeronica":26966,"Ġlandowners":26967,"ĠYel":26968,"ĠWorkshop":26969,"antic":26970,"Ġdysfunction":26971,"Ġ229":26972,"Ġculturally":26973,"Ġinfuri":26974,"ĠEck":26975,"sem":26976,"Ġwired":26977,"ĠWerner":26978,"lov":26979,"ĠJasper":26980,"Ġvehemently":26981,"ĠSpy":26982,"lift":26983,"ĠNab":26984,"ĠPound":26985,"ĠHanna":26986,"Ġleveled":26987,"WOOD":26988,"tm":26989,"ĠKitt":26990,"Ġconve":26991,"nat":26992,"Ġjog":26993,"IVER":26994,"Ġmemes":26995,"Ġseaw":26996,"ector":26997,"Ġsprayed":26998,"Ġvaccinated":26999,"Europe":27000,"Ġmustard":27001,"ĠMahm":27002,"Ġ214":27003,"Research":27004,"iminary":27005,"Ġconcerted":27006,"Detroit":27007,"Ġkios":27008,"Ġplummet":27009,"Ġvisuals":27010,"247":27011,"Ġ228":27012,"development":27013,"ĠPascal":27014,"acial":27015,"ĠSeasons":27016,"ĠTL":27017,"480":27018,"ĠReader":27019,"Ġexpulsion":27020,"Ġchoked":27021,"Ġdevotion":27022,"ĠSTAT":27023,"urred":27024,"Ġfascinated":27025,"Ġstealth":27026,"NL":27027,"Ġbooster":27028,"Kat":27029,"ĠPriebus":27030,"Ġaux":27031,"ĠHate":27032,"ĠThing":27033,"Ġabnormal":27034,"Ġcalmly":27035,"Ġdedicate":27036,"cause":27037,"Ġisolate":27038,"ĠPai":27039,"Ġsuspensions":27040,"Ġpoisoned":27041,"ission":27042,"Ġprohibiting":27043,"353":27044,"banks":27045,"Ġkissed":27046,"ĠBegin":27047,"atis":27048,"LI":27049,"Ġshaft":27050,"ĠGuth":27051,"ĠBoo":27052,"Ġcinnamon":27053,"Ġverbally":27054,"ĠRabbi":27055,"Ġmonsters":27056,"done":27057,"ĠClyde":27058,"Ġspar":27059,"ĠCage":27060,"ĠPersons":27061,"305":27062,"ĠMons":27063,"Ġjealous":27064,"Ġswirling":27065,"know":27066,"Ġprote":27067,"Ġcruising":27068,"Ġduly":27069,"Ġchapel":27070,"Ġgroove":27071,"bps":27072,"ĠKelvin":27073,"iom":27074,"aer":27075,"bomb":27076,"Christian":27077,"Ġgigs":27078,"+.":27079,"ĠWei":27080,"Ġfarmland":27081,"otally":27082,"Ġequitable":27083,"ĠCBO":27084,"chool":27085,"amara":27086,"Ġwealthiest":27087,"ĠMeans":27088,"Ġ235":27089,"ĠUk":27090,"steps":27091,"raham":27092,"nerg":27093,"Ġclad":27094,"Ġsled":27095,"ĠMorrow":27096,"152":27097,"ĠRece":27098,"Ġplausible":27099,"Ġbisexual":27100,"artments":27101,"Ġveh":27102,"ĠLoft":27103,"bly":27104,"ĠCONC":27105,"automatic":27106,"Ġmasterpiece":27107,"ĠSpringer":27108,"Ġtendencies":27109,"Ro":27110,"Ġresentment":27111,"Ġadversely":27112,"Ġbandwidth":27113,"ĠDAV":27114,"Ġtun":27115,"Ġpuppies":27116,"ĠBundes":27117,"ĠHort":27118,"ĠGarfield":27119,"Ġenlist":27120,"Ġmont":27121,"gd":27122,"Ġrooting":27123,"Dream":27124,"Ġfulfillment":27125,"chal":27126,"182":27127,"prop":27128,"159":27129,"Ġcourtyard":27130,"iard":27131,"ĠSle":27132,"Ġoperative":27133,"Ġpublishes":27134,"ĠProposition":27135,"Ġcritique":27136,"Ġredist":27137,"wang":27138,"ĠNep":27139,"DD":27140,"Ġbonding":27141,"141":27142,"ĠAssault":27143,"-'":27144,"Ġlodging":27145,"itters":27146,"cigarettes":27147,"Ġ__":27148,"ĠLaf":27149,"GF":27150,"ĠAnat":27151,"ĠStephan":27152,"214":27153,"ĠKass":27154,"Ġviz":27155,"Ġpiling":27156,"Ġfugitive":27157,"ĠCurrency":27158,"ĠCrypto":27159,"Ġfaux":27160,"ĠPing":27161,"ĠLia":27162,"igl":27163,"Ġadversaries":27164,"ĠYPG":27165,"ĠComb":27166,"ĠYar":27167,"heny":27168,"Ġoverhe":27169,"Fest":27170,"emy":27171,"Ever":27172,"Ġ370":27173,"Ġsecretive":27174,"ĠSEN":27175,"ĠMEM":27176,"PRESS":27177,"ĠBirth":27178,"kos":27179,"Ġprecarious":27180,"irting":27181,"ĠUI":27182,"Ġoccupying":27183,"olute":27184,"Ġperiodic":27185,"eon":27186,"iens":27187,"ĠRH":27188,"Win":27189,"Ġplaybook":27190,"Ġexodus":27191,"ĠSkinner":27192,"Ġorderly":27193,"ĠVed":27194,"ouses":27195,"Ġescal":27196,"Ġbenign":27197,"Ġbots":27198,"ĠWhis":27199,"Ġappra":27200,"FOR":27201,"ĠChromebook":27202,"_____":27203,"990":27204,"athed":27205,"Ġspirited":27206,"illi":27207,"Ġbicycles":27208,"orse":27209,"ifestyle":27210,"orno":27211,"ĠDept":27212,"JA":27213,"Ġnausea":27214,"Ġpervasive":27215,"velop":27216,"commun":27217,"ĠUniversities":27218,"Ġremnants":27219,"Ġdisarm":27220,"ĠBoots":27221,"Ġprin":27222,"...\"":27223,"quila":27224,"Ġcautiously":27225,"uper":27226,"onto":27227,"din":27228,"Ġvelocity":27229,"Ġconspiring":27230,"ĠMX":27231,"Ġemphasizing":27232,"Ġâĸ":27233,"ĠStam":27234,"Ġspices":27235,"Ġairplanes":27236,"uty":27237,"culture":27238,"ĠPetr":27239,"Ġglor":27240,"ĠExcel":27241,"ĠSpeech":27242,"Ġharmless":27243,"ĠPend":27244,"ĠCrossing":27245,"ĠDocument":27246,"Ġramifications":27247,"ĠCroatian":27248,"ĠKiller":27249,"Ġmultim":27250,"Ġdiscontinued":27251,"Ġcherished":27252,"ĠMaker":27253,"aspers":27254,"ĠBlooming":27255,"ĠMata":27256,"offic":27257,"Ġsettlers":27258,"ĠPlenty":27259,"ĠInstitutes":27260,"ĠArpaio":27261,"Pool":27262,"ĠSubst":27263,"Ġ380":27264,"Ġdecidedly":27265,"ollah":27266,"Den":27267,"ĠJiang":27268,"ĠAmos":27269,"Grand":27270,"ĠTurns":27271,"meyer":27272,"Ġconducive":27273,"Ġpoignant":27274,"abortion":27275,"Ġnotebook":27276,"Ġshelling":27277,"common":27278,"ĠPavel":27279,"Ġhumid":27280,"Ġinappropriately":27281,"????":27282,"Ġsoar":27283,"Ġdynasty":27284,"Ġresearched":27285,"ĠYon":27286,"Ġmaple":27287,"Ġwedge":27288,"mass":27289,"ĠTM":27290,"USE":27291,"eln":27292,"Ġgloss":27293,"rigan":27294,"steen":27295,"ĠDeV":27296,"Ġdebacle":27297,"Christmas":27298,"Ġtweaks":27299,"grab":27300,"Ġprofoundly":27301,"Ġcampaigner":27302,"ĠSeal":27303,"Ġiteration":27304,"Ġsigh":27305,"Ġunfounded":27306,"Ġframing":27307,"Ġrecognizable":27308,"Ġseizing":27309,"legal":27310,"Ġproportions":27311,"omers":27312,"rek":27313,"Ġscreenshot":27314,"itsu":27315,"ĠOG":27316,"ĠYing":27317,"ĠMississ":27318,"295":27319,"Ġlandsl":27320,"Ġpsychiatrist":27321,"sov":27322,"arine":27323,"Ju":27324,"Ġflo":27325,"apple":27326,"hof":27327,"wig":27328,"ĠENT":27329,"Ġenthusiast":27330,"Such":27331,"ĠArtificial":27332,"happy":27333,"oton":27334,"ĠFram":27335,"ĠRemove":27336,"Ġsmear":27337,"Ġjer":27338,"Ġtopp":27339,"Ġimbalance":27340,"ĠWords":27341,"Ġcoffers":27342,"olina":27343,"Ġrigged":27344,"uction":27345,"idding":27346,"Ġdispensaries":27347,"Ġdermat":27348,"Ġshutter":27349,"idental":27350,"Ġcontinu":27351,"Ġhumility":27352,"Ġbulbs":27353,"Ġ207":27354,"lass":27355,"ĠBeirut":27356,"ĠUlt":27357,"urry":27358,"NEWS":27359,"Ġfeminine":27360,"Ġsimulated":27361,"Ġcharger":27362,"mom":27363,"ĠCreed":27364,"Ġwolves":27365,"essions":27366,"created":27367,"ifiers":27368,"Ġdissemin":27369,"ĠDarling":27370,"umann":27371,"Ġmarrying":27372,"Ġshred":27373,"avin":27374,"Ġbudgetary":27375,"Ġmedicinal":27376,"ulin":27377,"seys":27378,"agues":27379,"Ġextracted":27380,"ĠFlower":27381,"Ġcontinents":27382,"ĠWish":27383,"Ġdivides":27384,"ĠDing":27385,"Ġinsulation":27386,"respect":27387,"ĠABS":27388,"Ġreconcile":27389,"keep":27390,"ILD":27391,"Ġgenome":27392,"Ġ410":27393,"ĠSweep":27394,"Ġharass":27395,"Ġfrantic":27396,"ĠEE":27397,"dad":27398,"Ġaperture":27399,"rought":27400,"Ġhugs":27401,"Ġdrying":27402,"Ġoverrun":27403,"Space":27404,"Ġperiodically":27405,"Ġbrightness":27406,"atched":27407,"kee":27408,"ĠITS":27409,"ĠSpokane":27410,"ĠSeaf":27411,"Ġdesks":27412,"ĠEisen":27413,"ĠOPS":27414,"Ġcider":27415,"Ġacceler":27416,"ĠAthlet":27417,"2008":27418,"ĠGuid":27419,"ĠManip":27420,"Ġmould":27421,"Ġmisguided":27422,"Ġbrow":27423,"Ġmanagerial":27424,"Ġhugged":27425,"Ġfurnish":27426,"ĠHarmony":27427,"ĠHebrew":27428,"Ġtyph":27429,"Ġdecreases":27430,"Ġimpetus":27431,"Ġcontagious":27432,"Ġunch":27433,"209":27434,"Ġswell":27435,"ĠHuffington":27436,"Ġpubs":27437,"Ġadequ":27438,"amoto":27439,"rir":27440,"Ġpristine":27441,"Ġanx":27442,"ĠSecure":27443,"Ġenrichment":27444,"ĠVAL":27445,"Ġsummed":27446,"Ġconfidently":27447,"ĠProfit":27448,"ĠFrog":27449,"ĠLena":27450,"ĠFUN":27451,"Ġbruises":27452,"Ġuproar":27453,"coll":27454,"ĠImpro":27455,"Ġflair":27456,"146":27457,"ĠBrend":27458,"Ġ166":27459,"Ġenhances":27460,"ĠDent":27461,"Ġdegener":27462,"Ġproponents":27463,"ĠInspired":27464,"Ġramps":27465,"Ġwisely":27466,"Western":27467,"Ġtart":27468,"Ġsteered":27469,"Ġtreason":27470,"dropping":27471,"Ġtransc":27472,"ĠScarlett":27473,"ĠEzekiel":27474,"Ġpivot":27475,"esame":27476,"Show":27477,"Ġdiscontent":27478,"ĠJudith":27479,"ĠPutting":27480,"Ġblessings":27481,"Ġhardcore":27482,"Ġtray":27483,"Ġdiscern":27484,"oley":27485,"ouk":27486,"Ġwil":27487,"Ġintolerance":27488,"157":27489,"ĠRelative":27490,"ĠLynd":27491,"Ġwhistleblower":27492,"Ġincon":27493,"ĠTao":27494,"Ġindefinite":27495,"Ġguardians":27496,"Ġagon":27497,"ĠInstruments":27498,"Ġexistential":27499,"AAF":27500,"vind":27501,"Ġbrazen":27502,"condition":27503,"Ġratified":27504,"fam":27505,"ĠHin":27506,"ĠMichaels":27507,"204":27508,"ĠKats":27509,"ITS":27510,"ISON":27511,"prone":27512,"Ġboiling":27513,"Ġprolong":27514,"Ġnoticing":27515,"resident":27516,"brance":27517,"ĠFolk":27518,"Ġdesserts":27519,"uton":27520,"Web":27521,"ĠLongh":27522,"ĠReef":27523,"Going":27524,"ĠCarb":27525,"Sur":27526,"complete":27527,"ĠSloan":27528,"ĠClubs":27529,"ĠSadd":27530,"Ġshrugged":27531,"Ġedible":27532,"ĠTyp":27533,"thal":27534,"ĠRocks":27535,"ĠClive":27536,"Ġkidding":27537,"ĠCrom":27538,"ĠTurks":27539,"ĠWak":27540,"Ġeyewitness":27541,"ĠHass":27542,"collar":27543,"Ġsucceeding":27544,"Ġinsert":27545,"Ġ224":27546,"ĠBret":27547,"Ġneurological":27548,"Ġrewrite":27549,"imil":27550,"ultimate":27551,"ĠJeremiah":27552,"Ġliaison":27553,"Ġpedd":27554,"direct":27555,"ĠYi":27556,"ĠMAD":27557,"ĠOrion":27558,"oyd":27559,"ĠLOC":27560,"release":27561,"Ġinvestigates":27562,"ĠApache":27563,"û":27564,"ĠVend":27565,"Ġcynical":27566,"ĠHelm":27567,"ĠMovies":27568,"tops":27569,"Ġsinister":27570,"Ġunparalleled":27571,"Ġspikes":27572,"Ġoverlap":27573,"enstein":27574,"Ġhypocrisy":27575,"Plus":27576,"Ġexpansions":27577,"Ġvow":27578,"Ġdetonated":27579,"Ġfellowship":27580,"Ġsolicitor":27581,"ĠNewtown":27582,"mony":27583,"ĠLod":27584,"ĠDevelopers":27585,"ateg":27586,"ibus":27587,"Ġcrumbling":27588,"ĠWein":27589,"ĠKlan":27590,"gio":27591,"ĠPhys":27592,"ĠAntarctica":27593,"368":27594,"Ġseam":27595,"Ġautomobiles":27596,"ĠTEAM":27597,"bern":27598,"Ġmanic":27599,"Ġsanct":27600,"Ġequals":27601,"Est":27602,"Ġincentiv":27603,"ĠHawking":27604,"nin":27605,"Ġresonate":27606,"bid":27607,"Ġtelescope":27608,"endon":27609,"ĠVacc":27610,"Ġregretted":27611,"Ġ1300":27612,"ĠForestry":27613,"BOOK":27614,"Ġgroundwork":27615,"Ġessays":27616,"ĠIndo":27617,"Pierre":27618,"ĠChau":27619,"Ġapologies":27620,"killers":27621,"ĠMoroccan":27622,"0001":27623,"336":27624,"Ra":27625,"Ġparcels":27626,"Ġleaned":27627,"Ġthankfully":27628,"ĠSplit":27629,"Ġlobbied":27630,"ĠDegree":27631,"Ġrisking":27632,"assy":27633,"Ġsupplemental":27634,"little":27635,"Ġeclectic":27636,"Ġ206":27637,"ealing":27638,"206":27639,"Ġrepo":27640,"Ġhose":27641,"ayn":27642,"lux":27643,"Ġbeliever":27644,"')":27645,"ĠHide":27646,"vance":27647,"ĠEinstein":27648,"Ġdepos":27649,"Ġfray":27650,"Ġki":27651,"Ġinternship":27652,"ĠHou":27653,"Vis":27654,"Ġstare":27655,"ĠBreed":27656,"option":27657,"Ġvisionary":27658,"Ġmins":27659,"Ġbitten":27660,"ancies":27661,"ĠShake":27662,"Ġtemplate":27663,"Ġliner":27664,"Ġmuster":27665,"appro":27666,"ĠMubarak":27667,"esty":27668,"mong":27669,"actory":27670,"Ġheadphone":27671,"ĠPrec":27672,"Ġwaive":27673,"Ron":27674,"ĠHearing":27675,"Ġimperfect":27676,"Ġsealing":27677,"Ġlocating":27678,"Ġculminated":27679,"chio":27680,"channel":27681,"lust":27682,"ĠLowell":27683,"woods":27684,"Ġsoak":27685,"Ġforbidden":27686,"Ġdetached":27687,"unct":27688,"ĠHunger":27689,"ĠPatient":27690,"ĠPolo":27691,"Saharan":27692,"Jon":27693,"athered":27694,"ĠSignal":27695,"Six":27696,"Ġstatistically":27697,"ITH":27698,"artment":27699,"ĠCU":27700,"Ġhates":27701,"qual":27702,"Ġcapitalist":27703,"ATES":27704,"ĠDesc":27705,"Ġhandcuffed":27706,"Ġindulge":27707,"ĠReligious":27708,"German":27709,"housing":27710,"Ġdismantling":27711,"Ġconventions":27712,"dain":27713,"chairs":27714,"Ġloos":27715,"Ġknowingly":27716,"Var":27717,"Ġhusbands":27718,"eez":27719,"asion":27720,"ĠIssa":27721,"Ġswollen":27722,"Ġ1946":27723,"Ġheadlined":27724,"Chelsea":27725,"Ġignorant":27726,"Ġperipheral":27727,"Note":27728,"Ġaxe":27729,"Ġnicotine":27730,"ĠSanctuary":27731,"Ġ1917":27732,"Ġwithdrawals":27733,"uits":27734,"Hot":27735,"Ġreimburse":27736,"probably":27737,"ĠAdapt":27738,"industrial":27739,"answer":27740,"orus":27741,"ĠMell":27742,"Talk":27743,"Ġcontemplating":27744,"omas":27745,"Ġtaxis":27746,"Ġencompasses":27747,"rations":27748,"ĠLatvia":27749,"Ġhumiliating":27750,"Ġloft":27751,"tight":27752,"rium":27753,"Ġlogin":27754,"ĠBulletin":27755,"Ġturtles":27756,"EAR":27757,"349":27758,"Radio":27759,"ĠBord":27760,"151":27761,"kk":27762,"pocket":27763,"Ġdove":27764,"348":27765,"Ġtemptation":27766,"ĠCoy":27767,"those":27768,"ĠDest":27769,"ishly":27770,"rn":27771,"Ġmammals":27772,"ĠTub":27773,"arial":27774,"ĠPersian":27775,"Ġdaddy":27776,"Zen":27777,"Ġps":27778,"Ġ]":27779,"Field":27780,"adiq":27781,"Ġmeaningless":27782,"Ġprimer":27783,"Ġ1942":27784,"Ġ!":27785,"625":27786,"Ġfashionable":27787,"ĠTheft":27788,"ĠHAVE":27789,"christ":27790,"Ġperil":27791,"Ġrepealing":27792,"Ġbuff":27793,"Ġodor":27794,"Ġstalking":27795,"ĠDems":27796,"iences":27797,"Ġunilaterally":27798,"odies":27799,"ĠQuite":27800,"Ġbloodshed":27801,"Ġinfect":27802,"Ġreminders":27803,"Ġchop":27804,"Ġevapor":27805,"877":27806,"Ġhorrified":27807,"ĠFruit":27808,"rams":27809,"Ġinsecure":27810,"cester":27811,"ĠNationwide":27812,"Ġmocking":27813,"Ret":27814,"Ġcomplying":27815,"sav":27816,"Ġali":27817,"Family":27818,"Ĩ":27819,"Ġdishonest":27820,"Ġincorrectly":27821,"LOAD":27822,"ĠGand":27823,"ourcing":27824,"obby":27825,"ĠPetersen":27826,"Something":27827,"Ġravaged":27828,"limited":27829,"Ġrituals":27830,"ĠKnowledge":27831,"ĠUtility":27832,"Ġdoom":27833,"Ġsheds":27834,"ĠGael":27835,"ĠMillennials":27836,"ĠMonthly":27837,"Ġdomination":27838,"Ġrapport":27839,"spot":27840,"ĠPrest":27841,"ĠHA":27842,"ushes":27843,"Ġtact":27844,"Richard":27845,"Ġgritty":27846,"Does":27847,"ĠTNT":27848,"Ġdownfall":27849,"Wood":27850,"ĠPrediction":27851,"ĠPour":27852,"ĠFraud":27853,"ĠSyndrome":27854,"166":27855,"Ġliteral":27856,"Ġaddict":27857,"ĠLoud":27858,"hens":27859,"ĠAccounts":27860,"distance":27861,"Ġclassmate":27862,"Ġsalv":27863,"Ġunlucky":27864,"Ġpartying":27865,"ĠKou":27866,"ĠSNAP":27867,"%-":27868,"Ġdelegate":27869,"Ġstrikers":27870,"ĠSlate":27871,"Ġarticulate":27872,"390":27873,"Ġinqu":27874,"Ġdiscredit":27875,"ĠPriv":27876,"ploy":27877,"ĠMarketplace":27878,"ĠTune":27879,"visor":27880,"Ġwrestle":27881,"Ġkindly":27882,"ĠCollect":27883,"Ġcirc":27884,"ĠRemain":27885,"Ġ192":27886,"contin":27887,"Ġ325":27888,"Ġsevered":27889,"isations":27890,"Ġmuddy":27891,"Ġtaxing":27892,"ĠRepresent":27893,"ĠSty":27894,"rology":27895,"ĠJudges":27896,"ĠBronze":27897,"ĠApplic":27898,"Ġarrow":27899,"consuming":27900,"ĠFeaturing":27901,"Ġspies":27902,"Ġnoises":27903,"ĠColony":27904,"lost":27905,"Ġopp":27906,"Ġdeem":27907,"ĠGarc":27908,"icent":27909,"ptroller":27910,"liest":27911,"Ġoutward":27912,"ĠUser":27913,"Ġintimidate":27914,"156":27915,"Ġjab":27916,"ANGE":27917,"Jay":27918,"ĠPoverty":27919,"ACA":27920,"Ġrife":27921,"Ġfaint":27922,"ĠAcceler":27923,"tall":27924,"ĠUNITED":27925,"ĠFighter":27926,"ĠGilmore":27927,"Ġsod":27928,"amura":27929,"Ġpredictive":27930,"Ġpolish":27931,"ĠDD":27932,"Ġfabricated":27933,"ĠDag":27934,"Ġfatty":27935,"Ġplague":27936,"Ġexhib":27937,"ĠAdvent":27938,"Ġ1941":27939,"ERSON":27940,"initely":27941,"Ġloneliness":27942,"ĠEquality":27943,"Ġuntrue":27944,"Ġonlook":27945,"Ġfragmented":27946,"ruce":27947,"Ġdistrust":27948,"Ġscal":27949,"ĠCors":27950,"Ġrobbing":27951,"cultural":27952,"clusion":27953,"ĠObi":27954,"sels":27955,"ĠEvidence":27956,"ĠSac":27957,"Ġfragments":27958,"Ġflipping":27959,"ĠRabbit":27960,"Ġdisproportionate":27961,"ĠCreat":27962,"Ġlabeling":27963,"ĠGri":27964,"Ġ161":27965,"ĠEditors":27966,"holm":27967,"adr":27968,"Ĭ":27969,"tailed":27970,"Ġrenters":27971,"Ġnoodles":27972,"Ġcompetence":27973,"Ġpanc":27974,"uration":27975,"Ġacids":27976,"Ġconfid":27977,"rival":27978,"AAA":27979,"kson":27980,"Ġrecreate":27981,"153":27982,"Ġ164":27983,"ĠOlympia":27984,"ĠUnlimited":27985,"ĠShock":27986,"ĠTeaching":27987,"ĠHouses":27988,"resso":27989,"ĠMaw":27990,"Ġreplen":27991,"Ġprotestors":27992,"bey":27993,"Ġsurve":27994,"Ġemphasizes":27995,"223":27996,"ĠEsther":27997,"ĠNikol":27998,"Ġprosecutions":27999,"ĠFreed":28000,"Ġposs":28001,"OTE":28002,"ĠPrayer":28003,"Ġsquarely":28004,"Ġtir":28005,"adv":28006,"Ġbogus":28007,"Ġwrongful":28008,"Ġembell":28009,"Ġseldom":28010,"Ġpossesses":28011,"Er":28012,"ĠAlternatively":28013,"Ġinstituted":28014,"rr":28015,"Ġvocational":28016,"eval":28017,"ĠComics":28018,"Ġstumbling":28019,"335":28020,"Ġdragon":28021,"vine":28022,"services":28023,"Ġcrit":28024,"irens":28025,"Ġlayered":28026,"orb":28027,"Ġdominates":28028,"ĠMarx":28029,"period":28030,"avering":28031,"Ġbrigade":28032,"Ġchem":28033,"ĠEvolution":28034,"ĠSuk":28035,"Ġ209":28036,"ĠMalk":28037,"Ġtallest":28038,"recogn":28039,"ĠCraw":28040,"Ġell":28041,"ĠCaesar":28042,"php":28043,"ĠSurvivors":28044,"sd":28045,"itsch":28046,"ambo":28047,"Ġashore":28048,"acular":28049,"rost":28050,"Ġmurderer":28051,"Ġcasts":28052,"ĠEconomist":28053,"ĠWeapons":28054,"Ġnostalgic":28055,"Skip":28056,"REAM":28057,"Pa":28058,"Ġjournals":28059,"ĠSitting":28060,"Union":28061,"Att":28062,"ĠMaxim":28063,"Ġpurportedly":28064,"Ġrespecting":28065,"ĠMAX":28066,"seed":28067,"Ġjuicy":28068,"ĠGallup":28069,"Ġmileage":28070,"adier":28071,"Ġbod":28072,"DER":28073,"Ġsummers":28074,"icult":28075,"ipl":28076,"ĠDeng":28077,"Ġsmells":28078,"Ġivory":28079,"Ġ255":28080,"Id":28081,"DEN":28082,"Ġ159":28083,"Due":28084,"ĠLighting":28085,"ĠSurely":28086,"Ġsund":28087,"ĠKessler":28088,"immigrant":28089,"Ġtragedies":28090,"ĠOxy":28091,"ĠFixed":28092,"ĠBalk":28093,"Ġoriented":28094,"pher":28095,"Ġkitchens":28096,"Ġhips":28097,"Ġtweak":28098,"Ġtuna":28099,"ĠCla":28100,"Ġdislike":28101,"ussy":28102,"Ġoutnumbered":28103,"Ġplumbing":28104,"Ġcogn":28105,"ĠThrow":28106,"ĠTER":28107,"urally":28108,"ĠMurd":28109,"Ġcreamy":28110,"Ġresiding":28111,"otics":28112,"Ġfingerprints":28113,"!,":28114,"Ġpaused":28115,"ĠMilo":28116,"Ġhomosexuality":28117,"Ġresponsibly":28118,"iop":28119,"UCT":28120,"Ġsucceeds":28121,"ĠCRE":28122,"ĠThatcher":28123,"Ġcurrents":28124,"Ġarises":28125,"Ġwaterproof":28126,"Ġamp":28127,"ĠClaims":28128,"177":28129,"Ġsubpoen":28130,"Ġvig":28131,"ĠNeuro":28132,"Ġblur":28133,"ĠPaint":28134,"campus":28135,"Ġtoughness":28136,"ĠButton":28137,"Neal":28138,"ĠDEN":28139,"ĠNir":28140,"ĠAxel":28141,"EEP":28142,"Ġpint":28143,"Ġagile":28144,"odor":28145,"Ġessentials":28146,"ĠMov":28147,"ĠVenezuel":28148,"Ġexchanging":28149,"ĠNegative":28150,"Mil":28151,"Key":28152,"Ġbuzzing":28153,"ĠStew":28154,"Ġrebuke":28155,"Ġdepl":28156,"ĠKoz":28157,"Ġ163":28158,"Ġshines":28159,"NZ":28160,"Ġcarnage":28161,"cases":28162,"Ġwarmed":28163,"ĠGreenwich":28164,"College":28165,"Ġneedy":28166,"301":28167,"ĠMü":28168,"culation":28169,"Ġ440":28170,"425":28171,"atories":28172,"Ġsatisfactory":28173,"ĠFib":28174,"ĠElim":28175,"developed":28176,"Ġvacations":28177,"Ġpeculiar":28178,"Ġvets":28179,"onest":28180,"ĠPug":28181,"Ġlifestyles":28182,"zzi":28183,"Ġprovoke":28184,"bah":28185,"arger":28186,"ĠVirt":28187,"Sales":28188,"annel":28189,"ĠMeth":28190,"ivating":28191,"Ġrevoke":28192,"ĠAgenda":28193,"ĠIch":28194,"Ġsensit":28195,"ĠAzerbai":28196,"ĠBombay":28197,"Ġuncon":28198,"river":28199,"Ġapr":28200,"actic":28201,"ĠSubaru":28202,"Ġbanquet":28203,"Ġcontradict":28204,"tek":28205,"Football":28206,"igent":28207,"Ġreintrodu":28208,"ĠInsight":28209,"Ġsystematically":28210,"Ġboun":28211,"ĠFishing":28212,"Ġstri":28213,"ĠOB":28214,"Ġstair":28215,"Wall":28216,"ĠAllow":28217,"Ġcaramel":28218,"169":28219,"Ġcafes":28220,"Ġcalcium":28221,"Ġ169":28222,"Ġportraying":28223,"Ġdiscriminate":28224,"Ġunrestricted":28225,"Ġmant":28226,"Ġscarcity":28227,"Ġfeminism":28228,"ĠJJ":28229,"ĠOversight":28230,"ĠCue":28231,"Ġinexperienced":28232,"Ġdrafts":28233,"Ġ1939":28234,"nm":28235,"forest":28236,"ĠHonour":28237,"Ġceramic":28238,"Ġdownstairs":28239,"Ġboon":28240,"Ġmorality":28241,"Ġhorrifying":28242,"Rad":28243,"justice":28244,"Ġmosques":28245,"Ġcurfew":28246,"Ġsurrogate":28247,"Ġreimb":28248,"enth":28249,"pressure":28250,"beam":28251,"Ġwhirlwind":28252,"ĠRecession":28253,"ĠTours":28254,"Ġclusters":28255,"ĠQuant":28256,"Jonathan":28257,"project":28258,"Ġ777":28259,"ĠNOAA":28260,"abis":28261,"Ġdeficiencies":28262,"Ġsuicides":28263,"Ġfoothold":28264,"ĠYah":28265,"imeter":28266,"URN":28267,"Ġcultivate":28268,"Ġnoisy":28269,"Ġ1951":28270,"Ġpressuring":28271,"ĠDeals":28272,"ĠProphet":28273,"ĠWikipedia":28274,"INESS":28275,"ĠShine":28276,"ĠCalled":28277,"ĠSole":28278,"ĠZhou":28279,"Ġasphalt":28280,"armac":28281,"ĠScorp":28282,"ĠUnknown":28283,"ĠPAT":28284,"Heart":28285,"Ġguessed":28286,"Ġsushi":28287,"Ġheartbeat":28288,"Ġconcent":28289,"eret":28290,"plin":28291,"Ġweeds":28292,"Ġbombed":28293,"ĠTerrorism":28294,"Rich":28295,"Ġblades":28296,"Ġhaunt":28297,"Ġstorefront":28298,"Ġthwarted":28299,"access":28300,"ĠLydia":28301,"LINE":28302,"Ġpregnancies":28303,"Ġripping":28304,"ĠBelieve":28305,"spoken":28306,"inian":28307,"sed":28308,"ĠBrass":28309,"econom":28310,"current":28311,"Ġvoc":28312,"Ġmodeled":28313,"Ġpeppers":28314,"otech":28315,"ĠOption":28316,"Connell":28317,"isel":28318,"Ġcompel":28319,"Ġjuveniles":28320,"ĠNET":28321,"ĠEXP":28322,"Ġparadigm":28323,"Des":28324,"Ġ204":28325,"employed":28326,"Ġdurability":28327,"Ġ245":28328,"Ġbillionaires":28329,"violent":28330,"ĠCooperative":28331,"TOP":28332,"ĠGarry":28333,"ĠSoldiers":28334,"Ġdared":28335,"Ġvoucher":28336,"Ġblends":28337,"gue":28338,"Ġadventurous":28339,"Ġorganisms":28340,"Ġgaze":28341,"Ġcrap":28342,"Coach":28343,"omon":28344,"ĠWheels":28345,"ĠGrayson":28346,"Ġrecy":28347,"grave":28348,"Ġallergic":28349,"Ġreef":28350,"Ġbeginnings":28351,"ĠRuff":28352,"Ġclout":28353,"structed":28354,"315":28355,"ĠGeorgian":28356,"say":28357,"Ġsprings":28358,"ĠAsus":28359,"Ġrepaid":28360,"ĠGuys":28361,"ticket":28362,"Ġunb":28363,"ĠCertificate":28364,"ĠSTORY":28365,"cin":28366,"Ġpassions":28367,"Ġmediocre":28368,"Ġlackluster":28369,"vernight":28370,"kids":28371,"ĠWife":28372,"politics":28373,"ĠHimal":28374,"oddy":28375,"ensus":28376,"ĠGustav":28377,"binding":28378,"ĠIndividuals":28379,"Ġmaize":28380,"Ġhoop":28381,"ĠChanging":28382,"Ġlessen":28383,"Ġarranging":28384,"ĠFukushima":28385,"ĠTrying":28386,"ĠMage":28387,"Ġskeleton":28388,"ĠTec":28389,"289":28390,"Ġrecl":28391,"ĠFIL":28392,"Gs":28393,"ĠOdyssey":28394,"ĠProcessing":28395,"ilion":28396,"Ġsubsidized":28397,"Ġabdomen":28398,"Ġanalyse":28399,"music":28400,"clean":28401,"Ġunfinished":28402,"Ġdownloads":28403,"Ġmorally":28404,"Ġ218":28405,"Ġtrib":28406,"Keep":28407,"ĠSER":28408,"FY":28409,"Ġaust":28410,"Ġdiscovers":28411,"ĠGROUP":28412,"ĠMachines":28413,"Ġeroded":28414,"Ġominous":28415,"Ġbrightly":28416,"IME":28417,"Ġwicked":28418,"ĠTrou":28419,"Ġvisions":28420,"Kay":28421,"reported":28422,"Ġbog":28423,"ĠQuin":28424,"ĠSigma":28425,"urned":28426,"ixon":28427,"Ġharming":28428,"Ġcheckout":28429,"inet":28430,"much":28431,"Ġcherish":28432,"ĠByrd":28433,"ĠSamson":28434,"WP":28435,"orders":28436,"boa":28437,"Ġbron":28438,"oki":28439,"ĠRR":28440,"Ġsuitcase":28441,"Ġfeathers":28442,"ĠChristy":28443,"Islamic":28444,"Ġamusement":28445,"ĠISS":28446,"intensive":28447,"Qaida":28448,"Ġneurons":28449,"Ġwagon":28450,"ĠTek":28451,"Ġdolls":28452,"ĠShoot":28453,"Ġunderestimate":28454,"Ġstreamlined":28455,"Ġfractures":28456,"Ġcathedral":28457,"Ġeliminates":28458,"helle":28459,"Ġcitrus":28460,"risis":28461,"Ġimpecc":28462,"istries":28463,"ĠHog":28464,"vote":28465,"pas":28466,"Ġassign":28467,"ĠSongs":28468,"ĠMiracle":28469,"kas":28470,"zynski":28471,"Ġcrane":28472,"Ġadulthood":28473,"ĠBenefit":28474,"ĠGrimes":28475,"Ġpayday":28476,"ablished":28477,"Ġcenterpiece":28478,"Ġhassle":28479,"ĠAppalachian":28480,"follow":28481,"Ġ290":28482,"ĠRL":28483,"ĠDoe":28484,"Ġacclaim":28485,"Ġlevied":28486,"Ġtossing":28487,"Ġcarrots":28488,"ĠDarius":28489,"161":28490,"Ġoffspring":28491,"ĠJury":28492,"ĠTPP":28493,"CAP":28494,"Ġenvironmentalists":28495,"Ġrays":28496,"267":28497,"Ser":28498,"Ġcaptivity":28499,"Ġappellate":28500,"ĠElectricity":28501,"ĠEnough":28502,"232":28503,"Ġfisher":28504,"Ġbrilliance":28505,"Ġpraises":28506,"aunch":28507,"Ġsolicitation":28508,"Ġadolescent":28509,"Ġinferior":28510,"checks":28511,"Set":28512,"Ġmutations":28513,"ĠLatinos":28514,"ĠLicense":28515,"ĠAme":28516,"hirt":28517,"ĠChun":28518,"Ġdeeds":28519,"ldon":28520,"Ġmammoth":28521,"Ġturtle":28522,"rule":28523,"Ken":28524,"Ġvoyage":28525,"gram":28526,"Ġconquer":28527,"Ġretaliate":28528,"ĠPJ":28529,"ĠViking":28530,"Ġsafegu":28531,"ordinary":28532,"ĠArbit":28533,"ĠDigest":28534,"Die":28535,"Ġbureaucratic":28536,"Ġhonorable":28537,"Ġcafeteria":28538,"ĠRAF":28539,"ĠPlaces":28540,"ĠKlu":28541,"Cam":28542,"ĠBiology":28543,"ĠCycling":28544,"imore":28545,"Ġstripping":28546,"Ġwarriors":28547,"Ġbursting":28548,"Ġlapse":28549,"Ġversa":28550,"Ġclicked":28551,"ogh":28552,"Ġ\"â̦":28553,"Ġdiligently":28554,"ĠMiy":28555,"ĠCorpus":28556,"Ġredef":28557,"Ġ176":28558,"ĠInstrument":28559,"ĠOECD":28560,"Ġstro":28561,"Ġmicrowave":28562,"Santa":28563,"Ġpars":28564,"Social":28565,"iffe":28566,"itability":28567,"Equ":28568,"Ġnud":28569,"legged":28570,"ĠTud":28571,"lav":28572,"Ġinterpreter":28573,"alcohol":28574,"Ġimposition":28575,"Ġdwelling":28576,"Ġ1400":28577,"].\"":28578,"ĠIw":28579,"RM":28580,"Ġ555":28581,"Ġparalyzed":28582,"mind":28583,"rans":28584,"adin":28585,"French":28586,"Ġliar":28587,"Represent":28588,"Ġstrapped":28589,"orate":28590,"Ġrigging":28591,"Ġinterrog":28592,"Ġsparse":28593,"ento":28594,"ĠThem":28595,"Ġbaseless":28596,"Ġbuildup":28597,"Ġundecided":28598,"isms":28599,"Ġabduct":28600,"Ġflowed":28601,"Ġprestige":28602,"Ġhacks":28603,"Ġpanicked":28604,"Cast":28605,"ĠKrish":28606,"umat":28607,"Ġantique":28608,"Ġbitters":28609,"Ġentitlement":28610,"Ġstandby":28611,"Ten":28612,"said":28613,"ĠConditions":28614,"events":28615,"Ġobey":28616,"Ġshortest":28617,"etting":28618,"Ġconcentrating":28619,"ĠNeeds":28620,"234":28621,"Ġintrigued":28622,"enting":28623,"ĠXen":28624,"ĠAlger":28625,"seekers":28626,"anish":28627,"Ġ172":28628,"âĢij":28629,"Ġsilicon":28630,"Ġstandardized":28631,"ĠFountain":28632,"essel":28633,"Ġapproves":28634,"Ġsucked":28635,"gone":28636,"ĠBriggs":28637,"brother":28638,"Ġartisan":28639,"ĠContinuing":28640,"vir":28641,"Ġsubmarines":28642,"ĠInk":28643,"program":28644,"ĠNexus":28645,"ĠCoco":28646,"Ġconceptual":28647,"Ġmatt":28648,"aughters":28649,"Ġbaths":28650,"Ġbeaut":28651,"ĠEmerald":28652,"ĠParties":28653,"248":28654,"completely":28655,"esan":28656,"Ġdiarrhea":28657,"Ġ1100":28658,"borg":28659,"ĠBroken":28660,"Ġreiterate":28661,"Ġsorting":28662,"ONS":28663,"Ġ177":28664,"Ġadmin":28665,"ĠMandatory":28666,"Ġsymptom":28667,"Ġpaced":28668,"Remember":28669,"Ġabdominal":28670,"Ġswapped":28671,"Ġtransitions":28672,"IFA":28673,"pretty":28674,"ĠJC":28675,"Ġallotted":28676,"ĠShows":28677,"Arthur":28678,"Ġsoften":28679,"dozen":28680,"Mah":28681,"Ġextinguished":28682,"Ġreelection":28683,"Ġdeployments":28684,"Ġsturdy":28685,"Ġdownright":28686,"Ġjams":28687,"ĠOptim":28688,"Ġhumiliation":28689,"cd":28690,"Ġbunk":28691,"sie":28692,"NAT":28693,"ilies":28694,"Ġimplying":28695,"Ġ<":28696,"Ġhomepage":28697,"242":28698,"Ġey":28699,"Ġdict":28700,"Ġslender":28701,"Ġforehead":28702,"ĠCecil":28703,"Ġshrunk":28704,"ĠExit":28705,"Ġexpressly":28706,"Ġseals":28707,"ĠThiel":28708,"umni":28709,"Ġdamning":28710,"ĠVS":28711,"ulum":28712,"BBC":28713,"URES":28714,"Ġinhal":28715,"Ġfont":28716,"Ġworkplaces":28717,"ĠPUBLIC":28718,"ĠHorror":28719,"Bs":28720,"arta":28721,"ĠBread":28722,"Ġstret":28723,"Ġethos":28724,"Ġstabilized":28725,"Ġconvers":28726,"ĠInqu":28727,"Ġjudgments":28728,"ĠContemporary":28729,"221":28730,"Ġzombie":28731,"VD":28732,"Ġmisunderstanding":28733,"Ġspam":28734,"ĠPapers":28735,"Ġcrocod":28736,"ENA":28737,"ĠJuven":28738,"ĠAbram":28739,"Ġbursts":28740,"atto":28741,"Ġturbulence":28742,"tty":28743,"sexual":28744,"Ġwaning":28745,"community":28746,"Government":28747,"Ġtranspl":28748,"??":28749,"Getting":28750,"ĠRare":28751,"prime":28752,"Ġlooting":28753,"Ġvalidate":28754,"ĠCreating":28755,"ĠCorruption":28756,"Ġspit":28757,"ĠFavorite":28758,"Kar":28759,"Ġadaptive":28760,"ĠART":28761,"Ġtorso":28762,"ĠIdent":28763,"Ġsubdivision":28764,"azo":28765,"Ġconsequently":28766,"Ġrotate":28767,"ĠWit":28768,"Ġestab":28769,"managed":28770,"ĠBound":28771,"Ġskim":28772,"198":28773,"ĠCorona":28774,"ĠâĿ":28775,"Ġwording":28776,"buck":28777,"iph":28778,"patrick":28779,"Help":28780,"flying":28781,"Ġracer":28782,"Ġfisherman":28783,"____":28784,"ackers":28785,"Ġpersisted":28786,"Ġmyths":28787,"Ġgarn":28788,"ologue":28789,"ĠApprentice":28790,"Ġhereby":28791,"Ġvulgar":28792,"ĠGinger":28793,"Ġtrait":28794,"ĠIdea":28795,"Ġfigur":28796,"ĠSchwarzenegger":28797,"ĠSafari":28798,"178":28799,"ĠAsians":28800,"775":28801,"ĠTriangle":28802,"Ġdemons":28803,"ĠOv":28804,"Ġanime":28805,"Broad":28806,"Ġmolecule":28807,"Ġdeposition":28808,"Ġbiodiversity":28809,"modern":28810,"Ġwallets":28811,"NH":28812,"planes":28813,"rats":28814,"ĠSeed":28815,"Ġ174":28816,"umed":28817,"Ġtouting":28818,"gre":28819,"ĠSEAL":28820,"Ġperpetrator":28821,"ĠGerrard":28822,"Ġallocations":28823,"Ġworsh":28824,"payment":28825,"bett":28826,"ĠIssues":28827,"ennis":28828,"eering":28829,"ĠMV":28830,"yi":28831,"hak":28832,"Ġ167":28833,"Ġorchestr":28834,"224":28835,"Ġsup":28836,"Ġleukemia":28837,"osures":28838,"575":28839,"Ġnoticeably":28840,"Ġparamilitary":28841,"ĠTHERE":28842,"Ġwaged":28843,"igrated":28844,"Ġdocumentaries":28845,"Ġsenseless":28846,"Ġbark":28847,"Ġgenetics":28848,"ĠAlbania":28849,"ĠCrypt":28850,"ĠSEO":28851,"Ġnightly":28852,"Ġfaults":28853,"279":28854,"ĠFerdinand":28855,"ĠSylv":28856,"Ġcalam":28857,"ĠMuller":28858,"ĠSpielberg":28859,"Boy":28860,"ĠUrs":28861,"Ġrug":28862,"Ġcolonies":28863,"ĠFunk":28864,"Ġlyric":28865,"ĠATT":28866,"anni":28867,"ĠNB":28868,"Ġthorn":28869,"Ġpertinent":28870,"188":28871,"Ġpartic":28872,"Head":28873,"Pad":28874,"Palestinian":28875,"ĠBarg":28876,"anical":28877,"beaut":28878,"onge":28879,"Ġgigantic":28880,"travel":28881,"Ġdownloading":28882,"Contin":28883,"whe":28884,"plane":28885,"Wil":28886,"IDA":28887,"Ele":28888,"ĠPAL":28889,"Ġbeams":28890,"ĠProud":28891,"ramer":28892,"Ġindependents":28893,"Ġtranslator":28894,"ĠBrah":28895,"ĠTrooper":28896,"aylor":28897,"pson":28898,"Ġguise":28899,"Ġdiffering":28900,"Ġtopple":28901,"ichen":28902,"ĠSeymour":28903,"deg":28904,"ĠMixed":28905,"Ġinvoluntary":28906,"Ġcountdown":28907,"ĠNarc":28908,"ĠAdults":28909,"Ġcoaster":28910,"Ġ342":28911,"ĠAcquisition":28912,"mone":28913,"Ġpenchant":28914,"Brian":28915,"Gh":28916,"Pres":28917,"enei":28918,"Ġreefs":28919,"ĠMaver":28920,"Ġdevised":28921,"ĠIMP":28922,"vict":28923,"Ġagility":28924,"ĠPayments":28925,"respected":28926,"Ġtuning":28927,"ĠFACE":28928,"actions":28929,"Ġyell":28930,"ĠLeaving":28931,"Ġsnowy":28932,"Saudi":28933,"Ġformations":28934,"Ġairborne":28935,"Ġdeed":28936,"ooks":28937,"Ġnamesake":28938,"Ġpunishable":28939,"Ġagg":28940,"oths":28941,"ĠFamous":28942,"ĠDeposit":28943,"Ġinduce":28944,"189":28945,"Ġhesitation":28946,"ĠBrowse":28947,"ople":28948,"reys":28949,"henko":28950,"Ġsecretaries":28951,"Ġintersections":28952,"Ġdiminishing":28953,"ints":28954,"Ġ1934":28955,"ĠInvestigative":28956,"ĠMexicans":28957,"ĠMahar":28958,"ibur":28959,"Ġstocking":28960,"gross":28961,"Ġasbestos":28962,"Ġagitation":28963,"ĠBST":28964,"Overall":28965,"Ġheats":28966,"ĠSpan":28967,"Ġimped":28968,"Ġtrusting":28969,"Pet":28970,"Ġegregious":28971,"Ġcomedians":28972,"zin":28973,"WIN":28974,"Ġchats":28975,"Ġexploding":28976,"ĠTort":28977,"Ġembraces":28978,"Ġneut":28979,"verson":28980,"ouncing":28981,"ĠFiber":28982,"Ġbaker":28983,"Ġunstoppable":28984,"ĠDial":28985,"cars":28986,"Marc":28987,"164":28988,"volt":28989,"Ġceased":28990,"EFF":28991,"Ġpromoters":28992,"Ġcircuits":28993,"Ġexcise":28994,"Ġseminars":28995,"ĠTiny":28996,"ĠImportant":28997,"ĠTup":28998,"Ġoutburst":28999,"ĠSOC":29000,"ĠWWII":29001,"Ġmerging":29002,"highly":29003,"ĠGmail":29004,"ozy":29005,"ĠKB":29006,"Ġlaboratories":29007,"knit":29008,"ĠClosed":29009,"Ġsurrounds":29010,"ĠVet":29011,"Ġcere":29012,"vard":29013,"ĠDeadpool":29014,"text":29015,"Ġinfusion":29016,"Ġcuc":29017,"ĠAtl":29018,"Ġbustling":29019,"ĠSettings":29020,"Ġ193":29021,"ryan":29022,"184":29023,"186":29024,"Ġswat":29025,"rane":29026,"Ġepidem":29027,"lando":29028,"Ġtestifying":29029,"Ġmoistur":29030,"ĠTens":29031,"Ġexemplary":29032,"ĠPump":29033,"Ġforcefully":29034,"ĠFare":29035,"Ġcomplicate":29036,"Fe":29037,"Di":29038,"ĠThy":29039,"Ġcompartment":29040,"ĠFiesta":29041,"Would":29042,"fitted":29043,"Ġcull":29044,"Ġcomedic":29045,"cyl":29046,"Ġwhichever":29047,"stic":29048,"Ġ213":29049,"Ġspills":29050,"Ġplasma":29051,"Ġdisguise":29052,"ĠCompass":29053,"ĠImmun":29054,"Ġscarf":29055,"Ġdisperse":29056,"Ġreckon":29057,"ĠTaste":29058,"root":29059,"ĠGAME":29060,"xx":29061,"Ġhomophobic":29062,"Ġdimin":29063,"/#":29064,"Ġ178":29065,"Ġgems":29066,"lio":29067,"informed":29068,"ample":29069,"XT":29070,"Ġrepression":29071,"ĠTakes":29072,"Ġhabitats":29073,"Ġmountainous":29074,"ĠMcH":29075,"ENC":29076,"Mobil":29077,"Ġreel":29078,"ĠTI":29079,"Ġauthorize":29080,"ĠAccept":29081,"ĠMetall":29082,"CCC":29083,"Ġwetlands":29084,"ĠWitch":29085,"heading":29086,"Ġintervals":29087,"ĠWitt":29088,"hene":29089,"Ġcomforting":29090,"ollen":29091,"ERN":29092,"ooky":29093,"etch":29094,"Ġassailant":29095,"announced":29096,"elin":29097,"plate":29098,"920":29099,"eating":29100,"induced":29101,"ĠIgor":29102,"ĠAmph":29103,"Ġpatented":29104,"posing":29105,"Ġextraordinarily":29106,"Ġfearless":29107,"mortem":29108,"ĠDraw":29109,"ĠRend":29110,"Son":29111,"ridden":29112,"ĠAdvantage":29113,"Ġ305":29114,"Ġroared":29115,"Str":29116,"Ġradioactive":29117,"Ġslur":29118,"ĠRear":29119,"affles":29120,"ĠPon":29121,"Ġost":29122,"umbs":29123,"ĠSlack":29124,"athom":29125,"baby":29126,"213":29127,"ĠSpending":29128,"ĠAccordingly":29129,"Ġclocks":29130,"archs":29131,"Ġsmugg":29132,"Ġmastermind":29133,"ĠKlaus":29134,"alpha":29135,"Ġspoiled":29136,"264":29137,"Pod":29138,"Ġflared":29139,"Ġcomposure":29140,"ĠCAM":29141,"Ġrestruct":29142,"Ġtasted":29143,"ĠKimber":29144,"Ġupheaval":29145,"CHAR":29146,"ĠGeo":29147,"itations":29148,"Ġbegged":29149,"UX":29150,"Authorities":29151,"ĠEngel":29152,"ĠHOME":29153,"Ġratt":29154,"Ġquickest":29155,"475":29156,"ĠSting":29157,"ĠICO":29158,"yu":29159,"Ġdefy":29160,"Prince":29161,"cards":29162,"Ġovertake":29163,"Ġretrieved":29164,"ĠNavajo":29165,"Ġpastry":29166,"ĠLange":29167,"Ġentrusted":29168,"ĠCull":29169,"aler":29170,"Ġdinosaurs":29171,"Ġbragging":29172,"ĠAlley":29173,"meier":29174,"ĠAssuming":29175,"Ġana":29176,"omatic":29177,"Brend":29178,"acted":29179,"Ġexhaustive":29180,"Ġunfit":29181,"Several":29182,"gap":29183,"Ġtet":29184,"228":29185,"Sk":29186,"302":29187,"Ġdeflect":29188,"Ġ179":29189,"226":29190,"Ġadorned":29191,"ĠSpread":29192,"Ġthirds":29193,"ĠSemi":29194,"Ġdescend":29195,"Ġaccumulate":29196,"Ġflavours":29197,"Ġinvoked":29198,"ĠAnge":29199,"Ġprofess":29200,"unks":29201,"ĠKickstarter":29202,"ENTS":29203,"ĠRw":29204,"Ġchatter":29205,"ĠPOS":29206,"Ġcollaborators":29207,"ĠEW":29208,"ĠMarkus":29209,"Ġimpair":29210,"Ġbolt":29211,"Ġglue":29212,"Ġloosely":29213,"ĠSUM":29214,"Ġhydraulic":29215,"Ġpredatory":29216,"Charles":29217,"cond":29218,"Ġspawned":29219,"Fr":29220,"174":29221,"Ġtame":29222,"Ġaggrav":29223,"Ġchrist":29224,"true":29225,"ivable":29226,"Ġhen":29227,"ĠKut":29228,"Ġskyrocket":29229,"Ġeg":29230,"Ġveterinarian":29231,"ĠStats":29232,"Kit":29233,"Ġbiologist":29234,"Spe":29235,"Ġantenna":29236,"Ġsust":29237,"fill":29238,"Ġpayload":29239,"227":29240,"Ġlivestream":29241,"ORN":29242,"ĠAbel":29243,"Ġdeception":29244,"ussen":29245,"Britain":29246,"partisan":29247,"Ġbrowse":29248,"Ġmelan":29249,"172":29250,"ĠNumerous":29251,"ĠMansion":29252,"Ġassailants":29253,"£":29254,"olerance":29255,"Ġdirectives":29256,"ĠInteg":29257,"zers":29258,"Ġduct":29259,"ĠHonestly":29260,"ĠImmediately":29261,"ixty":29262,"Ġdiagnose":29263,"Ġimplication":29264,"ĠiPads":29265,"testers":29266,"riots":29267,"Ġrespons":29268,"XP":29269,"pes":29270,"875":29271,"Ġ199":29272,"ĠPoe":29273,"303":29274,"Ġailments":29275,"ĠCarrier":29276,"Ġeject":29277,"Ġrestroom":29278,"Drive":29279,"manufact":29280,"Ġcompens":29281,"Ġglossy":29282,"Ġrecovers":29283,"Ġthinner":29284,"Ġdescendants":29285,"antle":29286,"Beaut":29287,"competitive":29288,"ĠRobotics":29289,"Ġpretext":29290,"233":29291,"Ġflanked":29292,"ĠâĻ":29293,"Ġguts":29294,"Ġwee":29295,"Ġaccents":29296,"mc":29297,"Ġgrapp":29298,"ĠNathaniel":29299,"ĠMikhail":29300,"Ġobligated":29301,"Ġmanoeuv":29302,"Ġechoing":29303,"Ġ189":29304,"ĠDevice":29305,"isd":29306,"Ġloopholes":29307,"Ġbehold":29308,"ĠMerry":29309,"Ġfunn":29310,"Ġnuanced":29311,"667":29312,"ELY":29313,"ĠTasmania":29314,"ĠSaddam":29315,"Ġquizz":29316,"military":29317,"cient":29318,"Ġoutlaw":29319,"ĠAudit":29320,"ĠBoom":29321,"Ġcrim":29322,"asured":29323,"ĠApps":29324,"ĠKush":29325,"onica":29326,"Ġamput":29327,"signed":29328,"ĠMEN":29329,"ĠRosenberg":29330,"Ġvide":29331,"ĠDirection":29332,"Ġfountain":29333,"TW":29334,"ĠCARE":29335,"Ġreassured":29336,"Food":29337,"Ġdepressing":29338,"ĠWhilst":29339,"reatment":29340,"Ġspelled":29341,"Ġhipp":29342,"ĠPeach":29343,"hound":29344,"Harry":29345,"Ġcatalogue":29346,"ĠCommun":29347,"Ġnurture":29348,"rush":29349,"ĠPopulation":29350,"ĠNTS":29351,"ĠElectrical":29352,"rounded":29353,"Ġblending":29354,"Ġ223":29355,"alities":29356,"ilation":29357,"eas":29358,"estate":29359,"Ġnarrowing":29360,"ĠTreasure":29361,"192":29362,"Ġwhims":29363,"Ġrobber":29364,"Ġsoaked":29365,"nian":29366,"Ġcongest":29367,"ĠYosemite":29368,"notes":29369,"icer":29370,"ĠGuardians":29371,"ĠFrozen":29372,"Ġ187":29373,"Ġhandcuffs":29374,"Someone":29375,"Ġenshr":29376,"gency":29377,"ĠCube":29378,"Ġprinters":29379,"Ġundercut":29380,"ĠSolution":29381,"rosis":29382,"ĠHumanity":29383,"Ġsucks":29384,"ĠSick":29385,"Tax":29386,"Ġtablespoon":29387,"ĠTrin":29388,"ĠArchive":29389,"Mom":29390,"ĠSAY":29391,"Ġdrifting":29392,"ĠFarage":29393,"Ġforging":29394,"WM":29395,"ĠEleanor":29396,"USH":29397,"Ġemph":29398,"Ġcareless":29399,"Ġspew":29400,"Ġinsensitive":29401,"Ġawhile":29402,"Ġcit":29403,"opened":29404,"ĠFem":29405,"Ġvapor":29406,"Ġdownt":29407,"ylene":29408,"Ġclut":29409,"Ġculp":29410,"1990":29411,"Ġdisgruntled":29412,"Students":29413,"uttering":29414,"gyn":29415,"vre":29416,"Ġrapes":29417,"division":29418,"ĠCalendar":29419,"tal":29420,"icts":29421,"caliber":29422,"ĠFighters":29423,"ĠUnc":29424,"163":29425,"ĠRogue":29426,"Ġregistrations":29427,"Ġundermines":29428,"ĠPunch":29429,"Ġdramas":29430,"176":29431,"Ġslider":29432,"ĠFlore":29433,"ر":29434,"Ġbru":29435,"inelli":29436,"Ġdisparities":29437,"ا":29438,"Ġreferrals":29439,"ĠCharges":29440,"Ġbreeds":29441,"ĠMEP":29442,"288":29443,"Ġmouths":29444,"Ġsideways":29445,"Ġbelievers":29446,"ppard":29447,"Ġhotter":29448,"Ġunderestimated":29449,"Ġjelly":29450,"525":29451,"ĠCMS":29452,"ĠWeiner":29453,"Ġguarding":29454,"Ġampl":29455,"ĠKidd":29456,"UF":29457,"orient":29458,"max":29459,"Ash":29460,"Ġwander":29461,"Ġ..........":29462,"ĠDempsey":29463,"ĠToken":29464,"chat":29465,"Justin":29466,"equipped":29467,"ĠBI":29468,"Ġsins":29469,"Ġnond":29470,"ursion":29471,"Ġcoc":29472,"Ġmailing":29473,"ĠArchitect":29474,"Ġhaunting":29475,"Ġpont":29476,"Ġascertain":29477,"Ġwig":29478,"Ġskysc":29479,"Ġarg":29480,"ĠItalians":29481,"/?":29482,"Ġ----------------------------------------------------------------":29483,"ĠPrecision":29484,"EPA":29485,"Ġhotly":29486,"Ġcircumvent":29487,"ĠEcc":29488,"Ġmerch":29489,"akov":29490,"Ġunab":29491,"heres":29492,"Ġsubcommittee":29493,"ĠDiscuss":29494,"ĠChallenger":29495,"crafted":29496,"Ġcanine":29497,"osphere":29498,"Ġspider":29499,"Ġteachings":29500,"atos":29501,"Ġuniversally":29502,"Ġturbine":29503,"ĠLO":29504,"ĠMAG":29505,"Ġpassers":29506,"Ġroundup":29507,"Ġdenounce":29508,"ĠSpiegel":29509,"until":29510,"Ġshaved":29511,"Ġdisdain":29512,"Nazi":29513,"Ġnewfound":29514,"Ġspontaneous":29515,"Ġmash":29516,"ĠDispatch":29517,"Ġsunrise":29518,"ogged":29519,"Ġfuss":29520,"Ġeas":29521,"acci":29522,"ĠTarg":29523,"Ġhash":29524,"lict":29525,"Ġmisc":29526,"ĠSched":29527,"guy":29528,"linger":29529,"warm":29530,"ipel":29531,"ĠGork":29532,"Ġdispatcher":29533,"Ġ315":29534,"Ġfinely":29535,"Ġreliably":29536,"Ġrupt":29537,"Ġnegligent":29538,"Ġendorsements":29539,"ĠOrient":29540,"Ġelectro":29541,"haired":29542,"Ġphysique":29543,"wine":29544,"Ġadolescents":29545,"Ġ184":29546,"alth":29547,"Ġvalidated":29548,"izzard":29549,"ĠPeck":29550,"Ġemblem":29551,"status":29552,"ĠJungle":29553,"orius":29554,"Ġeccentric":29555,"Ġfolding":29556,"poor":29557,"ĠTHC":29558,"appers":29559,"Ġscripted":29560,"239":29561,"ĠPreferred":29562,"digital":29563,"Ġsharper":29564,"Ġportrays":29565,"rative":29566,"238":29567,"Ġ183":29568,"Ġuneasy":29569,"ĠRI":29570,"Ġvil":29571,"171":29572,"Ġspoil":29573,"ĠPricing":29574,"ĠHardware":29575,"Ġ188":29576,"Ġhorrendous":29577,"Ġostensibly":29578,"nah":29579,"Ġgadget":29580,"ADS":29581,"coat":29582,"Ġexhausting":29583,"Ġdraining":29584,"arate":29585,"ĠBulgarian":29586,"emo":29587,"Ġhier":29588,"Ġguitars":29589,"ieties":29590,"assed":29591,"ĠYaz":29592,"Ġaggress":29593,"ĠBG":29594,"vik":29595,"Ġneatly":29596,"Ġpixel":29597,"Ġintimacy":29598,"ĠRug":29599,"Ġ512":29600,"Ġnarrated":29601,"Ġmast":29602,"ĠNos":29603,"ĠHung":29604,"reciation":29605,"ĠChandra":29606,"Ġbios":29607,"ĠEnded":29608,"lique":29609,"ĠCambod":29610,"Ġworrisome":29611,"ĠEQ":29612,"Ġnovelist":29613,"ĠDynamic":29614,"ĠMIC":29615,"Ġdisposed":29616,"Ġbrackets":29617,"Ġhaircut":29618,"ĠLana":29619,"Ġlull":29620,"Ġbillboard":29621,"ĠReverend":29622,"ĠNAV":29623,"borgh":29624,"Ġadrenaline":29625,"Ġseeming":29626,"ĠPCB":29627,"ĠBridgewater":29628,"Ġsquirrel":29629,"262":29630,"write":29631,"Ġstabilization":29632,"wild":29633,"Ġsecession":29634,"Ġpacket":29635,"AMES":29636,"licted":29637,"Ġmalnutrition":29638,"claimed":29639,"Ġcharred":29640,"Ġtragically":29641,"Published":29642,"Ġrepealed":29643,"ĠSawyer":29644,"ĠMormon":29645,"resolution":29646,"ĠSaud":29647,"Henry":29648,"Ġdiscontin":29649,"Ġsnag":29650,"danger":29651,"Ġmixes":29652,"Ġupbringing":29653,"Ġlimb":29654,"ĠFantastic":29655,"Sim":29656,"ĠAugustine":29657,"ĠGreeks":29658,"cod":29659,"ĠHistorically":29660,"mire":29661,"register":29662,"ĠKund":29663,"Ġdebilitating":29664,"Chat":29665,"ĠTau":29666,"ï":29667,"lower":29668,"pie":29669,"Ġ430":29670,"Ġnascent":29671,"Ġ375":29672,"Ġbum":29673,"WI":29674,"Netflix":29675,"whether":29676,"Ġdearly":29677,"eff":29678,"PRES":29679,"Ġlandmarks":29680,"Ġculminating":29681,"Ġmigrate":29682,"balanced":29683,"Ġregulars":29684,"Ġmodification":29685,"Ġdips":29686,"ĠRedmond":29687,"ationally":29688,"atsu":29689,"Ġphilosophical":29690,"Ġtyping":29691,"Ġunreal":29692,"Ġboiled":29693,"Ġblight":29694,"Ġdru":29695,"ĠGaddafi":29696,"Ġnour":29697,"Ġsequential":29698,"Ġaugment":29699,"ĠEuras":29700,"ĠWiley":29701,"endar":29702,"Ġacronym":29703,"esteem":29704,"ĠMajesty":29705,"Ġgrips":29706,"Ġobsolete":29707,"nos":29708,"Made":29709,"ogie":29710,"ĠLiver":29711,"ĠDonetsk":29712,"Ġdynam":29713,"tel":29714,"bring":29715,"Ġknit":29716,"Ġfirepower":29717,"Ġprepaid":29718,"ĠRaphael":29719,"Ġsensing":29720,"720":29721,"WN":29722,"Nor":29723,"puted":29724,"Ġbureaucrats":29725,"ĠAdjust":29726,"Ġintensely":29727,"Ġsunscreen":29728,"Ho":29729,"ĠYelp":29730,"ĠPU":29731,"ĠSerge":29732,"ĠCyp":29733,"ELF":29734,"ĠGuns":29735,"Ġteamwork":29736,"ĠBib":29737,"ĠMaintenance":29738,"perate":29739,"Ġwiping":29740,"Ġcharcoal":29741,"ordan":29742,"International":29743,"Ġbehaving":29744,"Ġsoftened":29745,"ĠIncreased":29746,"Ġunfl":29747,"470":29748,"Ġinformative":29749,"Ġnovelty":29750,"Ġavoidance":29751,"Ġteasing":29752,"matic":29753,"Ġmaid":29754,"ĠPell":29755,"Ġcounterterrorism":29756,"ĠGabe":29757,"ications":29758,"ĠConnection":29759,"ĠInquiry":29760,"isin":29761,"orama":29762,"Ġcorpse":29763,"Ġpractitioner":29764,"itto":29765,"UA":29766,"Ġforestry":29767,"Ġlic":29768,"Ġrevolves":29769,"Ġcalculating":29770,"Ġpuppet":29771,"ulously":29772,"ĠPebble":29773,"Dep":29774,"Ġupholding":29775,"Ġcarving":29776,"Ġwartime":29777,"Ġenvy":29778,"Ġencro":29779,"ĠPunk":29780,"ĠAdminist":29781,"ucha":29782,"Ġbattleground":29783,"Ġlol":29784,"uable":29785,"Ġunheard":29786,"ĠSpur":29787,"phony":29788,"Ġcarc":29789,"ĠSut":29790,"Ġpollutants":29791,"Cr":29792,"Ġvigorous":29793,"355":29794,"ĠMarriage":29795,"Ġstaffed":29796,"fecture":29797,"ĠArabs":29798,"supported":29799,"Ġmanpower":29800,"ĠSatellite":29801,"None":29802,"Ġqueues":29803,"Ġinsightful":29804,"Ġinterchange":29805,"Rel":29806,"Ġsolemn":29807,"Ġsmuggled":29808,"upt":29809,"Ġ171":29810,"Ġparallels":29811,"intelligence":29812,"punk":29813,"Ġrecycle":29814,"Ġdecorative":29815,"Ġshar":29816,"arrell":29817,"iances":29818,"ĠBolivia":29819,"Ġstrengthens":29820,"430":29821,"Ġhardships":29822,"Ġsignalling":29823,"Ġunthinkable":29824,"READ":29825,"Ġtad":29826,"picked":29827,"Ġarmor":29828,"Ġcores":29829,"ĠMatrix":29830,"Ġdj":29831,"Ġevolutionary":29832,"ĠBermuda":29833,"OE":29834,"organized":29835,"Ġrelentlessly":29836,"sol":29837,"ĠMamm":29838,"Ġpounding":29839,"Weather":29840,"Ġrab":29841,"Ġsweets":29842,"funding":29843,"ĠHUD":29844,"ĠSoldier":29845,"reed":29846,"released":29847,"Ġcontainment":29848,"alid":29849,"ĠNikon":29850,"Ġcervical":29851,"Ġign":29852,"Ġalias":29853,"Ġoptimized":29854,"Ġasserting":29855,"ĠAFTER":29856,"Ġflatt":29857,"Ġdinosaur":29858,"ĠRefugees":29859,"ĠAnch":29860,"Ġadjustable":29861,"Ġroaring":29862,"Ġpilgrimage":29863,"Ġcowboy":29864,"Ġentails":29865,"ractions":29866,"EY":29867,"undy":29868,"ĠKuh":29869,"inges":29870,"ĠTerra":29871,"ĠEscape":29872,"Ġrundown":29873,"Ġstriped":29874,"KN":29875,"ocations":29876,"IDENT":29877,"IGH":29878,"Ġavoids":29879,"Moh":29880,"ĠLS":29881,"lbs":29882,"ĠAttempt":29883,"Ġtriangle":29884,"Ġclimax":29885,"Ġhp":29886,"Ġallot":29887,"learning":29888,"ĠJFK":29889,"Justice":29890,"OUT":29891,"ĠHER":29892,"ĠLect":29893,"Ġtrench":29894,"edar":29895,"Ġreservoirs":29896,"uid":29897,"rf":29898,"162":29899,"Ġinterfered":29900,"Ġemit":29901,"these":29902,"444":29903,"ĠLeather":29904,"essing":29905,"ĠEighth":29906,"uckle":29907,"Breaking":29908,"Ġunresolved":29909,"Ġgoose":29910,"252":29911,"platform":29912,"atus":29913,"Ġcomplexion":29914,"ĠBUS":29915,"Ġstruct":29916,"middle":29917,"Sat":29918,"ĠWHERE":29919,"LB":29920,"redible":29921,"vered":29922,"Louis":29923,"ĠBaz":29924,"Eye":29925,"safety":29926,"Ġhypothetical":29927,"Ġbowel":29928,"Ġuntouched":29929,"312":29930,"ĠPric":29931,"Ġastounding":29932,"meet":29933,"Aaron":29934,"ĠWoo":29935,"236":29936,"ĠShape":29937,"Ġdrifted":29938,"Ġtile":29939,"ĠGrim":29940,"Ġundeniable":29941,"Ġ..":29942,"Ġradius":29943,"Ġovarian":29944,"ĠSeriously":29945,"verning":29946,"Ġassertions":29947,"oxic":29948,"231":29949,"ĠViz":29950,"Jackson":29951,"ĠSno":29952,"Ġboycot":29953,"okingly":29954,"ousse":29955,"proclaimed":29956,"Ġblazing":29957,"Ġinefficient":29958,"Ġfig":29959,"Ġbooze":29960,"259":29961,"agus":29962,"statement":29963,"Ġlocom":29964,"Ġtacos":29965,"Ġmemos":29966,"gender":29967,"ĠOrt":29968,"263":29969,"Ġintervening":29970,"Soc":29971,"University":29972,"ĠPis":29973,"ĠReturns":29974,"ĠPAN":29975,"Ġultrasound":29976,"Ġcoherent":29977,"tracking":29978,"rieved":29979,"383":29980,"Ġqualitative":29981,"uld":29982,"ĠGiovanni":29983,"Ġstorylines":29984,"Ġdarkest":29985,"Ġvelvet":29986,"RIP":29987,"Ġcompatibility":29988,"Ġtroll":29989,"CN":29990,"Found":29991,"ĠOu":29992,"Ġtease":29993,"Ġvested":29994,"Ġprovocation":29995,"Ġimprovised":29996,"Ġactivation":29997,"unte":29998,"ĠMonteneg":29999,"ĠJOHN":30000,"ĠReact":30001,"Ġpolluted":30002,"217":30003,"Ġmushroom":30004,"Ġdisconnected":30005,"ĠVoices":30006,"asu":30007,"Ġsensory":30008,"REE":30009,"Ġmonarchy":30010,"Ġ173":30011,"doing":30012,"involved":30013,"ĠJonah":30014,"Ġtoxins":30015,"Ġtv":30016,"Ġacademia":30017,"IQ":30018,"Mor":30019,"ĠStraight":30020,"ĠRN":30021,"ĠâĹı":30022,"Ġpear":30023,"187":30024,"Ġendeavors":30025,"ĠTurbo":30026,"Ġducks":30027,"ĠRamsay":30028,"Ġoutpatient":30029,"Ġcomprehend":30030,"UNE":30031,"Ġbriefings":30032,"total":30033,"Ġmigr":30034,"always":30035,"Ġmoot":30036,"ĠRider":30037,"Ġbiblical":30038,"Form":30039,"Ġcurry":30040,"Ġexquisite":30041,"385":30042,"244":30043,"Ġattendants":30044,"Ġcabinets":30045,"nton":30046,"Baby":30047,"Honestly":30048,"ĠFIRE":30049,"211":30050,"itech":30051,"ĠProsper":30052,"Ġchops":30053,"odic":30054,"Rod":30055,"job":30056,"orset":30057,"ĠAry":30058,"obic":30059,"ĠNil":30060,"isable":30061,"Ġorche":30062,"Ġtrivial":30063,"ĠZy":30064,"ĠXP":30065,"Ġendorsing":30066,"ĠLIM":30067,"adish":30068,"237":30069,"ĠLaws":30070,"heid":30071,"ĠSignature":30072,"ĠVern":30073,"ĠBland":30074,"ansk":30075,"Ġrepository":30076,"ĠPetra":30077,"Enter":30078,"Ġtruths":30079,"Ġbordering":30080,"Ġpenn":30081,"Ġsimplified":30082,"zn":30083,"ĠCree":30084,"Ġ181":30085,"Hi":30086,"ĠGreenberg":30087,"Ġprematurely":30088,"ĠSass":30089,"Ġwrecked":30090,"Ġheinous":30091,"415":30092,"Turn":30093,"zl":30094,"amental":30095,"ĠBraz":30096,"fing":30097,"ĠAngle":30098,"ĠPhantom":30099,"agra":30100,"ĠShack":30101,"Ġhomegrown":30102,"Ġalright":30103,"AME":30104,"ĠKN":30105,"Ġclicks":30106,"Ġmanned":30107,"ĠScope":30108,"Ġextras":30109,"Ġclinicians":30110,"321":30111,"African":30112,"Ġjuices":30113,"Ġrefere":30114,"****":30115,"ambling":30116,"since":30117,"Ġvoic":30118,"QB":30119,"ĠAtmospheric":30120,"Mat":30121,"Ġperpetrated":30122,"ĠSteps":30123,"Fit":30124,"Ġsilenced":30125,"Ġbonded":30126,"Ġquantify":30127,"Houston":30128,"ocracy":30129,"Ġfreeing":30130,"pipe":30131,"corn":30132,"rones":30133,"ooked":30134,"ĠSuz":30135,"Ġunaccount":30136,"196":30137,"Ġlogos":30138,"ĠFurious":30139,"ĠSpart":30140,"urst":30141,"itri":30142,"ĠZub":30143,"ĠActual":30144,"Ġslee":30145,"Ġgag":30146,"Ġmetabolism":30147,"ĠDesigned":30148,"Ġpedigree":30149,"Ġcoolest":30150,"âĿ":30151,"iuses":30152,"ĠYellowstone":30153,"Ġinformant":30154,"Ġushered":30155,"ĠGarg":30156,"thel":30157,"Hop":30158,"Ġrepetitive":30159,"flag":30160,"Ġunmarked":30161,"ĠBrave":30162,"Ġincur":30163,"reading":30164,"ppel":30165,"lah":30166,"ateurs":30167,"286":30168,"ĠAtomic":30169,"Ġappliance":30170,")'":30171,"traditional":30172,"Ġdads":30173,"Ġregimen":30174,"Ġinfrared":30175,"Ġdotted":30176,"Ġtails":30177,"Ġhorrors":30178,"uments":30179,"Ġdub":30180,"lighting":30181,"Ġunearthed":30182,"assisted":30183,"ĠSpiel":30184,"trial":30185,"Ġpersever":30186,"MAX":30187,"Ġicing":30188,"Energy":30189,"Ġ1943":30190,"move":30191,"Error":30192,"Ġliter":30193,"ĠCly":30194,"Ari":30195,"Ġgranite":30196,"Ġcropped":30197,"ĠRD":30198,"ĠREM":30199,"TX":30200,"Ġdispleasure":30201,"ĠComfort":30202,"Ġunsettling":30203,"Ġscratching":30204,"866":30205,"eton":30206,"560":30207,"Ġcommonplace":30208,"Ġreproduced":30209,"ggie":30210,"Ġschooling":30211,"Ġreprim":30212,"Ġdarling":30213,"huge":30214,"ĠDante":30215,"cp":30216,"heastern":30217,"Ġeduc":30218,"Digital":30219,"Ġwrath":30220,"Ġwatering":30221,"ĠTail":30222,"Ġdegradation":30223,"530":30224,"usive":30225,"ĠXu":30226,"ĠAH":30227,"Ġclassy":30228,"ĠSET":30229,"Ġcriminally":30230,"dependent":30231,"ĠAlps":30232,"Ġnotwithstanding":30233,"Ġfamiliarity":30234,"ĠAPP":30235,"aurus":30236,"gments":30237,"Mid":30238,"Ġepilepsy":30239,"Ġresemblance":30240,"brush":30241,"Ġ333":30242,"Ġliberated":30243,"ĠBeng":30244,"ĠLans":30245,"Ġtraff":30246,"ihu":30247,"establish":30248,"Ġcort":30249,"Rick":30250,"Ġplugged":30251,"onement":30252,"ĠAccounting":30253,"Ġreconstruct":30254,"Pop":30255,"Ġincapable":30256,"aho":30257,"ĠDexter":30258,"Ġpitted":30259,"Ġbathing":30260,"Ġdun":30261,"Ġexplor":30262,"ĠMidnight":30263,"Ġactiv":30264,"iann":30265,"likely":30266,"acons":30267,"owicz":30268,"Ġnegativity":30269,"Ġfreel":30270,"ewitness":30271,"Ġinj":30272,"Stephen":30273,"Ġshredded":30274,"Ġprepar":30275,"Script":30276,"Ġcorrectional":30277,"Ġcommits":30278,"hai":30279,"activity":30280,"Imp":30281,"Ġstumble":30282,"Ġcache":30283,"ĠPromise":30284,"Ġprecinct":30285,"Ġmulticultural":30286,"Ġsubstitutes":30287,"Ġshortened":30288,"ovable":30289,"Ġfasting":30290,"Ġinfused":30291,"Ġbulldo":30292,"alm":30293,"Ġadjoining":30294,"Ġmultiplayer":30295,"ĠAlien":30296,"Ġpund":30297,"ethyl":30298,"Ġbliss":30299,"ĠDecision":30300,"Ġbab":30301,"Ġangrily":30302,"another":30303,"oled":30304,"ainted":30305,"ĠPriest":30306,"Ġdraped":30307,"ĠPersonally":30308,"Ġstomp":30309,"ĠWolfgang":30310,"Ġoste":30311,"itches":30312,"Ġhoops":30313,"ĠJO":30314,"Ġsche":30315,"ĠZan":30316,"Ġcleans":30317,"Ġclimbs":30318,"Ġelectronically":30319,"243":30320,"ocy":30321,"gall":30322,"ĠREAL":30323,"Ġmurky":30324,"Ġmodernization":30325,"tub":30326,"Really":30327,"Ġlax":30328,"Ġdoubted":30329,"yden":30330,"ĠPrevent":30331,"UTERS":30332,"Ġoverride":30333,"ĠSAF":30334,"Ġcoun":30335,"Ġexcerpts":30336,"Ġmotivations":30337,"Ġdecency":30338,"Ġastronomers":30339,"orical":30340,"Ġaltering":30341,"Ġ232":30342,"described":30343,"omic":30344,"Ġexh":30345,"Ġknocks":30346,"ĠRiot":30347,"ĠPurs":30348,"equal":30349,"pleting":30350,"llan":30351,"ĠSOL":30352,"iator":30353,"ILE":30354,"ĠWM":30355,"Ġdefences":30356,"Ġforearm":30357,"Toronto":30358,"526":30359,"Ġacne":30360,"Ġthirteen":30361,"itiz":30362,"akable":30363,"charges":30364,"Ġinaction":30365,"Ġbred":30366,"Ġdeficiency":30367,"Ġintrigue":30368,"opoly":30369,"ĠCamer":30370,"ĠMelt":30371,"Ġunlawfully":30372,"Ġpenetrate":30373,"ĠUsed":30374,"ĠDirty":30375,"Ġexcerpt":30376,"ĠYen":30377,"ĠCARD":30378,"Ġcher":30379,"ĠChallenges":30380,"ieves":30381,"Ġambush":30382,"Data":30383,"eeks":30384,"Ġgiveaway":30385,"Ġpawn":30386,"Ġtransf":30387,"renched":30388,"Ġmoderately":30389,"Ġnumbered":30390,"ĠIntegrity":30391,"ĠHOU":30392,"ĠHDMI":30393,"Royal":30394,"LT":30395,"ĠDirk":30396,"izon":30397,"Ġ227":30398,"Ġdisagrees":30399,"ĠNinth":30400,"Ġincrement":30401,"ĠGlory":30402,"suff":30403,"Ġartery":30404,"ĠEmployee":30405,"bum":30406,"ĠEditorial":30407,"Kh":30408,"ĠPremiere":30409,"ĠWeld":30410,"ĠIncluded":30411,"Ġmathematical":30412,"Ġexponentially":30413,"Ġhandwritten":30414,"ĠMAS":30415,"Ġindiscrim":30416,"Ġnutrient":30417,"ĠSelection":30418,"Ġ219":30419,"hyd":30420,"Ġdeton":30421,"æ":30422,"dark":30423,"ĠFidel":30424,"Ġmonkeys":30425,"Ġnutritious":30426,"Ġheadlights":30427,"oller":30428,"piring":30429,"ĠDefenders":30430,"Ġdrown":30431,"elong":30432,"Ġfloats":30433,"graduate":30434,"Ġprosper":30435,"ĠNamed":30436,"ĠEating":30437,"ECK":30438,"establishment":30439,"XM":30440,"Ġsoaking":30441,"278":30442,"Ġlistener":30443,"Ġsimultaneous":30444,"olutions":30445,"payer":30446,"Ġcustomize":30447,"ĠROCK":30448,"Ġaltar":30449,"ĠExercise":30450,"anky":30451,"ĠProfession":30452,"sever":30453,"ĠMerchant":30454,"RF":30455,"ĠCombat":30456,"Ġlegality":30457,"fledged":30458,"Ġdiapers":30459,"lves":30460,"Ġlur":30461,"Ġignores":30462,"ĠProtocol":30463,"Ġrepresentations":30464,"ĠBlumenthal":30465,"ĠLime":30466,"romptu":30467,"Ġbesieged":30468,"dl":30469,"Ġsighting":30470,"ĠParm":30471,"ĠServer":30472,"ĠBenghazi":30473,"estival":30474,"Ġplaylist":30475,"ĠUng":30476,"ĠQuantum":30477,"Ġcompromises":30478,"ĠSurvivor":30479,"ĠMobility":30480,"Ġbounty":30481,"ophers":30482,"ISA":30483,"need":30484,"uese":30485,"Ġorn":30486,"218":30487,"Ġ530":30488,"Ġbuddies":30489,"Ġagendas":30490,"ĠFeldman":30491,"ĠÃĸ":30492,"ĠBMC":30493,"ĠServe":30494,"Ent":30495,"ĠKH":30496,"ĠINT":30497,"Ġlittered":30498,"Ġvisitation":30499,"mist":30500,"Ġdupl":30501,"Ġrouted":30502,"ĠAmount":30503,"Dev":30504,"ĠConv":30505,"Ġslams":30506,"ĠVeterinary":30507,"bold":30508,"Ġ186":30509,"ĠDOT":30510,"builder":30511,"Ġdecay":30512,"ĠHemp":30513,"pelled":30514,"Ġmankind":30515,"Tonight":30516,"Ġeffortlessly":30517,"ĠBUT":30518,"Ġhostilities":30519,"formerly":30520,"alon":30521,"ĠCrash":30522,"humane":30523,"Ġmayhem":30524,"ĠBudd":30525,"Ġdisinformation":30526,"Ġ226":30527,"Ġprototypes":30528,"__":30529,"IVERS":30530,"izzy":30531,"ĠMight":30532,"ĠPip":30533,"pour":30534,"INO":30535,"ĠLL":30536,"Ġwiret":30537,"Ġresorted":30538,"ĠTanaka":30539,"ĠDOES":30540,"Earlier":30541,"HO":30542,"Ġmoniker":30543,"ĠFang":30544,"ĠHua":30545,"bered":30546,"adding":30547,"194":30548,"STR":30549,".\")":30550,"cop":30551,"ĠFlags":30552,"ĠColleges":30553,"ĠUz":30554,"Ġsparks":30555,"Ġparadox":30556,"Marie":30557,"Strong":30558,"Ġstrawberry":30559,"Ġnurturing":30560,"Ġfax":30561,"Tor":30562,"killer":30563,"burse":30564,"Ġattachments":30565,"Ġpup":30566,"Ġexhaustion":30567,"Ġwhisky":30568,"isu":30569,"ologically":30570,"iership":30571,"Ġlamps":30572,"Ġshuff":30573,"Ġcentralized":30574,"ĠNeedless":30575,"Ġgrenade":30576,"Ġrouter":30577,"Ġoptics":30578,"ivering":30579,"Ġpioneers":30580,"ĠHug":30581,"Ġhandguns":30582,"010":30583,"Ġbailed":30584,"uana":30585,"197":30586,"Ġdistorted":30587,"ĠEssentially":30588,"ĠSilent":30589,"Ġcomparative":30590,"Music":30591,"ĠMUS":30592,"Bur":30593,"ĠComet":30594,"ĠWinchester":30595,"IGN":30596,"Mod":30597,"ĠCandidate":30598,"Ġdysfunctional":30599,"ĠCeleb":30600,"Ġhitch":30601,"api":30602,"Ġidiot":30603,"Ġunsupported":30604,"gat":30605,"inker":30606,"Ġredevelop":30607,"Ġdwind":30608,"Ġforgetting":30609,"ĠRost":30610,"Ġremembrance":30611,"Na":30612,"mopolitan":30613,"Ġberries":30614,"Ġmarital":30615,"Vol":30616,"ĠClosing":30617,"ĠHindus":30618,"itism":30619,"Ġrover":30620,"Ġmysteries":30621,"ĠNig":30622,"ucing":30623,"Ġfabrication":30624,"Ġgarments":30625,"Ġwield":30626,"ĠCompton":30627,"357":30628,"Ġoxide":30629,"chron":30630,"ĠThought":30631,"Ġcomed":30632,"ĠEpstein":30633,"ĠBART":30634,"orative":30635,"ĠKahn":30636,"adan":30637,"APH":30638,"cum":30639,"Ġloophole":30640,"ĠGoPro":30641,"osit":30642,"Ġspecification":30643,"ĠAPR":30644,"Ġdrains":30645,"Ġconserve":30646,"ĠMorse":30647,"Ġcalorie":30648,"ĠCheney":30649,"station":30650,"Ġevangel":30651,"Ġspraying":30652,"lections":30653,"Ġenclosure":30654,"Ġcommanded":30655,"ĠOrganizations":30656,"Ġimb":30657,"mins":30658,"ĠTobias":30659,"Ve":30660,"ĠNau":30661,"183":30662,"ĠGuantanamo":30663,"173":30664,"Ġrequisite":30665,"Ġderivative":30666,"Ġpopulism":30667,"Ġcultivated":30668,"lord":30669,"uler":30670,"ĠDEA":30671,"inally":30672,"Ġdemonstr":30673,"trip":30674,"ĠFirefox":30675,"246":30676,"confirmed":30677,"Anne":30678,"Ġtamp":30679,"ĠHousehold":30680,"amous":30681,"Meet":30682,"Ġdashed":30683,"pire":30684,"Ġinex":30685,"Ġloosen":30686,"272":30687,"famous":30688,"ĠHeard":30689,"Ġhindsight":30690,"Ġdepot":30691,"ĠCutting":30692,"ĠMouse":30693,"Ġgeological":30694,"number":30695,"OUN":30696,".,\"":30697,"Ġmoderation":30698,"ĠUNHCR":30699,"Ġdomains":30700,"eco":30701,"Ġcrater":30702,"Ġ510":30703,"kid":30704,"Ġcylinders":30705,"ĠClasses":30706,"Kn":30707,"Ġcarcin":30708,"ĠHunting":30709,"irit":30710,"ARP":30711,"anting":30712,"ĠMarino":30713,"ĠRESP":30714,"ifle":30715,"Ġ239":30716,"fman":30717,"Ġtheoretically":30718,"Ġdistraught":30719,"Ġstaircase":30720,"Ġexpel":30721,"Ġlord":30722,"Ġbehaviours":30723,"Ġprescribing":30724,"ographs":30725,"ĠNewly":30726,"Ġpatiently":30727,"Ġskyline":30728,"udos":30729,"Ġrepertoire":30730,"Ġhover":30731,"mint":30732,"Ġclears":30733,"Ġkale":30734,"ĠSco":30735,"ĠCoulter":30736,"Ġpancreat":30737,"pu":30738,"995":30739,"Ġincompetent":30740,"2007":30741,"Ġgripping":30742,"enable":30743,"Ġreinforcing":30744,"ĠFee":30745,"education":30746,"ĠKuro":30747,"Ġbowed":30748,"Ġshave":30749,"ĠMean":30750,"xi":30751,"Ġinciting":30752,"atters":30753,"Ġecstatic":30754,"hog":30755,"Ġclauses":30756,"Ġsubt":30757,"Ġbehaved":30758,"tains":30759,"Liverpool":30760,"Ġstrives":30761,"ĠKev":30762,"ĠFramework":30763,"defined":30764,"Ġrecounts":30765,"array":30766,"tips":30767,"Ġartificially":30768,"fits":30769,"Clearly":30770,"mediate":30771,"Ġunseen":30772,"Ġthugs":30773,"ĠLent":30774,"Ġ1938":30775,"Ġgenital":30776,"ĠSonic":30777,"ĠWarehouse":30778,"pler":30779,"Ġunm":30780,"Ġpackets":30781,"ĠMET":30782,"ealous":30783,"ographers":30784,"Ġlabou":30785,"Core":30786,"+,":30787,"parable":30788,"Ġstrat":30789,"Ġinvitations":30790,"Ġsouven":30791,"Ġbillboards":30792,"ĠRegulations":30793,"Ġdwarf":30794,"Ġtoler":30795,"Ġprose":30796,"Ġestates":30797,"Ġmetabolic":30798,"ĠSuff":30799,"ĠFirstly":30800,"Ġpolio":30801,"Ġchick":30802,"ĠDaughter":30803,"Ġsubstant":30804,"ĠIdentity":30805,"umbers":30806,"ĠFacts":30807,"Ġfrust":30808,"Ġdissip":30809,"ĠDeck":30810,"Hy":30811,"ĠBirch":30812,"Ġhurled":30813,"democracy":30814,"nered":30815,"eper":30816,"Ġcerebral":30817,"181":30818,"Ġhalves":30819,"abit":30820,"balance":30821,"ĠTibet":30822,"Ġhandheld":30823,"ĠDough":30824,"Ġprogrammed":30825,"hw":30826,"Ġoutlawed":30827,"ĠSerious":30828,"Ġironically":30829,"Ġmanipulating":30830,")\"":30831,"juries":30832,"Ġfragrance":30833,"crete":30834,"ĠHHS":30835,"cience":30836,"Ġcosmic":30837,"Ġforeclosure":30838,"Ġpercentages":30839,"Bus":30840,"Ġenticing":30841,"extra":30842,"ĠShy":30843,"ĠÂ¥":30844,"Ġheadsets":30845,"imensional":30846,"Ġlux":30847,"Ġresidual":30848,"Ġmantle":30849,"ĠSJ":30850,"ĠPeaks":30851,"ĠFinger":30852,"Ġunfolds":30853,"anity":30854,"Ġresettlement":30855,"ĠWeak":30856,"ĠBeen":30857,"Ġ198":30858,"Ġangels":30859,"ĠFarn":30860,"peace":30861,"Ġcapac":30862,"Ġhue":30863,"Ġlust":30864,"traumatic":30865,"laun":30866,"Ġstrawberries":30867,"Ġherbal":30868,"Ġconversions":30869,"ĠHeld":30870,"Ġprescribe":30871,"Its":30872,"ĠDartmouth":30873,"Ġfashioned":30874,"460":30875,"BLE":30876,"international":30877,"Ġlumin":30878,"Ġplantation":30879,"ilde":30880,"490":30881,"Ġeuph":30882,"Ġdisgust":30883,"Ġaspire":30884,"medical":30885,"Ġsocialism":30886,"Ġdissolve":30887,"Wal":30888,"Ġadmittedly":30889,"Ġsewing":30890,"ĠAcer":30891,"Ġtul":30892,"Ġfacilit":30893,"Ġgrandma":30894,"ĠFeeling":30895,"Ġobst":30896,"ĠFranz":30897,"ĠPalin":30898,"ĠIncrease":30899,"gets":30900,"ĠImam":30901,"âĢİ":30902,"Ġcoincides":30903,"urrence":30904,"Ġlifes":30905,"Lab":30906,"Ham":30907,"angelo":30908,"Wild":30909,"Ġvetoed":30910,"Ġventilation":30911,"olid":30912,"Summer":30913,"Ġfacade":30914,"neys":30915,"ĠWOM":30916,"ĠBenny":30917,"ĠMarried":30918,"squ":30919,"ĠReflect":30920,"return":30921,"elia":30922,"olding":30923,"Ġrefine":30924,"ĠMadness":30925,"innacle":30926,"posts":30927,"287":30928,"fruit":30929,"274":30930,"icator":30931,"ĠVoy":30932,"Ġunsett":30933,"Ġfant":30934,"Ġtreaties":30935,"Ġcrystals":30936,"Ġhijacked":30937,"words":30938,"ĠReleased":30939,"Save":30940,"Ġcannon":30941,"Ġanomaly":30942,"Ġbeacon":30943,"Ġcrippled":30944,"Ġbundles":30945,"Ġuntreated":30946,"Ġhappiest":30947,"Ġgalaxies":30948,"Ġoccupational":30949,"416":30950,"Dar":30951,"Ġcrank":30952,"Ġappropriation":30953,"asking":30954,"mens":30955,"Ġdetector":30956,"Ġskewed":30957,"Ġpoke":30958,"254":30959,"Ġhypertension":30960,"apolog":30961,"Ġevaluations":30962,"blocks":30963,"Ġpow":30964,"GEN":30965,"Ġscalp":30966,"Ġarrogant":30967,"AIDS":30968,"ority":30969,"Ġredirect":30970,"Ġderogatory":30971,"Ġlateral":30972,"495":30973,"rolley":30974,"brew":30975,"Ġbabys":30976,"Ġmuff":30977,"ĠRequ":30978,"Ġdime":30979,"Ġwonderfully":30980,"Ġtreasures":30981,"ĠNES":30982,"Ġponds":30983,"Ġimpulse":30984,"Ġdetecting":30985,"Ġgrin":30986,"Ġbrid":30987,"Ġshoved":30988,"Ġpurge":30989,"irteen":30990,"OTHER":30991,"ÙĦ":30992,"irsch":30993,"ĠOcc":30994,"193":30995,"Ġfodder":30996,"wrote":30997,"meric":30998,"posal":30999,"Ġwinters":31000,"ĠJuice":31001,"hub":31002,"Ġcontrasting":31003,"Brazil":31004,"Ġflashy":31005,"uffer":31006,"technology":31007,"Children":31008,"Ġcatapult":31009,"owsky":31010,"ĠEclipse":31011,"abeth":31012,"ĠParticip":31013,"Ġlaud":31014,"ĠQuiet":31015,"Ġsimulations":31016,"Ġsacrificing":31017,"Ġpreaching":31018,"Ġvoicing":31019,"itizen":31020,"Ġgn":31021,"Ġsans":31022,"Ġ285":31023,"ĠRobot":31024,"Ġ1936":31025,"Ġsham":31026,"ĠKislyak":31027,"ĠGCC":31028,"tale":31029,"ĠShades":31030,"Ġsediment":31031,"Ġconveniently":31032,"Give":31033,"mounted":31034,"Ġpeel":31035,"Jun":31036,"ĠEisenhower":31037,"Ġdiplom":31038,"ĠPreservation":31039,"Ġaffirm":31040,"Ġtaboo":31041,"ĠGarr":31042,"ĠApply":31043,"prim":31044,"Ġausp":31045,"Ġtextbook":31046,"Ġforfeit":31047,"icides":31048,"Ġundis":31049,"DJ":31050,"Ġ\"...":31051,"ĠXperia":31052,"Ġfurry":31053,"Australian":31054,"Ġpreach":31055,"Ġparamed":31056,"Ġ196":31057,"agos":31058,"ĠRIP":31059,"Ġ408":31060,"ĠQuarterly":31061,"ĠQuentin":31062,"Ġdeft":31063,"ĠVlad":31064,"massive":31065,"apore":31066,"Ġquestionnaire":31067,"secution":31068,"ĠTunnel":31069,"ĠAssist":31070,"BILITY":31071,"everything":31072,"vich":31073,"Ġcomparatively":31074,"heng":31075,"ETH":31076,"ĠiPod":31077,"Ġinsurgent":31078,"Ġtestosterone":31079,"191":31080,"Ġmoons":31081,"Ġgripped":31082,"Ġstrang":31083,"pects":31084,"ĠSERVICE":31085,"Ġnumb":31086,"Ġmeasurable":31087,"Ġdismantled":31088,"Ġdepict":31089,"Ġretake":31090,"Light":31091,"Ġaquatic":31092,"useum":31093,"judicial":31094,"Ġ****":31095,"Ġrosters":31096,"certain":31097,"Ġhypothesis":31098,"2002":31099,"Snow":31100,"Ġpounded":31101,"ĠZel":31102,"ĠTrem":31103,"iversity":31104,"219":31105,"Jen":31106,"ĠAdventures":31107,"Ġcylinder":31108,"Ġbanging":31109,"Ġbalk":31110,"analy":31111,"ĠHust":31112,"ookie":31113,"ĠReturning":31114,"Ġpods":31115,"analysis":31116,"ĠTruman":31117,"Ġorg":31118,"Ġsar":31119,"Ġdred":31120,"ĠTelecommunications":31121,"ĠSven":31122,"carry":31123,"ĠLOVE":31124,"Ġparting":31125,"asar":31126,"utations":31127,"itic":31128,"Ġactu":31129,"Ġbananas":31130,"ĠNights":31131,"410":31132,"Still":31133,"Ġtweaked":31134,"went":31135,"Ġtoddlers":31136,"irted":31137,"Ġpaed":31138,"ĠWink":31139,"Ġviewpoint":31140,"ĠHelic":31141,"Ġhandshake":31142,"Ġpoaching":31143,"Ġrounding":31144,"268":31145,"ĠNVIDIA":31146,"Ġsquat":31147,"Ġtowed":31148,"Ġhandler":31149,"Ġconspir":31150,"Ġadditionally":31151,"CENT":31152,"ĠÃľ":31153,"article":31154,"ĠTough":31155,"NM":31156,"Rem":31157,"Ġstunts":31158,"ILS":31159,"ĠLM":31160,"Connect":31161,"ĠParagu":31162,"Ġcomplexities":31163,"Ġhugging":31164,"Ġabolish":31165,"ricting":31166,"ĠItems":31167,"Ġtemples":31168,"ĠSeat":31169,"ĠRubber":31170,"Ġindic":31171,"ĠVitamin":31172,"Ġcitations":31173,"Ġarmored":31174,"---------------":31175,"ĠNeo":31176,"ippy":31177,"Que":31178,"Ġrag":31179,"Ġlov":31180,"630":31181,"Ġadept":31182,"orbit":31183,"253":31184,"412":31185,"Ġbutterflies":31186,"Ġoutl":31187,"ĠCycle":31188,"Ġaesthetics":31189,"ĠTwitch":31190,"405":31191,"factor":31192,"ðŁij":31193,"ĠCircus":31194,"Posted":31195,"Ġintroductory":31196,"ĠStack":31197,"atoes":31198,"Ġfurn":31199,"ĠHond":31200,"Ġbipolar":31201,"ĠAging":31202,"inches":31203,"Ġincompetence":31204,"Ġaloud":31205,"Imagine":31206,"Ġsepar":31207,"Ġmanip":31208,"ophobic":31209,"inion":31210,"bek":31211,"Ġquer":31212,"ĠArmen":31213,"Ġhumorous":31214,"Ġmundane":31215,"Ġapologizing":31216,"Ġpioneered":31217,"Ġ303":31218,"282":31219,"Ġcalming":31220,"orious":31221,"760":31222,"Ġstitches":31223,"Ġthrottle":31224,"Ġspinach":31225,"urities":31226,"ĠCologne":31227,"Ġripple":31228,"Cs":31229,"Cent":31230,"Should":31231,"Ġaffinity":31232,"amount":31233,"ĠMISS":31234,"Ġsage":31235,"Ġamusing":31236,"Ġsnatch":31237,"clair":31238,"ĠGuess":31239,"bench":31240,"ĠMoj":31241,"nuclear":31242,"Ġfid":31243,"ĠVM":31244,"ĠGN":31245,"brainer":31246,"Ġcurled":31247,"Ġbushes":31248,"icably":31249,"Ġcreeping":31250,"Ġveil":31251,"ĠALS":31252,"ESPN":31253,"ulsion":31254,"ĠGTX":31255,"ĠANN":31256,"Ġcomplicit":31257,"assault":31258,"IOR":31259,"Ġpolymer":31260,"Ġestimating":31261,"277":31262,"alog":31263,"Ġglimps":31264,"Ġreinforces":31265,"Ġtextbooks":31266,"Ġdictated":31267,"ĠReyn":31268,"latable":31269,"ĠOrth":31270,"520":31271,"Ġtrickle":31272,"ĠWrong":31273,".[":31274,"ĠDesigner":31275,"304":31276,"ĠInner":31277,"Ġrave":31278,"ppa":31279,"ĠGim":31280,"Ġswath":31281,"Ġcarts":31282,"atlantic":31283,"Ġpersists":31284,"ĠDeveloper":31285,"Ġgoodies":31286,"isive":31287,"Inf":31288,"ĠSaving":31289,"loop":31290,"tions":31291,"Ġabusers":31292,"Ġclot":31293,"Ġmesmer":31294,"Ġdeg":31295,"Ġskirts":31296,"257":31297,"Ġunreliable":31298,"ĠCOMM":31299,"Ġ194":31300,"Ġfledgling":31301,"administ":31302,"Israeli":31303,"ĠBarbie":31304,"ĠJeanne":31305,"Ġgenerously":31306,"ĠStruct":31307,"ĠZap":31308,"Ġvetted":31309,"ĠViolet":31310,"Ġ),":31311,"Ġembarrass":31312,"bang":31313,"ĠProvider":31314,"getting":31315,"alg":31316,"Ġunconditional":31317,"ĠHulk":31318,"ĠWad":31319,"utation":31320,"Ġpointless":31321,"Ġdeprivation":31322,"Ġstarving":31323,"ĠImpossible":31324,"ĠStir":31325,"Ġknack":31326,"anse":31327,"Ġsecurely":31328,"Ġply":31329,"395":31330,"Pack":31331,"liv":31332,"Ġridden":31333,"alks":31334,"308":31335,"male":31336,"Ġbitterly":31337,"Ġirrational":31338,"Members":31339,"ported":31340,"qq":31341,"ractor":31342,"Ġinflict":31343,"ĠBoehner":31344,"Ġthickness":31345,"Ġdome":31346,"ĠInflu":31347,"Ġheap":31348,"Ġmirrored":31349,"Ġconstituent":31350,"Ġfertile":31351,"Ġvaping":31352,"266":31353,"riages":31354,"Ġembassies":31355,"Ġpersu":31356,"ĠMacArthur":31357,"issions":31358,"Main":31359,"aths":31360,"onne":31361,"circ":31362,"Ġsweating":31363,"quartered":31364,"Ġsax":31365,"Ġ540":31366,"Ġreputable":31367,"Ġsatire":31368,"Ġpastors":31369,"ventional":31370,"Mic":31371,"female":31372,"Ġpity":31373,"appropri":31374,"voc":31375,"hei":31376,"Ġimperial":31377,"Ġcorrective":31378,"Ġresent":31379,"Ġtempered":31380,"Ġdiffers":31381,"Hamilton":31382,"Ġsaddle":31383,"Ġgrenades":31384,"ĠQuart":31385,"onymous":31386,"til":31387,"Ġdepiction":31388,"Ġdisreg":31389,"Ġpetitioner":31390,"Ġfret":31391,"ĠEns":31392,"Emer":31393,"540":31394,"opathy":31395,"vertisements":31396,"Ġsketches":31397,"venth":31398,"Ġautomate":31399,"Ġjihad":31400,"iping":31401,"Ġtert":31402,"ĠSop":31403,"ships":31404,"Ġdeceptive":31405,"ĠPryor":31406,"ĠGorge":31407,"ĠMeridian":31408,"rero":31409,"affected":31410,"Ġlame":31411,"660":31412,"rub":31413,"Hello":31414,"ĠNumbers":31415,"269":31416,"Ġmarg":31417,"Fran":31418,"640":31419,"Ġcath":31420,"winter":31421,"ĠMosque":31422,"Ġreckoning":31423,"ĠImaging":31424,"Ġmutation":31425,"ĠMild":31426,"Ġkidnap":31427,"Ġnav":31428,"Ġferocious":31429,"Ġdusty":31430,"Cele":31431,"ĠFoss":31432,"Ġregrett":31433,"lymp":31434,"Ġcoli":31435,"Ġstereo":31436,"Ġforesee":31437,"alties":31438,"Ġresusc":31439,"Full":31440,"wash":31441,"ĠINST":31442,"ĠPars":31443,"Ġcoated":31444,"ĠHT":31445,"Ġdiscord":31446,"Ġreforming":31447,"CAN":31448,"Ġblink":31449,"Ġlubric":31450,"Ġmishand":31451,"ensible":31452,"existent":31453,"secondary":31454,"ĠDoesn":31455,"terrorist":31456,"Ġriff":31457,"custom":31458,"ĠDET":31459,"Ġreusable":31460,"ĠCRA":31461,"ĠScalia":31462,"Ġaccelerator":31463,"Ġpropag":31464,"ĠMID":31465,"ework":31466,"Ġlooted":31467,"oscope":31468,"eners":31469,"ruction":31470,"Ġbarr":31471,"Ġviewership":31472,"Ġlends":31473,"obil":31474,"ĠRoots":31475,"ĠCame":31476,"ibel":31477,"Ġglobalization":31478,"lab":31479,"information":31480,"Ġcoordin":31481,"Ġglitch":31482,"Ġworms":31483,"Ġslurs":31484,"Ġcontemplated":31485,"ĠPenal":31486,"Ġ191":31487,"Ġ221":31488,"Ġexposes":31489,"Ġ248":31490,"ĠASP":31491,"Ġdependency":31492,"urga":31493,"pdf":31494,"Ġvibr":31495,"clone":31496,"ossible":31497,"ĠUtt":31498,"serv":31499,"ĠLevant":31500,"maybe":31501,"MU":31502,"ĠLunar":31503,"Ġbystanders":31504,"Ġcapitals":31505,"Ġpreacher":31506,"thin":31507,"Ġunderscore":31508,"Ġ('":31509,"Ġmedd":31510,"Ġautobiography":31511,"Ġpersistence":31512,"Ġarming":31513,"Ġappalled":31514,"Ġcontradictory":31515,"Ġreciproc":31516,"Ġtakedown":31517,"tan":31518,"Ġnecessities":31519,"itans":31520,"ĠAlas":31521,"Ġsegregated":31522,"ĠResponsibility":31523,"ĠSHOW":31524,"ISIS":31525,"Ġpengu":31526,"Ġumb":31527,"ĠHO":31528,"HB":31529,"ĠChou":31530,"Ġalluded":31531,"Ġharms":31532,"bara":31533,"ĠWOR":31534,"Sorry":31535,"Ġstarvation":31536,"Ġspilling":31537,"Ġcarb":31538,"annis":31539,"ĠGarrison":31540,"Ġmillionaire":31541,"ifling":31542,"ĠCancel":31543,"Ġimprint":31544,"Ġborrower":31545,"455":31546,"ĠCic":31547,"Ġexposures":31548,"dest":31549,"Ġunn":31550,"Ġ802":31551,"Ġadherence":31552,"prints":31553,"Ġweary":31554,"Ġwaging":31555,"Ġ1937":31556,"ĠKepler":31557,"%;":31558,"Ġdefective":31559,"ĠReps":31560,"ĠGranted":31561,"Ġdisco":31562,"ĠRanking":31563,"erno":31564,"Ġarchaeological":31565,"sq":31566,"Ġcapit":31567,"Ġfleets":31568,"Ġinventor":31569,"iffin":31570,"Ġspotting":31571,"ĠSHARES":31572,"309":31573,"Hard":31574,"save":31575,"241":31576,"ĠThinking":31577,"XY":31578,"Ġhavens":31579,"Ġmessed":31580,"crop":31581,"Ġperme":31582,"Ġtimelines":31583,"ĠGarage":31584,"Ġplateau":31585,"together":31586,"fox":31587,"Ġfailings":31588,"ĠTight":31589,"ĠPhysics":31590,"ĠScholars":31591,"Ġpans":31592,"Fall":31593,"Ġhull":31594,"GER":31595,"Ġbourbon":31596,"ceived":31597,"Ġsteroids":31598,"Ġhamb":31599,"Ġinterpretations":31600,"Ġcush":31601,"Chair":31602,"Ġinformational":31603,"aryn":31604,"Ġwoven":31605,"Ġamen":31606,"Bre":31607,"Ġrefreshed":31608,"York":31609,"ĠBlast":31610,"Editor":31611,"Ġmotivating":31612,"ĠReason":31613,"Florida":31614,"Ġdreaded":31615,"Ġstationary":31616,"Ġbil":31617,"doors":31618,"Ġslightest":31619,"Ġcombustion":31620,"Ġfascination":31621,"Ġstraps":31622,"scribed":31623,"Ġexhibiting":31624,"Ġsimplest":31625,"Gar":31626,"Ġprogressives":31627,"claim":31628,"ocket":31629,"Ġexoner":31630,"ĠNETWORK":31631,"Brad":31632,"Ġ197":31633,"Ġnightmares":31634,"Ġillust":31635,"among":31636,"ĠGreenpeace":31637,"Ġoval":31638,"Ġblocker":31639,"3000":31640,"ĠMemor":31641,"Ġmids":31642,"Ġconfuse":31643,"YN":31644,"cow":31645,"Ġdispensary":31646,"telling":31647,"Ġentail":31648,"Ġneurolog":31649,"Ġbroth":31650,"Ġpron":31651,"ĠAnswer":31652,"thank":31653,"Ġintersect":31654,"Ġclinging":31655,"ĠKilling":31656,"Ġcohesion":31657,"Ġcategorized":31658,"Ġtangled":31659,"ĠASC":31660,"Arsenal":31661,"ĠAutomatic":31662,"580":31663,"sac":31664,"Ġshady":31665,"consumer":31666,"hetically":31667,"NV":31668,"Ġoverl":31669,"holes":31670,"ĠDonation":31671,"tera":31672,"score":31673,"library":31674,"Ġsmoother":31675,"Ġcoasts":31676,"Ġintercourse":31677,"Ġunfavorable":31678,"erb":31679,"Hel":31680,"Ġbiases":31681,"Ġinheritance":31682,"Ġsuppressed":31683,"ĠRecommend":31684,"iculture":31685,"ighting":31686,"inguished":31687,"idences":31688,"operated":31689,"Ġhors":31690,"Ġshrug":31691,"aila":31692,"ĠConsortium":31693,"Ġveins":31694,"uria":31695,"ĠSmithsonian":31696,"ĠAX":31697,")âĢĶ":31698,"given":31699,"JC":31700,"Ġreneg":31701,"Ġprincip":31702,"Ġextinct":31703,"Golden":31704,"ASON":31705,"Ġstatutes":31706,"292":31707,"ĠGOOD":31708,"ĠGreenland":31709,"ĠRasmussen":31710,"ATHER":31711,"Ġdeserted":31712,"ĠHitchcock":31713,"Ġqualifies":31714,"Ġdreadful":31715,"Ġsupers":31716,"Ġtendon":31717,"oter":31718,"ĠFate":31719,"Ġrestrooms":31720,"igating":31721,"Sher":31722,"Name":31723,"orph":31724,"ĠCritical":31725,"rox":31726,"Ġdefunct":31727,"Ġcanoe":31728,"Ġbiscuits":31729,"Ġwomb":31730,"808":31731,"istar":31732,"Ġroar":31733,"aundering":31734,"iewicz":31735,"ĠNM":31736,"ĠChamberlain":31737,"Ġ233":31738,"ĠCoat":31739,"Ġ999":31740,"aft":31741,"Ġlurking":31742,"ĠPist":31743,"Ġfollower":31744,"Ġcareg":31745,"ÙĨ":31746,"ĠThin":31747,"ZZ":31748,"ĠGI":31749,"ĠVintage":31750,"Ġpainstaking":31751,"Ġgloom":31752,"Ġtbsp":31753,"Ġwhim":31754,"ĠMask":31755,"rugged":31756,"Ġwritings":31757,"stantial":31758,"luence":31759,"ordable":31760,"akia":31761,"Ġassassinated":31762,"Wind":31763,"Ġdemeanor":31764,"Night":31765,"rape":31766,"ĠBringing":31767,"Ġshields":31768,"ĠAntarctic":31769,"Ġfruitful":31770,"ĠBuster":31771,"ĠLois":31772,"Ġ302":31773,"Style":31774,"ĠRIS":31775,"Ġdissatisfaction":31776,"ulp":31777,"ĠLaser":31778,"Ġdisposition":31779,"ĠAnk":31780,"Ġabsorbing":31781,"276":31782,"Ġvolcan":31783,"Ġleftover":31784,"yah":31785,"ĠVaj":31786,"Ġunsolved":31787,"oland":31788,"Ġstained":31789,"Ġpathetic":31790,"ylan":31791,"Ġknots":31792,"immigration":31793,"ieving":31794,"Coming":31795,"Commerce":31796,"ĠHurt":31797,"drawn":31798,"Ġaxis":31799,"Ġdye":31800,"ĠNora":31801,"ĠPortal":31802,"Ġsuspense":31803,"ĠExactly":31804,"Ġpowering":31805,"ĠClock":31806,"Ġdrawer":31807,"ĠSpike":31808,"Ġhallmark":31809,"aber":31810,"ĠTrainer":31811,"UV":31812,"Ġredundant":31813,"Tour":31814,"Ġdesignate":31815,"Ġredress":31816,"ĠUb":31817,"cake":31818,"oded":31819,"Ġkings":31820,"iates":31821,"Ġcoupons":31822,"Ġextremes":31823,"Elect":31824,"Ġcitation":31825,"Ġdirectory":31826,"Ġtranspired":31827,"cele":31828,"gence":31829,"5000":31830,"ostic":31831,"Ġraining":31832,"ĠSight":31833,"videos":31834,"phthal":31835,"llor":31836,"Ġappraisal":31837,"Ġdetox":31838,"Ġelecting":31839,"Ġordinances":31840,"Ġlifespan":31841,"Ref":31842,"Ġilluminated":31843,"Ġforfe":31844,"Making":31845,"ĠWorst":31846,"ĠTP":31847,"Ġfullest":31848,"ĠISIL":31849,"ĠRates":31850,"Ġyeast":31851,"sett":31852,"ĠYok":31853,"innie":31854,"edition":31855,"ĠGoldstein":31856,"Ġunaff":31857,"god":31858,"Ġzo":31859,"rums":31860,"Ġopaque":31861,"ĠHist":31862,"Yesterday":31863,"AMS":31864,"aband":31865,"005":31866,"illary":31867,"ĠSplash":31868,"Ġaccrued":31869,"Ell":31870,"Ġnominating":31871,"ĠBroadcast":31872,"ĠWhip":31873,"ARM":31874,"Ġunnecessarily":31875,"brown":31876,"429":31877,"ansky":31878,"Ġextravagant":31879,"Malley":31880,"wage":31881,"Ġexempted":31882,"Ġtypo":31883,"Ġesports":31884,"ĠStru":31885,"ĠPython":31886,"Ġsaint":31887,"ĠCSI":31888,"ĠPowder":31889,"Ġdisguised":31890,"ĠSubway":31891,"Ġprecursor":31892,"ĠWizard":31893,"Johnson":31894,"icas":31895,"Ġdefaults":31896,"!).":31897,"ebra":31898,"jected":31899,"Ġunaccompanied":31900,"HH":31901,"Ġproced":31902,"clinical":31903,"Ġmitigating":31904,"ĠSoup":31905,"ĠFunny":31906,"344":31907,"Hall":31908,"Ġscalable":31909,"Ġshimmer":31910,"Ġunderstatement":31911,"zeb":31912,"icus":31913,"Ġretract":31914,"IDER":31915,"ieft":31916,"iii":31917,"ĠEmperor":31918,"Ġvoltage":31919,"343":31920,"Rest":31921,"ĠButcher":31922,"Ġlaced":31923,"Ġsalty":31924,"Ġfourteen":31925,"Ġoxy":31926,"Ġraged":31927,"Ġforg":31928,"Ġcaveat":31929,"Ġponder":31930,"process":31931,"Ġghosts":31932,"ĠGoose":31933,"didn":31934,"stood":31935,"amation":31936,"Ġvillains":31937,"contract":31938,"Ġbooted":31939,"ĠDidn":31940,"ĠSalon":31941,"Ġlewd":31942,"ĠFritz":31943,"Ġorganis":31944,"Ġpuzzles":31945,"ĠRX":31946,"Ġcurtains":31947,"ĠPackage":31948,"Ġrebate":31949,"Ġspokes":31950,"Ġoccupant":31951,"Ġfooled":31952,"appy":31953,"Ġyourselves":31954,"Ġmaths":31955,"Ġ630":31956,"bos":31957,"ĠHeb":31958,"APS":31959,"Ġbulletin":31960,"Ġpests":31961,"Ġlum":31962,"ĠHAS":31963,"users":31964,"idated":31965,"Ġpalpable":31966,"ĠFeature":31967,"ĠPKK":31968,"Ġdetriment":31969,"Ġbamboo":31970,"Ġimmersed":31971,"ĠDud":31972,"Ġion":31973,"icc":31974,"ĠIris":31975,"ĠBeats":31976,"Ġimprobable":31977,"Ġfuner":31978,"Ġsprung":31979,"ĠLieberman":31980,"ĠSTA":31981,"venge":31982,"Ġtreacherous":31983,"Ġpreced":31984,"Ġsniper":31985,"ĠGOLD":31986,"ĠSUR":31987,"Nic":31988,"ĠROB":31989,"Camp":31990,"Ġhooks":31991,"oling":31992,"Ġbolst":31993,"339":31994,"heter":31995,"Ġbracelet":31996,"Ġbreat":31997,"307":31998,"ĠTrader":31999,"ĠPixar":32000,"hist":32001,"Ġmenacing":32002,"Ġgrizz":32003,"294":32004,"Ġillustrious":32005,"Ġtransact":32006,"Ġspoiler":32007,"ĠWORK":32008,"Road":32009,"Ġblackout":32010,"Ġencomp":32011,"proven":32012,"ĠFriendship":32013,"Ġentrances":32014,"Ġprofessions":32015,"Ġinsin":32016,"Ġrecorder":32017,"Ġformulation":32018,"govern":32019,"Ġpainfully":32020,"ĠRepe":32021,"eeds":32022,"cru":32023,"ĠDir":32024,"Ġtriumphant":32025,"Ġignition":32026,"xy":32027,"Ġintrusion":32028,"ĠEAR":32029,"RES":32030,"Ġration":32031,"ĠTaken":32032,"Ġcages":32033,"Ġpeg":32034,"Ġcommem":32035,"680":32036,"ĠRite":32037,"Ġfolder":32038,"Ġvertically":32039,"Ġcheeks":32040,"pick":32041,"Ġcrispy":32042,"Ġsqueezing":32043,"ĠBene":32044,"ĠTrailer":32045,"ĠKM":32046,"acceptable":32047,"ĠSetting":32048,"Ġsupernatural":32049,"ĠEz":32050,"Ġvenom":32051,"ĠFrey":32052,"Ġpulp":32053,"Had":32054,"centered":32055,"metics":32056,"Kent":32057,"ĠDOI":32058,"kr":32059,"ĠWHEN":32060,"Ġtakeoff":32061,"isf":32062,"uko":32063,"Ġquasi":32064,"Ġveggies":32065,"Ġpesticide":32066,"Ġstimulating":32067,"Ġacknowledgement":32068,"Ġattained":32069,"ĠBackground":32070,"281":32071,"317":32072,"ĠTrees":32073,"Ġdetractors":32074,"Ġannouncer":32075,"Ġjoyful":32076,"ĠElf":32077,"istration":32078,"phi":32079,"Ġprogressively":32080,"mini":32081,"Ġcontraception":32082,"asca":32083,"ishops":32084,"Ġmisunderstood":32085,"Ġinitiating":32086,"ĠConversely":32087,"338":32088,"080":32089,"idation":32090,"ĠGoes":32091,"Ġimprov":32092,"Ġswapping":32093,"Vict":32094,"Ġdevoid":32095,"fighter":32096,"ĠMori":32097,"Ġvoy":32098,"ĠElev":32099,"ĠAim":32100,"Ġtrustworthy":32101,"Leg":32102,"675":32103,"ĠPossible":32104,"Crunch":32105,"ĠRings":32106,"Ġphony":32107,"Ġbladder":32108,"ĠChall":32109,"Spot":32110,"oak":32111,"Was":32112,"ĠFAM":32113,"ĠAGA":32114,"ĠFifa":32115,"Ġenclosed":32116,"Ġanthrop":32117,"faith":32118,"ĠAux":32119,"Ġgracious":32120,"roller":32121,"Ġdowntime":32122,"swing":32123,"Ġcamouflage":32124,"ĠCosts":32125,"Ġliv":32126,"ricular":32127,"ĠUran":32128,"Ġdisapproval":32129,"Ġpropriet":32130,"bits":32131,"Ġmafia":32132,"ĠSCHOOL":32133,"ĠPrepar":32134,"button":32135,"Almost":32136,"Ġpastoral":32137,"ĠDove":32138,"Hol":32139,"Ġimposes":32140,"ĠDram":32141,"lys":32142,"ĠSAS":32143,"Ġwiring":32144,"271":32145,"ĠModels":32146,"Ġoutpost":32147,"etics":32148,"Ġinsulted":32149,"ĠMongolia":32150,"Ġoverth":32151,"Haw":32152,"ĠHomer":32153,"itta":32154,"raining":32155,"Ġevidently":32156,"raphic":32157,"impact":32158,"Ġfranch":32159,"Ġ2100":32160,"Ġapproximate":32161,"Ġcartoons":32162,"Ġbackups":32163,"umbing":32164,"Ġforceful":32165,"ĠShad":32166,"Ġsurges":32167,"Ġperf":32168,"Ġdele":32169,"Ġquieter":32170,"ĠHorowitz":32171,"ĠDX":32172,"anners":32173,"ĠNinja":32174,"ĠScript":32175,"ĠElise":32176,"collect":32177,"Ġgrading":32178,"ĠBethesda":32179,"Kids":32180,"ĠTelephone":32181,"Ġpreferring":32182,"Ġreconcil":32183,"Ġmango":32184,"ĠHail":32185,"ĠCitizenship":32186,"Master":32187,"cular":32188,"Ġstuffing":32189,"ĠAlive":32190,"ALLY":32191,"Ġchi":32192,"ĠDynam":32193,"ĠRosenthal":32194,"Ġpurity":32195,"Ġtemp":32196,"ĠHAL":32197,"employ":32198,"Ġplentiful":32199,"ĠComed":32200,"Ġstacks":32201,"ĠHuge":32202,"ĠOlder":32203,"Ġsclerosis":32204,"ONY":32205,"Ġfilmmaking":32206,"chance":32207,"Cry":32208,"Ġworkflow":32209,"ĠPersonnel":32210,"awed":32211,"ĠColumn":32212,"Ġuncomp":32213,"Ġdiscriminated":32214,"Ġpts":32215,"Ġallev":32216,"ĠKinn":32217,"meal":32218,"Ġnovice":32219,"Ġcrest":32220,"Ġhearty":32221,"Ġlowers":32222,"inqu":32223,"ĠPlayoffs":32224,"ĠHyp":32225,"Ġautos":32226,"Ġindec":32227,"Ġnighttime":32228,"Ġreflex":32229,"306":32230,"disciplinary":32231,"ophe":32232,"contact":32233,"Ġachievable":32234,"Ġslab":32235,"ĠMessage":32236,"ĠVMware":32237,"ĠDia":32238,"REG":32239,"Ġconfisc":32240,"ĠMechan":32241,"Ġphenomena":32242,"Ġsequencing":32243,"Ġshaming":32244,"Ġcompilation":32245,"ĠAges":32246,"Ġmastered":32247,"Ġagony":32248,"Ġrestrain":32249,"ĠLyme":32250,"Which":32251,"ĠBarney":32252,"ĠConcept":32253,"Ġsuperheroes":32254,"ĠPsychology":32255,"Ġreminis":32256,"violence":32257,"Lead":32258,"Da":32259,"VEN":32260,"ERC":32261,"ĠVoter":32262,"Ġbetray":32263,"Ġsavage":32264,"driver":32265,"IFT":32266,"Chain":32267,"angler":32268,"'-":32269,"lain":32270,"ĠRatt":32271,"bis":32272,"iverse":32273,"Ġdensely":32274,"Ġuncom":32275,"Ġunsuspecting":32276,"Ġstimulation":32277,"diff":32278,"Ġskins":32279,"ĠRiding":32280,"ategic":32281,"ĠUnderstand":32282,"occup":32283,"ĠCooking":32284,"Ġschizophrenia":32285,"ĠKoen":32286,"Ġcomrades":32287,"HY":32288,"Ġfab":32289,"ĠRowling":32290,"Allen":32291,"ĠJUL":32292,"Ġembryos":32293,"UU":32294,"ĠCAT":32295,"Ġtidy":32296,"finger":32297,"ĠCake":32298,"Ġrightfully":32299,"religious":32300,"Ġ407":32301,"Gal":32302,"408":32303,"Ġgrievance":32304,"Ġswallowed":32305,"251":32306,"283":32307,"ĠBarcl":32308,"opter":32309,"Ġpedoph":32310,"Ġcured":32311,"Ġestablishes":32312,"increasing":32313,"tics":32314,"articles":32315,"Ġunethical":32316,"authored":32317,"Ġanchors":32318,"ĠContra":32319,"Ġventured":32320,"ĠCoh":32321,"Ġpuff":32322,"heddar":32323,"Ġomission":32324,"Ġdich":32325,"ceed":32326,"Ġscares":32327,"Ġdoctoral":32328,"293":32329,"ĠUnt":32330,"Ġdop":32331,"ĠInjury":32332,"ificantly":32333,"ĠRift":32334,"ĠOrders":32335,"Ġmobilize":32336,"particularly":32337,"Ġchilled":32338,"Reports":32339,"redibly":32340,"ĠGuru":32341,"Ġvalleys":32342,"Ġtextures":32343,"Ġreuse":32344,"roit":32345,"unts":32346,"Ġirreversible":32347,"Ġwarships":32348,"Ġpus":32349,"Ġpeeled":32350,"Ġthirst":32351,"Ġgrapple":32352,"busters":32353,"Ġnort":32354,"ĠDates":32355,"Safe":32356,"Ġbirthplace":32357,"hemoth":32358,"Ġvile":32359,"Ġ306":32360,"Ram":32361,"activated":32362,"ĠAero":32363,"Ġbutcher":32364,"ĠKnock":32365,"Ġdisturb":32366,"Ġtotality":32367,"tted":32368,"Ġlegit":32369,"cking":32370,"nikov":32371,"Ġfavoring":32372,"lang":32373,"Ġrightful":32374,"orum":32375,"!!!!":32376,"ĠMinute":32377,"Ġpostings":32378,"Java":32379,"510":32380,"Ġmicrobes":32381,"Ġsixteen":32382,"entimes":32383,"Ġbulb":32384,"Ġgoalt":32385,"Ġhumiliated":32386,"ansom":32387,"roach":32388,"Ġgrouping":32389,"hari":32390,"Ġcler":32391,"Ġstared":32392,"ĠSymptoms":32393,"Ġbasil":32394,"Whenever":32395,"ĠWhoever":32396,"Oil":32397,"ĠJericho":32398,"ĠAlm":32399,"Pol":32400,"Hur":32401,"Ġupro":32402,"ĠSpo":32403,"hammer":32404,"Mur":32405,"ĠTorch":32406,"Ġfrequencies":32407,"ĠExpansion":32408,"Ġparalysis":32409,"igon":32410,"ĠSail":32411,"Ġsilently":32412,"Ġrevolver":32413,"Ġstockpile":32414,"Ġpessimistic":32415,"ESA":32416,"Ġdisclaim":32417,"Ġdemocracies":32418,"ĠTales":32419,"ĠAngry":32420,"ĠWhitman":32421,"ĠOri":32422,"Ġtransitioned":32423,"behind":32424,"ĠLAN":32425,"Ġcav":32426,"ĠJazeera":32427,"KC":32428,"ĠInspect":32429,"irty":32430,"ĠAin":32431,"ĠOrig":32432,"Ġobscene":32433,"Ġdormant":32434,"Ġharb":32435,"ĠWiz":32436,"ĠAdolf":32437,"Ġvic":32438,"Ġdenouncing":32439,"Ġye":32440,"aques":32441,"Ġomn":32442,"Ġassemblies":32443,"nosis":32444,"Ġadmon":32445,"Ġanguish":32446,"Ġvag":32447,"YE":32448,"ĠMacro":32449,"Ġrubbing":32450,"Ġreplicated":32451,"Moon":32452,"ĠGuitar":32453,"Ġcentimeters":32454,"amily":32455,"ĠAmes":32456,"Ġchlorine":32457,"Perhaps":32458,"Ġpartisans":32459,"soc":32460,"Ġvagina":32461,"Ġtrove":32462,"ĠYES":32463,"Ġtherapists":32464,"Ġnods":32465,"Ġhanged":32466,"Ġridge":32467,"Ġhaz":32468,"ĠmacOS":32469,"Ġske":32470,"ĠShia":32471,"Ġsteril":32472,"Ġalmond":32473,"ĠRockefeller":32474,"Ġintrinsic":32475,"Certainly":32476,"Ġsublime":32477,"Earn":32478,"abet":32479,"Ġframeworks":32480,"ogical":32481,"ilst":32482,"ipal":32483,"Ġrescuing":32484,"ĠWatergate":32485,"Ġ231":32486,"ĠNano":32487,"ighthouse":32488,"olph":32489,"Ġ312":32490,"Ġhealed":32491,"ĠTomb":32492,"Ġsubst":32493,"Ġsulph":32494,"ĠNewsp":32495,"ĠLama":32496,"venue":32497,"387":32498,"productive":32499,"ĠNEED":32500,"minus":32501,"ĠPages":32502,"cand":32503,"ĠClover":32504,"ĠForensic":32505,"ryn":32506,"ogle":32507,"ocr":32508,"Ġvaccinations":32509,"cies":32510,"ĠMek":32511,"Ġunaffected":32512,"Ġfetal":32513,"ĠDino":32514,"Ġhemisphere":32515,"Ġfroze":32516,"ĠPeg":32517,"Ġmicroscope":32518,"Ġmoderates":32519,"ĠGEN":32520,"ĠHawai":32521,"Ġstagn":32522,"Absolutely":32523,"practice":32524,"IBLE":32525,"cture":32526,"ĠAshe":32527,"Ġcondoms":32528,"Ġpoked":32529,"training":32530,"Ġintermedi":32531,"347":32532,"Ġcardinal":32533,"ĠSpoon":32534,"Ġsupp":32535,"Ġpreviews":32536,"Service":32537,"ĠBeam":32538,"Ġtranscend":32539,"Fresh":32540,"Sure":32541,"Ġ4000":32542,"idential":32543,"ĠCoinbase":32544,"Ġworkings":32545,"ĠPI":32546,"Ġpassionately":32547,"Ġdecisively":32548,"ĠInspection":32549,"Ġinvoke":32550,"Ġstain":32551,"Ġcleaners":32552,"Ġregulates":32553,"Ġshone":32554,"ĠEVERY":32555,"istance":32556,"map":32557,"Ġredu":32558,"Ġoccupies":32559,"Ġprocure":32560,"acket":32561,"roman":32562,"Ġilleg":32563,"Ġleaps":32564,"yond":32565,"Ġyarn":32566,"ĠLTD":32567,"ĠCONTR":32568,"ĠRestoration":32569,"ĠCDs":32570,"Ġdrinkers":32571,"ĠJordanian":32572,"Ġabl":32573,"Ġdisparate":32574,"Ġprimed":32575,"ĠFirearms":32576,"artz":32577,"Ġindispensable":32578,"Ter":32579,"Ġfright":32580,"Ġmarkedly":32581,"Ġroam":32582,"ĠJurassic":32583,"Ġfeder":32584,"Ġpepp":32585,"ĠDV":32586,"Ġpancakes":32587,"sweet":32588,"Ġunmatched":32589,"Ġassembling":32590,"Ultimately":32591,"Ġendeavour":32592,"Ġluckily":32593,"Ġbitch":32594,"Ġelegance":32595,"eers":32596,"drop":32597,"credit":32598,"Ġscourge":32599,"ĠMinimum":32600,"Ġimpatient":32601,"Ġhunted":32602,"ĠGoddard":32603,"Kal":32604,"Ġmined":32605,"Ġcalves":32606,"Ġ234":32607,"Ġplank":32608,"Ġinjecting":32609,"ĠKaufman":32610,"ĠCompliance":32611,"tone":32612,"Ġ345":32613,"Ġdazz":32614,"ĠClarks":32615,"Ġcomprehens":32616,"Ġpist":32617,"Ġrhythms":32618,"Ġreserv":32619,"337":32620,"ĠIDF":32621,"Ġshouts":32622,"midt":32623,"323":32624,"Ġsoothing":32625,"Ġadministr":32626,"Ġgloomy":32627,"Ġfutile":32628,"ĠProhibition":32629,"upon":32630,"ĠAnglic":32631,"seeking":32632,"Ġdodge":32633,"Ds":32634,"ĠGrants":32635,"editor":32636,"ĠInquis":32637,"Ġ1929":32638,"decl":32639,"ĠPorts":32640,"ĠCure":32641,"ĠDPRK":32642,"oct":32643,"Ġvocabulary":32644,"Ġcling":32645,"298":32646,"Ġpeac":32647,"Ġantibodies":32648,"dor":32649,"ĠWorse":32650,"Ġsmelled":32651,"Ġleash":32652,"MED":32653,"Ġdisinteg":32654,"Ġtruthful":32655,"Ġsalesman":32656,"Ġsquares":32657,"susp":32658,"Ġcraving":32659,"Ġwizard":32660,"moral":32661,"ĠQué":32662,"Anything":32663,"Ġfalsehood":32664,"ARI":32665,"Ġcoworkers":32666,"Ġthy":32667,"outher":32668,"Ġbrushing":32669,"ĠProtest":32670,"ĠMF":32671,"abba":32672,"lead":32673,"ĠExhibit":32674,"Ga":32675,"ĠFranks":32676,"Ġdictates":32677,"illegal":32678,"Ġrelayed":32679,"Ġploy":32680,"ĠاÙĦ":32681,"ĠDocuments":32682,"Ġtint":32683,"ĠYuan":32684,"Ġdepended":32685,"Mir":32686,"ĠIntrodu":32687,"Ġrecourse":32688,"oqu":32689,"ĠTED":32690,"Ġdifferentiated":32691,"ĠWalls":32692,"Ġsentimental":32693,"Ġantis":32694,"retion":32695,"comes":32696,"ĠWORLD":32697,"Ġcoax":32698,"ĠTatt":32699,"ĠGingrich":32700,"2006":32701,"ĠBrut":32702,"Second":32703,"posed":32704,"shots":32705,"Ġ313":32706,"idian":32707,"alking":32708,"Ġdens":32709,"Ġgif":32710,"akings":32711,"Ġkeywords":32712,"Ġchast":32713,"Ġadversary":32714,"Ġnick":32715,"iasis":32716,"ĠLegisl":32717,"Ġcoff":32718,"ĠOriental":32719,"ĠMorg":32720,"ĠHAR":32721,"Ġlegalizing":32722,"Ġbanter":32723,"ĠTart":32724,"ĠTRI":32725,"Ġantagon":32726,"ĠGF":32727,"oler":32728,"ĠUFO":32729,"Therefore":32730,"ĠOsama":32731,"ĠStructure":32732,"apps":32733,"Ġpee":32734,"ĠSomehow":32735,"ĠOverwatch":32736,"ĠCasual":32737,"Ġdishon":32738,"SEE":32739,"ctive":32740,"andering":32741,"ĠTransformation":32742,"Andy":32743,"ĠFever":32744,"Ġspectator":32745,"Ġlash":32746,"Ġprotector":32747,"apy":32748,"Ġexhilar":32749,"aroo":32750,"Ġmamm":32751,"Ġbystand":32752,"acky":32753,"Ġdigestive":32754,"Ġamplified":32755,"Ġalpha":32756,"continue":32757,"Low":32758,"Ġdisgusted":32759,"356":32760,"script":32761,"Ġgenerational":32762,"ĠPassenger":32763,"sight":32764,"Ġcout":32765,"Ġhone":32766,"ulse":32767,"Ġignite":32768,"284":32769,"gow":32770,"Ġbinary":32771,"Ġincess":32772,"Review":32773,"607":32774,"ĠSurprise":32775,"Ġirritation":32776,"ĠBarth":32777,"ĠGum":32778,"Ġvideot":32779,"ĠFres":32780,"asons":32781,"Ġcollaborator":32782,"fal":32783,"ĠGon":32784,"Ġsettles":32785,"regular":32786,"Ġmiscarriage":32787,"cube":32788,"Ġsubord":32789,"ĠRegistered":32790,"Ġnotions":32791,"zzy":32792,"Ġrevert":32793,"OFF":32794,"Ġhasht":32795,"ĠPNG":32796,"Ġunimaginable":32797,"builders":32798,"Taylor":32799,"ĠPAY":32800,"Ġ).":32801,"Ġ238":32802,"ĠLAST":32803,"MAS":32804,"Ġillustrations":32805,"Ġparody":32806,"Ġdispersed":32807,"ĠRoses":32808,"Ġestimation":32809,"ĠGets":32810,"Patrick":32811,"CHA":32812,"Ġmisdem":32813,"agate":32814,"alter":32815,"Ġgeo":32816,"Ġenormously":32817,"Ġarrogance":32818,"Ġpert":32819,"Ġmeta":32820,"ĠJuno":32821,"iov":32822,"imov":32823,"Ġchores":32824,"acan":32825,"Paris":32826,"313":32827,"Lewis":32828,"Ġwillingly":32829,"ERA":32830,"Ġencaps":32831,"ilk":32832,"Ġnodes":32833,"Ġenzyme":32834,"want":32835,"Ġtolerant":32836,"Ġcondos":32837,"Ġasserts":32838,"Ġcanon":32839,"Ġscanned":32840,"bishop":32841,"Ġperched":32842,"util":32843,"ĠBonus":32844,"create":32845,"ĠFuk":32846,"Ġmotif":32847,"Ġcontemplate":32848,"ĠBEN":32849,"imir":32850,"Ġacadem":32851,"uvian":32852,"ĠIdeas":32853,"ĠCY":32854,"Ġants":32855,"Ġprostitutes":32856,"2005":32857,"Spring":32858,"ĠBarrel":32859,"ĠAunt":32860,"ĠLudwig":32861,"ĠHerm":32862,"PRO":32863,"obiles":32864,"rack":32865,"STER":32866,"ucket":32867,"Ġmun":32868,"Ġ419":32869,"ICES":32870,"Ġcardio":32871,"Ġtrenches":32872,"Nation":32873,"yahoo":32874,"Ġburd":32875,"Ġnost":32876,"Ġappropriations":32877,"ĠChili":32878,"Josh":32879,"GW":32880,"Ġoppressed":32881,"ĠBEFORE":32882,"Ġmurderous":32883,"Pen":32884,"achable":32885,"Ġrive":32886,"Ġculmin":32887,"Ġdefin":32888,"ĠMord":32889,"idate":32890,"ĠChim":32891,"ource":32892,"ĠElectro":32893,"orthy":32894,"Ġcalendars":32895,"regation":32896,"Ġretrospect":32897,"ĠTribal":32898,"ĠHes":32899,"Ġcran":32900,"Ġcreditor":32901,"Ġfibers":32902,"note":32903,"idays":32904,"ĠSebast":32905,"ĠKitty":32906,"Ġplainly":32907,"ĠLAPD":32908,"Ġtrumpet":32909,"ĠAppropriations":32910,"Hill":32911,"ĠVeget":32912,"296":32913,"lated":32914,"othes":32915,"ibrarian":32916,"Listen":32917,"nex":32918,"WHO":32919,"Ġshampoo":32920,"Ġclaimants":32921,"Ġisol":32922,"Ġunchecked":32923,"Ġmov":32924,"umo":32925,"ĠLens":32926,"Ġdiscreet":32927,"Ġrespectfully":32928,"Ġreclaimed":32929,"ĠHatt":32930,"thus":32931,"ĠFlo":32932,"Ġsumm":32933,"phas":32934,"ĠHaitian":32935,"Ġstrife":32936,"Ġabound":32937,"verted":32938,"Ġpatronage":32939,"449":32940,"Ġprelim":32941,"ĠZhu":32942,"ĠRevel":32943,"adic":32944,"Ġminded":32945,"ĠStability":32946,"Ġresembling":32947,"Ġvending":32948,"ischer":32949,"Ġkisses":32950,"Ġsuperiority":32951,"Ġinfinite":32952,"ISC":32953,"880":32954,"Ġappease":32955,"VO":32956,"404":32957,"ECH":32958,"gam":32959,"River":32960,"metal":32961,"determination":32962,"Cook":32963,"Ġbuds":32964,"Ġ(%)":32965,"ĠCreated":32966,"Ġstrut":32967,"Ġ425":32968,"Ġverte":32969,"ĠOrb":32970,"Ġweaving":32971,"261":32972,"Ġflyers":32973,"spons":32974,"ĠCovenant":32975,"570":32976,"Ġintangible":32977,"ĠBJ":32978,"ĠStead":32979,"ĠBrune":32980,"pain":32981,"independent":32982,"Ball":32983,"witch":32984,"ĠIon":32985,"Ġpupp":32986,"Cash":32987,"ĠConvert":32988,"Ġimpede":32989,"broad":32990,"onew":32991,"Ġsynergy":32992,"Ġcoined":32993,"620":32994,"ivalent":32995,"ĠInfect":32996,"ĠAqua":32997,"Together":32998,"ĠChemistry":32999,"ĠURL":33000,"ampion":33001,"Ġdeclarations":33002,"Ġaffirmative":33003,"umper":33004,"ĠTarant":33005,"Ġstereotype":33006,"Ġbookstore":33007,"incre":33008,"Ġchipset":33009,"Ġangst":33010,"Jose":33011,"laus":33012,"Ġheater":33013,"ipers":33014,"Ġeminent":33015,"hook":33016,"sticks":33017,"ĠCoul":33018,"Ġmildly":33019,"SG":33020,"Ġworm":33021,"Ġdisable":33022,"Ġperfume":33023,"ISTER":33024,"Ġgathers":33025,"ĠLotus":33026,"hyp":33027,"actus":33028,"Ġdistinctly":33029,"fifth":33030,"!),":33031,"ĠCrunch":33032,"Ġcohesive":33033,"Ġfortunately":33034,"Ġninety":33035,"Ġcartels":33036,"empl":33037,"Direct":33038,"Ġcommuting":33039,"ĠSX":33040,"ractive":33041,"Ġtranslating":33042,"ĠAQ":33043,"Ġslay":33044,"abuse":33045,"ĠProc":33046,"ĠCantor":33047,"ĠTas":33048,"Sir":33049,"Thom":33050,"ĠCHRIST":33051,"Ġreceptive":33052,"ĠCornel":33053,"Arab":33054,"Ġgrammar":33055,"Ġhandlers":33056,"Ġalloy":33057,"Ġthinly":33058,"adem":33059,"Ġproponent":33060,"ĠPVC":33061,"Ġstump":33062,"tom":33063,"rets":33064,"iciency":33065,"780":33066,"Ġ311":33067,"ĠClapper":33068,"ITAL":33069,"Ùħ":33070,"Ġnarrator":33071,"Ġblond":33072,"Ġintermittent":33073,"Ġcollabor":33074,"646":33075,"Ġmetast":33076,"Ġregeneration":33077,"ĠLegendary":33078,"Ġgenitals":33079,"Ġbartender":33080,"atson":33081,"Okay":33082,"Ġpassages":33083,"Ġsubstituted":33084,"orr":33085,"ALTH":33086,"Ġartic":33087,"Ġascent":33088,"Ġmatured":33089,"Ġterminology":33090,"served":33091,"ĠDeliver":33092,"Ġattic":33093,"anges":33094,"Ġrenaissance":33095,"Ġbleed":33096,"claimer":33097,"onse":33098,"Sec":33099,"Ġparticle":33100,"aneous":33101,"ateur":33102,"Ġzeal":33103,"ĠPets":33104,"Working":33105,"ĠRespect":33106,"Ġsermon":33107,"ĠProvided":33108,"Ġfilibuster":33109,"Ġabolished":33110,"reviewed":33111,"cription":33112,"Ġrevers":33113,"atered":33114,"435":33115,"Ġwhe":33116,"ometown":33117,"UFC":33118,"products":33119,"Winter":33120,"Ġ304":33121,"Ġsporadic":33122,"orough":33123,"EB":33124,"ĠAgric":33125,"ĠMTA":33126,"wic":33127,"Ġpowerless":33128,"Ġcarrot":33129,"ww":33130,"Ġabsorption":33131,"ĠTyphoon":33132,"Turkey":33133,"Ġproclaim":33134,"Ġhikers":33135,"Ġpractise":33136,"/$":33137,"Ġfingertips":33138,"Ġbaff":33139,"vu":33140,"Ġans":33141,"plug":33142,"Ġacquaintance":33143,"itement":33144,"ihar":33145,"Ġreluctantly":33146,"Ġforc":33147,"Ġguarant":33148,"ĠWanted":33149,"Walk":33150,"addle":33151,"unders":33152,"Fred":33153,"Ġtides":33154,"ĠBai":33155,"Ġcountering":33156,"raper":33157,"ursions":33158,"ĠFlav":33159,"pared":33160,"raised":33161,"Ñı":33162,"ĠDiff":33163,"Ġreload":33164,"ourses":33165,"ĠBurning":33166,"Ġwand":33167,"Ġledger":33168,"Ġcoughing":33169,"ĠLoren":33170,"Nazis":33171,"Ġcompile":33172,"Eight":33173,"icultural":33174,"yy":33175,"Ġ1932":33176,"Run":33177,"AIN":33178,"Ġattractiveness":33179,"ĠOmn":33180,"Ġconfer":33181,"compliance":33182,"Ġembed":33183,"Steven":33184,"2001":33185,"Ġdecre":33186,"Ġprompts":33187,"ĠHare":33188,"Ġleaping":33189,"Ġslaughtered":33190,"Ġforfeiture":33191,"342":33192,"Charl":33193,"CDC":33194,"ographically":33195,"Ġduplicate":33196,"Ġdistracting":33197,"examination":33198,"Ġpeas":33199,"Ġcatchy":33200,"Ġdives":33201,"ĠAda":33202,"Hay":33203,"Ġenthusiastically":33204,"Ġfunky":33205,"kay":33206,"EVA":33207,"Ġpsychologists":33208,"Ġancestry":33209,"iyah":33210,"ifter":33211,"nob":33212,"518":33213,"rouse":33214,"Ġchord":33215,"Ġcone":33216,"Ġbarracks":33217,"ĠRoyale":33218,"ĠIntegration":33219,"Ġtrolling":33220,"ĠSynt":33221,"andals":33222,"ĠGrain":33223,"ĠNeck":33224,"618":33225,"Ġrapist":33226,"pins":33227,"Ġwitty":33228,"Ġdehydration":33229,"arlane":33230,"Ġimmoral":33231,"Ġaccum":33232,"ĠMcAuliffe":33233,"slow":33234,"Ġinjust":33235,"Ġ1700":33236,"Ġcarbs":33237,"Ġintel":33238,"Non":33239,"isks":33240,"Tre":33241,"Ġinterviewer":33242,"sam":33243,"Ġdelve":33244,"Ġadmirable":33245,"ĠROM":33246,"ĠHispanics":33247,"Ġimpart":33248,"Ġunderrated":33249,"Ġvictimized":33250,"ĠPsych":33251,"ppings":33252,"Ġ610":33253,"pole":33254,"Ġdiner":33255,"ĠScale":33256,"Ġunforeseen":33257,"surprisingly":33258,"opus":33259,"ĠCOURT":33260,"Ġjuggling":33261,"ĠFacilities":33262,"Aid":33263,"ĠHPV":33264,"Ġcrawling":33265,"flu":33266,"etary":33267,"ĠHarriet":33268,"329":33269,"ĠSod":33270,"ĠBiological":33271,"birth":33272,"ribed":33273,"Ġpulses":33274,"396":33275,"eways":33276,"ĠAlma":33277,"nov":33278,"015":33279,"ricane":33280,"agna":33281,"Ak":33282,"ĠClaim":33283,"Ġpref":33284,"Ġinterfaces":33285,"ĠADHD":33286,"604":33287,"ZE":33288,"venture":33289,"Ġascend":33290,"ĠGou":33291,"Ġpriceless":33292,"redo":33293,"kw":33294,"Conf":33295,"Ġmah":33296,"Ġpoets":33297,"Ġstalk":33298,"Ġencamp":33299,"Ġhopped":33300,"Ġmelody":33301,"JECT":33302,"eming":33303,"Ġbewild":33304,"aternal":33305,"uchs":33306,"dit":33307,"ĠTransmission":33308,"Lake":33309,"Ġatoms":33310,"ĠThoughts":33311,"ilts":33312,"volume":33313,"Ġsocioeconomic":33314,"atisf":33315,"Ġnarr":33316,"zinski":33317,"ymes":33318,"episode":33319,"Ġinherit":33320,"Ġintending":33321,"Ġarenas":33322,"uras":33323,"burning":33324,"334":33325,"teenth":33326,"Ġsophistication":33327,"Ġscreenshots":33328,"Ġautistic":33329,"lip":33330,"paper":33331,"Ġmonopol":33332,"799":33333,"forms":33334,"ocrats":33335,"Ġpineapple":33336,"Ġbegs":33337,"Ġpersecuted":33338,"Ġsubscribed":33339,"Ġelic":33340,"ĠPRESIDENT":33341,"297":33342,"Ġpreferential":33343,"Ġpyramid":33344,"Ġconvergence":33345,"Ġwob":33346,"Project":33347,"ĠAluminum":33348,"ĠJPM":33349,"ĠBAT":33350,"Ġdolphins":33351,"018":33352,"healthy":33353,"ĠCG":33354,"ĠEffective":33355,"worm":33356,"ĠEas":33357,"olicited":33358,"ĠUSE":33359,"ĠCaval":33360,"Ġswirl":33361,"Ġspaghetti":33362,"Ġinward":33363,"Republican":33364,"Ġpublicized":33365,"Ġeconomical":33366,"Ġsalsa":33367,"ĠTitanic":33368,"dot":33369,"Ġcontro":33370,"ĠBangl":33371,"iban":33372,"ĠKlux":33373,"Ġhinges":33374,"610":33375,"Ġvalves":33376,"profits":33377,"Wonder":33378,"Ġorient":33379,"Ġsque":33380,"Ġprivatization":33381,"Obama":33382,"Thousands":33383,"ĠTasman":33384,"Ġmaze":33385,"eem":33386,"Ġsurvives":33387,"istant":33388,"Ġenriched":33389,"Ġencl":33390,"Ġcompliments":33391,"ĠShoes":33392,"Ġinsanity":33393,"consider":33394,"agog":33395,"Ġbaffled":33396,"Ġ°":33397,"ĠWordPress":33398,"qus":33399,"usual":33400,"stall":33401,"Deb":33402,"ĠRothschild":33403,"Ġesche":33404,"Ġsoph":33405,"Ġambiguous":33406,"negative":33407,"Ġdiscouraging":33408,"Alexander":33409,"319":33410,"Ġsummon":33411,"ipation":33412,"000000":33413,"Ġminimalist":33414,"Ġenraged":33415,"777":33416,"Ġplanetary":33417,"Ġthroughput":33418,"Ġtemperament":33419,"ĠNIC":33420,"ileged":33421,"minster":33422,"ĠPLEASE":33423,"Ġexagger":33424,"ĠDescription":33425,"Ġagitated":33426,"Ġimmortal":33427,"Ġrenders":33428,"Ġcharisma":33429,"sequ":33430,"Ġmajorities":33431,"Ġfreaking":33432,"ĠAdvice":33433,"Ġembodies":33434,"stable":33435,"Ġcustomization":33436,"started":33437,"ĠAutism":33438,"Ġparticipates":33439,"ĠUTC":33440,"Marco":33441,"Ġoddly":33442,"Ġantiqu":33443,"ĠPear":33444,"ĠFey":33445,"Ġcertify":33446,"Ġdisillusion":33447,"ĠPhysicians":33448,"obl":33449,"855":33450,"Ġelim":33451,"Ġ335":33452,"Ol":33453,"ĠSear":33454,"Ġnuances":33455,"past":33456,"Sa":33457,"ĠSlov":33458,"Ġfiltered":33459,"Ġanalogy":33460,"Ġformulate":33461,"Ġarmies":33462,"Ġpuls":33463,"fters":33464,"ilipp":33465,"ĠHOT":33466,"485":33467,"ĠAfghans":33468,"Ġtopical":33469,"ĠBunny":33470,"seeing":33471,"Ġeloqu":33472,"Ġkidneys":33473,"ĠDEM":33474,"pent":33475,"Ġhus":33476,"stores":33477,"ĠProtestant":33478,"Comm":33479,"label":33480,"Kings":33481,"ĠPurpose":33482,"â̦..":33483,"Ġaccumulating":33484,"calling":33485,"Ġgiveaways":33486,"Ġpredicament":33487,"Ġtyp":33488,"Ġtraveler":33489,"003":33490,"impro":33491,"fac":33492,"Ġmapped":33493,"itious":33494,"Ġmasculinity":33495,"Ġtantal":33496,"ĠDJs":33497,"Ġviewpoints":33498,"Burn":33499,"ĠWii":33500,"pak":33501,"ĠEB":33502,"Ġhinge":33503,"Ġfacets":33504,"Ġphotographic":33505,"Ġcompiling":33506,"Ġdecks":33507,"Ġarticulated":33508,"Federal":33509,"crim":33510,"llah":33511,"Ġfiasco":33512,"ĠLIST":33513,"oute":33514,"ĠDraper":33515,"ĠLaos":33516,"Ġclimbers":33517,"raph":33518,"ĠDek":33519,"WAY":33520,"Ġgreets":33521,"Ġoppressive":33522,"otor":33523,"otiation":33524,"\":[":33525,"Record":33526,"mining":33527,"Town":33528,"Ġfavorably":33529,"ĠYoutube":33530,"William":33531,"Ġlan":33532,"â̲":33533,"ĠSpec":33534,"Ġtranquil":33535,"ĠClient":33536,"oln":33537,"celona":33538,"Ġrealistically":33539,"Ġmisplaced":33540,"ĠBie":33541,"bye":33542,"Yo":33543,"465":33544,"ĠMadagascar":33545,"oplan":33546,"arist":33547,"Ġconfines":33548,"Ġï":33549,"awks":33550,"Ġpiracy":33551,"Ġunwelcome":33552,"Intel":33553,"Ġparanoid":33554,"CLAIM":33555,"Ġblush":33556,"united":33557,"Ġmotivational":33558,"ĠVII":33559,"Ġdiabetic":33560,"Ġantiv":33561,"Ġdissect":33562,"Ġbestselling":33563,"Ġfluffy":33564,"ĠRemote":33565,"Ġvert":33566,"Correct":33567,"Ġcolossal":33568,"Ġcontrasts":33569,"Ġcirca":33570,"ĠDamage":33571,"Ġunrel":33572,"Ġdiscrepancy":33573,"ĠCIS":33574,"ĠCLASS":33575,"ilty":33576,"Ġsynopsis":33577,"emed":33578,"cakes":33579,"ibal":33580,"inea":33581,"ienced":33582,"Ġimplicit":33583,"ĠLOOK":33584,"Ġsilhouette":33585,"affiliated":33586,"ĠHalo":33587,"377":33588,"Ġlyr":33589,"ĠVide":33590,"herent":33591,"Ġbadges":33592,"plays":33593,"orea":33594,"Ġjammed":33595,"cancer":33596,"ĠYep":33597,"racted":33598,"ĠDisability":33599,"Ġfooth":33600,"friends":33601,"Ġbloated":33602,"Bet":33603,"ĠAntioch":33604,"Ġintrodu":33605,"Ġannexed":33606,"ivism":33607,"ĠFlickr":33608,"pants":33609,"Ġinterruption":33610,"645":33611,"ĠIly":33612,"ĠOss":33613,"ĠAMA":33614,"Ġpolitely":33615,"Ġnatives":33616,"Ġrushes":33617,"enges":33618,"ĠHarm":33619,"Ġdestroyer":33620,"ĠEstimates":33621,"Ġtransforms":33622,"Ġinvariably":33623,"Ġcac":33624,"iency":33625,"599":33626,"Ġconstitutionally":33627,"Ġrappers":33628,"ĠSettlement":33629,"icz":33630,"Ġhardened":33631,"citizens":33632,"Ġcircling":33633,"Ġtrapping":33634,"Ġguaranteeing":33635,"690":33636,"agher":33637,"Ġarcade":33638,"Ġfanc":33639,"Ġslapping":33640,"OPS":33641,"Ġmasse":33642,"Ġpudding":33643,"Jac":33644,"ĠGraphics":33645,"Ġuptake":33646,"?,":33647,"Fair":33648,"ĠSatan":33649,"uffy":33650,"ĠGuatem":33651,"ĠTransaction":33652,"Ġunlocking":33653,"ĠLINE":33654,"Ġapprehens":33655,"Ġglean":33656,"291":33657,"Ġexacerbate":33658,"ĠTrave":33659,"ĠTrop":33660,"Supp":33661,"Ġqueens":33662,"cart":33663,"Ġscrolling":33664,"Ġox":33665,"cone":33666,"Matthew":33667,"ĠDIRECT":33668,"Ġbacker":33669,"Ġthyroid":33670,"Sarah":33671,"ĠEDIT":33672,"ĠActivision":33673,"352":33674,"Ġreinforcements":33675,"Ġding":33676,"Ġplush":33677,"Ġpeanuts":33678,"ĠFant":33679,"ĠPediatrics":33680,"Ġaccommodating":33681,"ĠPractices":33682,"Answer":33683,"racial":33684,"ĠConstant":33685,"740":33686,"strength":33687,"apist":33688,"Ġsynthes":33689,"ĠLeap":33690,"ĠFabric":33691,"Ġbrainstorm":33692,"obia":33693,"Ġconception":33694,"Ġtuberculosis":33695,"Ġmajestic":33696,"ĠTitus":33697,"ĠTee":33698,"Ġlikeness":33699,"ĠSEA":33700,"lite":33701,"Ġ950":33702,"sufficient":33703,"Ġtrem":33704,"Ġharshly":33705,"Ġredacted":33706,"Ġwelding":33707,"Ġperplex":33708,"Ġpoetic":33709,"Ġinsignificant":33710,"Ġware":33711,"Ġwandered":33712,"Ġmete":33713,"ĠSTART":33714,"Ġweaponry":33715,"opsy":33716,"shadow":33717,"Ġobsc":33718,"hare":33719,"ĠOPEN":33720,"Ġdiligent":33721,"Girls":33722,"Ġinitials":33723,"Start":33724,"ĠBrookings":33725,"ombs":33726,"Ġlashes":33727,"essor":33728,"Ġgravy":33729,"ĠUbuntu":33730,"Tree":33731,"Ġ435":33732,"Ġcellar":33733,"Ġaquarium":33734,"ĠPodesta":33735,"361":33736,"ĠController":33737,"Ġeru":33738,"reasonable":33739,"Ġpermissions":33740,"725":33741,"Ġadministering":33742,"Ġflirt":33743,"Ġfleeting":33744,"asive":33745,"Ġsubcontract":33746,"Ġfascist":33747,"Ġcabbage":33748,"science":33749,"Ġboiler":33750,"ioned":33751,"Ġintegrates":33752,"Ġresidue":33753,"KEY":33754,"Ġwi":33755,"Ġsquared":33756,"Unless":33757,"Ġmute":33758,"ĠTuc":33759,"Ġverb":33760,"Gary":33761,"Ġexperimentation":33762,"fee":33763,"chini":33764,"Ġmarrow":33765,"ĠBalt":33766,"Ġnodded":33767,"tn":33768,"Ġmissionary":33769,"OTO":33770,"Ġoptimum":33771,"555":33772,"Ġwhipping":33773,"aunts":33774,"ĠScene":33775,"Ġcharacterize":33776,"Ġretrospective":33777,"Ġutilizes":33778,"Ġhastily":33779,"older":33780,"ĠPW":33781,"Ġsleepy":33782,"020":33783,"ĠAcid":33784,"Ġridiculously":33785,"Ġgigg":33786,"649":33787,"Ġcrus":33788,"ĠShame":33789,"ĠTorn":33790,"finding":33791,"IPS":33792,"Ġplat":33793,"ometers":33794,"Ġamphib":33795,"ellow":33796,"ĠSpecies":33797,"commercial":33798,"Ġvirgin":33799,"Ġdarn":33800,"Ġsorely":33801,"Ġrespondent":33802,"Ġray":33803,"ĠCONS":33804,"Ġunequivocally":33805,"server":33806,"Ġdrip":33807,"ĠRazor":33808,"Ban":33809,"ĠHMS":33810,"Ġhijab":33811,"ĠMuss":33812,"Ġsandy":33813,"Ġaversion":33814,"Ġoverarching":33815,"Ġultr":33816,"ĠIraqis":33817,"Ġuninterrupted":33818,"Ġrouting":33819,"Ġundone":33820,"independence":33821,"gra":33822,"ysics":33823,"inflammatory":33824,"cussion":33825,"ĠDefinitely":33826,"Ġelastic":33827,"peer":33828,"ĠGiov":33829,"ĠMandarin":33830,"Ġscratches":33831,"Ġphysicist":33832,"Ġbestowed":33833,"usually":33834,"OULD":33835,"igration":33836,"Human":33837,"Dead":33838,"osph":33839,"bott":33840,"doctoral":33841,"Ġbending":33842,"Ġconfigurations":33843,"psych":33844,"db":33845,"ĠUD":33846,"Ġarteries":33847,"orically":33848,"Ġblasphemy":33849,"jj":33850,"checking":33851,"adian":33852,"IRD":33853,"ĠDialogue":33854,"Ġshielded":33855,"ĠVox":33856,"Dave":33857,"Ġturb":33858,"ĠMassive":33859,"ĠBMI":33860,"ĠNF":33861,"uced":33862,"ickle":33863,"ishable":33864,"Ġembody":33865,"ÙĪ":33866,"Senior":33867,"ĠResult":33868,"try":33869,"egu":33870,"401":33871,"ĠLoyal":33872,"Ġperilous":33873,"Ġdissu":33874,"Ġmythology":33875,"ĠWax":33876,"Jesus":33877,"ĠMotorsport":33878,"Ġadvis":33879,"ĠAki":33880,"ISM":33881,"tested":33882,"Ġplag":33883,"Ġriches":33884,"ĠOCT":33885,"ĠLocke":33886,"BG":33887,"Ġ460":33888,"rawl":33889,"ĠTermin":33890,"Ġ295":33891,"Ġchopping":33892,"KT":33893,"Ġconverts":33894,"Ask":33895,"alse":33896,"ĠKeynes":33897,"Ġrefuted":33898,"Ġrabbits":33899,"Ġbilingual":33900,"urse":33901,"ĠSalad":33902,"odiac":33903,"Ġsolidly":33904,"Dam":33905,"Ġpp":33906,"rities":33907,"Rah":33908,"itness":33909,"Ġsixty":33910,"332":33911,"cold":33912,"Ġhindered":33913,"Ġclipped":33914,"Ġreceptor":33915,"ĠHoms":33916,"Ġdusk":33917,"Ġarchae":33918,"LR":33919,"Ġrods":33920,"Ġ257":33921,"ĠSith":33922,"ĠPumpkin":33923,"ellation":33924,"ĠWD":33925,"Ġdecriminal":33926,"Ġusable":33927,"Ġcheerful":33928,"ĠInform":33929,"Ġbrushes":33930,"vier":33931,"ĠBrush":33932,"590":33933,"boost":33934,"guided":33935,"ĠMJ":33936,"Ġsatirical":33937,"ortion":33938,"efficiency":33939,"Ġstrands":33940,"ĠWilde":33941,"Ġreproduce":33942,"verage":33943,"Ġlug":33944,"Ġhist":33945,"offer":33946,"Ġcollapses":33947,"Ġclerks":33948,"Ġairstrike":33949,"IPP":33950,"iscover":33951,"Ġnefarious":33952,"Ġstripe":33953,"Ġbona":33954,"ocon":33955,"Ġpunishments":33956,"ITED":33957,"ĠAltern":33958,"testing":33959,"Ġeerie":33960,"erous":33961,"Ġcaves":33962,"Ġcondemns":33963,"ĠDropbox":33964,"inese":33965,"axis":33966,"ĠRegistry":33967,"ĠMong":33968,"Ġbullies":33969,"Ġdocks":33970,"ĠAlter":33971,"rella":33972,"446":33973,"ĠDare":33974,"Ġvirtues":33975,"Ġdont":33976,"Value":33977,"ENE":33978,"received":33979,"Ġseaf":33980,"476":33981,"ilon":33982,"ĠKits":33983,"Ġrarity":33984,"Ġnurt":33985,"skin":33986,"ĠUL":33987,"ĠRegiment":33988,"terior":33989,"hate":33990,"ĠEstimated":33991,"ĠSilence":33992,"Ġorganism":33993,"ĠSigned":33994,"ĠIA":33995,"bite":33996,"Ġthicker":33997,"Ġeyeb":33998,"Ġjournalistic":33999,"ĠDisp":34000,"margin":34001,"Dri":34002,"Ġcomplexes":34003,"Ġimaginary":34004,"Ġrefuel":34005,"Ġmeticulous":34006,"Dub":34007,"Ġhaze":34008,"860":34009,"Ġproverbial":34010,"Ġozone":34011,"cale":34012,"resent":34013,"Ġdiscrete":34014,"boats":34015,"Ġ343":34016,"ĠRET":34017,"Ġsailor":34018,"hair":34019,"gear":34020,"Ġmalt":34021,"Ġpeach":34022,"ĠRabb":34023,"699":34024,"318":34025,"ĠVerge":34026,"Fin":34027,"ĠMighty":34028,"ierce":34029,"403":34030,"Ġdisenfranch":34031,"bass":34032,"nice":34033,"Ġsinks":34034,"ĠLaugh":34035,"367":34036,"ĠZur":34037,"Ġtravers":34038,"ĠMystery":34039,"onsense":34040,"ĠMonarch":34041,"Ġleapt":34042,"ergy":34043,"porate":34044,"display":34045,"ilet":34046,"Ġendemic":34047,"Bern":34048,"Ġpulmonary":34049,"Ġbroch":34050,"ĠManziel":34051,"Lyn":34052,"Repe":34053,"lda":34054,"hands":34055,"Ġtroublesome":34056,"Jordan":34057,"UTION":34058,"ĠALP":34059,"ĠLEG":34060,"Ġreconnaissance":34061,"ĠRNA":34062,"letters":34063,"ĠYounger":34064,"ĠLW":34065,"ĠSensor":34066,"388":34067,"Ġwielding":34068,"spr":34069,"Ġancestral":34070,"331":34071,"OTH":34072,"ĠAxis":34073,"irement":34074,"ĠCompact":34075,"voice":34076,"Ġpercussion":34077,"Ġendeav":34078,"Kate":34079,"ĠJACK":34080,"ĠMagnus":34081,"Ġinterconnected":34082,"ĠTraff":34083,"demon":34084,"Ġardent":34085,"ĠSomers":34086,"andum":34087,"346":34088,"heartedly":34089,"ayne":34090,"Design":34091,"melon":34092,"ĠCarib":34093,"Ġ1935":34094,"intention":34095,"cape":34096,"cend":34097,"organic":34098,"373":34099,"ĠRevival":34100,"ĠBLACK":34101,"Ġaspiration":34102,"yellow":34103,"bodied":34104,"Ġcrave":34105,"ĠIntelligent":34106,"ĠUnique":34107,"tab":34108,"386":34109,"ĠNess":34110,"Official":34111,"Stay":34112,"Ġcreat":34113,"iliary":34114,"rified":34115,"ĠPok":34116,"Ġabolition":34117,"Ka":34118,"ĠCourage":34119,"ĠDickens":34120,"rophic":34121,"ĠFAR":34122,"Ġfurnished":34123,".âĢĵ":34124,"rete":34125,"Ġvaginal":34126,"hner":34127,"ĠLONG":34128,"imates":34129,"ĠLiter":34130,"ĠMeasures":34131,"ĠBelg":34132,"\"-":34133,"ĠRaider":34134,"enario":34135,"rification":34136,"ĠFISA":34137,"ĠStab":34138,"Ġnar":34139,"mund":34140,"Tenn":34141,"Ġwakes":34142,"Ġcharg":34143,"okers":34144,"assment":34145,"Ġsiph":34146,"Ġludicrous":34147,"670":34148,"Ġcompositions":34149,"Ġpinnacle":34150,"ĠRankings":34151,"ĠTelescope":34152,"secure":34153,"Ġib":34154,"Ġaptly":34155,"paste":34156,"ĠJUST":34157,"RD":34158,"herry":34159,"sung":34160,"Ġmig":34161,"naires":34162,"Ġmigrated":34163,"Base":34164,"Ġamazingly":34165,"Ġunregulated":34166,"published":34167,"ĠPIT":34168,"ĠMissile":34169,"extreme":34170,"ĠAlone":34171,"skilled":34172,"ĠRamp":34173,"Ġcamer":34174,"Ġflyer":34175,"Ġbrewers":34176,"ĠReference":34177,"ĠMOV":34178,"ĠLep":34179,"Ġentitle":34180,"ivals":34181,"ĠPIN":34182,"Ġbatches":34183,"Ġunexplained":34184,"Ġenergies":34185,"Ġblurred":34186,"enged":34187,"orig":34188,"WF":34189,"olves":34190,"ĠPicks":34191,"ĠTwice":34192,"arranted":34193,"Ġmembrane":34194,"ĠMoonlight":34195,"Ġsulfur":34196,"Ġpurposely":34197,"Ġfumes":34198,"Ġ(#":34199,"onics":34200,"ivities":34201,"rollers":34202,"Ġflattering":34203,"felt":34204,"Ġintoxication":34205,"Bridge":34206,"ĠFallout":34207,"Ġcreatively":34208,"Ġpsychologically":34209,"Ġdespicable":34210,"gae":34211,"820":34212,"VERS":34213,"Ġtidal":34214,"Ġcarbohydrates":34215,"strip":34216,"Ġgravitational":34217,"Ġfeds":34218,"ĠZhao":34219,"legates":34220,"Ġ307":34221,"String":34222,"ĠRepair":34223,"Ġ1928":34224,"orses":34225,"atography":34226,"Boston":34227,"Ġasymm":34228,"ĠSomebody":34229,"Van":34230,"ĠSovereign":34231,"Ġnotoriety":34232,"Ġsimulate":34233,"ĠDiscussion":34234,"ĠTransition":34235,"Ġcopying":34236,"antage":34237,"ĠRodrig":34238,"Ġindifference":34239,"Ġ580":34240,"Ġastronomical":34241,"Ġscrews":34242,"840":34243,"inates":34244,"ĠStreaming":34245,"Ġentit":34246,"ĠLiterature":34247,"369":34248,"805":34249,"OTS":34250,"о":34251,"img":34252,"inness":34253,"Ġreverber":34254,"Ġpartition":34255,"Short":34256,"Ġmoist":34257,"Ġspoof":34258,"ĠDesire":34259,"orce":34260,"Ġcrammed":34261,"Ġunfor":34262,"Pan":34263,"ingen":34264,"Ġrelat":34265,"Mother":34266,"ĠGn":34267,"altern":34268,"Ġresurg":34269,"Ġcramped":34270,"ĠCitadel":34271,"Ġlaureate":34272,"Ġanalys":34273,"Ġnuns":34274,"ĠTie":34275,"activ":34276,"ĠSurprisingly":34277,"ĠProtective":34278,"ĠRedemption":34279,"Ġendlessly":34280,"Ġfists":34281,"spl":34282,"ĠKron":34283,"ĠExamples":34284,"Especially":34285,"Ġprejud":34286,"ĠSchwar":34287,"Ġ237":34288,"ĠPlants":34289,"ĠUNDER":34290,"Ġlasers":34291,"Ġsher":34292,"Ġgoddess":34293,"Ġwipes":34294,"409":34295,"ĠGTA":34296,"Ġhybrids":34297,"rowd":34298,"ĠMILL":34299,"ĠNUM":34300,"ĠGeek":34301,"ĠTWO":34302,"ĠTimbers":34303,"Ġresembled":34304,"ĠGRE":34305,"Bring":34306,"Ġcompressed":34307,"ĠOral":34308,"379":34309,"Ġwrench":34310,"LCS":34311,"Ġhomosexual":34312,"Kelly":34313,"Ġhump":34314,"ĠSicily":34315,"Ġperished":34316,"aos":34317,"doesn":34318,"scrib":34319,"Charlie":34320,"Ġshuffle":34321,"372":34322,"cedented":34323,"402":34324,"Ġtiers":34325,"Ġinteracted":34326,"ĠHG":34327,"ĠJere":34328,"ĠBRA":34329,"ĠDOC":34330,"things":34331,"Ġfaiths":34332,"Ġgirlfriends":34333,"Ġfortified":34334,"develop":34335,"ĠKus":34336,"iability":34337,"rase":34338,"iotics":34339,"ĠChern":34340,"boxes":34341,"abol":34342,"idan":34343,"emon":34344,"ĠJudaism":34345,"ĠSituation":34346,"ĠGrimm":34347,"Ġgou":34348,"ĠVictim":34349,"backer":34350,"Ġanimosity":34351,"ĠHorizons":34352,"ĠKazakh":34353,"Ġgrossly":34354,"ĠTac":34355,"yg":34356,"366":34357,"Ġcheaply":34358,"Ġformulated":34359,"ĠDangerous":34360,"offensive":34361,"Ġsauces":34362,"Ġkeyboards":34363,"666":34364,"Ġcanopy":34365,"Inc":34366,"astered":34367,"iesel":34368,"Ġadv":34369,"currency":34370,"Ġscapego":34371,"plings":34372,"ĠBDS":34373,"Ġstrangely":34374,"today":34375,"ĠEgyptians":34376,"Ġcoron":34377,"often":34378,"ĠTransformers":34379,"ĠAfterwards":34380,"reated":34381,"Ġpoisonous":34382,"Ġgeographically":34383,"Ġmell":34384,"Cross":34385,"Ġdeductible":34386,"ĠZionist":34387,"Ġcutter":34388,"ĠRP":34389,"ĠImag":34390,"Ġoverflow":34391,"358":34392,"ĠADD":34393,"bones":34394,"Ġflattened":34395,"ĠGREEN":34396,"Ġlaure":34397,"haps":34398,"ĠCellular":34399,"kens":34400,"363":34401,"ĠSmash":34402,"ĠSpeak":34403,"ĠMaiden":34404,"Ġgreedy":34405,"ĠManit":34406,"Ġfacet":34407,"ĠGPA":34408,"Ġracks":34409,"popular":34410,"322":34411,"ĠBars":34412,"avement":34413,"359":34414,"Ġpomp":34415,"Ġregisters":34416,"Fs":34417,"ĠLoving":34418,"ĠTaxi":34419,"concert":34420,"ĠArchae":34421,"Ġcurls":34422,"ĠSpit":34423,"ĠLIFE":34424,"Ġinvade":34425,"rolog":34426,"wreck":34427,"Ġconflicted":34428,"Ġ970":34429,"Ġexiled":34430,"Ġchew":34431,"udging":34432,"Ġexper":34433,"ĠFt":34434,"rius":34435,"ĠXer":34436,"~":34437,"Ġbandwagon":34438,"Fore":34439,"Cat":34440,"Ġoverflowing":34441,"Ġradios":34442,"Much":34443,"Ġfacilitates":34444,"ĠCaf":34445,"ĠQing":34446,"Use":34447,"Ġmang":34448,"Ġpissed":34449,"ĠOuter":34450,"within":34451,"ĠSchr":34452,"ĠSherlock":34453,"Ġ336":34454,"Ġcasc":34455,"chens":34456,"incent":34457,"Ġcultivating":34458,"ampions":34459,"Ġwasteful":34460,"adays":34461,"sets":34462,"ĠLF":34463,"watching":34464,"Ġabandonment":34465,"ĠJesuit":34466,"Ġlegislatures":34467,"regnancy":34468,"ĠColt":34469,"Ġinterns":34470,"Ġundertook":34471,"ĠIPA":34472,"ĠInstall":34473,"nsics":34474,"washer":34475,"Ġbeginners":34476,"ĠDiseases":34477,"Ġlimp":34478,"ĠESA":34479,"Basically":34480,"Ġprud":34481,"LED":34482,"Ġgrease":34483,"ousel":34484,"Ġrotten":34485,"ĠCele":34486,"facts":34487,"ĠLouie":34488,"ĠISI":34489,"481":34490,"Ġsett":34491,"Ġtoug":34492,"ĠReck":34493,"OUNT":34494,"ĠFou":34495,"Ġinhibitor":34496,"gru":34497,"bane":34498,"1980":34499,"ĠPanc":34500,"Ġsuperficial":34501,"Ġauthoritative":34502,"ĠVOL":34503,"790":34504,"Ġcrusade":34505,"airy":34506,"Ġemphatically":34507,"Ġflourishing":34508,"Ġ416":34509,"Ġheroine":34510,"inx":34511,"Ġanch":34512,"stretched":34513,"ĠRegener":34514,"ĠAncient":34515,"evaluate":34516,"Ġantibody":34517,"ĠEston":34518,"ĠAeg":34519,"Ġboldly":34520,"TN":34521,"ĠPercentage":34522,"Ġ747":34523,"Ġrapt":34524,"ĠEdited":34525,"Earth":34526,"phal":34527,"ĠXXX":34528,"arling":34529,"ĠReligion":34530,"Ġ503":34531,"forces":34532,"Ġendpoint":34533,"Miller":34534,"Ba":34535,"Ġdisappears":34536,"andre":34537,"Ġconnector":34538,"407":34539,"ĠTOUR":34540,"aura":34541,"ĠRazer":34542,"UPDATE":34543,"Ġcalib":34544,"original":34545,"ĠMonkey":34546,"Ir":34547,"Ġexacerb":34548,"killing":34549,"Ġforb":34550,"native":34551,"Ġpoking":34552,"Ġveiled":34553,"mails":34554,"Ġalphabet":34555,"Ġawkwardly":34556,"ĠNames":34557,"Ġspiders":34558,"ĠParam":34559,"ĠColour":34560,"Ġunification":34561,"ĠPione":34562,"Ġoffend":34563,"Ġscoff":34564,"ĠSAR":34565,"ĠBuildings":34566,"edes":34567,"ĠAke":34568,"Ġfirmware":34569,"Madison":34570,"policy":34571,"ĠComputing":34572,"ĠRW":34573,"Ġfluent":34574,"Ġdece":34575,"Ġswore":34576,"Ġrestaur":34577,"Ġpresses":34578,"ophon":34579,"Ġphilosopher":34580,"ften":34581,"Ġintruder":34582,"Ġleng":34583,"ĠCowboy":34584,"cled":34585,"Ġmeticulously":34586,"ĠPair":34587,"ĠEND":34588,"Ġcapsules":34589,"Ġauxiliary":34590,"Ġverses":34591,"Ġsheltered":34592,"Ġexplorer":34593,"ĠWolverine":34594,"auts":34595,"Ġinhibitors":34596,"ĠPeng":34597,"ĠValve":34598,"imar":34599,"Ġchuck":34600,"ĠRecording":34601,"Ġardu":34602,"Test":34603,"Ġinterven":34604,"Ġchrome":34605,"months":34606,"tap":34607,"ĠManz":34608,"format":34609,"ĠBalkans":34610,"Ġannex":34611,"uder":34612,"ĠAAC":34613,"Ġdisturbances":34614,"354":34615,"asms":34616,"ĠTad":34617,"puting":34618,"Ġfateful":34619,"imen":34620,"Ġaudi":34621,"ĠNewsweek":34622,"Around":34623,"Ġretribution":34624,"Ġsugars":34625,"Ġescapes":34626,"Ġlegitim":34627,"ĠProof":34628,"Ġmisogyn":34629,"cit":34630,"Ġclutching":34631,"exist":34632,"Ġrevol":34633,"Ġdiscs":34634,"discrimination":34635,"Ġstout":34636,"aline":34637,"ĠRandom":34638,"364":34639,"Ġapprehension":34640,"Ġmockery":34641,"Ġfossils":34642,"ĠStress":34643,"Ġbenefic":34644,"exc":34645,"lude":34646,"Small":34647,"Ġgh":34648,"Ġobserves":34649,"ĠSUP":34650,"Ġbrewer":34651,"ĠESP":34652,"Ġomitted":34653,"multiple":34654,"Ġminimizing":34655,"Ġtaco":34656,"Ġindifferent":34657,"medi":34658,"available":34659,"Ġ252":34660,"Ġsanity":34661,"ĠCookie":34662,"mostly":34663,"near":34664,"NASA":34665,"Ġlowly":34666,"seless":34667,"Ġobsess":34668,"itous":34669,"Dispatch":34670,"Ġcanyon":34671,"Ġbriefs":34672,"Say":34673,"ĠNato":34674,"ĠSpend":34675,"Ġ242":34676,"ĠEthernet":34677,"Ġmatte":34678,"ĠStim":34679,"hetics":34680,"Ġflourished":34681,"389":34682,"ĠMcA":34683,"695":34684,"Ġoverr":34685,"Ġtorment":34686,"Ġpirate":34687,"ĠJohann":34688,"roversial":34689,"ĠUnemployment":34690,"breakers":34691,"ĠMessages":34692,"tones":34693,"Ġtagging":34694,"Ġfrog":34695,"Jewish":34696,"Ġmessenger":34697,"Ġexasper":34698,"ernaut":34699,"Ġnarrower":34700,"ĠCatalyst":34701,"ĠSecrets":34702,"Ġadj":34703,"ĠFug":34704,"Ġaura":34705,"Ġtherape":34706,"mber":34707,"Ġcaliphate":34708,"Ġretreating":34709,"ĠComput":34710,"Ġburying":34711,"Ġail":34712,"Ġgriev":34713,"lins":34714,"825":34715,"tten":34716,"ifully":34717,"ĠTrials":34718,"igma":34719,"Ġ1914":34720,"Ġcoordinates":34721,"ocusing":34722,"ĠFeng":34723,"ĠWhale":34724,"Ġshorten":34725,"Ġcorrectness":34726,"evil":34727,"network":34728,"Ġreactive":34729,"assuming":34730,"ĠLaksh":34731,"games":34732,"Ġruining":34733,"excluding":34734,"annels":34735,"º":34736,"Ġrubbed":34737,"aleb":34738,"flex":34739,"iped":34740,"ĠLimit":34741,"allowed":34742,"ĠDMV":34743,"ĠLD":34744,"Ġstamina":34745,"conduct":34746,"Ġmislead":34747,"lib":34748,"ĠEminem":34749,"Ġpayoff":34750,"Ġkernel":34751,"Ġsweeps":34752,"Ġsonic":34753,"ĠKodi":34754,"unique":34755,"Ġsurrog":34756,"Michigan":34757,"Ġattest":34758,"Ġdummy":34759,"ĠStellar":34760,"ĠSquadron":34761,"ĠHait":34762,"ĠSpirits":34763,"605":34764,"ĠHemisphere":34765,"legram":34766,"ĠRack":34767,"opol":34768,"Ġfreshwater":34769,"cession":34770,"Ġabort":34771,"ĠLOG":34772,"Ġfuzzy":34773,"Ġcrystall":34774,"illation":34775,"ĠFreddy":34776,"Ġsalvation":34777,"Ġjuxtap":34778,"weekly":34779,"usha":34780,"456":34781,"Ġ660":34782,"ĠGlacier":34783,"Ġnegatives":34784,"Ġillegitimate":34785,"ĠProtein":34786,"Moore":34787,"Der":34788,"Ġinfancy":34789,"Again":34790,"ALD":34791,"Leon":34792,"ĠIdeally":34793,"fresh":34794,"730":34795,"Ġgamb":34796,"Ġscrewed":34797,"wow":34798,"Ġembodied":34799,"ĠCinderella":34800,"341":34801,"ĠPiano":34802,"Ġbroccoli":34803,"Ġmats":34804,"ĠZheng":34805,"cream":34806,"anut":34807,"ĠZig":34808,"Columb":34809,"ĠTibetan":34810,"Death":34811,"Ġstren":34812,"ĠVertical":34813,"Ġratification":34814,"Ġprincipally":34815,"ELD":34816,"Ġforbid":34817,"Ġamalg":34818,"blind":34819,"auri":34820,"stery":34821,"Ġbarley":34822,"FBI":34823,"ĠHex":34824,"925":34825,"Domin":34826,"oat":34827,"Ġswayed":34828,"ĠKKK":34829,"ĠTaxes":34830,"Ġker":34831,"eeper":34832,"ĠAwakens":34833,"ĠPix":34834,"ĠKING":34835,"dc":34836,"Ren":34837,"Ġlegitimately":34838,"ĠTriumph":34839,"ĠSites":34840,"ĠSai":34841,"tl":34842,"painted":34843,"ĠWaiting":34844,"starting":34845,"parents":34846,"ĠDuo":34847,"eele":34848,"upper":34849,"ĠInvestig":34850,"Ġeighteen":34851,"Ġcorrelated":34852,"ĠCascade":34853,"acca":34854,"ĠAlph":34855,"ĠPolic":34856,"ĠEVs":34857,"Ġworthless":34858,"ĠIndust":34859,"auld":34860,"ĠYiannopoulos":34861,"ĠEzra":34862,"Ġmorphed":34863,"Ġoriginating":34864,"mania":34865,"Ġsparing":34866,"Ġextrem":34867,"cre":34868,"ults":34869,"mare":34870,"classified":34871,"Ġparachute":34872,"Ġmistrust":34873,"ONT":34874,"Mind":34875,"Ġthru":34876,"707":34877,"ĠTwain":34878,"Ġmelodies":34879,"ĠDanger":34880,"ĠDPS":34881,"Ġderive":34882,"Ġdissolution":34883,"Ġchildbirth":34884,"Ġ415":34885,"fork":34886,"solid":34887,"loads":34888,"ĠCGI":34889,"378":34890,"ĠShed":34891,"Face":34892,"Ġcomet":34893,"iceps":34894,"ĠReduction":34895,"Fly":34896,"jp":34897,"ĠAnimation":34898,"Luke":34899,"Ġabiding":34900,"Ġdevise":34901,"ĠAe":34902,"Ġflux":34903,"Ġbras":34904,"Ġfracturing":34905,"Ġinventive":34906,"ĠGranger":34907,"Ġsap":34908,"inducing":34909,"Ġreviewers":34910,"Officers":34911,"ĠWHY":34912,"Ġamplify":34913,"Ġentr":34914,"Ġslit":34915,"457":34916,"Ġreformed":34917,"ĠPhi":34918,"Ġtempt":34919,"Ġcontradiction":34920,"585":34921,"ĠMaced":34922,"371":34923,"kinson":34924,"robe":34925,"ĠHunters":34926,"astern":34927,"criminal":34928,"jew":34929,"Ġdecentralized":34930,"bands":34931,"Ġavatar":34932,"ĠBarrier":34933,"Ġcharacterization":34934,"student":34935,"Ġgays":34936,"Ġspecialize":34937,"ĠJudging":34938,"Ġinitiation":34939,"Ġshove":34940,"Ġpirates":34941,"Ġfictitious":34942,"ĠPoker":34943,"ĠElsa":34944,"ĠTECH":34945,"handedly":34946,"Ġglued":34947,"Ġclinically":34948,"Ġinaccessible":34949,"Ġderegulation":34950,"Ġprohib":34951,"Ġdangling":34952,"Ġnoses":34953,"Ġstash":34954,"اØ":34955,"ESH":34956,"Ġmonstrous":34957,"Ġcrept":34958,"ĠCharm":34959,"Ġbeh":34960,"Ġshuts":34961,"Ġ236":34962,"imedia":34963,"445":34964,"Du":34965,"Ġafar":34966,"ĠRout":34967,"Ġflares":34968,"Utah":34969,"Ġ808":34970,"Ġjewels":34971,"2004":34972,"Ġrecal":34973,"Gas":34974,"ĠExcellent":34975,"Ġpitfalls":34976,"ĠDrawing":34977,"viously":34978,"angered":34979,"changes":34980,"Ġpasture":34981,"talking":34982,"Ġinequ":34983,"Ġbicycl":34984,"Cost":34985,"423":34986,"bard":34987,"Ġanterior":34988,"ecast":34989,"CHR":34990,"397":34991,"masters":34992,"706":34993,"ĠFinish":34994,"Yet":34995,"study":34996,"ĠCogn":34997,"Ġloaf":34998,"Ġspatial":34999,"ĠParad":35000,"batch":35001,"Ġvents":35002,"Ġspins":35003,"ĠAddiction":35004,"Ġcondone":35005,"Ġproble":35006,"English":35007,"ĠRomans":35008,"ĠSaying":35009,"ĠKling":35010,"Universal":35011,"ivist":35012,"Ġskirm":35013,"Ġ2500":35014,"Ġ263":35015,"aired":35016,"ĠMartian":35017,"ĠCompensation":35018,"lation":35019,"ĠSalam":35020,"LGBT":35021,"ĠDart":35022,"strike":35023,"vasive":35024,"ILLE":35025,"Ġimaginative":35026,"ĠEuph":35027,"Financial":35028,"Ġholog":35029,"orah":35030,"crit":35031,"ĠOswald":35032,"512":35033,"ĠUri":35034,"Ġdiscrepancies":35035,"Ġbeads":35036,"ĠShots":35037,"Mem":35038,"Ġhunts":35039,"Ġsubtly":35040,"Ġ470":35041,"ĠVigil":35042,"Ġsew":35043,"ĠBurma":35044,"igm":35045,"ighed":35046,"swe":35047,"Ġ251":35048,"Ġdeceit":35049,"Ġphysi":35050,"iflower":35051,"ĠCert":35052,"Ġchewing":35053,"rax":35054,"ĠMER":35055,"icient":35056,"Les":35057,"Ġ390":35058,"Ġperjury":35059,"Ġfiltering":35060,"770":35061,"Ġpoppy":35062,"Ġbland":35063,"ĠNasa":35064,"Ġorbiting":35065,"ĠRipple":35066,"otal":35067,"ĠRyu":35068,"ĠShap":35069,"ĠJian":35070,"Ġpiv":35071,"ĠNeptune":35072,"rary":35073,"Ġunavoidable":35074,"Ġguideline":35075,"Ġwaterfall":35076,"inators":35077,"ĠLogic":35078,"ĠPlug":35079,"role":35080,"Ġalterations":35081,"ĠSett":35082,"ĠFeld":35083,"Ġfreezes":35084,"Ġbedrock":35085,"ĠVIEW":35086,"ovation":35087,"Ġneedless":35088,"ĠIU":35089,"ignant":35090,"ĠConfeder":35091,"316":35092,"fine":35093,"Ġjars":35094,"gotten":35095,"Bron":35096,"Ġmindfulness":35097,"imating":35098,"Ġhysteria":35099,"Ġhurried":35100,"Ġinfantry":35101,"ĠNYU":35102,"tags":35103,"Penn":35104,"Ġtracing":35105,"ĠSwing":35106,"ĠIo":35107,"Ġreckoned":35108,"ĠRecall":35109,"ĠVersion":35110,"314":35111,"Ġecology":35112,"Ġarmoured":35113,"Ġresonance":35114,"970":35115,"Ġvigilance":35116,"Ġrede":35117,"ĠBohem":35118,"Ġchau":35119,"ĠDevi":35120,"Ġtru":35121,"))":35122,"Put":35123,"Ġflavored":35124,"ĠClown":35125,"Senate":35126,"ĠScandinavian":35127,"mable":35128,"Residents":35129,"ĠFranchise":35130,"Ġprecincts":35131,"Prem":35132,"ĠNeutral":35133,"coal":35134,"Ġdelinqu":35135,"Mus":35136,"UME":35137,"Ġtedious":35138,"roots":35139,"ĠCondition":35140,"ĠIntercept":35141,"017":35142,"itives":35143,"Ġdefinitively":35144,"Ġobliter":35145,"Ġclandestine":35146,"Ġstagnation":35147,"Ġblindness":35148,"abiding":35149,"Ġremix":35150,"feeding":35151,"Ġunrecogn":35152,"2003":35153,"960":35154,"381":35155,"Ġbulky":35156,"xia":35157,"ivered":35158,"inic":35159,"ĠSoci":35160,"ĠYards":35161,"Ġhides":35162,"Film":35163,"Ġtestim":35164,"Ġblacklist":35165,"Deep":35166,"Standard":35167,"ĠClash":35168,"Ġriddled":35169,"Ġdiseng":35170,"ĠTRE":35171,"ĠIDs":35172,"Ġmigrating":35173,"protect":35174,"Ġgraded":35175,"Ġvaguely":35176,"ĠCharacter":35177,"382":35178,"ĠMOD":35179,"Eng":35180,"Ġmobilized":35181,"Ġsincerity":35182,"Ġ317":35183,"sighted":35184,"ownt":35185,"ĠâĢİ":35186,"umpy":35187,"Ġitching":35188,"ĠVerd":35189,"cook":35190,"Ġsimulator":35191,"players":35192,"Early":35193,"infeld":35194,"Ġmaximizing":35195,"Philipp":35196,"ĠPhotoshop":35197,"Ġdestroys":35198,"Ġbefriend":35199,"Ġfilthy":35200,"ĠIncident":35201,"gha":35202,"Ġcomplicity":35203,"Ġmessing":35204,"YA":35205,"ĠNegro":35206,"adows":35207,"374":35208,"Ġpip":35209,"cean":35210,"Ġ1924":35211,"Sent":35212,"represent":35213,"Ġdeems":35214,"ĠRue":35215,"Ġtitanium":35216,"Ġmanners":35217,"â̦â̦":35218,"bare":35219,"Ġusur":35220,"mma":35221,"ĠPanda":35222,"ulus":35223,"ĠSlav":35224,"324":35225,"ĠMole":35226,"^":35227,"micro":35228,"foreign":35229,"lest":35230,"ocular":35231,"ĠUniv":35232,"ĠFrag":35233,"Ġshepherd":35234,"Ġelectron":35235,"ĠFSA":35236,"Ġunl":35237,"dose":35238,"Ġimmersion":35239,"ĠDeL":35240,"Ġbiomedical":35241,"Anna":35242,"Ġskillet":35243,"Ġrecre":35244,"Ġtrillions":35245,"voy":35246,"Ġnormalized":35247,"radio":35248,"cue":35249,"urbed":35250,"Ġthinkers":35251,"328":35252,"327":35253,"ĠForge":35254,"505":35255,"Ġunbearable":35256,"olini":35257,"Ġdisinfect":35258,"Ġshaving":35259,"Ġtoxicity":35260,"453":35261,"Ġheterosexual":35262,"Baltimore":35263,"Ġstool":35264,"lr":35265,"ĠMk":35266,"Ġantidote":35267,"Dark":35268,"810":35269,"Ġirritated":35270,"ĠSUPPORT":35271,"Chance":35272,"bent":35273,"ĠZelda":35274,"ĠPenguin":35275,"ifled":35276,"Ġarte":35277,"705":35278,"Ġcondol":35279,"izza":35280,"ĠCK":35281,"Ġprojector":35282,"ravings":35283,"Ġ1919":35284,"Ġburner":35285,"ĠSchwarz":35286,"Oregon":35287,"Ġridicule":35288,"Ġinstructional":35289,"Ġ\"#":35290,"ĠDign":35291,"Ġkitten":35292,"Ġconstit":35293,"iration":35294,"Speed":35295,"ecycle":35296,"ĠFalse":35297,"ĠDealer":35298,"Could":35299,"655":35300,"outside":35301,"Ġworldview":35302,"Ġ246":35303,"Ġspitting":35304,"595":35305,"MN":35306,"ĠComes":35307,"ingu":35308,"Ġenzymes":35309,"Ġcompass":35310,"Ġexclaimed":35311,"ĠMalays":35312,"Ġ1916":35313,"Ġcoloring":35314,"Ġrepeats":35315,"Ġsoils":35316,"Ġtrivia":35317,"ĠIsles":35318,"Const":35319,"ĠFiction":35320,"665":35321,"Ġcriminality":35322,"ĠZi":35323,"384":35324,"ĠWilderness":35325,"ĠCanary":35326,"ĠVs":35327,"и":35328,"ĠAPIs":35329,"Ġbehest":35330,"Ġeb":35331,"ĠHipp":35332,"Ġpreempt":35333,"Ġevoke":35334,"Ġinept":35335,"tele":35336,"447":35337,"ĠGarmin":35338,"Ġpursuits":35339,"351":35340,"Ġcliché":35341,"ĠJihad":35342,"Ġ308":35343,"ĠSnake":35344,"ĠAnnounce":35345,"Nearly":35346,"!'\"":35347,"Ġ1927":35348,"saw":35349,"Ġabhor":35350,"Plan":35351,"rawled":35352,"ĠRiy":35353,"ensor":35354,"Fal":35355,"quick":35356,"odynamic":35357,"Ġsubstitution":35358,"Ġprovoking":35359,"Operation":35360,"rupulous":35361,"Ġsweetness":35362,"folk":35363,"ĠDefault":35364,"Ġstarved":35365,"ĠPrinting":35366,"urious":35367,"ĠTracker":35368,"them":35369,"Ġleth":35370,"Ġemptied":35371,"Ġfootprints":35372,"ilian":35373,"Ġbattalion":35374,"Ġprophet":35375,"Ġrailing":35376,"Ġhect":35377,"rouch":35378,"lees":35379,"Ġideologies":35380,"Ġ254":35381,"ĠGods":35382,"ĠAvalon":35383,"Ġfrontrunner":35384,"ĠPork":35385,"ĠPipe":35386,"Ġscaven":35387,"Ġming":35388,"Ġerg":35389,"Ġ520":35390,"Ġhatched":35391,"asant":35392,"ĠHI":35393,"Ġpend":35394,"Ġ288":35395,"Prom":35396,"achev":35397,"ĠEcology":35398,"enforcement":35399,"467":35400,"dule":35401,"Ġrealism":35402,"ĠTypes":35403,"USB":35404,"utra":35405,"ĠHiroshima":35406,"Ġcontradicted":35407,"393":35408,"ĠDSL":35409,"Ġtherein":35410,"ĠReconstruction":35411,"Ġ243":35412,"irled":35413,"479":35414,"ĠWhats":35415,"Currently":35416,"ĠPOWER":35417,"ĠHiro":35418,"ĠBreath":35419,"ĠYourself":35420,"Ġlantern":35421,"376":35422,"É":35423,"ĠHumans":35424,"Lady":35425,"Ġdissemination":35426,"ecake":35427,"ĠChao":35428,"flat":35429,"Ġinspecting":35430,"stration":35431,"Ġidentifiable":35432,"CV":35433,"ĠLobby":35434,"function":35435,"Roll":35436,"DIV":35437,"Tell":35438,"Ġfasc":35439,"ĠAOL":35440,"HM":35441,"Keefe":35442,"Ġporous":35443,"Ġsmoot":35444,"existence":35445,"ĠDeg":35446,"Ġdivor":35447,"isner":35448,"allas":35449,"Bloomberg":35450,"Ġdictators":35451,"ĠGeh":35452,"Ġsilicone":35453,"Ġdab":35454,"Ġmashed":35455,"Ġpric":35456,"might":35457,"ĠBLM":35458,"Ġpatriarch":35459,"Microsoft":35460,"ĠAds":35461,"Ġcoronary":35462,"ĠContrary":35463,"Ġdra":35464,"ĠStarted":35465,"Ġbuckle":35466,"lear":35467,"accept":35468,"Within":35469,"bd":35470,"interested":35471,"bia":35472,"POR":35473,"motion":35474,"ĠFounders":35475,"ĠCassandra":35476,"ĠPassion":35477,"Ġbehavioural":35478,"ĠHealing":35479,"Ġmarkings":35480,"Ġsnowball":35481,"Ġridiculed":35482,"phase":35483,"Ġunto":35484,"aque":35485,"uggets":35486,"Ġfrantically":35487,"Ġcoward":35488,"Ġinconvenient":35489,"Taking":35490,"Afee":35491,"Ġtwisting":35492,"930":35493,"ĠSieg":35494,"ĠGit":35495,"Ġcurs":35496,"ĠGlas":35497,"ĠSignificant":35498,"Ġachieves":35499,"Ġpreferably":35500,"Ġcondensed":35501,"Ġfetus":35502,"Ġunivers":35503,"Ġpse":35504,"Access":35505,"Ġintertwined":35506,"been":35507,"quit":35508,"ĠLEGO":35509,"Ġimagining":35510,"454":35511,"Ġplains":35512,"sequently":35513,"pull":35514,"Fast":35515,"Pot":35516,"yles":35517,"AIR":35518,"Ġblatantly":35519,"eki":35520,"ilated":35521,"ĠMembership":35522,"Ġ262":35523,"Ġ}":35524,"Ġexcavation":35525,"Ġethn":35526,"addin":35527,"Ġfoundational":35528,"ceptions":35529,"ĠViet":35530,"exempt":35531,"Ġmicrophones":35532,"Ġ244":35533,"778":35534,"Ġdwar":35535,"attery":35536,"502":35537,"ĠKik":35538,"Ġinspir":35539,"ĠMaximum":35540,"Ġvengeance":35541,"Ġetched":35542,"outine":35543,"552":35544,"Ġunicorn":35545,"gged":35546,".�":35547,"ĠBlackwell":35548,"ĠStatue":35549,"Ġdissidents":35550,"ĠKaine":35551,"Ġdeforestation":35552,"ĠScholar":35553,"Ġpleasantly":35554,"ÑĤ":35555,"398":35556,"ĠRUN":35557,"arent":35558,"Ġundeniably":35559,"Ġtechnologically":35560,"Ġconsciously":35561,"ĠEther":35562,"Ġproportional":35563,"Ġlaund":35564,"ĠRye":35565,"Ġambiguity":35566,"Ġunmist":35567,"Terror":35568,"ciplinary":35569,"ĠImproved":35570,"hesis":35571,"Ġcooker":35572,"elsen":35573,"Ġguerrilla":35574,"opped":35575,"ATURE":35576,"Ġrequ":35577,"Ġunprepared":35578,"Ġcamel":35579,"Ġfitt":35580,"Sex":35581,"edged":35582,"Ġrecurrent":35583,"ctuary":35584,"ĠCompare":35585,"ĠServing":35586,"Tri":35587,"Ġtransient":35588,"ĠBees":35589,"Ġcovenant":35590,"Ġfantasies":35591,"Ġespresso":35592,"draft":35593,"baugh":35594,"Ġdemocratically":35595,"ĠBans":35596,"ĠManual":35597,"ĠTurtle":35598,"ennett":35599,"achy":35600,"ĠClim":35601,"Ġdescending":35602,"Ġprow":35603,"Ġinconsistencies":35604,"Player":35605,"Ġoblivious":35606,"ĠWonderland":35607,"nav":35608,"aughter":35609,"Ġlod":35610,"Ġ403":35611,"ĠPolaris":35612,"ĠLeia":35613,"ĠInfantry":35614,"Sy":35615,"ĠMeter":35616,"Ġautoimmune":35617,"Ġdiagnoses":35618,"Ġtrespass":35619,"011":35620,"wrong":35621,"ĠGREAT":35622,"Ġtelescopes":35623,"shows":35624,"Pac":35625,"olation":35626,"Ġclerics":35627,"Ġdissenting":35628,"406":35629,"Ġetiquette":35630,"Ġdeterrence":35631,"765":35632,"Ġove":35633,"Has":35634,"Pak":35635,"ा":35636,"ĠNec":35637,"Ġsociology":35638,"witz":35639,"Ġkittens":35640,"Ġcontinual":35641,"Ġoverlapping":35642,"Ġmonks":35643,"ĠMechanical":35644,"Captain":35645,"ocial":35646,"ĠFalling":35647,"ĠCorrection":35648,"ĠTrouble":35649,"Ġslog":35650,"Ġ253":35651,"Ġemanating":35652,"Ġwidest":35653,"PROV":35654,"Japanese":35655,"urat":35656,"Ġboxed":35657,"ĠCases":35658,"Ġjarring":35659,"Fix":35660,"'?":35661,"ĠStrateg":35662,"Republic":35663,"ovy":35664,"362":35665,"ĠMothers":35666,"Ġstreaks":35667,"Ġlocalized":35668,"ĠONLY":35669,"Ġeh":35670,"ĠObject":35671,"Ġstub":35672,"Fre":35673,"ĠScarlet":35674,"Ġmultip":35675,"ĠMaul":35676,"ĠProblems":35677,"cest":35678,"Ġmortal":35679,"Ġarche":35680,"ulet":35681,"Ġfuller":35682,"ĠGER":35683,"Si":35684,"mr":35685,"ĠPowerful":35686,"boxing":35687,"ĠPeer":35688,"Jean":35689,"ĠTF":35690,"Ġplural":35691,"optim":35692,"Jimmy":35693,"ĠFriendly":35694,"Mex":35695,"Ġdepri":35696,"PK":35697,"Ġwaitress":35698,"eph":35699,"arrass":35700,"ikawa":35701,"feel":35702,"Finally":35703,"fourth":35704,"394":35705,"conom":35706,"VT":35707,"Ġeleg":35708,"ivot":35709,"Ġharsher":35710,"ĠPepe":35711,"ĠImpl":35712,"Ġankles":35713,"idity":35714,"ĠPrepare":35715,"Rather":35716,"Ġconservatism":35717,"Ġunquestion":35718,"ribution":35719,"ĠPatent":35720,"ĠDeluxe":35721,"ĠAE":35722,"007":35723,"Ġprag":35724,"bg":35725,"Ġpalate":35726,"Ġintric":35727,"ossom":35728,"Ġspac":35729,"ĠSpotlight":35730,"Seven":35731,"amacare":35732,"ĠGotham":35733,"Ġencompass":35734,"Ġnicer":35735,"ĠLauder":35736,"Ġscaff":35737,"worn":35738,"442":35739,"Ġpropri":35740,"443":35741,"ĠCompos":35742,"ĠIniti":35743,"inth":35744,"Ġrehe":35745,"Prov":35746,"Ġgri":35747,"ossip":35748,"ĠModest":35749,"quiet":35750,"Ġwealthier":35751,"Ġ241":35752,"icum":35753,"Ġcommunism":35754,"Ġhelpers":35755,"Ġbellig":35756,"Ġ405":35757,"uttered":35758,"Ġbitterness":35759,"nl":35760,"474":35761,"Ġvitality":35762,"blank":35763,"ĠLeth":35764,"PAC":35765,"326":35766,"ĠNapoleon":35767,"Ġ299":35768,"ĠReviews":35769,"ĠSect":35770,"Ġstrongh":35771,"ĠTube":35772,"Ġwoodland":35773,"Ġhumming":35774,"411":35775,"Alpha":35776,"Ġundet":35777,"Ġmounts":35778,"Officials":35779,"igning":35780,"830":35781,"ĠStamp":35782,"ubby":35783,"424":35784,"Ġoutlandish":35785,"Ġjerk":35786,"Ġradiant":35787,"Ġcubes":35788,"Director":35789,"Ġatro":35790,"vous":35791,"Sab":35792,"Ġpretended":35793,"Ġ620":35794,"975":35795,"Sham":35796,"Ġpotassium":35797,"ĠAttention":35798,"gly":35799,"opens":35800,"ĠWorker":35801,"porter":35802,"Ġsplendid":35803,"embed":35804,"Je":35805,"ĠMeal":35806,"Ġsurname":35807,"Usually":35808,"Ġtimer":35809,"Ġweave":35810,"irin":35811,"ĠGenetics":35812,"ensual":35813,"Ġmerry":35814,"Ġapprehend":35815,"utsche":35816,"strate":35817,"Ġsupplementary":35818,"ĠRoundup":35819,"upid":35820,"Ġmiraculous":35821,"ĠHUN":35822,"Ġglaciers":35823,"weed":35824,"ĠSuggest":35825,"XL":35826,"authors":35827,"Ġbarking":35828,"ĠUKIP":35829,"leased":35830,"ĠRAD":35831,"Ġfide":35832,"Ġphen":35833,"Ġscanners":35834,"Parents":35835,"ĠBlaze":35836,"Ġtweaking":35837,"Ġelaborated":35838,"Ġsusp":35839,"iscovered":35840,"Ġthighs":35841,"Ġradicals":35842,"ULTS":35843,"aggressive":35844,"endants":35845,"Hon":35846,"Ġcorrecting":35847,"391":35848,"pps":35849,"ĠTerritories":35850,"Ġconferred":35851,"crazy":35852,"utor":35853,"ĠSurvival":35854,"Ġbrowsers":35855,"ĠConflict":35856,"pn":35857,"Ġdeprive":35858,"riage":35859,"ilan":35860,"à¦":35861,"949":35862,"Congratulations":35863,"radical":35864,"ĠHits":35865,"powerful":35866,"Ġcrypt":35867,"745":35868,"ĠRegistrar":35869,"ophile":35870,"ĠElement":35871,"cooked":35872,"ĠTwilight":35873,"Ġdemos":35874,"IER":35875,"Ġstricken":35876,"Magic":35877,"abby":35878,"ĠSack":35879,"ĠShrine":35880,"Nev":35881,"Probably":35882,"ĠWisdom":35883,"ulpt":35884,"opher":35885,"Ġcolonel":35886,"atl":35887,"Tem":35888,"kun":35889,"ĠIndie":35890,"Putin":35891,"jection":35892,"areth":35893,"ĠBullet":35894,"Ġsmartest":35895,"ĠEsper":35896,"Ġproficiency":35897,"Ġcessation":35898,"Ġmars":35899,"ĠDATA":35900,"sup":35901,"Ġostr":35902,"Jane":35903,"Ġpathogens":35904,"hd":35905,"ĠNK":35906,"Ġhorribly":35907,"regulated":35908,"Ġesteemed":35909,"ĠChinatown":35910,"Ġvibration":35911,"Ġoverboard":35912,"ĠRhod":35913,"Ġfeces":35914,"otation":35915,"Ġcryptic":35916,"Bal":35917,"OPER":35918,"Ġaffirmation":35919,"Ġmenstrual":35920,"Ġuntold":35921,"Ġanecdotes":35922,"ĠHOUSE":35923,"Ġcape":35924,"311":35925,"ittance":35926,"ĠRemy":35927,"ĠWaves":35928,"ĠCOVER":35929,"ordinate":35930,"Ġrestricts":35931,"Samsung":35932,"Ġplantations":35933,"olver":35934,"Better":35935,"ĠExplos":35936,"Ġnasal":35937,"ĠSyri":35938,"ĠPerl":35939,"Ġlatency":35940,"othermal":35941,"Sweet":35942,"ĠRyzen":35943,"ĠYuri":35944,"Ġsmack":35945,"Ġcrow":35946,"aniel":35947,"iological":35948,"Ġmonk":35949,"Ġtutorial":35950,"ĠAure":35951,"Ġcliffs":35952,"ameron":35953,"umers":35954,"ĠMour":35955,"Ġunorthodox":35956,"Ġgulf":35957,"Ġintrusive":35958,"ĠVIII":35959,"ĠFF":35960,"Ġenlarged":35961,"Ġspheres":35962,"ĠCheap":35963,"ĠAmend":35964,"Ġ::":35965,"Ġpacing":35966,"ĠStartup":35967,"ĠDating":35968,"racist":35969,"ĠDivine":35970,"Ġpollen":35971,"ĠMeaning":35972,"ĠLei":35973,"ĠMOT":35974,"ĠARC":35975,"legate":35976,"Ġbrav":35977,"Ross":35978,"redit":35979,"414":35980,"ringe":35981,"perhaps":35982,"SPA":35983,"Southern":35984,"Front":35985,"undrum":35986,"Ġassorted":35987,"ĠDawkins":35988,"ĠWrap":35989,"Ġconsequential":35990,"ĠFuji":35991,"458":35992,"Ġunst":35993,"Bon":35994,"acter":35995,"Trade":35996,"ingers":35997,"ĠClin":35998,"Ġstimul":35999,"arah":36000,"inois":36001,"urdy":36002,"Ġobsessive":36003,"Zone":36004,"Ġprimitive":36005,"unctions":36006,"Ġadapter":36007,"Ġassures":36008,"Daddy":36009,"Ġunsatisf":36010,"441":36011,"Ġ1910":36012,"Ġsecondly":36013,"truth":36014,"RED":36015,"040":36016,"Pope":36017,"venants":36018,"Ġestim":36019,"Ġhemorrh":36020,"Ġexcruciating":36021,"459":36022,"Ġboils":36023,"ieved":36024,"Storm":36025,"Ġmanifestation":36026,"Ġinsulated":36027,"fb":36028,"Ġclassify":36029,"Mbps":36030,"Ġinclination":36031,"Ġaur":36032,"Ġpolarized":36033,"Ġoccupations":36034,"Secretary":36035,"Ġcustomizable":36036,"scribe":36037,"Ġadjunct":36038,"Ġ1922":36039,"rived":36040,"ocative":36041,"Friends":36042,"Oak":36043,"Ġpsyche":36044,"Ġwrinkles":36045,"anthrop":36046,"Ġcoercion":36047,"enos":36048,"Ġvariability":36049,"hma":36050,"phot":36051,"ĠXander":36052,"ĠDiss":36053,"Ġtigers":36054,"ahoo":36055,"focus":36056,"rical":36057,"grow":36058,"Ġseminal":36059,"Ġdisciples":36060,"Cas":36061,"Hundreds":36062,"Ġscissors":36063,"correct":36064,"Ġfascism":36065,"imoto":36066,"Ġnudity":36067,"charg":36068,"Ġrusty":36069,"ĠLyndon":36070,"Ġanomalies":36071,"onial":36072,"ĠiCloud":36073,"Ġannoy":36074,"Ġdistortion":36075,"Lou":36076,"ĠGiul":36077,"eyes":36078,"870":36079,"uum":36080,"ĠUltr":36081,"Action":36082,"cigarette":36083,"igators":36084,"kj":36085,"Ġ323":36086,"uine":36087,"Score":36088,"Ġmans":36089,"Security":36090,"Ġarom":36091,"ĠBoards":36092,"Ġwrists":36093,"602":36094,"Ġastronomy":36095,"Ġresin":36096,"width":36097,")/":36098,"Ġconcurrent":36099,"unless":36100,"606":36101,"ĠMagnet":36102,"Ġauthorizing":36103,"ĠJunk":36104,"atical":36105,"Ġauthent":36106,"zac":36107,"413":36108,"ĠGrape":36109,"Ġcircled":36110,"Ġooz":36111,"Ġvisceral":36112,"ointment":36113,"Ġincendiary":36114,"ĠBourbon":36115,"Ġgimmick":36116,"vette":36117,"Stan":36118,"Ġdetachment":36119,"488":36120,"Ġmisogyny":36121,"Ġenlight":36122,"utic":36123,"Ġinquire":36124,"ĠBEL":36125,"ascular":36126,"ĠWasserman":36127,"Dallas":36128,"Ġconstellation":36129,"Ġdystopian":36130,"504":36131,"ĠOptical":36132,"Ġsilhou":36133,"Girl":36134,"ĠGong":36135,"ĠHighest":36136,"????????":36137,"Sav":36138,"ocity":36139,"leted":36140,"Ġattrition":36141,"ĠExpedition":36142,"ĠKilled":36143,"501":36144,"ONES":36145,"dat":36146,"Ġglyphosate":36147,"Ġplugs":36148,"Ġlact":36149,"Fla":36150,"fps":36151,"riger":36152,"Ġparagraphs":36153,"Ġinnate":36154,"ĠFoo":36155,"aternity":36156,"ĠGry":36157,"Ġoneself":36158,"642":36159,"Iowa":36160,"oodle":36161,"ĠCoconut":36162,"ĠChess":36163,"ommel":36164,"Ġmagnesium":36165,"Ġairliner":36166,"Ġexceedingly":36167,"ĠCreator":36168,"YouTube":36169,"Ġsleeper":36170,"Ġlonging":36171,"ĠPercy":36172,"Ġmatrix":36173,"Ġâľ":36174,"Ġbarren":36175,"Mrs":36176,"Ġinvading":36177,"Ġincom":36178,"Ġemperor":36179,"Ġip":36180,"irie":36181,"Ġpredictably":36182,"ĠBless":36183,"Ġsuperpower":36184,":-":36185,"Ġpropensity":36186,"easy":36187,"educ":36188,"ĠPolly":36189,"Ġcumbersome":36190,"Ġcollide":36191,"016":36192,"Ġtransports":36193,"Ġscraps":36194,"below":36195,"Ġhairs":36196,"mentation":36197,"Ġevolves":36198,"ĠFallen":36199,"Ġunsurprisingly":36200,"Ġcuff":36201,"Ġ249":36202,"mental":36203,"ĠCamel":36204,"Ġ337":36205,"Clinton":36206,"Ġdecad":36207,"ĠSTEP":36208,"ĠTestament":36209,"Ġirresistible":36210,"ĠACE":36211,"Ġhamm":36212,"ĠTerr":36213,"Ġcaul":36214,"iggins":36215,"Ġproficient":36216,"resp":36217,"Ġheirs":36218,"Ġ321":36219,"dress":36220,"ĠClothing":36221,"Ġ560":36222,"Ġ264":36223,"ĠRobb":36224,"Ġfrail":36225,"Ġoptimizing":36226,"615":36227,"ĠRefuge":36228,"rowth":36229,"washing":36230,"Ġgenders":36231,"indu":36232,"ĠNAT":36233,"Ġleans":36234,"Ġeyed":36235,"Ġhilar":36236,"vice":36237,"wolf":36238,"Ġfatig":36239,"ococ":36240,"ĠCarry":36241,"Community":36242,"Clark":36243,"itably":36244,"sv":36245,"448":36246,"Ġnumer":36247,"Ġ1925":36248,"ĠBehavioral":36249,"ĠScream":36250,"Ġgeek":36251,"rake":36252,"ĠTTC":36253,"Ġadditives":36254,"ĠBye":36255,"ylon":36256,"Ġfoliage":36257,"ateral":36258,"rapnel":36259,"Science":36260,"Ġrecollection":36261,"thening":36262,"ĠUbisoft":36263,"ĠLur":36264,"ĠOkinawa":36265,"ĠProvision":36266,"ferred":36267,"ĠGrounds":36268,"Ġhops":36269,"aterial":36270,"Ġacad":36271,"Ġengulf":36272,"ĠApex":36273,"frequency":36274,"relations":36275,"ĠCorvette":36276,"ĠRepeat":36277,"Ġanew":36278,"Ġhes":36279,"ĠLair":36280,"ĠPSP":36281,"foundation":36282,"Band":36283,"ĠPublisher":36284,"Ġreciprocal":36285,"Ġ287":36286,"Ġpir":36287,"Adams":36288,"Ġprostitute":36289,"ĠMecca":36290,"ectomy":36291,"Ġskew":36292,"ĠLol":36293,"Voice":36294,"ĠCalais":36295,"ISION":36296,"rue":36297,"Ġgaping":36298,"prot":36299,"Ġ6000":36300,"Ġtilted":36301,"Ġgoofy":36302,"Stand":36303,"Ġfellows":36304,"Ġcurly":36305,"ĠPOW":36306,"Ġlore":36307,"Ġinhabited":36308,"ĠIdentification":36309,"Metro":36310,"Ġdispel":36311,"Ġinvoking":36312,"Ġdeleting":36313,"Ġstigmat":36314,"ĠDalai":36315,"Ġequate":36316,"Ġmascara":36317,"endered":36318,"ĠNYT":36319,"ĠCommittees":36320,"rians":36321,"ĠOlympus":36322,"ĠQR":36323,"ĠDrinking":36324,"Ġbatt":36325,"andr":36326,"computer":36327,"Senator":36328,"ĠTwist":36329,"ĠNoise":36330,"Ġcheesy":36331,"Ġ1931":36332,"Ġtyranny":36333,"Ġnegligible":36334,"ĠBok":36335,"Ġwebpage":36336,"ĠHEAD":36337,"ĠNovel":36338,"Ġquarry":36339,"Ġexpressive":36340,"Ġforgiving":36341,"Among":36342,"asin":36343,"ĠSuc":36344,"Democrats":36345,"795":36346,"Ġaback":36347,"¨":36348,"ĠNeon":36349,"392":36350,"ĠRNC":36351,"ĠPROC":36352,"sein":36353,"Ros":36354,"Ġemot":36355,"ĠASA":36356,"ĠSeb":36357,"ĠExtended":36358,"atern":36359,"Ġpsychedelic":36360,"Fil":36361,"ĠOrwell":36362,"ĠSOS":36363,"Ġconceive":36364,"Ġhobbies":36365,"Ġspecimens":36366,"ĠTEXT":36367,"sometimes":36368,"Mario":36369,"orpor":36370,"ĠTemporary":36371,"Ġapocalypse":36372,"Ġcounterproductive":36373,"ĠQUEST":36374,"ĠCargo":36375,"Amb":36376,"Ġoptic":36377,"groups":36378,"Ġparanoia":36379,".?":36380,"sounding":36381,"mediately":36382,"System":36383,"ubi":36384,"Ġuttered":36385,"Ġgraphs":36386,"âĢĭâĢĭ":36387,"Ġscientifically":36388,"Ġbluntly":36389,"Ġhopping":36390,"Fun":36391,"ĠSUPER":36392,"Ġrobe":36393,"VB":36394,"ĠQuote":36395,"Ġincarnation":36396,"Ġtreadmill":36397,"Ġ1915":36398,"Ġbart":36399,"669":36400,"Ġhoc":36401,"Ġ309":36402,"Ġimprovis":36403,"Ġhut":36404,"Ġmixer":36405,"ĠCt":36406,"span":36407,"Ġwatered":36408,"Ġpatriot":36409,"Ġdehyd":36410,"laughs":36411,"ĠFancy":36412,"ĠVoc":36413,"Ġintellect":36414,"ĠTid":36415,"Ġnesting":36416,"Tel":36417,"Ġ()":36418,"letter":36419,"ĠSeems":36420,"Ops":36421,"ĠContents":36422,"ript":36423,"hani":36424,"Ġrecru":36425,"Ġpickups":36426,"repair":36427,"Throughout":36428,"bear":36429,"Ġconquered":36430,"656":36431,"Ġmalf":36432,"Ġordained":36433,"755":36434,"ĠReprodu":36435,"brain":36436,"ĠOuts":36437,"ĠWage":36438,"Ru":36439,"________":36440,"ĠLAW":36441,"ĠWass":36442,"Ġcomplication":36443,"Fri":36444,"Ġregener":36445,"Wait":36446,"577":36447,"Ġmisconception":36448,"Ġbombardment":36449,"Ġunloaded":36450,"Ġdictionary":36451,"IU":36452,"025":36453,"etically":36454,"ĠNarr":36455,"repe":36456,"Ġassigning":36457,"Rail":36458,"Ġnotebooks":36459,"Ġingest":36460,"Ġrpm":36461,"Ġalienated":36462,"ĠCredits":36463,"Ġindis":36464,"ĠGathering":36465,"aration":36466,"-+-+-+-+":36467,"Ġori":36468,"Ġsr":36469,"ndra":36470,"Ġlibertarian":36471,"Ġcoerced":36472,"ording":36473,"Ġtranqu":36474,"Ġelbows":36475,"549":36476,"Ġping":36477,"ĠRELE":36478,"ĠYanuk":36479,"Ġmaneuvers":36480,"ĠTrojan":36481,"IFIED":36482,"ĠViolent":36483,"è":36484,"Ġlest":36485,"Ġarrows":36486,"frog":36487,"anty":36488,"WB":36489,"ĠSeen":36490,"648":36491,"Ġclutter":36492,"ĠBender":36493,"Ġpessim":36494,"ĠTeg":36495,"Asian":36496,"IFIC":36497,"Ġexponential":36498,"Ġsponge":36499,"rite":36500,"ĠDAM":36501,"Ġtacit":36502,"ĠZoom":36503,"Ġolds":36504,"Ġonward":36505,"ĠSandwich":36506,"missible":36507,"isol":36508,"940":36509,"Ġinciner":36510,"ĠTrick":36511,"Ġawakening":36512,"Ġdart":36513,"ĠCouch":36514,"respons":36515,"ĠElephant":36516,"ĠPluto":36517,"ĠTags":36518,"itcher":36519,"644":36520,"702":36521,"Ġelectrons":36522,"ĠMyth":36523,"ĠAad":36524,"Danny":36525,"Ġcraw":36526,"ĠCertification":36527,"Ġtending":36528,"Ġpellets":36529,"Ġamused":36530,"ĠAuschwitz":36531,"ĠAppl":36532,"iris":36533,"ashion":36534,"walking":36535,"Ġabnorm":36536,"Cro":36537,"?:":36538,"ĠIcelandic":36539,"ĠAvailability":36540,"Ġcann":36541,"Opt":36542,"buster":36543,"ĠQuartz":36544,"Executive":36545,"tracks":36546,"igel":36547,"MIT":36548,"ĠTracking":36549,"Ġconditioned":36550,"Ġsampled":36551,"ĠGenius":36552,"Ġsubstit":36553,"ĠSiberia":36554,"Ġfrequ":36555,"historic":36556,"okin":36557,"OWS":36558,"1500":36559,"warts":36560,"ĠEtsy":36561,"licks":36562,"ĠSmooth":36563,"unity":36564,"515":36565,"Ġperk":36566,"aida":36567,"forts":36568,"ĠUA":36569,"RIC":36570,"Spain":36571,"ĠWired":36572,"cuts":36573,"Ġfurnace":36574,"ĠTOTAL":36575,"ĠTables":36576,"662":36577,"Fab":36578,"Ġquaint":36579,"ĠWorlds":36580,"ĠCabin":36581,"atche":36582,"List":36583,"ĠVO":36584,"Ġkeyword":36585,"Ġ258":36586,"Farm":36587,"timer":36588,"ĠVolt":36589,"Build":36590,"pressed":36591,"*,":36592,"Ġ324":36593,"aiman":36594,"TING":36595,"Ġsneaking":36596,"cery":36597,"Ġcrib":36598,"ĠIllust":36599,"later":36600,"Ġcompar":36601,"Ġpropulsion":36602,"647":36603,"ĠTrails":36604,"Ġperiphery":36605,"steel":36606,"Ġvividly":36607,"ĠConver":36608,"eatured":36609,"427":36610,"463":36611,"Ġapprox":36612,"spin":36613,"Ġconfigured":36614,"inside":36615,"razy":36616,"account":36617,"anye":36618,"riend":36619,"Ġbows":36620,"809":36621,"ĠDEF":36622,"ĠRez":36623,"Fans":36624,"ĠDF":36625,"Ġstains":36626,"ĠAtom":36627,"ĠConce":36628,"ĠTOM":36629,"ĠELECT":36630,"Ġdisappro":36631,"019":36632,"afia":36633,"ĠTemperature":36634,"Ġextracts":36635,"fab":36636,"Ġunsur":36637,"Ġseasoning":36638,"Ty":36639,"KB":36640,"Ġposit":36641,"Ġlocality":36642,"1200":36643,"cour":36644,"izons":36645,"hh":36646,"506":36647,"ĠDLC":36648,"iago":36649,"Ġcorpses":36650,"iddling":36651,"Mayor":36652,"Ġsimplistic":36653,"Ġlibel":36654,"Ġalmonds":36655,"Ġswast":36656,"Change":36657,"ĠJoker":36658,"MAR":36659,"ĠScully":36660,"Ġmailbox":36661,"VIDEO":36662,"ĠKyoto":36663,"esley":36664,"ĠIncredible":36665,"youtube":36666,"Ġinequalities":36667,"Ġbolts":36668,"Ġbothering":36669,"Ġattentive":36670,"ĠSparrow":36671,"Ġdiaper":36672,"Ġfanbase":36673,"Ġuncont":36674,"Ap":36675,"ĠQi":36676,"Price":36677,"471":36678,"Ġpearl":36679,"wid":36680,"899":36681,"ĠPony":36682,"casting":36683,"Ġinhabit":36684,"Ġunve":36685,"Ġinsur":36686,"ĠWee":36687,"658":36688,"Ġeffected":36689,"gger":36690,"Ġinstallments":36691,"imilar":36692,"FU":36693,"Ġinfertility":36694,"climate":36695,"HEAD":36696,"fashion":36697,"ĠTHEY":36698,"jc":36699,"Ġsatisf":36700,"ĠGuidelines":36701,"Ġinsure":36702,"ĠRSA":36703,"Ġvirt":36704,"Ġinterpre":36705,"Joshua":36706,"ĠShut":36707,"Ġtestimonies":36708,"Ñģ":36709,"untary":36710,"417":36711,"Ġbeck":36712,"ĠMilky":36713,"ç":36714,"Ġsequels":36715,"Ġ281":36716,"ĠRibbon":36717,"Ġroomm":36718,"Ġsynchron":36719,"452":36720,"Ġ1926":36721,"Ġhawk":36722,"ĠDisorder":36723,"Ġbackstory":36724,"ĠNum":36725,"Ġoverheard":36726,"technical":36727,"Jud":36728,"aii":36729,"Ġdecon":36730,"ĠRape":36731,"ĠWarrant":36732,"Ġpoop":36733,"spir":36734,"Country":36735,"Ġweld":36736,"Ġabuser":36737,"Ġ------":36738,"material":36739,"Ġpreserves":36740,"spring":36741,"Ġpuzzled":36742,"ĠDebate":36743,"Joseph":36744,"Ġ272":36745,"Blood":36746,"antry":36747,"Ġconverge":36748,"Ġimaginable":36749,"oward":36750,"545":36751,"Ġfug":36752,"Vision":36753,"075":36754,"Ġadoptive":36755,"Ġunknow":36756,"Stream":36757,"Ġaffili":36758,"ĠPUR":36759,"ĠWally":36760,"Ġgamer":36761,"Ġfart":36762,"stice":36763,"Ġcongen":36764,"н":36765,"685":36766,"orst":36767,"ĠATF":36768,"Ġml":36769,"ĠMozilla":36770,"Ġcalmed":36771,"bage":36772,"ĠVault":36773,"arkable":36774,"ĠGuan":36775,"Ġclueless":36776,"umatic":36777,"Ġshameless":36778,"Ġpreached":36779,"Ġmisconceptions":36780,"Ġanthology":36781,"Ġbiomass":36782,"ĠPs":36783,"tails":36784,"Ġexcessively":36785,"Ġextr":36786,"Davis":36787,"Ġgrounding":36788,"Ġshortcuts":36789,"ĠShift":36790,"ĠRew":36791,"ĠIllum":36792,"Ġincite":36793,"sense":36794,"ĠScouting":36795,"otos":36796,"respond":36797,"Ġbeware":36798,"gran":36799,"ĠXV":36800,"JM":36801,"ĠSounders":36802,"Ġ276":36803,"Ġshockingly":36804,"Ġgastrointestinal":36805,"erences":36806,"df":36807,"ĠNG":36808,"Ġdiscredited":36809,"Ġdemoral":36810,"Ġgladly":36811,"Tal":36812,"ĠPredator":36813,"708":36814,"Ġdoi":36815,"Ġdecentral":36816,"illin":36817,"printed":36818,"Ġinflicting":36819,"ribes":36820,"Ġsupper":36821,"abc":36822,"Ġgraz":36823,"980":36824,"Bull":36825,"Ġmillionaires":36826,"Ġvanity":36827,"imony":36828,"Ġbiologists":36829,"Ġalternating":36830,"Ġsleeps":36831,"Force":36832,"ĠPrinc":36833,"ĠTransgender":36834,"Ġ314":36835,"ĠProvide":36836,"enthal":36837,"Ġplum":36838,"Ġresurrect":36839,"CW":36840,"Ġinjure":36841,"ĠPerspective":36842,"ĠBei":36843,"Ġrestless":36844,"aciously":36845,"Ġchlor":36846,"catch":36847,"ĠLuigi":36848,"Ġinconsistency":36849,"Ġwhiff":36850,"Arizona":36851,"ustration":36852,"ĠRaid":36853,"ĠDemons":36854,"ĠVita":36855,":\"":36856,"Ġmigraine":36857,"ĠHamb":36858,"Ġwidget":36859,"451":36860,"Ġrandomized":36861,"etchup":36862,"ĠParticularly":36863,"Ġdiced":36864,"Ġperfected":36865,"roid":36866,"710":36867,"Ġreflections":36868,"Ġantioxidants":36869,"ĠLabel":36870,"Ġ326":36871,"igious":36872,"ĠEucl":36873,"608":36874,"Ġstrand":36875,"ĠDirt":36876,"ĠLift":36877,"suits":36878,"ĠControls":36879,"RAW":36880,"Ġcowardly":36881,"ĠUmb":36882,"Growing":36883,"mington":36884,"Ġ339":36885,"ĠCommit":36886,"Ġnonviolent":36887,"Ġcontaminants":36888,"Ġacrylic":36889,"ĠMAP":36890,"Ġ269":36891,"Ġdegrading":36892,"Ġmiracles":36893,"ĠEstablishment":36894,"despite":36895,"cry":36896,"Ġpauses":36897,"Ġmythical":36898,"Ġtwenties":36899,"Actually":36900,"phan":36901,"recorded":36902,"Ġunwillingness":36903,"engineering":36904,"avored":36905,"Ġdevout":36906,"item":36907,"Ġbunny":36908,"ĠMerchants":36909,"Ġconsumes":36910,"508":36911,"Ġlex":36912,"ĠClause":36913,"Ġchecklist":36914,"Sus":36915,"uther":36916,".#":36917,"Bit":36918,"uay":36919,"bf":36920,"Ġpopulace":36921,"Ġ316":36922,"Ġcombust":36923,"Ġnano":36924,"Ġpopul":36925,"Indust":36926,"Ġcapitalists":36927,"ĠFiles":36928,"Bang":36929,"Ġkosher":36930,"atile":36931,"Ġincrim":36932,"OVER":36933,"Ġmelee":36934,"ymph":36935,"ĠPupp":36936,"evin":36937,"ĠMolecular":36938,"Ġmisinterpret":36939,"vc":36940,"olithic":36941,"ĠSimpsons":36942,"Ġshrew":36943,"Ġselectively":36944,"ĠDrain":36945,"mittedly":36946,"conservative":36947,"True":36948,"Using":36949,"562":36950,"apon":36951,"Ġapprentice":36952,"Mas":36953,"ĠBattlefield":36954,"Ġfing":36955,"Ġconcoct":36956,"ĠVIS":36957,"ĠHuss":36958,"Ġdetects":36959,"ĠFriedrich":36960,"Ġlatitude":36961,"Custom":36962,"ĠÙ":36963,"ĠBones":36964,"whose":36965,"Ġredirected":36966,"aligned":36967,"ĠNeighbor":36968,"ĠAmen":36969,"ĠMarble":36970,"Beyond":36971,"Ġbiomark":36972,"Ġerroneous":36973,"Atlanta":36974,"Ġmasturb":36975,"ĠAssoci":36976,"Albert":36977,"Ġcigar":36978,"ĠFraz":36979,"ethe":36980,"skinned":36981,"Ford":36982,"throp":36983,"Acc":36984,"Ġtricked":36985,"Ġoverwhelm":36986,"Ġimplements":36987,"ĠGeForce":36988,"Ġbounces":36989,"Ġmoderator":36990,"910":36991,"ĠButterfly":36992,"ĠIllegal":36993,"ĠSubject":36994,"RET":36995,"ĠFreeze":36996,"ĠNewt":36997,"Ġuterus":36998,"696":36999,"Ġ267":37000,"tk":37001,"Ġdodged":37002,"liam":37003,"Ġparasite":37004,"obal":37005,"ĠHubble":37006,"Ġtheology":37007,"âĢĶ\"":37008,"height":37009,"Ale":37010,"employment":37011,"ĠWallet":37012,"cessive":37013,"Ġ404":37014,"Ġsimilarity":37015,"zens":37016,"Ġdumps":37017,"Ġdepress":37018,"Ġlifeless":37019,"535":37020,"oard":37021,"Scotland":37022,"Ġbelievable":37023,"Ġcalculator":37024,"ĠNaked":37025,"Ġremission":37026,"Ġoranges":37027,"ĠSections":37028,"Ġentangled":37029,"Ġuncanny":37030,"Ġteaspoons":37031,"vr":37032,"ĠPorn":37033,"Organ":37034,"Ġbund":37035,"Doug":37036,"ĠGHz":37037,"Major":37038,"abus":37039,"Bell":37040,"avier":37041,"Ġimplanted":37042,"RON":37043,"Fle":37044,"462":37045,"509":37046,"Ġgoggles":37047,"Ġmanuscript":37048,"NOT":37049,"ĠCanaveral":37050,"ĠDID":37051,"Season":37052,"HAEL":37053,"Edge":37054,"appiness":37055,"DIS":37056,"Ġplotted":37057,"Ġwrought":37058,"Ġquarantine":37059,"Ġrearr":37060,"itage":37061,"Ġsocket":37062,"Ġbrig":37063,"Ġunbelievably":37064,"abytes":37065,"TG":37066,"Ġ444":37067,"ĠOffic":37068,"Ġacquaintances":37069,"ĠComparison":37070,"Nine":37071,"ĠFeast":37072,"758":37073,"YC":37074,"Ġfiner":37075,"ĠStrawberry":37076,"Ġeternity":37077,"liament":37078,"urrency":37079,"ĠCortana":37080,"ĠSabbath":37081,"Ġsprinkle":37082,"unker":37083,"ĠUE":37084,"flies":37085,"Ġblender":37086,"Ġacutely":37087,"emark":37088,"ĠAffect":37089,"Politics":37090,"Ġsane":37091,"Ġcorrosion":37092,"Ġspirituality":37093,"Ġredeemed":37094,"Ġingrained":37095,"manager":37096,"joined":37097,"ĠDumb":37098,"ĠHeight":37099,"Ġseventeen":37100,"Ġ640":37101,"Ġreviewer":37102,"Ġwallpaper":37103,"Ġnurs":37104,"Ġsubset":37105,"703":37106,"Ġsymbolism":37107,"Ġdudes":37108,"Ġmismatch":37109,"gans":37110,"please":37111,"ĠKE":37112,"Ġatom":37113,"004":37114,"ionic":37115,"Ġservings":37116,"Ġproxies":37117,"Ġtranscription":37118,"yx":37119,"bowl":37120,"iscovery":37121,"ĠScotch":37122,"brace":37123,"riter":37124,"ĠDesktop":37125,"Ġlimestone":37126,"æ":37127,"Neg":37128,"013":37129,"Ġformulas":37130,"Ġeval":37131,"Ġzombies":37132,"GU":37133,"ĠHermes":37134,"Ġbrist":37135,"Mand":37136,"Ġmastery":37137,"Ġgoverns":37138,"Ġconstrued":37139,"region":37140,"Ġemitted":37141,"Vice":37142,"060":37143,"Jennifer":37144,"mol":37145,"Ġjealousy":37146,"Ġingenuity":37147,"bug":37148,"olitical":37149,"Ġperce":37150,"ĠSapp":37151,"dim":37152,"utral":37153,"Ġinterrogated":37154,"Gate":37155,"Ġamber":37156,"911":37157,"ĠEveryday":37158,"ĠDDR":37159,"ĠBlades":37160,"Ġnifty":37161,"Ġmurderers":37162,"Ġpresumption":37163,"Pitt":37164,"Div":37165,"ĠDestination":37166,"having":37167,"Ġprolifer":37168,"Ġbreaker":37169,"ĠBW":37170,"Ġcourier":37171,"Try":37172,"ĠBUR":37173,"itized":37174,"Ġcompress":37175,"Ġrepetition":37176,"ĠTik":37177,"Ġdivergence":37178,"Ġcube":37179,"everyone":37180,"ĠPoles":37181,"418":37182,"ĠHighly":37183,"468":37184,"Jeremy":37185,"Ġcontradictions":37186,"Ġmanure":37187,"Sad":37188,"pletion":37189,"626":37190,"Ġ279":37191,"Ġfrivolous":37192,"ĠCanaan":37193,"olor":37194,"Ġincapac":37195,"ĠGentle":37196,"Ġinsomnia":37197,"ĠJing":37198,"688":37199,"ĠViews":37200,"Ġsyll":37201,"486":37202,"antom":37203,"Ġcog":37204,"aintain":37205,"ĠDVDs":37206,"Ġ318":37207,"archy":37208,"Ġreprodu":37209,"Ġconcedes":37210,"Brook":37211,"Ġinterpreting":37212,"Ġextracting":37213,"Ġess":37214,"uning":37215,"ĠMathematics":37216,"iably":37217,"Ġmultit":37218,"ĠActs":37219,"iliated":37220,"Foreign":37221,"Ġflaming":37222,"ĠCoup":37223,"Ġglitches":37224,"Ġdifferentiation":37225,"ihadi":37226,"ĠDrone":37227,"Ġincompatible":37228,"asher":37229,"documented":37230,"agons":37231,"wark":37232,"Ġshielding":37233,"ĠCorrect":37234,"romising":37235,"uned":37236,"Ġconduit":37237,"ĠDiablo":37238,"Ġbeginner":37239,"Ġarchived":37240,"smanship":37241,"ĠTBD":37242,"digy":37243,"Ġ322":37244,"Ġ268":37245,"ĠTears":37246,"ĠPriority":37247,"Italy":37248,"Ġ^":37249,"annot":37250,"different":37251,"Joy":37252,"Ġbreathed":37253,"heon":37254,"Ġracists":37255,"Ġvascular":37256,"Between":37257,"etition":37258,"ĠLikely":37259,"icans":37260,"529":37261,"ĠMonsters":37262,"agy":37263,"Orange":37264,"hide":37265,"SIM":37266,"Ġdeceive":37267,"ĠDAR":37268,"Ġshattering":37269,"Ġow":37270,"peak":37271,"Ġpreferable":37272,"Ġpiping":37273,"ĠLEDs":37274,"ĠCOMMUN":37275,"ĠConstruct":37276,"008":37277,"Ġdissatisfied":37278,"ĠKNOW":37279,"ĠFrame":37280,"ĠToast":37281,"Ġadore":37282,"history":37283,"Soviet":37284,"reporting":37285,"Ġ266":37286,"pract":37287,"ĠSauce":37288,"686":37289,"ievers":37290,"ĠDomain":37291,"ousand":37292,"768":37293,"Cos":37294,"609":37295,"432":37296,"Ġtransl":37297,"oof":37298,"Ġ292":37299,"Turkish":37300,"ĠPOLIT":37301,"Harris":37302,"bj":37303,"Ġrodents":37304,"556":37305,"Ġintellectuals":37306,"Ġinteroper":37307,"ixt":37308,"Ġunbiased":37309,"itia":37310,"Ġ504":37311,"Ġbuttocks":37312,"ĠFlam":37313,"Ġchrom":37314,"Ġ259":37315,"shock":37316,"ĠRJ":37317,"ĠLich":37318,"422":37319,"Ġcondom":37320,"phen":37321,"Ġvigilante":37322,"Ġowl":37323,"Ġdwellings":37324,"Ġarchaeologists":37325,"Ġ680":37326,"RAY":37327,"Ġ1921":37328,"Ġ625":37329,"ĠPLAN":37330,"alde":37331,"030":37332,"abbling":37333,"Wave":37334,"Ni":37335,"Ġfurthe":37336,"JS":37337,"Ġpsycho":37338,"ĠFrançois":37339,"Ġundergrad":37340,"Ġsuccessors":37341,"Ġpadded":37342,"introdu":37343,"Ġreasoned":37344,"Ġvas":37345,"creen":37346,"onsequ":37347,"starter":37348,"Court":37349,"ĠHIS":37350,"Ġplaster":37351,"Ġranger":37352,"Ġ298":37353,"esters":37354,"Ġglare":37355,"ype":37356,"Ġcompute":37357,"Ali":37358,"mallow":37359,"Ġmasculine":37360,"ĠExamination":37361,"improve":37362,"Ġdeclass":37363,"Ġdecoration":37364,"ĠFIG":37365,"abre":37366,"Ġstale":37367,"abling":37368,"ĠRusty":37369,"ĠASAP":37370,"Ġadjusts":37371,"Ġbluff":37372,"density":37373,"Ġdisse":37374,"Ġcensor":37375,"ervatives":37376,"Ġkettle":37377,"Ġskeptics":37378,"fd":37379,"Imm":37380,"461":37381,"Ġadvantageous":37382,"419":37383,"ĠPresents":37384,"482":37385,"ĠRewards":37386,"Ġovershadow":37387,"Alabama":37388,"ĠCPC":37389,"Ġsock":37390,"ĠChurches":37391,"hidden":37392,"Ġcringe":37393,"ĠHOR":37394,"PB":37395,"Pretty":37396,"Hong":37397,"?),":37398,"687":37399,"Ġgrocer":37400,"472":37401,"565":37402,"itent":37403,"Ġpartake":37404,"wait":37405,"usters":37406,"Ġcones":37407,"Ġconcurrently":37408,"Ġlevers":37409,"Ġaroma":37410,"ĠDrill":37411,"498":37412,"804":37413,"ithering":37414,"Ġ355":37415,"Ġlegion":37416,"Ġvitri":37417,"Ġcondu":37418,"Angel":37419,"OWER":37420,"Ġ{*":37421,"Simon":37422,"Ġsynthesis":37423,"ĠContainer":37424,"sheet":37425,"Bi":37426,"ĠRaspberry":37427,"Ġ328":37428,"anders":37429,"ĠBlossom":37430,"ĠFINAL":37431,"acid":37432,"Ġborderline":37433,"Aut":37434,"Ġoriginate":37435,"Ġtransm":37436,"Ġbuffalo":37437,"atial":37438,"ĠCraigslist":37439,"Ġcredential":37440,"Ġdisbanded":37441,"Ġunprotected":37442,"ĠZer":37443,"waukee":37444,"diagn":37445,"1999":37446,"doc":37447,"ellig":37448,"Ġwarheads":37449,"ĠADS":37450,"verified":37451,"ĠHAM":37452,"785":37453,"Cu":37454,"Ġenorm":37455,"ĠSkill":37456,"\\":37457,"Ġbashing":37458,"Ġloudspe":37459,"during":37460,"Ġdebunked":37461,"adequ":37462,"Ġuh":37463,"Feed":37464,"ificial":37465,"pred":37466,"ĠPassing":37467,"Kyle":37468,"enance":37469,"ĠMex":37470,"itect":37471,"Ġcavern":37472,"Ġtrop":37473,"ĠEliot":37474,"753":37475,"Ġencountering":37476,"Ġsulf":37477,"Always":37478,"ĠGest":37479,"Ġadditive":37480,"Ġ278":37481,"Ġloops":37482,"liberal":37483,"urion":37484,"ĠRefresh":37485,"ĠDynasty":37486,"Ġsweaty":37487,"Ġsails":37488,"protection":37489,"ĠRooms":37490,"ĠEXT":37491,"few":37492,"ĠPaid":37493,"Ġ377":37494,"Ġcolonialism":37495,"Ġchuckle":37496,"Ġarmour":37497,"Ġsoftly":37498,"661":37499,"Building":37500,"ĠAMER":37501,"Ġbabe":37502,"Ġshif":37503,"Sem":37504,"Ġdisembark":37505,"ĠSubstance":37506,"Stone":37507,"Ġdialect":37508,"ĠAph":37509,"Ġspreadsheet":37510,"ierra":37511,"Ġlineage":37512,"ĠCust":37513,"ĠBabe":37514,"Ġwra":37515,"ĠMafia":37516,"Ġflakes":37517,"ĠEVER":37518,"cong":37519,"ĠCreation":37520,"loo":37521,"ĠAmpl":37522,"ĠSpectre":37523,"012":37524,"geons":37525,"Ġswarm":37526,"ĠPale":37527,"ĠSeek":37528,"itures":37529,"Ġarri":37530,"Ġredistribution":37531,"campaign":37532,"ĠAbility":37533,"579":37534,"ournament":37535,"locks":37536,"Ġnests":37537,"ĠConstantine":37538,"Ġwhisper":37539,"Ġshrouded":37540,"changed":37541,"ĠEnhanced":37542,"Ġ920":37543,"Ġglob":37544,"Tam":37545,"Ġoutwe":37546,"Ġilliter":37547,"Ġsurg":37548,"Nap":37549,"ĠAerial":37550,"iferation":37551,"Egypt":37552,"ERO":37553,"Ġantip":37554,"environment":37555,"machine":37556,"Ġrupture":37557,"treatment":37558,"internal":37559,"Ġinfiltrate":37560,"Ġgratification":37561,"Uber":37562,"Ġunequal":37563,"Ġflav":37564,"Lord":37565,"tein":37566,"ĠLOT":37567,"Ġbullshit":37568,"Ġoriginals":37569,"Ġminced":37570,"Ġmultiply":37571,"ayson":37572,"Ġrecomm":37573,"Ġreceptors":37574,"Ġflashlight":37575,"Ġinhuman":37576,"Future":37577,"Ġpuzzling":37578,"Ġrouters":37579,"Ġuncontroll":37580,"responsible":37581,"Ġcellul":37582,"ĠTablet":37583,"Ġbolted":37584,"Ġpermissible":37585,"adra":37586,"picture":37587,"ODY":37588,"BRE":37589,"Iraq":37590,"Total":37591,"rising":37592,"Ġ273":37593,"nv":37594,"Ġ327":37595,"alysed":37596,"infect":37597,"Ġ1912":37598,"ĠVT":37599,"ĠLazarus":37600,"ictive":37601,"Bu":37602,"ĠNEVER":37603,"ĠCODE":37604,"ĠModified":37605,"fetched":37606,"ĠTrap":37607,"mob":37608,"Ġupkeep":37609,"WARD":37610,"Ġbrewed":37611,"Ġsaliva":37612,"Ġ1923":37613,"Ġsteroid":37614,"rather":37615,"ĠVER":37616,"Ġcontextual":37617,"Ont":37618,"ĠLSD":37619,"agine":37620,"Ġaudible":37621,"ĠMeta":37622,"erek":37623,"aults":37624,"ĠOttoman":37625,"ĠIncludes":37626,"Ġocc":37627,"678":37628,"ipple":37629,"Ġcontrasted":37630,"014":37631,"ĠLenin":37632,"Ġomega":37633,"885":37634,"civil":37635,"Ġoverload":37636,"},\"":37637,"Ġprogrammers":37638,"Ġgeometry":37639,"?).":37640,"shift":37641,"ĠClancy":37642,"nr":37643,"verb":37644,"Ġ760":37645,"Ġstaggered":37646,"Playing":37647,"ĠSmile":37648,"Ġcomplains":37649,"ĠSloven":37650,"Ġdisobedience":37651,"creator":37652,"Ġly":37653,"incoln":37654,"emp":37655,"Ġcrate":37656,"ĠPledge":37657,"ĠGPUs":37658,"protected":37659,"Vo":37660,"medium":37661,"Ġacet":37662,"603":37663,"478":37664,"469":37665,"Further":37666,"Ġsensed":37667,"Lock":37668,"Ġcrabs":37669,"ĠChains":37670,"ĠNEO":37671,"Ġexperimented":37672,"ĠRhythm":37673,"802":37674,"Ġhormonal":37675,"491":37676,"ĠMedian":37677,"Ġevaluates":37678,"ippi":37679,"Ġremovable":37680,"Ġvector":37681,"ilant":37682,"TERN":37683,"Ġpurch":37684,"ĠBind":37685,"athering":37686,"Ġcords":37687,"Lib":37688,"Ġdamned":37689,"orc":37690,"ĠEverywhere":37691,"Ġgorilla":37692,"ystem":37693,"fail":37694,"Ġecstasy":37695,"allion":37696,"Sea":37697,"Ġuploading":37698,"ĠSpecific":37699,"Ġreinforcement":37700,"cerned":37701,"ĠDollars":37702,"Twenty":37703,"OX":37704,"ADD":37705,"Ġbraces":37706,"Ġraven":37707,"Ġ1890":37708,"Ġcirculate":37709,"udden":37710,"Disney":37711,"ĠNope":37712,"ĠBagg":37713,"ĠBuddha":37714,"rael":37715,"urus":37716,"ĠKarma":37717,"Ġcurl":37718,"Ġflips":37719,"Ġbearer":37720,"Ġmisunderstand":37721,"Ġabras":37722,"ĠAssassin":37723,"Fact":37724,"Ġinterf":37725,"Ġvantage":37726,"ĠGenocide":37727,"Ġdeducted":37728,"Sep":37729,"McC":37730,"Jessica":37731,"ĠBackup":37732,"Ian":37733,"urnal":37734,"Ġlaborers":37735,"438":37736,"ĠContinuous":37737,"ĠNBN":37738,"Cool":37739,"mitting":37740,"ĠNormandy":37741,"Ġpurchaser":37742,"Ġacquainted":37743,"Ġblogging":37744,"route":37745,"marine":37746,"Ġstartled":37747,"6000":37748,"ĠRadical":37749,"kiss":37750,"ĠBlitz":37751,"express":37752,"Ġ601":37753,"hent":37754,"Ġtink":37755,"pires":37756,"launch":37757,"sg":37758,"ĠEffects":37759,"Ġstiffness":37760,"ĠAllies":37761,"Ġthirsty":37762,"Ġmyst":37763,"Ġlogger":37764,"Ġstances":37765,"ĠEvaluation":37766,"090":37767,"Ġproclaiming":37768,"Ġhypocritical":37769,"496":37770,"Ġcaus":37771,"ĠKappa":37772,"ĠLann":37773,"ĠScientist":37774,"Ġempath":37775,"etrical":37776,"lege":37777,"Hom":37778,"Aud":37779,"ĠColors":37780,"ĠStraw":37781,"each":37782,"ĠPatron":37783,"Ġnuance":37784,"send":37785,"ourney":37786,"ĠPhen":37787,"Ġamino":37788,"ĠSeconds":37789,"Sn":37790,"ĠCiv":37791,"Ġconglomer":37792,"Ġ411":37793,"versely":37794,"487":37795,"prises":37796,"Ġ277":37797,"necessary":37798,"Ġdope":37799,"Late":37800,"Ġrake":37801,"ĠBrigham":37802,"ogun":37803,"ĠSTATES":37804,"ĠGaal":37805,"Ġintellig":37806,"Ġglacier":37807,"destruct":37808,"ĠZucker":37809,"484":37810,"Ġ332":37811,"ĠArist":37812,"Ġprotagonists":37813,"Ġgraveyard":37814,"names":37815,"ĠPax":37816,"Ġthresholds":37817,"Seeing":37818,"Ġmunitions":37819,"Ġcontradicts":37820,"684":37821,"Ġ529":37822,"ĠConcent":37823,"ĠBlessed":37824,"Hz":37825,"Ġinhibit":37826,"Ġshenanigans":37827,"ĠSpear":37828,"Ġoverlay":37829,"ritis":37830,"ilus":37831,"Ġvariance":37832,"Ġoverpower":37833,"viol":37834,"erning":37835,"Ġpolarization":37836,"aito":37837,"GV":37838,"493":37839,"Keeping":37840,"Ġpaternity":37841,"ĠHappiness":37842,"oops":37843,"sb":37844,"xit":37845,"ophysical":37846,"Ġconclusive":37847,"Arch":37848,"Ġmiser":37849,"Ġsuffice":37850,"ĠStout":37851,"Ġhrs":37852,"643":37853,"Ġprincipled":37854,"azine":37855,"atorium":37856,"ĠFairy":37857,"Ġinfiltrated":37858,"ĠHier":37859,"ĠMIA":37860,"inders":37861,"Ġrebutt":37862,"Ġxx":37863,"Ġfeats":37864,"izzle":37865,"Ġ780":37866,"668":37867,"Ġrepressive":37868,"ĠYugoslavia":37869,"sole":37870,"704":37871,"ĠRPG":37872,"ĠTroll":37873,"packing":37874,"ĠDatabase":37875,"ĠVelvet":37876,"ĠRELEASE":37877,"ablish":37878,"smoking":37879,"ĠBottle":37880,"ĠFully":37881,"ĠLean":37882,"Ġobjectively":37883,"ĠFounding":37884,"ĠClassics":37885,"Ġmosaic":37886,"473":37887,"Ġrooft":37888,"Ġcentrally":37889,"Ġdismissive":37890,"Ġparasites":37891,"009":37892,"Ġcursed":37893,"Ġvex":37894,"Ġeconom":37895,"ĠBore":37896,"enery":37897,"ĠFundamental":37898,"ĠOmni":37899,"489":37900,"714":37901,"Ġforegoing":37902,"Ġfragment":37903,"oros":37904,"070":37905,"ĠFaust":37906,"Ġsucking":37907,"Ġnode":37908,"Ġrighteous":37909,"ĠPowered":37910,"426":37911,"HQ":37912,"Ġchronically":37913,"ĠBAL":37914,"Ġprest":37915,"Ġrapists":37916,"ĠRelationship":37917,"ĠCHR":37918,"Ġlinen":37919,"Ġnumerical":37920,"oters":37921,"Ġiterations":37922,"ttes":37923,"ĠENTER":37924,"Ġrabbi":37925,"Ġhoard":37926,"Ġmerciless":37927,"Ġrobes":37928,"ĠSpray":37929,"Ġadvers":37930,"ilantro":37931,"483":37932,"Ġfungus":37933,"Ġalcoholism":37934,"anasia":37935,"ĠCruiser":37936,"Ġmorals":37937,"cision":37938,"measures":37939,"Ġsabot":37940,"Ġrecol":37941,"ĠSaur":37942,"ĠError":37943,"Ġmysteriously":37944,"sle":37945,"Ġfeminists":37946,"д":37947,"ackle":37948,"ĠMarxist":37949,"Ġselves":37950,"Ġdoorway":37951,"Ġdiscard":37952,"Ġbandits":37953,"ĠDive":37954,"ameless":37955,"TRY":37956,"Ġgull":37957,"Ġrepublican":37958,"sr":37959,"ĠDynamo":37960,"Ġembryo":37961,"MENTS":37962,"ĠLOW":37963,"Ġ319":37964,"Ġgly":37965,"Ġcowork":37966,"Coll":37967,"Ġcris":37968,"ĠBanana":37969,"reality":37970,"Ġmobilization":37971,"unal":37972,"Updated":37973,"Crew":37974,"ĠGideon":37975,"Ġvines":37976,"Ġknitting":37977,"Ġdag":37978,"ĠSurv":37979,"Ġvacc":37980,"Ġimpulses":37981,"Northern":37982,"Ġnanop":37983,"allows":37984,"UTH":37985,"Ġflashbacks":37986,"alsa":37987,"Ġ282":37988,"Ġtransmissions":37989,"ĠAlmighty":37990,"Office":37991,"ĠBride":37992,"ĠBeasts":37993,"othy":37994,"ĠClouds":37995,"ĠDyn":37996,"ĠJolly":37997,"District":37998,"Ġveget":37999,"Ġantit":38000,"ĠSmoking":38001,"hess":38002,"Ġcompose":38003,"Ġreligiously":38004,"ĠHY":38005,"Ġfluorescent":38006,"rame":38007,"ĠMeier":38008,"ĠSQ":38009,"benefit":38010,"Thirty":38011,"559":38012,"ĠCance":38013,"586":38014,"Ġgrouped":38015,"Ġphys":38016,"Ġrebellious":38017,"ĠBASE":38018,"chid":38019,"582":38020,"ĠLessons":38021,"ĠWonderful":38022,"ODE":38023,"uctions":38024,"Ġbarbaric":38025,"rahim":38026,"635":38027,"Ġcloves":38028,"ĠNIH":38029,"ossession":38030,"Employ":38031,"Ġliberate":38032,"Gro":38033,"Ġmagician":38034,"ountain":38035,"FORM":38036,"533":38037,"Ġunpredict":38038,"rity":38039,"Ġfaked":38040,"plets":38041,"ppelin":38042,"Living":38043,"Ġnearer":38044,"Ġsuperiors":38045,"Ur":38046,"Ġheroism":38047,"Ġbearded":38048,"006":38049,"Cole":38050,"1970":38051,"Ġsill":38052,"ĠReduce":38053,"OLOG":38054,"onel":38055,"Billy":38056,"ĠPainter":38057,"ansas":38058,"Ġintermediary":38059,"trump":38060,"ĠMith":38061,"otom":38062,"434":38063,"Ġterrit":38064,"Wa":38065,"Ġsuprem":38066,"Rh":38067,"liction":38068,"ĠDEAD":38069,"Ġbothers":38070,"503":38071,"Ġfrogs":38072,"Ġsprinkled":38073,"Ġnil":38074,"628":38075,"Private":38076,"ĠKGB":38077,"Ġoverriding":38078,"Ġdeceived":38079,"698":38080,"idium":38081,"Ġseeker":38082,"Final":38083,"Ġsubconscious":38084,"Ġwom":38085,"Ġcass":38086,"Ġchicks":38087,"Ġverifying":38088,"ective":38089,"inia":38090,"ĠDetection":38091,"MH":38092,"fortable":38093,"ĠISPs":38094,"Ġcrumble":38095,"ĠRecap":38096,"598":38097,"ummies":38098,"export":38099,"Irish":38100,"Ġlil":38101,"ĠRapt":38102,"ĠRIGHT":38103,"Ġanecdotal":38104,"Ġpiercing":38105,"deck":38106,"Liber":38107,"Books":38108,"Ġassassin":38109,"Tur":38110,"revolution":38111,"ĠSheep":38112,"ĠPublishers":38113,"EMS":38114,"iosis":38115,"finder":38116,"ĠCuriosity":38117,"ARB":38118,"ĠConvers":38119,"IVES":38120,"clave":38121,"ĠChaos":38122,"ĠMim":38123,"ĠCostume":38124,"Ġtwe":38125,"Ġintim":38126,"757":38127,"berto":38128,"Ġ261":38129,"VPN":38130,"cribed":38131,"ĠVerb":38132,"cb":38133,"Ġaxle":38134,"Ġsandwic":38135,"Ice":38136,"ĠThermal":38137,"654":38138,"709":38139,"ĠPact":38140,"ĠEnsure":38141,"izable":38142,"497":38143,"Ġbloodstream":38144,"Aw":38145,"Ġleakage":38146,"Ġalleg":38147,"ĠMelody":38148,"681":38149,"Austin":38150,"428":38151,"Ġsummarized":38152,"ĠDefendants":38153,"ĠVader":38154,"Ê":38155,"Ġ1880":38156,"Ġassemb":38157,"YOU":38158,"GREEN":38159,"jury":38160,"4000":38161,"Ġvenerable":38162,"Ġcomputational":38163,"Ġperpetuate":38164,"Ġtorpedo":38165,"Ġaborted":38166,"Ġrhetorical":38167,"ĠOvert":38168,"Ġacknowledgment":38169,"essment":38170,"ĠIGN":38171,"ĠSheen":38172,"571":38173,"Ġcontag":38174,"Ġcultiv":38175,"Ġspawn":38176,"mess":38177,"Dur":38178,"Ġvortex":38179,"ixties":38180,"ĠBlow":38181,"Sum":38182,"Åį":38183,"Rom":38184,"ĠRadeon":38185,"Fed":38186,"Ġameric":38187,"ĠAnth":38188,"Ġantic":38189,"Ġfortress":38190,"Cold":38191,"ĠPredict":38192,"Fake":38193,"Ġilluminate":38194,"Find":38195,"Ġintellectually":38196,"Ġgon":38197,"alker":38198,"Ġinvoice":38199,"IELD":38200,"Ġfools":38201,"ĠEnding":38202,"-(":38203,"Ġalk":38204,"ĠControlled":38205,"Ġpurposefully":38206,"ĠChronic":38207,"Ġrele":38208,"ĠOps":38209,"Party":38210,"ethnic":38211,"ĠSpecifications":38212,"ffee":38213,"ĠTeach":38214,"ulas":38215,"Ġenslaved":38216,"onomy":38217,"Ġtenets":38218,"Ġammonia":38219,"Ġ1913":38220,"Ġdripping":38221,"612":38222,"659":38223,"ĠSagan":38224,"Ġinaccur":38225,"Ġabol":38226,"ĠLIKE":38227,"Ġvisualization":38228,"learn":38229,"anon":38230,"cipline":38231,"Ġadaptations":38232,"Ġwaiter":38233,"nergy":38234,"507":38235,"ĠDK":38236,"YD":38237,"Ġpedest":38238,"Sense":38239,"ĠObst":38240,"Ġresurrection":38241,"ĠSPECIAL":38242,"Unlike":38243,"Ġlia":38244,"Ġpersuasive":38245,"iatrics":38246,"ONEY":38247,"esthetic":38248,"494":38249,"zik":38250,"Ġfract":38251,"ĠOutput":38252,"ĠBers":38253,"rozen":38254,"ĠRevis":38255,"Ġdraconian":38256,"Words":38257,"asions":38258,"ĠClintons":38259,"CU":38260,"History":38261,"Ġtwilight":38262,"iform":38263,"Ġdispl":38264,"progress":38265,"ĠIO":38266,"Ġcannibal":38267,"Michelle":38268,"Ġnerv":38269,"Ġcontexts":38270,"ĠHorses":38271,"Ġanatomy":38272,"ĠLegislation":38273,"ĠBloody":38274,"Ġunwittingly":38275,"Ġinquired":38276,"ĠZip":38277,"ĠDesigns":38278,"Ġirritating":38279,"Ġunison":38280,"ĠRG":38281,"aviour":38282,"Ġpseudo":38283,"ĠVenom":38284,"Ġobscured":38285,"Ġner":38286,"uked":38287,"ORGE":38288,"Ġmomentarily":38289,"olyn":38290,"Syrian":38291,"Ġmicroscopic":38292,"Ġmistress":38293,"Less":38294,"Ġawoke":38295,"Ġtutor":38296,"esome":38297,"ollar":38298,"egg":38299,"UTE":38300,"Buzz":38301,"Ġattainment":38302,"Ġdiscriminating":38303,"::":38304,"Ġ525":38305,"azard":38306,"ĠBrist":38307,"oras":38308,"Ġveterin":38309,"jing":38310,"idon":38311,"ĠAustral":38312,"arious":38313,"ĠGrav":38314,"anol":38315,"ĠQuran":38316,"Ġbleach":38317,"588":38318,"ĠOsw":38319,"Ġdiffered":38320,"typ":38321,"ĠSIL":38322,"failed":38323,"436":38324,"Ġpalms":38325,"ĠFail":38326,"idespread":38327,"Ġchap":38328,"ĠIMAGES":38329,"ACP":38330,"matched":38331,"Ġjaws":38332,"MHz":38333,"Nik":38334,"ĠHume":38335,"OSH":38336,"Ġpresume":38337,"secut":38338,"ĠDied":38339,"ĠBreat":38340,"gins":38341,"prison":38342,"ĠUR":38343,"ĠROS":38344,"isitions":38345,"Ġpelvic":38346,"exclusive":38347,"522":38348,"689":38349,"FN":38350,"Ġener":38351,"Ġdispers":38352,"Ġcohorts":38353,"shut":38354,"ĠLoad":38355,"needs":38356,"azaki":38357,"inoa":38358,"Inside":38359,"usra":38360,"ighters":38361,"Ġ271":38362,"Ġsubordinate":38363,"ĠHOL":38364,"ĠGlow":38365,"Ġincred":38366,"ĠMadame":38367,"Ġoats":38368,"Ġdeviation":38369,"ĠApproach":38370,"Ġnarc":38371,"bart":38372,"bole":38373,"ĠSHE":38374,"effects":38375,"ĠADA":38376,"Ġmuse":38377,"Squ":38378,"Ġneuroscience":38379,"ĠValues":38380,"engu":38381,"Ġdosage":38382,"Ġwhispers":38383,"Ġnaughty":38384,"ĠFarming":38385,"Recently":38386,"Ġrelapse":38387,"rentice":38388,"UGH":38389,"Ġdarkened":38390,"appings":38391,"ĠSlaughter":38392,"ĠAnim":38393,"Ġovertly":38394,"poses":38395,"Ġdeficient":38396,"Ġnecks":38397,"Iron":38398,"Ġphysiological":38399,"ĠLiang":38400,"Ġlear":38401,"Ġcelestial":38402,"Ġpistols":38403,"Ġeyebrow":38404,"915":38405,"ratch":38406,"cephal":38407,"ĠPSU":38408,"Ġphotograp":38409,"ĠGaul":38410,"Ġuncontrolled":38411,"ĠJoined":38412,"652":38413,"itory":38414,"Ġ274":38415,"GAN":38416,"imester":38417,"essional":38418,"Ø©":38419,"Ġuncons":38420,"THER":38421,"Ġpaternal":38422,"Zero":38423,"ugen":38424,"538":38425,"Ġende":38426,"Ġ505":38427,"movie":38428,"Lind":38429,"Ġscorn":38430,"ulty":38431,"Ġpesky":38432,"Ġ8000":38433,"677":38434,"Ġhomophobia":38435,"ranch":38436,"Ġnarciss":38437,"ĠVoyager":38438,"ĠHELP":38439,"528":38440,"edly":38441,"Ġdetract":38442,"Hope":38443,"787":38444,"ĠMerlin":38445,"Ġgrids":38446,"KI":38447,"Mu":38448,"ĠSelected":38449,"select":38450,"ĠModer":38451,"ĠFeet":38452,"Ġrename":38453,"intensity":38454,"Wilson":38455,"Ġ414":38456,"leave":38457,"Ready":38458,"intuitive":38459,"Ġmeager":38460,"Franc":38461,"DH":38462,"Ġrhy":38463,"ĠPillar":38464,"ĠDOE":38465,"minist":38466,"ĠGrave":38467,"isible":38468,"Ess":38469,"Ġempt":38470,"Ġpatched":38471,"ĠAbortion":38472,"rals":38473,"Ġdow":38474,"Ġcrawled":38475,"igrate":38476,"Virginia":38477,"Ġconting":38478,"Ġorphans":38479,"ĠCrimean":38480,"Ġdyn":38481,"Ġshadowy":38482,"sound":38483,"ailable":38484,"Ġ293":38485,"vm":38486,"Ġaccompanies":38487,"Meanwhile":38488,"JR":38489,"ĠDirections":38490,"Ġadolescence":38491,"Ġpenetrated":38492,"bars":38493,"Rev":38494,"Ta":38495,"ĠSkywalker":38496,"ĠFires":38497,"concept":38498,"ĠSIG":38499,"554":38500,"currently":38501,"Ġ----------------":38502,"ĠWHITE":38503,"767":38504,"rors":38505,"PDF":38506,"Ġcasing":38507,"673":38508,"Ġdisapprove":38509,"1800":38510,"ĠWeed":38511,"Ġinhib":38512,"Ġmorbid":38513,"433":38514,"Ġawfully":38515,"Ts":38516,"Maria":38517,"Ġillusions":38518,"Ġtotalitarian":38519,"ollo":38520,"Ġsuppl":38521,"Ġsarc":38522,"ĠRGB":38523,"Ġlauncher":38524,"Ġbadass":38525,"ĠSyd":38526,"Ġscrape":38527,"ĠCLA":38528,"Ġcircum":38529,"657":38530,"Ġnucleus":38531,"ĠUkip":38532,"Ġmodem":38533,"ĠJou":38534,"adders":38535,"Ġwiser":38536,"thereal":38537,"Ġdemocr":38538,"ĠInvalid":38539,"Mine":38540,"Ġmanifested":38541,"meat":38542,"MORE":38543,"Larry":38544,"acements":38545,"Ġspecimen":38546,"results":38547,"Ġswallowing":38548,"Ġpigeon":38549,"tons":38550,"ĠLose":38551,"Ġquartz":38552,"Ġintraven":38553,"Ġ412":38554,"alyst":38555,"Ġengraved":38556,"client":38557,"ĠADV":38558,"ĠShared":38559,"Ġrites":38560,"Ġhysterical":38561,"ĠHUM":38562,"Cow":38563,"orously":38564,"Ġpleasures":38565,"democratic":38566,"Ġamph":38567,"Ġnib":38568,"rieg":38569,"Ġcalculates":38570,"Ġfrying":38571,"favorite":38572,"Ġantim":38573,"ĠDoom":38574,"monitor":38575,"Want":38576,"Ġtemplates":38577,"558":38578,"iever":38579,"Photos":38580,",,":38581,"ĠSync":38582,"Ġconfronts":38583,"kept":38584,"dt":38585,"ĠERROR":38586,"ETF":38587,"578":38588,"Ġspor":38589,"718":38590,"ivation":38591,"ĠHaskell":38592,"Ca":38593,"Ġdick":38594,"Ġcivilized":38595,"Ġblah":38596,"enough":38597,"Ġoccup":38598,"Ġ334":38599,"antically":38600,"584":38601,"ĠDolphin":38602,"ĠStarts":38603,"Ġfanatic":38604,"ت":38605,"imag":38606,"Ġmicrobial":38607,"freedom":38608,"cult":38609,"wra":38610,"Ġ423":38611,"RIPT":38612,"601":38613,"BTC":38614,"atmeal":38615,"653":38616,"agogue":38617,"Ġderives":38618,"Wolf":38619,"466":38620,"Susan":38621,"ĠPassage":38622,"ARDS":38623,"Guy":38624,"Council":38625,"Ġerotic":38626,"pure":38627,"ĠMemories":38628,"ĠWikileaks":38629,"elines":38630,"Ġanth":38631,"Capital":38632,"807":38633,"ĠEggs":38634,"cv":38635,"ctors":38636,"Ġshatter":38637,"Ġesteem":38638,"vity":38639,"ĠVulcan":38640,"effic":38641,"ĠBELOW":38642,"Ġplatoon":38643,"Commun":38644,"oustic":38645,"Amy":38646,"Freedom":38647,"ppo":38648,"Ja":38649,"ĠConan":38650,"Ġinsepar":38651,"scene":38652,"Ġurinary":38653,"gain":38654,"Hillary":38655,"ĠTAM":38656,"Hist":38657,"Ġmechan":38658,"ĠRobots":38659,"Leader":38660,"Ġcartridges":38661,"Ġwhistleblowers":38662,"ĠSPL":38663,"Labour":38664,"unction":38665,"Ġfaithfully":38666,"Ġcoarse":38667,"Ġsynth":38668,"ĠLV":38669,"Ġjustifying":38670,"439":38671,"Victoria":38672,"ĠProceedings":38673,"alogy":38674,"Ġmorph":38675,"Ġcove":38676,"Ġlaughable":38677,"ECA":38678,"Ġ670":38679,"aturated":38680,"ĠSouls":38681,"ĠSleeping":38682,"Ly":38683,"ĠRetro":38684,"Ġastroph":38685,"Ġseism":38686,"atherine":38687,"ĠHercules":38688,"Ġfuse":38689,"ĠHL":38690,"Ġunintentionally":38691,"ĠRé":38692,"iery":38693,"Ġconco":38694,"Ġeras":38695,"recent":38696,"Ġlaunchers":38697,"ĠVolcano":38698,"ĠJace":38699,"Ġterminating":38700,"ĠIde":38701,"zee":38702,"asonic":38703,"itone":38704,"Ġnutshell":38705,"Ġbip":38706,"dies":38707,"Ġ286":38708,"Ġnood":38709,"ĠFathers":38710,"alys":38711,"Ġtheor":38712,"???":38713,"548":38714,"674":38715,"efined":38716,"806":38717,"âĻ":38718,"697":38719,"Ġdecap":38720,"ĠFN":38721,"Ġbureaucr":38722,"ĠGoat":38723,"ĠShang":38724,"Ġsemin":38725,"Ġthroats":38726,"Ġmoth":38727,"herer":38728,"Democratic":38729,"ixtures":38730,"impl":38731,"ĠLogo":38732,"ortunate":38733,"Ġclumsy":38734,"Ġinnocuous":38735,"ĠBlend":38736,"abulary":38737,"ĠFaces":38738,"Ġpornographic":38739,"px":38740,"Information":38741,"Ġfluoride":38742,"Ġatroc":38743,"Ġdelta":38744,"whatever":38745,"ossier":38746,"ĠNoir":38747,"ĠYao":38748,"551":38749,"undred":38750,"Ġmillennium":38751,"Ġferal":38752,"Ġconvinc":38753,"cano":38754,"imsy":38755,"angles":38756,"Ġsterile":38757,"ĠMenu":38758,"779":38759,"ĠCrack":38760,"Ġabundantly":38761,"ĠmL":38762,"Ġinfiltration":38763,"ĠDefinition":38764,"733":38765,"oubt":38766,"Ġorbital":38767,"Ġpiss":38768,"Ġbeet":38769,"679":38770,"Ġcounteract":38771,"ĠALE":38772,"ulative":38773,"crew":38774,"Ġliberating":38775,"ĠDull":38776,"Speaking":38777,"Sadly":38778,"Ġmisfortune":38779,"Ġdolphin":38780,"557":38781,"Ġbould":38782,"ĠTorah":38783,"ĠConfederacy":38784,"421":38785,"Ġorbits":38786,"ocused":38787,"beer":38788,"Rand":38789,"ĠORIG":38790,"Ġmuc":38791,"LER":38792,"ĠMisty":38793,"Ġinexpl":38794,"Ġreptiles":38795,"Ġaven":38796,"blocking":38797,"ĠPASS":38798,"Ġarisen":38799,"ĠMock":38800,"Ġops":38801,"Ġshin":38802,"524":38803,"Ġdigestion":38804,"Soft":38805,"irect":38806,"POL":38807,"ĠSpell":38808,"Level":38809,"Ġhex":38810,"Ġbitcoins":38811,"ĠHungry":38812,"VL":38813,"ĠRealm":38814,"RELATED":38815,"Delta":38816,"Pri":38817,"Ġrejoice":38818,"ĠLatter":38819,"LG":38820,"Ġstupidity":38821,"Ġdonkey":38822,"nova":38823,"Vill":38824,"Ġdecomp":38825,"Ġexternally":38826,"Ġsequest":38827,"815":38828,"Ġshortcut":38829,"riminal":38830,"Hun":38831,"EH":38832,"Ġregiment":38833,"Case":38834,"definition":38835,"Ġappendix":38836,"ĠPlayed":38837,"associated":38838,"izens":38839,"ĠVag":38840,"Ġflung":38841,"Ġfru":38842,"Ġcoil":38843,"________________________":38844,"Ġselects":38845,"Ġsolves":38846,"aea":38847,"985":38848,"Tomorrow":38849,"Ġsear":38850,"APE":38851,"492":38852,"Ġenlightened":38853,"Ġnonexistent":38854,"ĠPotato":38855,"Ghost":38856,"Ġrichness":38857,"ĠKarin":38858,"Ġfamilial":38859,"ĠJA":38860,"Regardless":38861,"Ġepis":38862,"GD":38863,"Ġinsanely":38864,"ĠPhill":38865,"Block":38866,"Finding":38867,"omal":38868,"Ġdecipher":38869,"ĠSwap":38870,"derived":38871,"ĠOFFIC":38872,"Support":38873,"Ġnylon":38874,"Ġexaggeration":38875,"Ġevangelicals":38876,"Ġbearings":38877,"587":38878,"Ġlocale":38879,"Ġpowerfully":38880,"Ġappropriated":38881,"itates":38882,"irlfriend":38883,"cule":38884,"ĠSomewhere":38885,"747":38886,"ĠInteresting":38887,"464":38888,"Ġelong":38889,"Ġdegrade":38890,"rafted":38891,"Ġtutorials":38892,"905":38893,"ĠIntervention":38894,"Ġuniqueness":38895,"Ġ284":38896,"Ġexplorers":38897,"Ġnucle":38898,"ĠMillenn":38899,"511":38900,"ĠReneg":38901,"Ġexecut":38902,"urai":38903,"leon":38904,"Ġdeserts":38905,"ĠCig":38906,"Ġsuggestive":38907,"instead":38908,"Ġlousy":38909,"Ġenigmatic":38910,"594":38911,"Know":38912,"rollment":38913,"ipher":38914,"Ġhumanities":38915,"Ġmodifying":38916,".....":38917,"Ġdegraded":38918,"Ġsuppressing":38919,"Ġeman":38920,"abouts":38921,"functional":38922,"ĠOU":38923,"ĠRelax":38924,"786":38925,"esses":38926,"ĠLogin":38927,"spec":38928,"ĠWWF":38929,"Ġ364":38930,"ĠIsis":38931,"Wisconsin":38932,"Ġequival":38933,"ĠCollector":38934,"ibilities":38935,"malink":38936,"acea":38937,"Ġchained":38938,"Ġarist":38939,"Ġdisadvantages":38940,"ĠBrus":38941,"limits":38942,"ĠDmit":38943,"544":38944,"ĠRecipe":38945,"Ġhabitual":38946,".):":38947,"ĠPRODUCT":38948,"772":38949,"Ġrept":38950,"Ġpathology":38951,"Ġresurrected":38952,"uders":38953,"Ġlingu":38954,"Ġdenomination":38955,"Ġfirewall":38956,"scient":38957,"Ġvaliant":38958,"Kansas":38959,"516":38960,"Ġcontemporaries":38961,"Roman":38962,"Ġaccompan":38963,"Ġantennas":38964,"ĠXan":38965,"Ġelectromagnetic":38966,"ĠNek":38967,"alien":38968,"indle":38969,"Ġgraphene":38970,"Ġgraceful":38971,"syn":38972,"ĠBosh":38973,"Ġ1908":38974,"Ġsuccumb":38975,"Technology":38976,"Ġtoxin":38977,"myra":38978,"essert":38979,"Hell":38980,"Gil":38981,"Ġdiarr":38982,"imeters":38983,"Ġexplo":38984,"Ġgeometric":38985,"ĠNavigation":38986,"cern":38987,"Ġprogrammer":38988,"oÄŁan":38989,"Ġdodging":38990,"ĠLU":38991,"573":38992,"inters":38993,"Ġserum":38994,"Ġuber":38995,"Ġmanga":38996,"762":38997,"ĠOccasionally":38998,"437":38999,"ĠTheme":39000,"Ġimmature":39001,"Ġactivating":39002,"ĠTruly":39003,"د":39004,"osion":39005,"Age":39006,"TIME":39007,"Silver":39008,"sand":39009,"ulnerable":39010,"Ġcram":39011,"Large":39012,"ĠAnger":39013,"icators":39014,"431":39015,"ĠHonest":39016,"zip":39017,"Ġdism":39018,"Ġfades":39019,"ĠPik":39020,"Ast":39021,"sequent":39022,"Ġunsigned":39023,"xious":39024,"creation":39025,"Ġ395":39026,"ottenham":39027,"Ġundesirable":39028,"ugal":39029,"ĠDivide":39030,"lp":39031,"563":39032,"ĠPOP":39033,"ĠCET":39034,"session":39035,"Ġoccurrences":39036,"chu":39037,"ĠACS":39038,"ĠProsecut":39039,"Ġhypnot":39040,"rely":39041,"ERG":39042,"Ven":39043,"Republicans":39044,"inez":39045,"ĠImplementation":39046,"Ġsprang":39047,"Ġobs":39048,"Defense":39049,"Ġunexpl":39050,"ĠPAGE":39051,"ĠTent":39052,"ĠNeurolog":39053,"Ġintuition":39054,"759":39055,"Ġterrestrial":39056,"Ġmorphine":39057,"Ġ.\"":39058,"ĠHydra":39059,"651":39060,"Ġneoliberal":39061,"683":39062,"Ġabnormalities":39063,"quant":39064,"Ġmonastery":39065,"jac":39066,"ĠReaction":39067,"Ġcontraceptive":39068,"ĠBalls":39069,"Ġapost":39070,"676":39071,"ĠHELL":39072,"approximately":39073,"Ġvibrations":39074,"COR":39075,"ĠCPUs":39076,"Ġcontin":39077,"Ġsemblance":39078,"Ġshorth":39079,"tip":39080,"ĠChips":39081,"makes":39082,"Ġprett":39083,"Ġconspicuous":39084,"ĠAmp":39085,"Ġvisualize":39086,"Hu":39087,"sorry":39088,"nai":39089,"ĠArcade":39090,"rimination":39091,"obin":39092,"Ġvampire":39093,"773":39094,"ĠCaucasus":39095,"Medic":39096,"ĠGitHub":39097,"ĠWicked":39098,"ĠFet":39099,"Krist":39100,"998":39101,"Ġfrontal":39102,"Ġ283":39103,"ndum":39104,"Ġidols":39105,"ĠMSG":39106,"ĠShuttle":39107,"ĠTowards":39108,"Ġsaturation":39109,"Ġ®":39110,"Ġcradle":39111,"eteen":39112,"Ġprejudices":39113,"separ":39114,"ĠSoda":39115,"ynam":39116,"Ġnause":39117,"Ġpenetrating":39118,"ĠVampire":39119,"Ġmole":39120,"Ġgoogle":39121,"earance":39122,"583":39123,"Ġdomin":39124,"727":39125,"Kind":39126,"Ġcust":39127,"manuel":39128,"ĠAstro":39129,"Roger":39130,"JO":39131,"killed":39132,"ĠDisapp":39133,"833":39134,"ĠEQU":39135,"Ġprecedence":39136,"mberg":39137,"641":39138,"ĠRoller":39139,"Ġspecifying":39140,"035":39141,"phil":39142,"Ġpowdered":39143,"Ġblot":39144,"Ġdeline":39145,"Bruce":39146,"536":39147,"Ġpim":39148,"leasing":39149,"vacc":39150,"RN":39151,"Ġspacing":39152,"Ġhangar":39153,"ĠPlot":39154,"537":39155,"legraph":39156,"596":39157,"Ġpolyg":39158,"doi":39159,"ĠNerd":39160,"installed":39161,"ĠSeeds":39162,"ĠPlays":39163,"ĠRomance":39164,"layer":39165,"Ġunsu":39166,"Ġcurric":39167,"Mi":39168,"restrial":39169,"ĠNiño":39170,"ĠProper":39171,"Ġpores":39172,"Giving":39173,"aeus":39174,"Middle":39175,"liber":39176,"Ġcombatants":39177,"ĠBulk":39178,"Ġ502":39179,"Ġstru":39180,"ĠLonely":39181,"Companies":39182,"inence":39183,"Autom":39184,"Ġfearsome":39185,"Ġsummar":39186,"Ġrotated":39187,"ĠPLA":39188,"ĠFAT":39189,"572":39190,"ĠSkies":39191,"iour":39192,"Ġintimately":39193,"amera":39194,"Ġ475":39195,"623":39196,"Ġirrig":39197,"Ġboosters":39198,"Ġtransmitting":39199,"DOWN":39200,"ĠAble":39201,"Ġfuriously":39202,"spirit":39203,"Ġgrun":39204,"Ġbible":39205,"ĠAdmir":39206,"Ġ§":39207,"ĠRaise":39208,"Ġflowering":39209,"uxe":39210,"ravis":39211,"urther":39212,"ĠScientology":39213,"pathy":39214,"Ġruth":39215,"Ġtempor":39216,"Ġwhispered":39217,"ogly":39218,"coord":39219,"chlor":39220,"processing":39221,"iott":39222,"ĠTY":39223,"wik":39224,"abolic":39225,"ĠUnable":39226,"ĠLiterary":39227,"ĠpH":39228,"Eastern":39229,"Craig":39230,"Fear":39231,"Ġinventions":39232,"ĠNost":39233,"Ġafflicted":39234,"ĠSwamp":39235,"INST":39236,"Jerry":39237,"Ġprope":39238,"ĠLancet":39239,"Ġrefres":39240,"ĠPrinciples":39241,"ĠLys":39242,"ERAL":39243,"addock":39244,"Ġcynicism":39245,"Ġmassacres":39246,"roo":39247,"Ġcollagen":39248,"Johnny":39249,"Keith":39250,"Italian":39251,"553":39252,"Dad":39253,"Neither":39254,"cler":39255,"ilers":39256,"Ġassass":39257,"Travel":39258,"672":39259,"Ġeaves":39260,"ATOR":39261,"Ġoily":39262,"581":39263,"ateful":39264,"728":39265,"Ġchiefly":39266,"tical":39267,"enes":39268,"ĠWouldn":39269,"ĠJacket":39270,"ĠSuit":39271,"Ġindustrialized":39272,"ĠNose":39273,"ĠSECTION":39274,"Ġredd":39275,"Ġcavity":39276,"Ġconn":39277,"Shield":39278,"Ġtongues":39279,"Ġsuccinct":39280,"views":39281,"ĠMUST":39282,"oliath":39283,"Ġlimitless":39284,"Ġapocalyptic":39285,"ĠAtlantis":39286,"DNA":39287,"ilded":39288,"ĠDresden":39289,"nit":39290,"Ġsubdiv":39291,"gressive":39292,"701":39293,"hops":39294,"alist":39295,"Ġunintentional":39296,"Ġpsychic":39297,"Ġcontrovers":39298,"Ġforeground":39299,"Ġnaïve":39300,"Ġfolders":39301,"icist":39302,"Ġdrawbacks":39303,"ĠToxic":39304,"ophy":39305,"ĠMasonic":39306,"Ġcis":39307,"olated":39308,"Ġdepletion":39309,"Rap":39310,"692":39311,"Ġinver":39312,"ĠFAQ":39313,"Ġmeanings":39314,"Ġbisc":39315,"ĠRage":39316,"Ġresear":39317,"Ep":39318,"Ġunbeat":39319,"ĠComponents":39320,"bub":39321,"ĠInterface":39322,"Isa":39323,"ĠArgon":39324,"Ġdenomin":39325,"Ġmammal":39326,"519":39327,"Ġsizing":39328,"imbabwe":39329,"ĠReplacement":39330,"Georgia":39331,"ĠParticipation":39332,"Ġmelts":39333,"Ġfemin":39334,"514":39335,"Ġseams":39336,"513":39337,"ĠGaw":39338,"Ġbrood":39339,"Mit":39340,"Ġannoyance":39341,"Ġequilibrium":39342,"Ġpatri":39343,"Ġ338":39344,"561":39345,"mentioned":39346,"ĠVotes":39347,"Ġintoler":39348,"Ġstrikingly":39349,"Ġ352":39350,"Ġskeletal":39351,"616":39352,"isition":39353,"Ġfluor":39354,"provided":39355,"517":39356,"Ġclimates":39357,"Ġsensibilities":39358,"ĠFrequ":39359,"onite":39360,"Kenn":39361,"Ġmagnets":39362,"assis":39363,"Ġprerequisite":39364,"Ġ>>>":39365,"Ġscree":39366,"google":39367,"ĠMirage":39368,"Ġevict":39369,"Peace":39370,"Ġmissionaries":39371,"617":39372,"748":39373,"rient":39374,"ĠSTATS":39375,"Bird":39376,"ĠShiva":39377,"ĠBlessing":39378,"Ġredundancy":39379,"Ġphotoc":39380,"ĠOnes":39381,"754":39382,"alert":39383,"urous":39384,"Ġfolklore":39385,"ĠIdeal":39386,"sheets":39387,"according":39388,"Hor":39389,"Cle":39390,"ĠEdit":39391,"671":39392,"olitics":39393,"ĠESC":39394,"Ġparaly":39395,"Ġorgasm":39396,"speak":39397,"ð":39398,"Ġsneaky":39399,"Ġswords":39400,"Ġfandom":39401,"776":39402,"ĠScandinav":39403,"Ġdarts":39404,"546":39405,"cerpt":39406,"ĠGifts":39407,"Ġmagically":39408,"phys":39409,"Laughs":39410,"ĠSour":39411,"ources":39412,"789":39413,"ĠEps":39414,"ository":39415,"uality":39416,"literally":39417,"Ġheavens":39418,"FUL":39419,"Ġie":39420,"ĠISP":39421,"Ġwink":39422,"Ġweeping":39423,"Ġdocking":39424,"ACY":39425,"iece":39426,"Ġsignifies":39427,"guns":39428,"Sac":39429,"Leave":39430,"imation":39431,"Ġunex":39432,"uctive":39433,"ĠFees":39434,"ĠPortable":39435,"ĠInvestigator":39436,"pill":39437,"rehensible":39438,"Ġpotency":39439,"803":39440,"Ġembodiment":39441,"overty":39442,"shine":39443,"REL":39444,"ĠMPH":39445,"ĠPatriarch":39446,"Ġaspirin":39447,"Ġrinse":39448,"Ġinher":39449,"ograms":39450,"ĠTHREE":39451,"qt":39452,"ipples":39453,"Ġdehuman":39454,"Ġslander":39455,"Ġflora":39456,"brow":39457,"Ġblindly":39458,"ectar":39459,"endish":39460,"Ġpigment":39461,"cellent":39462,"Ġyells":39463,"ĠLust":39464,"ĠAttacks":39465,"ĠSyndicate":39466,"otin":39467,"gress":39468,"reenshot":39469,"picking":39470,"Ġacupuncture":39471,"images":39472,"glas":39473,"ĠPolicies":39474,"Ġintestinal":39475,"1998":39476,"ULE":39477,"runs":39478,"ĠNing":39479,"ĠAsuka":39480,"ĠSkull":39481,"Motor":39482,"Ġdefund":39483,"Ġattaching":39484,"ĠBAD":39485,"Ġquarrel":39486,"Child":39487,"Dog":39488,"issan":39489,"irmation":39490,"Ġinline":39491,"ĠLover":39492,"Ġcyan":39493,"entary":39494,"awareness":39495,"Ġtraveller":39496,"âĢIJ":39497,"Ġbeasts":39498,"Ġboobs":39499,"ĠDeadly":39500,"Ġplutonium":39501,"ĠIntellectual":39502,"Jam":39503,"Ġconsec":39504,"663":39505,"ĠVegan":39506,"Ġ331":39507,"uron":39508,"ĠHEL":39509,"reements":39510,"Ġclone":39511,"Ġoutputs":39512,"oult":39513,"ĠDOM":39514,"ĠNX":39515,"Ze":39516,"909":39517,"brate":39518,"arations":39519,"ĠJindal":39520,"Ġbooklet":39521,"amide":39522,"Ġscraping":39523,"Sol":39524,"Date":39525,"796":39526,"Ġfulf":39527,"Ġskeletons":39528,"Ġsaints":39529,"ĠCurious":39530,"Han":39531,"Ġrepud":39532,"osity":39533,"ĠGravity":39534,"Ġmetadata":39535,"Focus":39536,"Ġthrott":39537,"ĠProgramming":39538,"Break":39539,"erver":39540,"Ġknight":39541,"yrs":39542,"Ġ376":39543,"sat":39544,"auto":39545,"Ġbroom":39546,"Ġnerd":39547,"Political":39548,"022":39549,"-------------":39550,"oulos":39551,"Ġrelic":39552,"Ġenactment":39553,"rious":39554,"ĠUniform":39555,"Teen":39556,"Colorado":39557,"055":39558,"Ġangled":39559,"bolt":39560,"ĠNeander":39561,"ĠDism":39562,"thanks":39563,"Polit":39564,"ersion":39565,"dro":39566,"install":39567,"Jake":39568,"hz":39569,"Ġ770":39570,"ĠCommodore":39571,"lahoma":39572,"Ġshri":39573,"Ġ....":39574,"Ġ7000":39575,"scope":39576,"Ġgenesis":39577,"Ġresided":39578,"ĠRivals":39579,"Ġsarcastic":39580,"Ġelicit":39581,"Ġmultiplied":39582,"uitous":39583,"Ġoppress":39584,"ĠPROT":39585,"Ġperpetually":39586,"ĠAdds":39587,"Ġbuffers":39588,"Ġmush":39589,"Ġ354":39590,"Ġpresc":39591,"ĠKung":39592,"682":39593,"Education":39594,"Ġpled":39595,"bsp":39596,"Ġconfessions":39597,"Ġrevocation":39598,"Micro":39599,"ĠHobby":39600,"ĠFatal":39601,"STAR":39602,"Ġworkspace":39603,"Ġtransformations":39604,"Ġportals":39605,"orned":39606,"figured":39607,"Ġlinguistic":39608,"pperc":39609,"ergus":39610,"Fel":39611,"ĠIntent":39612,"Ġ289":39613,"Ġdelinquent":39614,"Ġhandwriting":39615,"Ġvap":39616,"576":39617,"redited":39618,"736":39619,"Ġpsychiatry":39620,"GMT":39621,"Ġdisingen":39622,"Ġcrou":39623,"801":39624,"Ġmalice":39625,"itutes":39626,"ĠTiff":39627,"Ġstink":39628,"574":39629,"Story":39630,"Modern":39631,"ĠGly":39632,"Jamie":39633,"Ġadvertis":39634,"Ġhiber":39635,"Ġinfiltr":39636,"Ġelector":39637,"rovers":39638,"ĠFist":39639,"peed":39640,"ĠClassical":39641,"592":39642,"Ġconscientious":39643,"Surv":39644,"Text":39645,"ĠDrunk":39646,"Ġsupplemented":39647,"THIS":39648,"Ġtimid":39649,"Ġstacking":39650,"rites":39651,"Ġrebirth":39652,"Ġbalcon":39653,"Ġyawn":39654,"rosc":39655,"axy":39656,"Hart":39657,"ĠOPER":39658,"996":39659,"Ġrabid":39660,"ĠTick":39661,"Ġgrinning":39662,"elfth":39663,"045":39664,"Ġjustifies":39665,"ĠPirate":39666,"ĠSalary":39667,"Ġmirac":39668,"613":39669,"inately":39670,"ĠLIN":39671,"Ġinadequ":39672,"NPR":39673,"iddled":39674,"storage":39675,"Ġseventy":39676,"onet":39677,"Ġgastro":39678,"FIR":39679,"Ġrodent":39680,"629":39681,"ĠInclude":39682,"ĠCategories":39683,"ĠLiterally":39684,"Ġpree":39685,"aunder":39686,"ĠLOL":39687,"694":39688,"Ġindef":39689,"Ped":39690,"Ġmenstru":39691,"Ġcensored":39692,"Ġconfigure":39693,"Ġoverest":39694,"igenous":39695,"Ġrectangular":39696,"ĠMIS":39697,"ĠMub":39698,"Ġwitches":39699,"izards":39700,"Ġobnoxious":39701,"ĠLoll":39702,"ĠSEM":39703,"Ġspiritually":39704,"Ġcoer":39705,"Ġmodesty":39706,"butt":39707,"Ġedits":39708,"ĠShall":39709,"sburgh":39710,"Ġ1911":39711,"Rex":39712,"manent":39713,"ĠLithuan":39714,"Ġpointers":39715,"ativity":39716,"retch":39717,"Ġcascade":39718,"ĠRagnarok":39719,"ĠPainting":39720,"ĠATL":39721,"Born":39722,"Ġpadding":39723,"whel":39724,"Ġgrotesque":39725,"Ġtheorists":39726,"forcer":39727,"ĠJinn":39728,"Ġrenal":39729,"jamin":39730,"ĠFEC":39731,".\"\"":39732,"redict":39733,"Ġoppos":39734,"opted":39735,"Sel":39736,"ipment":39737,"752":39738,"792":39739,"Pur":39740,"Ġvolt":39741,"Ġflap":39742,"ĠCASE":39743,"Ġdyed":39744,"orers":39745,"becca":39746,",.":39747,"ifice":39748,"ubes":39749,"Ġyr":39750,"DW":39751,"Ġalteration":39752,"ĠSimpl":39753,"Ġunequiv":39754,"756":39755,"Dou":39756,"Ġplunder":39757,"Ġcommons":39758,"Ġstag":39759,"ĠZeal":39760,"avanaugh":39761,"Self":39762,"none":39763,"EGIN":39764,"Ġflashback":39765,"VAL":39766,"Gab":39767,"ĠCapture":39768,"ĠBrilliant":39769,"ĠDisk":39770,"ĠMood":39771,"Ġhaun":39772,"Ġrotting":39773,"ĠCobra":39774,"Ġpsychopath":39775,"Ġhelper":39776,"Starting":39777,"ĠOrbit":39778,"Ġcaf":39779,"Half":39780,"Volume":39781,"aptop":39782,"ĠSaga":39783,"azor":39784,"593":39785,"774":39786,"ĠCaucasian":39787,"compan":39788,"ĠVERY":39789,"GES":39790,"Ġvomit":39791,"Ġdispro":39792,"ĠMechanics":39793,"Ġ385":39794,"Ġmystical":39795,"AFTA":39796,"Ġbacter":39797,"availability":39798,"Ġhairc":39799,"ĠVec":39800,"rypt":39801,"Ġmanipulative":39802,"shell":39803,"ĠWeird":39804,"jab":39805,"ĠByr":39806,"Bow":39807,"uin":39808,"Ġquot":39809,"MX":39810,"Ġ960":39811,"ĠSharia":39812,"ĠWeapon":39813,"ĠPowerPoint":39814,"Ġstitching":39815,"Ġconstraint":39816,"âľ":39817,"ulic":39818,"597":39819,"omedical":39820,"ĠSupplemental":39821,"ĠSurve":39822,"ĠSubcommittee":39823,"ĠDarkness":39824,"Ġpython":39825,"LU":39826,"Ġ402":39827,"ĠQuan":39828,"ĠModerate":39829,"clusively":39830,"Ġextrap":39831,"Ġlatt":39832,"ĠSTUD":39833,"oslav":39834,"Ġsymb":39835,"battle":39836,"flash":39837,"ĠDeploy":39838,"Ġmicrobiome":39839,"Ġingested":39840,"Ġdistort":39841,"Ġassimil":39842,"Ġmobs":39843,"illet":39844,"Gre":39845,"Ġ294":39846,"Ġforbids":39847,"ĠEfficiency":39848,"ĠClan":39849,"763":39850,"Ġdragons":39851,"States":39852,"ĠMAKE":39853,"ĠBOOK":39854,"ĠRuns":39855,"ĠUX":39856,"EED":39857,"Whoever":39858,"ionics":39859,"worldly":39860,"ĠMermaid":39861,"Ġbenz":39862,"Info":39863,"523":39864,"Ġbiod":39865,"ĠPoison":39866,"ceivable":39867,"Services":39868,"ATIVE":39869,"ĠItem":39870,"Ġdisav":39871,"Ġheter":39872,"Ġasteroids":39873,"ĠWooden":39874,"Ġelectroly":39875,"assadors":39876,"nance":39877,"reflect":39878,"Ġattent":39879,"iphany":39880,"Ġspaceship":39881,"Ġbegg":39882,"algia":39883,"Ax":39884,"Ġidiosyncr":39885,"Ġinserting":39886,"ĠCSS":39887,"ĠLET":39888,"ĠStrikes":39889,"ossibly":39890,"Exp":39891,"Opp":39892,"dden":39893,"Ġplayable":39894,"ĠJM":39895,"Ġlawfully":39896,"ĠBlink":39897,"Ġ413":39898,"Ġoverpowered":39899,"Ġcommenter":39900,"Track":39901,"Ġmethyl":39902,"Ġfermented":39903,"Ġinvaders":39904,"ĠMoves":39905,"Ġcommunicates":39906,"rint":39907,"ĠTray":39908,"jug":39909,"Ġsuperf":39910,"ochet":39911,"ĠJelly":39912,"Ġestrogen":39913,"Dom":39914,"mix":39915,"Gun":39916,"ochemistry":39917,"952":39918,"Ġovere":39919,"ĠPlaintiff":39920,"ĠPilgrim":39921,"ĠSERVICES":39922,"ĠExpend":39923,"ĠFRE":39924,"Ġsmelling":39925,"ĠSpaces":39926,"bris":39927,"Mission":39928,"Ġarter":39929,"Ġautonom":39930,"Lisa":39931,"ĠPercent":39932,"NK":39933,"ĠLimits":39934,"Ġ356":39935,"Recent":39936,"ĠSiberian":39937,"etermin":39938,"nets":39939,"ĠSword":39940,"essee":39941,"Ùĩ":39942,"icycle":39943,"Ġparas":39944,"Ġrud":39945,"Ġscrib":39946,"Ġ1860":39947,"Shop":39948,"orld":39949,"Ġpept":39950,"ENSE":39951,"Ġanimations":39952,"ership":39953,"Search":39954,"ĠUSSR":39955,"washed":39956,"Ġpromulg":39957,"Ġdetainee":39958,"Ġunderest":39959,"ĠAppropri":39960,"Left":39961,"Update":39962,"Wallet":39963,"idently":39964,"ĠBicycle":39965,"Ġgorge":39966,"abyte":39967,"ĠMinecraft":39968,"rike":39969,"997":39970,"Tesla":39971,"Often":39972,"ĠTHESE":39973,"Ġregression":39974,"Hen":39975,"Ġsnippets":39976,"irds":39977,"Ġprinces":39978,"Ġwastes":39979,"ĠWond":39980,"itimate":39981,"ĠMongol":39982,"ĠkW":39983,"Ġidiots":39984,"Ġforeigner":39985,"Upon":39986,"Ġbackdoor":39987,"umph":39988,"ĠSquirrel":39989,"Ġtyped":39990,"Ġblockers":39991,"Vote":39992,"ĠPossibly":39993,"geist":39994,"ĠTRANS":39995,"Ġtitan":39996,"VG":39997,"Ġmicrobi":39998,"Ġinteracts":39999,"Ġmasc":40000,"Ġfinite":40001,"Ġcutoff":40002,"ornings":40003,"Ġprototyp":40004,"Ġcompan":40005,"mology":40006,"ĠBOX":40007,"Cre":40008,"Bot":40009,"grading":40010,"PET":40011,"Ġinsidious":40012,"ĠFranch":40013,"orians":40014,"ĠAUT":40015,"ĠCrush":40016,"589":40017,"question":40018,"anguard":40019,"Ġabsurdity":40020,"?\",":40021,"Hum":40022,"Ġliberalism":40023,"Ġpostwar":40024,"Gener":40025,"Personally":40026,"889":40027,"Bul":40028,"Ġlighthouse":40029,"Ġ291":40030,"VK":40031,"ĠExposure":40032,"Ġsubtract":40033,"ometime":40034,"arbon":40035,"ĠThieves":40036,"anus":40037,"ĠLibertarian":40038,"Raw":40039,"Ġsolvent":40040,"Ġcorros":40041,"Ġsignific":40042,"Ġscholarly":40043,"024":40044,"Ġfetish":40045,"Ġlarvae":40046,"Ġcatast":40047,"Ġtraitor":40048,"ijing":40049,"Demand":40050,"math":40051,"Ġconceivable":40052,"either":40053,"acl":40054,"ĠArrows":40055,"627":40056,"ĠFrankenstein":40057,"entious":40058,"Ġimitation":40059,"amn":40060,"ĠSTOP":40061,"Ġcripp":40062,"zag":40063,"ĠZed":40064,"797":40065,"Along":40066,"Ġwont":40067,"Ġfolds":40068,"Shar":40069,"ĠCommentary":40070,"ĠLibraries":40071,"ĠThunderbolt":40072,"itud":40073,"Toy":40074,"Ġincidentally":40075,"ĠResp":40076,"Ġordinarily":40077,"Ġvanish":40078,"acterial":40079,"Minnesota":40080,"rank":40081,"614":40082,"ĠExam":40083,"Got":40084,"Ġsnipers":40085,"ETHOD":40086,"dirty":40087,"igsaw":40088,"Obs":40089,"ĠAuthors":40090,"Ġillustrating":40091,"782":40092,"864":40093,"Ġblinded":40094,"transfer":40095,"Ġspawning":40096,"ĠDiary":40097,"ĠDNS":40098,"CG":40099,"someone":40100,"Ġcruc":40101,"Morgan":40102,"Learn":40103,"API":40104,"toc":40105,"STAT":40106,"ĠFlame":40107,"aganda":40108,"ĠBenef":40109,"stuff":40110,"SEA":40111,"Ġincest":40112,"Normally":40113,"ĠRU":40114,"Ġarsenic":40115,"isine":40116,"ĠTG":40117,"Type":40118,"regn":40119,"Cass":40120,"Touch":40121,"Site":40122,"Ġpict":40123,"Ġcorrupted":40124,"729":40125,"Ġnineteen":40126,"Ġparaph":40127,"Ġtavern":40128,"Ġretard":40129,"ĠKaf":40130,"Ġcolleg":40131,"bucks":40132,"imum":40133,"ĠCandle":40134,"ĠMisc":40135,"ĠAwesome":40136,"edited":40137,"ĠDN":40138,"otomy":40139,"Ġdisclaimer":40140,"798":40141,"ĠGoodbye":40142,"ucle":40143,"atom":40144,"Judge":40145,"cipl":40146,"Ġinexplicable":40147,"iddler":40148,"781":40149,"Ġempirical":40150,"Veter":40151,"Ġascert":40152,"Ġaest":40153,"Ġlaz":40154,"binary":40155,"Ġ358":40156,"contained":40157,"Ġmultipl":40158,"ocado":40159,"Ġdelusional":40160,"Ġaeros":40161,"udence":40162,"Ġjargon":40163,"estine":40164,"Ġarbitrarily":40165,"Ġprick":40166,"BACK":40167,"amines":40168,"Mess":40169,"Knowing":40170,"ublic":40171,"ĠWarfare":40172,"Ġsignify":40173,"Ġfragmentation":40174,"Tex":40175,"Ġnin":40176,"Ġdise":40177,"882":40178,"hospital":40179,"volent":40180,"Need":40181,"Ġinfer":40182,"Sony":40183,"783":40184,"YING":40185,"Ġinfinity":40186,"ĠFortress":40187,"Ġmustache":40188,"Ġcorresponds":40189,"DX":40190,"Ġunmarried":40191,"ĠCruel":40192,"Ġ1901":40193,"Ġappropri":40194,"ZI":40195,"Ġphosph":40196,"901":40197,"IFE":40198,"Ġ347":40199,"Ġconvoluted":40200,"ĠApost":40201,"htm":40202,"Ġilluminating":40203,"568":40204,"Ġassassinate":40205,"Ġparam":40206,"Ġimpractical":40207,"cedes":40208,"ĠProcedure":40209,"ĠMouth":40210,"Battle":40211,"Ġ451":40212,"Sand":40213,"Ġcontamin":40214,"Hour":40215,"Cell":40216,"BIL":40217,"Ġprecon":40218,"ĠScor":40219,"Ġconfig":40220,"ĠMuscle":40221,"Ġhive":40222,"Ġunderworld":40223,"plement":40224,"Ġpostage":40225,"Ġinterpersonal":40226,"Ġpierced":40227,"Ġcharms":40228,"oscopic":40229,"ASC":40230,"ĠDex":40231,"render":40232,"png":40233,"Ġcritiques":40234,"992":40235,"ĠVinyl":40236,"Bear":40237,"idia":40238,"ĠTemp":40239,"Ġcyn":40240,"ĠBCE":40241,"Ġpatriarchal":40242,"Ġantagonist":40243,"ĠGMO":40244,"Ġunnatural":40245,"Race":40246,"imeo":40247,"ĠUkrainians":40248,"Train":40249,"Ġ329":40250,"ritten":40251,"igil":40252,"Lin":40253,"alus":40254,"*****":40255,"olded":40256,"ĠPegasus":40257,"Bas":40258,"photos":40259,"Ġ820":40260,"Ġsquadron":40261,"ESE":40262,"Ġ373":40263,"Uk":40264,"Lost":40265,"Store":40266,"ĠScenes":40267,"JJ":40268,"Ġlick":40269,"Tyler":40270,"cius":40271,"lishing":40272,"ocl":40273,"Ġassoci":40274,"ensitivity":40275,"entanyl":40276,"Rum":40277,"Ġ443":40278,"onding":40279,"Ġpedals":40280,"ĠPsychological":40281,"Ġthro":40282,"Network":40283,"591":40284,"Pick":40285,"Ġchords":40286,"ĠHound":40287,"entials":40288,"faces":40289,"ĠYin":40290,"ugi":40291,"bows":40292,"ĠForms":40293,"886":40294,"Ox":40295,"Ġ351":40296,"Ġmating":40297,"Ġchirop":40298,"916":40299,"Ġexpend":40300,"Ġusefulness":40301,"Marvel":40302,"ĠStretch":40303,"omez":40304,"ĠJS":40305,"Hal":40306,"fle":40307,"ĠCountdown":40308,"ĠLH":40309,"assian":40310,"vd":40311,"ĠTranscript":40312,"ĠExtrem":40313,"idine":40314,"ustainable":40315,"ederal":40316,"ĠOwl":40317,"Ġcreed":40318,"ĠGrateful":40319,"Ġprenatal":40320,"________________________________":40321,"ĠElements":40322,"â̦)":40323,"nesia":40324,"ARGET":40325,"Ġboredom":40326,"Ġdepictions":40327,"verbal":40328,"ĠeSports":40329,"Laura":40330,"ilage":40331,"ĠGalactic":40332,"Investigators":40333,"Ġscattering":40334,"instein":40335,"ĠExperiment":40336,"ĠRecre":40337,"Ġregul":40338,"Ġrelent":40339,"STE":40340,"Ġslicing":40341,"igans":40342,"raped":40343,"ĠDeter":40344,"Ġsmoker":40345,"ĠWikimedia":40346,"pages":40347,"Ted":40348,"713":40349,"Ġpuberty":40350,"Ġhars":40351,"ĠStarter":40352,"patch":40353,"leeve":40354,"Ġ346":40355,"ĠAccessories":40356,"ventions":40357,"ĠSTAND":40358,"ĠUrug":40359,"ĠOccupy":40360,"Ġbinds":40361,"ĠBubble":40362,"Ġincorporation":40363,"Ġstereotypical":40364,"Ġgor":40365,"987":40366,"Ġevils":40367,"tower":40368,"Ġastronomer":40369,"Ble":40370,"ĠNid":40371,"ĠWidow":40372,"Ġpaw":40373,"Ġinnoc":40374,"ĠOWN":40375,"Ġtofu":40376,"drops":40377,"ĠEval":40378,"693":40379,"Collins":40380,"penter":40381,"ĠNib":40382,"Ġsmokes":40383,"Ġ1850":40384,"Ġtechno":40385,"oooo":40386,"ĠUnic":40387,"ĠKirin":40388,"\":[\"":40389,"Ġincrements":40390,"989":40391,"oodoo":40392,"ĠCyborg":40393,"Ġcures":40394,"ĠOW":40395,"ĠAnnex":40396,"behavior":40397,"/-":40398,"Ġbuggy":40399,"onent":40400,"Bey":40401,"Ġsummarize":40402,"putable":40403,"Ġfri":40404,"Gi":40405,"urances":40406,"ĠAppalach":40407,"Ġhegemony":40408,"ĠOrigins":40409,"Ġconnectors":40410,"ĠAST":40411,"object":40412,"ĠSlay":40413,"Arm":40414,"oston":40415,"ĠEVEN":40416,"Ġprophecy":40417,"Bright":40418,"ĠVector":40419,"Marg":40420,"omical":40421,"Holy":40422,"ĠRPM":40423,"ĠReceiver":40424,"Ġtracts":40425,"boss":40426,"Ġblurry":40427,"aspx":40428,"DES":40429,"Ġcess":40430,"ĠAster":40431,"anything":40432,"levard":40433,"unciation":40434,"jong":40435,"Ġiv":40436,"Common":40437,"ĠDistance":40438,"imus":40439,"outheast":40440,"Ġcir":40441,"ĠCato":40442,"Ġinscribed":40443,"ersed":40444,"Ġanarchy":40445,"Ġplagiar":40446,"Ġthug":40447,"Actor":40448,"ĠTant":40449,"Researchers":40450,"remember":40451,"Ġitch":40452,"Ġrefill":40453,"Ġsucker":40454,"ĠWANT":40455,"RAG":40456,"rencies":40457,"ĠTape":40458,"Ġattaches":40459,"nb":40460,"Tan":40461,"Ġappend":40462,"Ġalas":40463,"951":40464,"panel":40465,"Climate":40466,"icrobial":40467,"Brandon":40468,"ĠFreud":40469,"Ġfungi":40470,"Ġcommenters":40471,"ĠDelicious":40472,"Ġhitherto":40473,"conv":40474,"Ġchemist":40475,"Ġdenominations":40476,"ĠBehavior":40477,"comed":40478,"ĠLantern":40479,"ĠFloating":40480,"magic":40481,"ĠBarbar":40482,"bender":40483,"iliar":40484,"unny":40485,"Ġretracted":40486,"atars":40487,"ĠLovely":40488,"Ġinfinitely":40489,"Ġhumili":40490,"Ġinterestingly":40491,"Ġmunicip":40492,"ĠPanic":40493,"Ġcomprehension":40494,"ĠMassacre":40495,"Ġpersuasion":40496,"enf":40497,"Ġcoded":40498,"higher":40499,"chart":40500,"umbered":40501,"ĠIndigo":40502,"Ġthinker":40503,"Ġgoof":40504,"ĠPetition":40505,"fascist":40506,"absor":40507,"Ġassay":40508,"ĠClassification":40509,"Ġhalluc":40510,"speech":40511,"issues":40512,"Ġinexper":40513,"ĠLibre":40514,"Ġsling":40515,"zech":40516,"Ġpouch":40517,"ĠOffense":40518,"ĠHF":40519,"Fight":40520,"026":40521,"ĠTrident":40522,"fm":40523,"Ġintox":40524,"Ġ465":40525,"colonial":40526,"ovies":40527,"794":40528,"Techn":40529,"undreds":40530,"Ġchildish":40531,"arenthood":40532,"ĠShade":40533,"Host":40534,"Ġdirectional":40535,"reader":40536,"rimp":40537,"ĠEater":40538,"prep":40539,"Ġmeas":40540,"Ġlatch":40541,"inant":40542,"nels":40543,"finished":40544,"application":40545,"Board":40546,"Ġfiller":40547,"ivably":40548,"CAST":40549,"Ġstereotyp":40550,"Ġwarranties":40551,"ĠProbe":40552,"Ġspontaneously":40553,"Ġtropes":40554,"Meg":40555,"ĠHandling":40556,"hemer":40557,"986":40558,"ĠSly":40559,"plates":40560,"Ġmolten":40561,"ĠHIT":40562,"strings":40563,"Ġcentrif":40564,"ĠENG":40565,"Indeed":40566,"Ġ429":40567,"Ġsly":40568,"Ġ490":40569,"Ġhordes":40570,"boot":40571,"691":40572,"ihara":40573,"Ġsubversive":40574,"Russell":40575,"aceous":40576,"wk":40577,"Ġreverence":40578,"Ġingenious":40579,"holiday":40580,"eligible":40581,"ĠTactical":40582,"978":40583,"herence":40584,"Ġgimm":40585,"Ġarchaic":40586,"Ġadam":40587,"Ġ297":40588,"Father":40589,"ĠLerner":40590,"Ġhesitated":40591,"Safety":40592,"Ġawakened":40593,"ueller":40594,"Ġextrater":40595,"Ġmummy":40596,"ĠBuddhism":40597,"Ġ359":40598,"Ġlegions":40599,"Ġprehistoric":40600,"ancouver":40601,"Ġmelancholy":40602,"ĠEnemy":40603,"ĠSyl":40604,"ĠRobo":40605,"verting":40606,"ĠBullets":40607,"essler":40608,"Ġmarvelous":40609,"ĠBened":40610,"Ġsavior":40611,"omever":40612,"Bee":40613,"Ġrapp":40614,"Ġpredomin":40615,"ĠScripture":40616,"Ġsnapshots":40617,"Ġunrem":40618,"Ġsquid":40619,"ĠBuddh":40620,"ĠSantorum":40621,"Internet":40622,"avoid":40623,"Ġunamb":40624,"Ġ296":40625,"Ġnexus":40626,"Ġinterchangeable":40627,"ockets":40628,"Ġfoll":40629,"ĠOPT":40630,"023":40631,"²":40632,"Ġhereditary":40633,"Ġvape":40634,"=\"":40635,"1996":40636,"س":40637,"Emergency":40638,"Ġneb":40639,"Ġisot":40640,"Ġdiam":40641,"stairs":40642,"ĠAppendix":40643,"venient":40644,"Ġinvol":40645,"Ġtheorist":40646,"Ġconqu":40647,"Mich":40648,"ĠSort":40649,"antasy":40650,"dating":40651,"771":40652,"Ġape":40653,"Ġindemn":40654,"ween":40655,"Games":40656,"ascal":40657,"Muslims":40658,"Ġleaflets":40659,"Ġtraverse":40660,"Ġtransgress":40661,"Ġflushed":40662,"893":40663,"lasses":40664,"obos":40665,"ooming":40666,"Ġtou":40667,"mast":40668,"âģ":40669,"751":40670,"Either":40671,"Ġgrate":40672,"urgy":40673,"Ġendowed":40674,"ĠRasm":40675,"Nat":40676,"odka":40677,"olon":40678,"iants":40679,"Ġsensations":40680,"Ġsituational":40681,"pox":40682,"Figure":40683,"Ġslime":40684,"Ġ421":40685,"ollow":40686,"Ġanesthesia":40687,"adult":40688,"ĠPiece":40689,"994":40690,"ĠAnalog":40691,"Iv":40692,"flo":40693,"Ġdomest":40694,"Ġcabal":40695,"Ġgarg":40696,"Ġrabb":40697,"REC":40698,"ISTORY":40699,"Friend":40700,"Ġancestor":40701,"ĠLets":40702,"Ġelf":40703,"Ġlobb":40704,"ĠAdren":40705,"silver":40706,"astical":40707,"Ġstitch":40708,"028":40709,"Hug":40710,"Ġmoss":40711,"ompl":40712,"Ġunob":40713,"883":40714,"Ġcortex":40715,"olutely":40716,"052":40717,"Seattle":40718,"restling":40719,"endment":40720,"Ġ366":40721,"ventus":40722,"ĠRated":40723,"ĠClever":40724,"Ġcloak":40725,"phrase":40726,"flake":40727,"Ġphilosophies":40728,"784":40729,"Ġskulls":40730,"wake":40731,"oru":40732,"ĠACTION":40733,"Ġcomprom":40734,"ĠManufacturer":40735,"ĠImprove":40736,"Ns":40737,"ĠRevenge":40738,"lords":40739,"Ġ417":40740,"iddles":40741,"Ġcondesc":40742,"tiny":40743,"Ġchloride":40744,"greg":40745,"ĠREST":40746,"subject":40747,"Ġundes":40748,"ftime":40749,"Ġbottleneck":40750,"ĠZombie":40751,"Ġhabitable":40752,"Ġcigars":40753,"Ġenlarg":40754,"icester":40755,"ðĿ":40756,"regulation":40757,"arters":40758,"Ġformulations":40759,"Ġadhesive":40760,"Ġ344":40761,"pod":40762,"etitive":40763,"Ġcontinuum":40764,"aghd":40765,"Ġ701":40766,"Ġdisband":40767,"Tu":40768,"Ġcivilisation":40769,"ĠPCI":40770,"Ġcrooked":40771,"ammy":40772,"Ġbrim":40773,"Jr":40774,"ĠBunker":40775,"plot":40776,"Ġwielded":40777,"Ġcaricature":40778,"ĠInfinite":40779,"piracy":40780,"aretz":40781,"Ġstares":40782,"incinnati":40783,"agents":40784,"ĠObamaCare":40785,"asuring":40786,"ansion":40787,"Ġastonished":40788,"iovascular":40789,"Bio":40790,"Ġadvisable":40791,"Ġsender":40792,"887":40793,"Led":40794,"DN":40795,"Ġaggregation":40796,"ĠInnocent":40797,"ĠTransactions":40798,"worms":40799,"ĠWorm":40800,"Ġ363":40801,"ĠBiblical":40802,"rared":40803,"Ġgazing":40804,"chant":40805,"Ġsubordinates":40806,"1600":40807,"actually":40808,"olition":40809,"ĠRTX":40810,"ĠPyramid":40811,"alph":40812,"ĠFPS":40813,"Ġerrone":40814,"ĠLR":40815,"Scientists":40816,"Ġincons":40817,"Ġbrittle":40818,"027":40819,"ĠBowser":40820,"Rub":40821,"links":40822,"ĠWik":40823,"ussion":40824,"Marsh":40825,"resents":40826,"Clean":40827,"Ġbrute":40828,"ĠInventory":40829,"1100":40830,"ĠATK":40831,"793":40832,"Ġcaveats":40833,"ĠKnot":40834,"IRT":40835,"ĠCanad":40836,"isma":40837,"entin":40838,"Own":40839,"Ġ455":40840,"Ġlesions":40841,"ĠAres":40842,"ĠKali":40843,"Ġpaws":40844,"Auto":40845,"Ġdiscrim":40846,"044":40847,"ĠCOUN":40848,"Ġ1905":40849,"Ġexperien":40850,"Ġ406":40851,"achelor":40852,"Ġscarcely":40853,"Ġsynchronized":40854,"Rat":40855,"Blake":40856,"Ġrewriting":40857,"Ġcannons":40858,"stem":40859,"Apparently":40860,"Ġleveling":40861,"?]":40862,"Ġfins":40863,"ĠTone":40864,"ogether":40865,"Sound":40866,"Ġmicrosc":40867,"ĠAsylum":40868,"Ġindividuality":40869,"Ġ432":40870,"lease":40871,"Chuck":40872,"Ġhating":40873,"Ġleftists":40874,"ĠPersonality":40875,"ĠBundle":40876,"Dutch":40877,"Ġtransformer":40878,"iami":40879,"ĠTradition":40880,"ĠRecipes":40881,"Ġdiscour":40882,"Viol":40883,"Ext":40884,"ĠOliv":40885,"ashington":40886,"Ġmillennia":40887,"Ġpsychiatrists":40888,"ĠTrilogy":40889,"inction":40890,"Ġdisliked":40891,"088":40892,"954":40893,"Ġoverloaded":40894,"Ġopium":40895,"acus":40896,"resources":40897,"mud":40898,"ometry":40899,"Hit":40900,"Ġguild":40901,"Ġabyss":40902,"884":40903,"ensity":40904,"ĠDifference":40905,"Electric":40906,"authent":40907,"Ġdownloadable":40908,"ellar":40909,"ĠSavior":40910,"ĠFRI":40911,"Ġ445":40912,"Ġincidental":40913,"Ġanalogue":40914,"ounters":40915,"ĠBuilder":40916,"Ġnarration":40917,"ategor":40918,"raise":40919,"Ġindoctr":40920,"Aren":40921,"Ġbaptism":40922,"Ġobe":40923,"Ġtubing":40924,"apsed":40925,"Fortunately":40926,"gered":40927,"Pict":40928,"Ġmastering":40929,"ĠHIM":40930,"ĠObesity":40931,"Ġornament":40932,"advant":40933,"ĠCous":40934,"032":40935,"cells":40936,"Ġpreclude":40937,"Ġanecdote":40938,"Ġpatriarchy":40939,"ĠSending":40940,"Pie":40941,"Ġdepressive":40942,"ĠEnds":40943,"712":40944,"zos":40945,"icka":40946,"Ġ1906":40947,"Anti":40948,"vana":40949,"ĠRestrict":40950,"Ġprotr":40951,"Ġusername":40952,"Ġparach":40953,"1997":40954,"imental":40955,"rower":40956,"carb":40957,"033":40958,"Ġobligatory":40959,"Ġwillful":40960,"Ġsnail":40961,"json":40962,"izarre":40963,"Ġmiscar":40964,"Ġdopamine":40965,"л":40966,"Ġapplic":40967,"Ġnervously":40968,"YY":40969,"alez":40970,"ĠSoviets":40971,"ĠMister":40972,"Ġcrates":40973,"Ġheavenly":40974,"Ġdoct":40975,"048":40976,"Ġ2400":40977,"ivia":40978,"adies":40979,"Phone":40980,"asks":40981,"Ġperenn":40982,"Ġcomposing":40983,"Ġraiding":40984,"requent":40985,"ibli":40986,"ĠFeedback":40987,"cellaneous":40988,"ĠContracts":40989,"ĠCasting":40990,"vim":40991,"Cut":40992,"Ġabbrevi":40993,"Ġintest":40994,"ricted":40995,"969":40996,"nostic":40997,"Ġinverted":40998,"ĠEG":40999,"aiden":41000,"ĠClaud":41001,"ĠiP":41002,"urized":41003,"Emily":41004,"Ġ353":41005,"Ġ((":41006,"ammad":41007,"Reb":41008,"plom":41009,"YES":41010,"connection":41011,"ĠWra":41012,"ĠMerch":41013,"Ġether":41014,"Elizabeth":41015,"Chip":41016,"relevant":41017,"URA":41018,"Ġantioxidant":41019,"ĠChron":41020,"Ġtheological":41021,"HCR":41022,"ruits":41023,"Body":41024,"enezuel":41025,"Few":41026,"adder":41027,"Ġinducing":41028,"ĠDarth":41029,"Ġimplicitly":41030,"Ġoverfl":41031,"Ġrelics":41032,"Must":41033,"ĠAnswers":41034,"Ġretina":41035,"ĠSlowly":41036,"ĠShib":41037,"software":41038,"Ġ\"\"":41039,"hack":41040,"Apart":41041,"told":41042,"Ger":41043,"Civil":41044,"problem":41045,"Ġslang":41046,"Ġtactile":41047,"Ġtabl":41048,"ĠAscension":41049,"Ġhumankind":41050,"Howard":41051,"rescent":41052,"ĠReleases":41053,"arijuana":41054,"Christopher":41055,"ĠWarden":41056,"blogspot":41057,"ĠVari":41058,"idency":41059,"ĠHandler":41060,"Round":41061,"MJ":41062,"Ġrhyth":41063,"Tai":41064,"terson":41065,"Ġ,\"":41066,"portation":41067,"ĠOrbital":41068,"Ġfantas":41069,"Ġattribut":41070,"Ġdiagram":41071,"atech":41072,"1992":41073,"ibl":41074,"Woman":41075,"ternally":41076,"Days":41077,"Ġdebunk":41078,"ĠPhant":41079,"ĠOath":41080,"sharp":41081,"Ġclaws":41082,"Lots":41083,"Incre":41084,"Aff":41085,"hooting":41086,"rect":41087,"Ġaltru":41088,"Ġwors":41089,"Ġtho":41090,"Ġ349":41091,"clusions":41092,"Ġpseudonym":41093,"Bec":41094,"Ġphosphorus":41095,"ivic":41096,"Ġ348":41097,"otent":41098,"Ġub":41099,"Ġcoales":41100,"regate":41101,"Ġ1870":41102,"Ġglide":41103,"treated":41104,"ĠSymb":41105,"Ġenchant":41106,"Besides":41107,"stocks":41108,"Ġ388":41109,"--------------":41110,"interpret":41111,"ouple":41112,"Ġdrawback":41113,"ĠRevised":41114,"Ġanat":41115,"Ġpsychosis":41116,"ب":41117,"Ġdiffuse":41118,"Ġaffidav":41119,"elve":41120,"amination":41121,"ĠTackle":41122,"hunter":41123,"env":41124,"Ġchests":41125,"Ġsubter":41126,"Ġconquest":41127,"Ġfidelity":41128,"Ġinfringing":41129,"opathic":41130,"ĠGrip":41131,"ĠKeyboard":41132,"Ġobjectionable":41133,"Ġmetabol":41134,"ĠGö":41135,"Room":41136,"...)":41137,"KEN":41138,"assic":41139,"Ġgeop":41140,"Tro":41141,"Ġcursing":41142,"Ġdile":41143,"Ġultraviolet":41144,"inarily":41145,"Ġdistilled":41146,"sect":41147,"ĠShooter":41148,"uckles":41149,"Ġdistortions":41150,"Map":41151,"Doctor":41152,"Ġinstalls":41153,"oire":41154,"Ġstarch":41155,"ociation":41156,"Lev":41157,"Ġscripture":41158,"Ġsalient":41159,"ilitating":41160,"wb":41161,"ĠSov":41162,"ĠDamn":41163,"Grey":41164,"Ġ980":41165,"Ġjung":41166,"Ġlicking":41167,"029":41168,"ĠDian":41169,"ĠBabylon":41170,"к":41171,"ĠRomantic":41172,"Ġguesses":41173,"ĠFren":41174,"Generally":41175,"ultural":41176,"istence":41177,"Ġiniti":41178,"Ġ341":41179,"ĠSlave":41180,"ultan":41181,"ĠTrash":41182,"ĠEmpty":41183,"ĠHundred":41184,"ĠDirective":41185,"Anderson":41186,"Advertisement":41187,"RH":41188,"ĠOo":41189,"ĠHik":41190,"peg":41191,"Sup":41192,"ĠXT":41193,"Ġencrypt":41194,"selage":41195,"ĠThrone":41196,"Ġconsecut":41197,"Li":41198,"ĠVirus":41199,"ĠCookies":41200,"SHIP":41201,"Ġflavorful":41202,"odynamics":41203,"animal":41204,"spread":41205,"ĠIPCC":41206,"jobs":41207,"ernand":41208,"ĠHaunted":41209,"Ġintolerable":41210,"ĠLAR":41211,"ixtape":41212,"Ġneur":41213,"Ġcausal":41214,"ĠPsychiatry":41215,"ĠVim":41216,"Ġgenomic":41217,"duration":41218,"ĠUsername":41219,"ategy":41220,"Ġunic":41221,"ĠKILL":41222,"blooded":41223,"Ġcaucuses":41224,"ĠPOLITICO":41225,"Spanish":41226,"Ġobedience":41227,"Ġinconven":41228,"MAT":41229,"Ġbends":41230,"ĠImprovements":41231,"Ġrelig":41232,"ĠForth":41233,"ĠLumia":41234,"uces":41235,"Ġunim":41236,"ĠStatistical":41237,"kb":41238,"auntlet":41239,"ĠDisco":41240,"ĠInstruction":41241,"ooo":41242,"ĠDictionary":41243,"culated":41244,"Adv":41245,"ĠAvatar":41246,"ictional":41247,"Ġcentr":41248,"ifles":41249,"orks":41250,"skill":41251,"Ġlatex":41252,"ĠPagan":41253,"Ġdevast":41254,"Ġprol":41255,"896":41256,"Product":41257,"968":41258,"Ġfrench":41259,"083":41260,"ĠCluster":41261,"cloth":41262,"ĠFilter":41263,"ĠDisorders":41264,"etimes":41265,"Ġinstinctively":41266,"ĠBritann":41267,"Ġaft":41268,"ĠVict":41269,"Ġâĺħ":41270,"Ġperverse":41271,"Ġcontraceptives":41272,"ĠHannibal":41273,"escap":41274,"ĠApostle":41275,"ĠXiao":41276,"ĠMagnum":41277,"Ġphosphate":41278,"Ġ399":41279,"utable":41280,"Ġsten":41281,"Ġwearer":41282,"Ġsmug":41283,"ĠInfluence":41284,"Ġ384":41285,"Truth":41286,"struction":41287,"Ġmaniac":41288,"ĠMagnetic":41289,"ousands":41290,"Ġsemen":41291,"dir":41292,"ĠTornado":41293,"Ġexplos":41294,"1995":41295,"Xi":41296,"Steel":41297,"057":41298,"Barn":41299,"Fan":41300,"ĠChatt":41301,"Chem":41302,"ĠFold":41303,"bees":41304,"1080":41305,"ĠMaze":41306,"ierre":41307,"oeuv":41308,"Cand":41309,"odium":41310,"mmm":41311,"ereo":41312,"Ġreactionary":41313,"Ġacidic":41314,"ĠRemoval":41315,"Ġnont":41316,"031":41317,"ĠTerminator":41318,"ĠVendor":41319,"enemy":41320,"Ġreconstructed":41321,"ĠGalileo":41322,"Ġtesters":41323,"albeit":41324,"uminium":41325,"Ġrite":41326,"ĠInput":41327,"committee":41328,"Ġjour":41329,"gements":41330,"Ġgerm":41331,"Dick":41332,"ĠRequirements":41333,"omsday":41334,"Î":41335,"ISSION":41336,"Ġmolded":41337,"Ġrye":41338,"Attorney":41339,"population":41340,"Ġrepet":41341,"Sync":41342,"breaks":41343,"Ġbanished":41344,"Ġraspberry":41345,"Ġammo":41346,"Ġorthodox":41347,"Ġwebcam":41348,"ĠAsc":41349,"vl":41350,"1989":41351,"Ġdiscipl":41352,"Ġmoreover":41353,"Ġexplodes":41354,"1960":41355,"Ġpropositions":41356,"Protect":41357,"Ġsexes":41358,"physical":41359,"ĠAthena":41360,"ocent":41361,"ĠGothic":41362,"ĠRacial":41363,"istani":41364,"Ġhelium":41365,"ĠPresumably":41366,"Ġperman":41367,"becue":41368,"ĠHW":41369,"rued":41370,"ĠCNS":41371,"DEP":41372,"ĠManifest":41373,"2500":41374,"ĠMyst":41375,"Economic":41376,"Prot":41377,"Ġledge":41378,"Ġimitate":41379,"ĠTotally":41380,"ĠBeaut":41381,"OIL":41382,"Ġ1440":41383,"Moscow":41384,"ĠSets":41385,"merga":41386,"Ġlesbians":41387,"Walker":41388,"Move":41389,"ĠSOM":41390,"ĠPsy":41391,"strument":41392,"Ġiter":41393,"ĠTosh":41394,"oola":41395,"ĠAntiqu":41396,"ĠShining":41397,"Ġobservational":41398,"VW":41399,"rophe":41400,"034":41401,"Ġcontiguous":41402,"Ġstarve":41403,"sure":41404,"Ġnegate":41405,"Ġmindless":41406,"tf":41407,"Ġdownwards":41408,"046":41409,"riors":41410,"Ġreverted":41411,"ĠAthe":41412,"Bra":41413,"eah":41414,"Rachel":41415,"Hung":41416,"Join":41417,"ĠRaces":41418,"Ġmutant":41419,"Ġuncond":41420,"Ġusability":41421,"NESS":41422,"haust":41423,"036":41424,"Ġobscurity":41425,"Ġimperialism":41426,"Ġemitting":41427,"Ġideologically":41428,"ĠIro":41429,"erva":41430,"ĠIzzy":41431,"ĠLevels":41432,"onym":41433,"ĠConspiracy":41434,"ĠSapphire":41435,"Ul":41436,"Ġhuh":41437,"ochem":41438,"Ġbehaves":41439,"ĠMesh":41440,"Ark":41441,"Ġvec":41442,"ĠActions":41443,"Ġdistinguishing":41444,"ĠTsarnaev":41445,"ĠEndurance":41446,"ederation":41447,"itant":41448,"Ġstreetcar":41449,"041":41450,"ĠAval":41451,"ĠCompanion":41452,"ĠCartoon":41453,"Ġcalculus":41454,"993":41455,"eq":41456,"ĠVanilla":41457,"MAC":41458,"wolves":41459,"fg":41460,"Ġfermentation":41461,"Ġinformants":41462,"Ġsudo":41463,"Ġperipher":41464,"Ġindign":41465,"parts":41466,"detail":41467,"femin":41468,"blade":41469,"Ġinserts":41470,"Ġoffsets":41471,"Ġantidepressants":41472,"Ġphr":41473,"Ġresultant":41474,"biology":41475,"Ġacquies":41476,"UFF":41477,"****************":41478,"ĠPenalty":41479,"Ġrever":41480,"heric":41481,"ĠShadows":41482,"command":41483,"Ġreprint":41484,"089":41485,"empty":41486,"ĠTAG":41487,"stim":41488,"FK":41489,"Ġkins":41490,"uggle":41491,"imura":41492,"wit":41493,"Kill":41494,"Beck":41495,"Ocean":41496,"Ġlabyrinth":41497,"ĠNorse":41498,"IENCE":41499,"Ġ+++":41500,"DoS":41501,"gm":41502,"Ġbarbar":41503,"ĠCeres":41504,"Ġhashing":41505,"eworthy":41506,"Ġrecite":41507,"Ġelectrodes":41508,"Ġconformity":41509,"response":41510,"olate":41511,"Ġ357":41512,"Snap":41513,"Crime":41514,"Ġpointer":41515,"ĠTIT":41516,"Ġdistinctions":41517,"Ġ427":41518,"ĠÙĪ":41519,"abases":41520,"Mars":41521,"ĠSpiritual":41522,"Ġimpuls":41523,"Philadelphia":41524,"1994":41525,"Ġcunning":41526,"Ġfram":41527,"Ġinco":41528,"Ġomnip":41529,"imize":41530,"ervative":41531,"Gy":41532,"Drug":41533,"Ġcarniv":41534,"ĠSailor":41535,"download":41536,"ĠBeetle":41537,"ĠEarthqu":41538,"izontal":41539,"Alan":41540,"Nice":41541,"Prior":41542,"MAG":41543,"Ġautobi":41544,"ĠBrill":41545,"Ġpredominant":41546,"ĠMessiah":41547,"REM":41548,"ĠSlip":41549,"ĠWebs":41550,"ademic":41551,"<":41552,"ĠVessel":41553,"vari":41554,"Code":41555,"Ġbeetle":41556,"projects":41557,"BAT":41558,"Ġpsychotic":41559,"Ġunderside":41560,"Ġrefute":41561,"Considering":41562,"kees":41563,"wd":41564,"priority":41565,"Ġtwentieth":41566,"Ġatheist":41567,"amina":41568,"Ġeuphem":41569,"Ġtripod":41570,"ĠTrayvon":41571,"ĠNON":41572,"2200":41573,"ĠNPC":41574,"ependence":41575,"ĠMHz":41576,"ĠBung":41577,"Ġpane":41578,"Ġaboriginal":41579,"ĠPLUS":41580,"igers":41581,"ĠSexy":41582,"MF":41583,"Chall":41584,"Ay":41585,"ilingual":41586,"adj":41587,"Ġfrown":41588,"successful":41589,"stack":41590,"Ġic":41591,"ĠSeah":41592,"Ġconsequ":41593,"bugs":41594,"ĠScand":41595,"ĠCurve":41596,"Nob":41597,"ĠHoo":41598,"ĠKissinger":41599,"ĠTimeline":41600,"Ġmt":41601,"Description":41602,"YP":41603,"ĠInstallation":41604,"levision":41605,"Ġanthropology":41606,"itzerland":41607,"iaries":41608,"kward":41609,"robat":41610,"Ġcarbohydrate":41611,"Phot":41612,"оÐ":41613,"ĠSQL":41614,"Disc":41615,"Ġdataset":41616,"ynski":41617,"Ġfiat":41618,"ĠDres":41619,"ĠFavor":41620,"ĠHalls":41621,"Alt":41622,"PART":41623,"Spider":41624,"Ġdisabling":41625,"RG":41626,"Ward":41627,"aturation":41628,"Ġwillfully":41629,"Ġlockout":41630,"ĠShutdown":41631,"956":41632,"Ġcommunists":41633,"Against":41634,"Ore":41635,"ĠRik":41636,"ĠASD":41637,"ĠOnion":41638,"Ġparticulars":41639,"Analy":41640,"checked":41641,"selected":41642,"romy":41643,"ĠAkira":41644,"Ġcongr":41645,"Choice":41646,"Ġbos":41647,"organisms":41648,"Ġfrowned":41649,"Tok":41650,"Bir":41651,"ĠScrib":41652,"Ġrealms":41653,"Ġcoercive":41654,"1993":41655,"021":41656,"âĢĵâĢĵ":41657,"athetic":41658,"rior":41659,"Ġfolly":41660,"ĠAMERICA":41661,"Ġcassette":41662,"953":41663,"Ġabsorbs":41664,"043":41665,"quad":41666,"''.":41667,"ĠExtract":41668,"Ġ424":41669,"Whit":41670,"Dun":41671,"Ġexerted":41672,"Ġbrethren":41673,"ĠChronicles":41674,"eric":41675,"Mot":41676,"Ġendings":41677,"piration":41678,"Ġpredetermined":41679,"ĠAirl":41680,"Ġgasp":41681,"Ġ367":41682,"Ġexclaim":41683,"cation":41684,"sort":41685,"idden":41686,"missive":41687,"ع":41688,"oice":41689,"same":41690,"Ott":41691,"Ġscatter":41692,"Flight":41693,"ĠTOD":41694,"Stra":41695,"amia":41696,"IZE":41697,"Ġcompressor":41698,"ixels":41699,"lethal":41700,"ĠExperimental":41701,"Ing":41702,"knife":41703,"Ġvanishing":41704,"ĠRequired":41705,"Stat":41706,"ĠPlex":41707,"spection":41708,"ĠBakr":41709,"Amazing":41710,"Ġbreaths":41711,"rots":41712,"OSP":41713,"Ġ840":41714,"Wars":41715,"OGR":41716,"Ġ372":41717,"ĠKhe":41718,"inous":41719,"lightly":41720,"ĠRounds":41721,"Ġrefinement":41722,"property":41723,"Ġmetaph":41724,"oultry":41725,"istor":41726,"Ġintestine":41727,"eus":41728,"ĠWilhelm":41729,"ĠBane":41730,"emption":41731,"oubtedly":41732,"ĠVirtue":41733,"'),":41734,"Ħ¢":41735,"Ġappar":41736,"ĠTranslation":41737,"Quite":41738,"Ġphysicists":41739,"Ġpriesthood":41740,"Ġallowable":41741,"Saint":41742,"OSED":41743,"bind":41744,"Ġtorches":41745,"osexual":41746,"Cruz":41747,"ertility":41748,"ĠAES":41749,"Ġascended":41750,"Ġmuzzle":41751,"Ġelectors":41752,"ĠKrug":41753,"Ġcc":41754,"classic":41755,"ĠMace":41756,"Å«":41757,"Ġâ̦\"":41758,"ĠTEST":41759,"gomery":41760,"Person":41761,"Ġtranslations":41762,"ĠDys":41763,"ĠConsent":41764,"Ġ361":41765,"alos":41766,"Ġallerg":41767,"ĠWast":41768,"ĠChecks":41769,"cerning":41770,"Ġlizard":41771,"Ġrevolutions":41772,"Ġtether":41773,"Ġminimized":41774,"ĠReverse":41775,"itely":41776,"iguous":41777,"athing":41778,"Flow":41779,"Moving":41780,"Ġ409":41781,"047":41782,"Ġsnug":41783,"Nich":41784,"Ġcartridge":41785,"YL":41786,"Ġforwarding":41787,"umerous":41788,"ĠAbedin":41789,"iolet":41790,"tick":41791,"ĠTransform":41792,"Grant":41793,"Ġsubtitles":41794,"ĠEmin":41795,"ghost":41796,"ĠKurd":41797,"Ġfireball":41798,"compatible":41799,"Ġprojectiles":41800,"amorph":41801,"ĠSatisf":41802,"Ġquirks":41803,"Ġrecept":41804,"spective":41805,"Ġgraphical":41806,"ĠPicard":41807,"ĠAuthent":41808,"ĠSponge":41809,"Army":41810,"ĠLumin":41811,"ĠSOME":41812,"Ġsolitude":41813,"ĠSHOULD":41814,"ĠFasc":41815,"opez":41816,"types":41817,"gallery":41818,"OLOGY":41819,"shake":41820,"Ġ369":41821,"Ġreused":41822,"Ġ378":41823,"Ġexorc":41824,"Ġdocs":41825,"Yu":41826,"ĠGOD":41827,"ocrine":41828,"location":41829,"fif":41830,"Grid":41831,"Ġpowd":41832,"Ġ'[":41833,"Ġposterior":41834,"Thompson":41835,"Table":41836,"oslov":41837,"ĠGoddess":41838,"odon":41839,"ĠSTD":41840,"Ġresponsiveness":41841,"stab":41842,"absolute":41843,"Enough":41844,"ĠEssence":41845,"ĠUpgrade":41846,"hematically":41847,"Subscribe":41848,"alsh":41849,"repl":41850,"Ġselector":41851,"ĠLength":41852,"Ġtemporal":41853,"Tele":41854,"ocalyptic":41855,"ĠDeaths":41856,"rl":41857,"Target":41858,"ĠOrn":41859,"ongh":41860,"Ġ1909":41861,"Quest":41862,"Place":41863,"ĠDisabled":41864,"Ġascending":41865,"giene":41866,"ĠMSI":41867,"ivil":41868,"Ġcaval":41869,"Ġintermitt":41870,"Ġsalts":41871,"Apr":41872,"059":41873,"ĠKeeper":41874,"emis":41875,"ĠEternal":41876,"SER":41877,"estones":41878,"Ġrudimentary":41879,"Ġpooled":41880,"ĠAlright":41881,"Ġdiagrams":41882,"ydia":41883,"Jacob":41884,"Ġarchitectures":41885,"ĠUSPS":41886,"Ġfootnote":41887,"ĠBrav":41888,"ĠLeopard":41889,"Ġvirtuous":41890,"ploma":41891,"ĠHIP":41892,"Ġhorizontally":41893,"olith":41894,"Prop":41895,"ĠApocalypse":41896,"Syria":41897,"ĠShowdown":41898,"constitutional":41899,"Independent":41900,"ĠMiliband":41901,"ĠTracks":41902,"adle":41903,"ĠESL":41904,"ĠFIGHT":41905,"Ġjohn":41906,"é":41907,"benef":41908,"eware":41909,"ĠTABLE":41910,"ĠVeg":41911,"ainers":41912,"Ġresolves":41913,"Warren":41914,"ĠRanked":41915,"possibly":41916,"bian":41917,"simple":41918,"Ġuniformly":41919,"ĠSlash":41920,"otton":41921,"ĠAbsent":41922,"agically":41923,"ĠPieces":41924,"Station":41925,"ĠBeware":41926,"ĠDiscrimination":41927,"Ġponies":41928,"Import":41929,"utory":41930,"ĠParas":41931,"Phoenix":41932,"Lat":41933,"UTC":41934,"push":41935,"astically":41936,"urrent":41937,"untarily":41938,"Ġparanormal":41939,"Ġglanced":41940,"Ġmanifestations":41941,"ĠNeuroscience":41942,"irgin":41943,"ROM":41944,"Ġ($)":41945,"Ġ379":41946,"missing":41947,"Ġmercenaries":41948,"Ġenumer":41949,"ĠShant":41950,"Ws":41951,"wered":41952,"Ġbuffs":41953,"ultane":41954,"ĠRohing":41955,"igger":41956,"Ring":41957,"Ġmanifests":41958,"Fat":41959,"ĠReduced":41960,"ĠMinerva":41961,"uart":41962,"ĠArmory":41963,"orange":41964,"igible":41965,"Ġphysiology":41966,"Ut":41967,"Ġparchment":41968,"ĠFired":41969,"trap":41970,"oggle":41971,"mson":41972,"ĠPoster":41973,"Ġbount":41974,"import":41975,"maximum":41976,"Ġ422":41977,"ĠFemin":41978,"Ġnodding":41979,"Ġinscription":41980,"Results":41981,"GRE":41982,"icative":41983,"Ġcognition":41984,"Ġions":41985,"ĠBite":41986,"Ġneutron":41987,"Ġduplication":41988,"ĠZIP":41989,"ĠQuit":41990,"Ġgrasping":41991,"ĠDaylight":41992,"Ġlayouts":41993,"CLA":41994,"reason":41995,"ĠHuh":41996,"Ġpige":41997,"ĠBomber":41998,"Produ":41999,"Ġgland":42000,"ĠAbsolute":42001,"writ":42002,"Ġmassac":42003,"Ġfixation":42004,"device":42005,"yz":42006,"ĠGOT":42007,"ĠDying":42008,"adjust":42009,"grain":42010,"Ġdeform":42011,"Ġtypew":42012,"Ġdagger":42013,"ĠTuring":42014,"ĠBucc":42015,"Heavy":42016,"Ġcommod":42017,"files":42018,"ogeneous":42019,"roth":42020,"Buff":42021,"Ġbookmark":42022,"porary":42023,"Medical":42024,"Um":42025,"Ġtranslucent":42026,"ĠAnxiety":42027,"ĠCorinthians":42028,"optional":42029,"PUT":42030,"Ġcrucifix":42031,"alloween":42032,"ĠVK":42033,"Ġblu":42034,"ĠCorinth":42035,"Mount":42036,"Ġmembranes":42037,"particip":42038,"Ġextraord":42039,"Ġstimulated":42040,"leneck":42041,"Ġspecifies":42042,"Sin":42043,"lash":42044,"Edited":42045,"Ġfused":42046,"Nin":42047,"ĠBungie":42048,"ĠTooth":42049,"WATCH":42050,"Nav":42051,"Initially":42052,"+)":42053,"ĠAncest":42054,"Ġtransmitter":42055,"ĠVolks":42056,"ezvous":42057,"ĠNirvana":42058,"ĠCald":42059,"font":42060,"Und":42061,"remlin":42062,"ichever":42063,"ĠHeal":42064,"shall":42065,"Ġattribution":42066,"authorized":42067,"ĠINTO":42068,"acteria":42069,"ĠTsu":42070,"ĠPlane":42071,"iphate":42072,"igraph":42073,"chev":42074,"Ġinverse":42075,"ifest":42076,"Players":42077,"!!\"":42078,"ĠContrast":42079,"1984":42080,"Ġsevent":42081,"colour":42082,"ĠRational":42083,"virtual":42084,"Ġfec":42085,"ĠETH":42086,"ĠPru":42087,"Õ":42088,"asma":42089,"Cur":42090,"Ġassigns":42091,"Ġridic":42092,"Todd":42093,"ulton":42094,"ĠDefendant":42095,"opsis":42096,"Ġpercentile":42097,"shr":42098,"wagen":42099,"Ġ368":42100,"SIGN":42101,"Screen":42102,"reprene":42103,"Ġerection":42104,"ĠFreak":42105,"ĠStard":42106,"stained":42107,"Ġcla":42108,"fet":42109,"ramids":42110,"QL":42111,"avorable":42112,"ĠTCP":42113,"nown":42114,"ulence":42115,"similar":42116,"Ġlinkage":42117,"ercise":42118,"Path":42119,"LECT":42120,"ĠCollections":42121,"ĠModule":42122,"Ġcs":42123,"Current":42124,"Ġmono":42125,"ĠAlv":42126,"ĠDude":42127,"Ġhypers":42128,"Ġ2600":42129,"surface":42130,"Ġpredictor":42131,"ĠColomb":42132,"Prof":42133,"anqu":42134,"natal":42135,"Ġadultery":42136,"ĠGenerations":42137,"clerosis":42138,"Ġ371":42139,"Ġenlightenment":42140,"onomic":42141,"Ġsatir":42142,"ĠBasics":42143,"Graham":42144,"ĠRove":42145,"Ġadul":42146,"Shut":42147,"ocious":42148,"Ġhandc":42149,"BW":42150,"ĠCognitive":42151,"visible":42152,"Ġinev":42153,"Ġ978":42154,"ĠSupported":42155,"Ġarrays":42156,"Ġalienation":42157,"Weight":42158,"ĠkWh":42159,"Ġwarped":42160,"Ġ386":42161,"lance":42162,"Ġherpes":42163,"ĠPHP":42164,"Ġclaimant":42165,"uitive":42166,"Ġpussy":42167,"Ġcorpus":42168,"ĠAo":42169,"Qual":42170,"ĠXVI":42171,"requ":42172,"Ġsympt":42173,"mination":42174,"Ġhairy":42175,"ĠBattles":42176,"owntown":42177,"Roberts":42178,"Ġnec":42179,"ablo":42180,"AMD":42181,"internet":42182,"Tar":42183,"direction":42184,"ouston":42185,"ĠGlock":42186,"ĠYanukovych":42187,"ogens":42188,"rogram":42189,"otype":42190,"ĠPt":42191,"tenance":42192,"Ġaromatic":42193,"oxin":42194,"Vert":42195,"Ġsociop":42196,"cible":42197,"Db":42198,"________________":42199,"Third":42200,"ĠShips":42201,"!.":42202,"expensive":42203,"WOR":42204,"primary":42205,"Ġ666":42206,"Ġdecaying":42207,"Ġclustered":42208,"Ġbeetles":42209,"ĠHogwarts":42210,"Ġheaders":42211,"ĠJudah":42212,"Ġscen":42213,"Ġcosmos":42214,"ĠGenetic":42215,"blems":42216,"Ġfeeble":42217,"NOW":42218,"NSA":42219,"Ġadminist":42220,"ĠDocker":42221,"portion":42222,"gression":42223,"Ġ1904":42224,"heard":42225,"Ġinhab":42226,"ĠLeaves":42227,"Ġcortisol":42228,"atinum":42229,"unknown":42230,"ĠObserv":42231,"ĠPhilosophy":42232,"Ide":42233,"Ġcopyrighted":42234,"surv":42235,"ĠLocations":42236,"Ġglands":42237,"ĠKnife":42238,"ĠEmber":42239,"ĠUnicorn":42240,"Ġhaste":42241,"Ġkinderg":42242,"ĠTerrit":42243,"ĠKoran":42244,"Ġaval":42245,"addon":42246,"ĠNero":42247,"\"]":42248,"Ġ392":42249,"comfort":42250,"Ġclothed":42251,"ashtra":42252,"mode":42253,"Ġ??":42254,"!\",":42255,"Ġknob":42256,"EMP":42257,"norm":42258,"ĠAgo":42259,"RECT":42260,"Denver":42261,"Ġ1907":42262,"ĠBombs":42263,"Sche":42264,"Ġtriangular":42265,"Ġperv":42266,"rises":42267,"Jes":42268,"Ġcalibration":42269,"Ġts":42270,"Same":42271,"ĠAxe":42272,"ĠMei":42273,"multi":42274,"Ġexerc":42275,"orney":42276,"Ware":42277,"abul":42278,"ĠFior":42279,"Eventually":42280,"ĠGrizz":42281,"Past":42282,"married":42283,"Ġscram":42284,"ĠCache":42285,"posure":42286,"Ġheav":42287,"ĠShirt":42288,"powder":42289,"complex":42290,"Doc":42291,"arus":42292,"Pi":42293,"Ġcurv":42294,"ĠTopic":42295,"Ġ.)":42296,"Ġwills":42297,"philis":42298,"gui":42299,"leground":42300,"Eth":42301,"Strike":42302,"Kid":42303,"Ġdelegated":42304,"Soon":42305,"Ġwast":42306,"gage":42307,"Ġprosecut":42308,"Ġ374":42309,"opolis":42310,"chest":42311,"ensation":42312,"Ġredes":42313,"Ġpresum":42314,"Portland":42315,"Ġannihil":42316,"yssey":42317,"Ġforks":42318,"Ġvitro":42319,"walker":42320,"ĠPsal":42321,"ĠStealth":42322,"Quick":42323,"ĠBaghd":42324,"ĠDrift":42325,"//":42326,"Ġinvincible":42327,"ĠGAM":42328,"Ġcastles":42329,"Ġbondage":42330,"ĠBalloon":42331,"Amid":42332,"individual":42333,"tis":42334,"ĠGuides":42335,"xe":42336,"Cong":42337,"URI":42338,"ĠHH":42339,"PHOTOS":42340,"ĠASIC":42341,"burst":42342,"ahon":42343,"ĠFIX":42344,"ilib":42345,"Ġ457":42346,"ĠLogged":42347,"à¹":42348,"Creat":42349,"inatory":42350,"column":42351,"ĠAugustus":42352,"suggest":42353,"pret":42354,"ĠParan":42355,"Ġsubsistence":42356,"wx":42357,"×":42358,"aleigh":42359,"dash":42360,"ĠMana":42361,"Ko":42362,"opausal":42363,"Ġbene":42364,"ĠSabb":42365,"ĠGhosts":42366,"Ġ1830":42367,"ĠHats":42368,"ĠHive":42369,"Perfect":42370,"Ġsocialists":42371,"Ġtumult":42372,"EGA":42373,"ĠNAME":42374,"Android":42375,"assembled":42376,"phis":42377,"Stage":42378,"Char":42379,"Double":42380,"Ġinsign":42381,"IED":42382,"perial":42383,"ĠEMP":42384,"mx":42385,"Ġskept":42386,"Ġwifi":42387,"Ġparad":42388,"ĠFrequency":42389,"Dist":42390,"nil":42391,"iots":42392,"å":42393,"Message":42394,"Furthermore":42395,"Ġhideous":42396,"ĠLDL":42397,"ĠFault":42398,"ĠDimensions":42399,"ĠImplement":42400,"fram":42401,"Ġamaz":42402,"ĠIndones":42403,"ĠTile":42404,"Ġlar":42405,"gc":42406,"Ġcorrelate":42407,"Ġensl":42408,"mite":42409,"Ġhomosexuals":42410,"Ġagric":42411,"8000":42412,"Ġcuring":42413,"rament":42414,"Ġrecons":42415,"ocene":42416,"ENTION":42417,"Ġcommunion":42418,"ĠFunction":42419,"iple":42420,"Ġredund":42421,"Ġcalibrated":42422,"Ġcontribut":42423,"ĠHuck":42424,"limit":42425,"ĠFedora":42426,"ĠTsuk":42427,"brates":42428,"Ġ1903":42429,"ozo":42430,"visual":42431,"ĠDiscipline":42432,"chains":42433,"ĠOCD":42434,"Ġexpended":42435,"0002":42436,"Ġsty":42437,"ĠNightmare":42438,"ĠReplace":42439,"ounty":42440,"fn":42441,"1900":42442,"ĠEpidem":42443,"ĠFW":42444,"Ġgul":42445,"ĠTomato":42446,"ĠPerse":42447,"wl":42448,"ĠFormation":42449,"Scan":42450,"cosystem":42451,"Brand":42452,"Ġ398":42453,"Ġcaptives":42454,"Ġ×":42455,"ESCO":42456,"ĠEnder":42457,"lesh":42458,"ĠAscend":42459,"poly":42460,"eous":42461,"Ġhyster":42462,"Murray":42463,"phe":42464,"Ġradiator":42465,"esthes":42466,"Ġopin":42467,"Ġconspic":42468,"intosh":42469,"Ġwitchcraft":42470,"ĠCFR":42471,"ussian":42472,"escent":42473,"locking":42474,"Ġnonsensical":42475,"uala":42476,"ĠSerial":42477,"1991":42478,"ĠCalm":42479,"containing":42480,"Ġstimulates":42481,"Ġ448":42482,"Pir":42483,"ĠâĨĴ":42484,"ĠDiver":42485,"Ġmanuscripts":42486,"ĠGaia":42487,"Ñĥ":42488,"Learning":42489,"Ġnipple":42490,"reads":42491,"Ġandroid":42492,"ĠMeditation":42493,"Ġincomprehensible":42494,"edded":42495,"Ġdescendant":42496,"ĠMorty":42497,"Luckily":42498,"ARCH":42499,"ausible":42500,"Dig":42501,"shared":42502,"ĠClip":42503,"Ġtrope":42504,"Ġnarcissistic":42505,"ventures":42506,"Ġcuriously":42507,"ĠCosmos":42508,"Aust":42509,"Lay":42510,"ĠShard":42511,"ĠRecorded":42512,"Ġ458":42513,"........":42514,"Ġperish":42515,"ĠExample":42516,"luent":42517,"Ġapes":42518,"ĠHitch":42519,"Ġholiest":42520,"Ġamplifier":42521,"minent":42522,"xxxxxxxx":42523,"inite":42524,"Ġgenomes":42525,"ĠGuilty":42526,"mult":42527,"Ġorc":42528,"Ġnipples":42529,"Side":42530,"Ġlogically":42531,"Ġdatasets":42532,"ĠTitanium":42533,"Ġrotor":42534,"undle":42535,"handled":42536,"nexpected":42537,"Ġdw":42538,"Ġdiagonal":42539,"ĠAnimated":42540,"Ġnumbering":42541,"Forest":42542,"ĠâĨ":42543,"Prin":42544,"Ġchemically":42545,"ĠGithub":42546,"Ġaph":42547,"ĠFaster":42548,"ĠTinker":42549,"ikini":42550,"Dest":42551,"dri":42552,"Manufact":42553,"isance":42554,"Return":42555,"Alert":42556,"elcome":42557,"ĠMMR":42558,"Ġresid":42559,"ĠLIC":42560,"Ġspecificity":42561,"zanne":42562,"Ġanyways":42563,"Ġ426":42564,"Scot":42565,"astery":42566,"Via":42567,"ĠBlocks":42568,"Ġactivates":42569,"Ġabstinence":42570,"Ġchronological":42571,"Soul":42572,"ĠSchne":42573,"Ġwatts":42574,"AUT":42575,"Ġcalcul":42576,"Simply":42577,"Emb":42578,"ceptive":42579,"ĠCatholicism":42580,"obook":42581,"ĠBits":42582,"ĠMbps":42583,"Ġindignation":42584,"Ġshorthand":42585,"Active":42586,"ĠLimbaugh":42587,"ĠCapcom":42588,"adesh":42589,"Ġclipping":42590,"ĠInstructor":42591,"Secret":42592,"___":42593,"Fer":42594,"rawling":42595,"ĠReward":42596,"Ġweep":42597,"Ġmotherboard":42598,"Above":42599,"metry":42600,"ĠPTS":42601,"Ġbombard":42602,"abetes":42603,".--":42604,"Lens":42605,"Comb":42606,"basic":42607,"ĠREALLY":42608,"Later":42609,"Ġ383":42610,"Ġpositional":42611,"olesc":42612,"Ġcrotch":42613,"ĠMDMA":42614,"requently":42615,"ĠPants":42616,"Ġ433":42617,"uctor":42618,"Ġillumination":42619,"ĠÙħ":42620,"ocrin":42621,"Ġpamph":42622,"atio":42623,"etc":42624,"Ġrestores":42625,"ĠProtector":42626,"Develop":42627,"ĠMew":42628,"trop":42629,"ĠSlayer":42630,"Ti":42631,"ĠNotwithstanding":42632,"Match":42633,"LIST":42634,"IDES":42635,"ĠThick":42636,"Ġdisks":42637,"Kin":42638,"Ġghetto":42639,"ĠObjects":42640,"Ġprism":42641,"ĠNether":42642,"Ġvul":42643,"iky":42644,"]:":42645,"ĠDetail":42646,"Ġfucked":42647,"!?":42648,"anium":42649,"Ġlords":42650,"ilities":42651,"ĠEthnic":42652,"static":42653,"$$":42654,"evidence":42655,"Ġmainline":42656,"Ġpeasant":42657,"ĠEnhance":42658,"ĠForced":42659,"virt":42660,"Ġii":42661,"Ġsymm":42662,"Ġconverter":42663,"ularity":42664,"Ġrepent":42665,"num":42666,"ĠScrew":42667,"ĠFTA":42668,"Ġmarines":42669,"hetto":42670,"blow":42671,"Ġado":42672,"ĠTypical":42673,"Ġoverw":42674,"ĠBerm":42675,"keley":42676,"Song":42677,"hao":42678,"valid":42679,"EXT":42680,"ĠProvides":42681,"âĺħâĺħ":42682,"ĠOdin":42683,"Shot":42684,"Ġgamma":42685,"Princ":42686,"asonry":42687,"ĠAccuracy":42688,"Ġcriterion":42689,"Ġdescriptive":42690,"Gall":42691,"gray":42692,"ĠCalcul":42693,"Ġaxes":42694,"ĠCommunists":42695,"ĠRebellion":42696,"Success":42697,"tg":42698,"Ġâĺ":42699,"Ġmultiplier":42700,"ravity":42701,"Thus":42702,"URL":42703,"Ġalternatively":42704,"duction":42705,"Ġsarcast":42706,"ĠCarth":42707,"ĠUSL":42708,"ĠInvisible":42709,"larg":42710,"pleted":42711,"pathic":42712,"Additionally":42713,"ĠCao":42714,"Ġlatent":42715,"ĠSurge":42716,"MEN":42717,"communications":42718,"ĠArray":42719,"Pink":42720,"commit":42721,"isodes":42722,"earcher":42723,"Ukraine":42724,"ĠAnthrop":42725,"incial":42726,"Ġquotations":42727,"adena":42728,"Ġwhining":42729,"Ġretri":42730,"ĠAssass":42731,"elligent":42732,"ĠPERSON":42733,"Py":42734,"Send":42735,"ĠâĪĴ":42736,"DON":42737,"Ġwatt":42738,"description":42739,"POS":42740,"Ġrepro":42741,"destroy":42742,"icidal":42743,"Ġmidrange":42744,"Ġinfographic":42745,"interesting":42746,"category":42747,"Flash":42748,"ĠInvasion":42749,"ĠExodus":42750,"restricted":42751,"Ġinference":42752,"dding":42753,"mingham":42754,"Ġcircumst":42755,"Wi":42756,"ĠHast":42757,"Ġsubjug":42758,"Ġwhispering":42759,"-.":42760,"Ġadren":42761,"ĠPattern":42762,"BOX":42763,"ĠEnhancement":42764,"Exc":42765,"ĠBucket":42766,"ĠGUN":42767,"deen":42768,"ĠHomo":42769,"1985":42770,"Ġclo":42771,"Ġsnippet":42772,"Ġ1896":42773,"TPP":42774,"Seg":42775,"success":42776,";\"":42777,"ĠMUCH":42778,"Author":42779,"Ġreplication":42780,"Ġhallucinations":42781,"Inv":42782,"ĠAware":42783,"ĠViper":42784,"kai":42785,"frames":42786,"ĠTHANK":42787,"ĠSHA":42788,"wordpress":42789,"Ġbc":42790,"CIA":42791,"arrison":42792,"Ġalloc":42793,"ĠAlz":42794,"letcher":42795,"ĠDaredevil":42796,"iversary":42797,"Ġmanuals":42798,"Catholic":42799,"feat":42800,"Ġkinetic":42801,"JB":42802,"yeah":42803,"ĠLDS":42804,"Ġppm":42805,"ĠADC":42806,"pring":42807,"cence":42808,"Ġclasp":42809,"Ġsetups":42810,"Ġdeity":42811,"ĠIndra":42812,"ĠWander":42813,"Ġantib":42814,"Otherwise":42815,"ombie":42816,"Bitcoin":42817,"ipop":42818,"expression":42819,"Animal":42820,"ĠResurrection":42821,"ĠMoral":42822,"ĠSDK":42823,"Ġwretched":42824,"ogenous":42825,"species":42826,"Ġchuckled":42827,"Thor":42828,"Ġ428":42829,"avery":42830,"ĠPry":42831,"asures":42832,"ĠErn":42833,"apor":42834,"Ġinnumerable":42835,"Ġbaptized":42836,"ĠExplosive":42837,"Ġelves":42838,"idges":42839,"ĠParadox":42840,"Close":42841,"aldehyde":42842,"construct":42843,"Ġvirginity":42844,"Poll":42845,"assin":42846,"Doctors":42847,"Pos":42848,"NECT":42849,"Moreover":42850,"Commercial":42851,"cknowled":42852,"1988":42853,"Ġquotation":42854,"marriage":42855,"ĠBapt":42856,"ĠSina":42857,"ĠGloves":42858,"gian":42859,"Ġconfounding":42860,"URRENT":42861,"Dean":42862,"Brew":42863,"thur":42864,"pty":42865,"immune":42866,"ĠSQU":42867,"Ġcounterfe":42868,"rider":42869,"Ġinferred":42870,"ĠDimension":42871,"ĠToad":42872,"Ġafterlife":42873,"ĠHERO":42874,"Indiana":42875,"seek":42876,"Ġdistinguishes":42877,"ĠQur":42878,"ĠMethods":42879,"combat":42880,"Ġcateg":42881,"ĠStruggle":42882,"teness":42883,"liquid":42884,"Ġblinking":42885,"ĠCONTIN":42886,"iae":42887,"Ġaerobic":42888,"Ġstrugg":42889,"Ġegalitarian":42890,"hello":42891,"orrect":42892,"ĠAbandon":42893,"Ġferment":42894,"Area":42895,"idem":42896,"ĠMania":42897,"Ġjs":42898,"ĠBALL":42899,"Running":42900,"Ġregenerate":42901,"iquid":42902,"Uh":42903,"Crystal":42904,"ĠItal":42905,"ĠHeavenly":42906,"в":42907,"CRIPTION":42908,"Consumer":42909,"dust":42910,"amiliar":42911,"ĠRhino":42912,"Rocket":42913,"Ġreversible":42914,"kok":42915,"ĠSketch":42916,"Ġshotguns":42917,"apses":42918,"Ġdetach":42919,"ĠCells":42920,"artist":42921,"rily":42922,"ĠRestore":42923,"Scar":42924,"Ġevid":42925,"Ġspaced":42926,"ĠContributions":42927,"Ġ418":42928,"ĠMystic":42929,"Ġobfusc":42930,"Russ":42931,"wings":42932,"Pear":42933,"osite":42934,"Nusra":42935,"urations":42936,"ovie":42937,"icago":42938,"ĠConcepts":42939,"Ġstimuli":42940,"Ġaroused":42941,"aughty":42942,"Talking":42943,"ĠPrompt":42944,"Across":42945,"ĠPlaint":42946,"Ġbranching":42947,"Thankfully":42948,"Original":42949,"Esc":42950,"ĠTechnician":42951,"fleet":42952,"usher":42953,"Mos":42954,"livion":42955,"oenix":42956,"Ġhr":42957,"ibble":42958,"Ġindent":42959,"ĠFinished":42960,"Department":42961,"ĠINFO":42962,"Movie":42963,"++":42964,"THING":42965,"Ġtimers":42966,"rocket":42967,"Natural":42968,"lime":42969,"Ġangular":42970,"osure":42971,"Ġdynamically":42972,"Ġpacif":42973,"ĠProcessor":42974,"Ġdisgu":42975,"Ġmoderators":42976,"Ġceases":42977,"Ġinertia":42978,"Ġpaperback":42979,"yton":42980,"ĠHuma":42981,"Ġprohibitions":42982,"Ġgestation":42983,"Bomb":42984,"termin":42985,"Ġcaric":42986,"oS":42987,"tc":42988,"Cop":42989,"raved":42990,"Ġeighty":42991,"ĠEnable":42992,"Ġimplementations":42993,"Ġconquering":42994,"ĠFinder":42995,"window":42996,"Gra":42997,"Ġfonts":42998,"laughter":42999,"Ġcolonization":43000,"ĠDOD":43001,")!":43002,",)":43003,"ĠGeral":43004,"ĠSpoiler":43005,"ĠComponent":43006,"Ġgist":43007,"hiro":43008,"Ġlicens":43009,"nesses":43010,"Ġkarma":43011,"?\".":43012,"OPA":43013,"Ġsquats":43014,"ĠRAND":43015,"Ġorally":43016,"document":43017,"olars":43018,"Ġpresumptive":43019,"Pers":43020,"OAD":43021,"ufficient":43022,"LESS":43023,"Hidden":43024,"ORK":43025,"xs":43026,"Ġmathematician":43027,"ĠGloss":43028,"Ġannihilation":43029,"Ġmanifold":43030,"Ry":43031,"Thunder":43032,"Yan":43033,"Activ":43034,"Ġworldly":43035,"TED":43036,"marg":43037,"ĠStun":43038,"ryce":43039,"ĠVG":43040,"Isn":43041,"ĠCyn":43042,"Expl":43043,"IRED":43044,"Ġcompr":43045,"Ġindisc":43046,"Boss":43047,"()":43048,"berman":43049,"ĠBegins":43050,"ujah":43051,"ornia":43052,"hetical":43053,"Ġcivilizations":43054,"Ġfundamentalist":43055,"strap":43056,"Forward":43057,"ettlement":43058,"Ġprophetic":43059,"glers":43060,"bending":43061,"Terry":43062,"Ġidi":43063,"Ġtrunc":43064,"Ġcreeps":43065,"intel":43066,"switch":43067,"ailand":43068,"Ġinstaller":43069,"GOP":43070,"Ġ499":43071,"ĠParallel":43072,"Cru":43073,"Ġ\"@":43074,"Ġ396":43075,"ĠUnlock":43076,"Raven":43077,"Corn":43078,"Ġcircadian":43079,"Ġ********************************":43080,"iliate":43081,"ĠFunctional":43082,"Ġpronouns":43083,"ĠSatoshi":43084,"Ġstim":43085,"Gay":43086,"Iss":43087,"ĠThief":43088,"atellite":43089,"Ġshards":43090,"Ġphil":43091,"protein":43092,"Ġalters":43093,"Poor":43094,"Typically":43095,"KER":43096,"ociate":43097,"Ġemits":43098,"recy":43099,"Ġmechanically":43100,"Ġ...\"":43101,"nature":43102,"sys":43103,"ysc":43104,"Ġwavelengths":43105,"pattern":43106,"insured":43107,"Ġparasitic":43108,"ĠLCS":43109,"ĠPACs":43110,"Ġheals":43111,"ĠCCP":43112,"ĠHacker":43113,"Ġpsy":43114,"ĠBeans":43115,"Ġdemonic":43116,"JV":43117,"Ġatmosp":43118,"equality":43119,"Ġairst":43120,"Ġincarn":43121,"ynthesis":43122,"Ġequations":43123,"tch":43124,"ĠHUGE":43125,"ĠChanged":43126,"itatively":43127,"Job":43128,"gaming":43129,"Ġ1899":43130,"ĠMorsi":43131,"Ġconjecture":43132,"riad":43133,"Ġprimates":43134,"ĠArtemis":43135,"ĠThro":43136,"Ġbiologically":43137,"Church":43138,"topia":43139,"recomm":43140,"Ġgradient":43141,"Ġful":43142,"Ġbastard":43143,"CHO":43144,"IUM":43145,"sleep":43146,"Construction":43147,"raints":43148,"vable":43149,"ionage":43150,"Ġcomrade":43151,"Ġpopulate":43152,"Ġnerds":43153,"ĠXie":43154,"result":43155,"ĠImper":43156,"Ġpamphlet":43157,"Ku":43158,"Ġbackend":43159,"ificent":43160,"etus":43161,"Ġdisson":43162,"config":43163,"Ġsuc":43164,"Ġwavelength":43165,"external":43166,"owder":43167,"Ġpredis":43168,"eenth":43169,"Det":43170,"andem":43171,"Ġ1865":43172,"ĠDefeat":43173,"Individual":43174,"Ġretrieving":43175,"stories":43176,"Ġdesolate":43177,"Ġlett":43178,"Ġunpublished":43179,"Ġpassively":43180,"Ġdissertation":43181,"raits":43182,"abee":43183,"ĠResist":43184,"Robin":43185,"Ġbenevolent":43186,"blast":43187,"Offic":43188,"snap":43189,"vernment":43190,"Ġextermin":43191,"wt":43192,"bitious":43193,"hibited":43194,"Insp":43195,"posted":43196,"ĠYugoslav":43197,"rational":43198,"adapt":43199,"ĠAtari":43200,"Ġplugin":43201,"oglobin":43202,"efeated":43203,"ĠHRC":43204,"cko":43205,"ilver":43206,"ĠDestruction":43207,"gewater":43208,"ĠRadiation":43209,"Ġimprison":43210,"origin":43211,"antine":43212,"ĠPublication":43213,"Ġhealer":43214,"istered":43215,"ĠTHEIR":43216,"hazard":43217,"Contract":43218,"Ġmediated":43219,"Ġindexed":43220,"ĠSYSTEM":43221,"Labor":43222,"Blade":43223,"Ġyog":43224,"Champ":43225,"Gordon":43226,"IAS":43227,"Ġnineteenth":43228,"animous":43229,"begin":43230,"ĠHolo":43231,"Planet":43232,"udding":43233,"default":43234,"ĠOMG":43235,"Ġwond":43236,"wm":43237,"pend":43238,"Extreme":43239,"Ġinterstellar":43240,"ASED":43241,"ĠBerks":43242,"Ġprimal":43243,"Foot":43244,"Ġinadvert":43245,"amboo":43246,"ĠLeica":43247,"Events":43248,"ĠPigs":43249,"RAFT":43250,"ï":43251,"ĠGentleman":43252,"Multiple":43253,"ĠPsychiatric":43254,"Ġdespise":43255,"ĠZionism":43256,"ĠSSL":43257,"shit":43258,"Ġthreaded":43259,"Ġartifact":43260,"Ġmitochondrial":43261,"ĠLayer":43262,"inus":43263,"podcast":43264,"Ġawaken":43265,"Management":43266,"Ġdelusions":43267,"grey":43268,"Ġpseud":43269,"agonal":43270,"ĠHirosh":43271,"Georg":43272,"Dragon":43273,"Stack":43274,"ohm":43275,"Ġvener":43276,"Row":43277,"Ġsandbox":43278,"Ġblinding":43279,"razen":43280,"Ġ389":43281,"Ġcrappy":43282,"Ġlith":43283,"antha":43284,"Ġplurality":43285,"ĠDAC":43286,"inently":43287,"intage":43288,"Ġ1902":43289,"ĠDepend":43290,"Ġelapsed":43291,"==":43292,"ĠGenie":43293,"Bush":43294,"ĠPlanetary":43295,"Bah":43296,"ĠKira":43297,"emn":43298,"Month":43299,"allic":43300,"coded":43301,"VOL":43302,"Ġ[...]":43303,"ĠRampage":43304,"Ġ(*":43305,"Production":43306,"licts":43307,"Ġinoc":43308,"Cour":43309,"Ġspurious":43310,"Ġultras":43311,"ggles":43312,"Ġdelusion":43313,"ĠRacer":43314,"ĠPrism":43315,"FH":43316,"uppet":43317,"Ġcultured":43318,"Ġ436":43319,"aneously":43320,"اÙĦ":43321,"ĠMissions":43322,"monton":43323,"criptions":43324,"ificate":43325,"Cause":43326,"Ġ1898":43327,"ocaust":43328,"Ġbri":43329,"ĠShoals":43330,"ommod":43331,"alted":43332,"ogenesis":43333,"warn":43334,"illus":43335,"vv":43336,"Ġcontam":43337,"ĠLesbian":43338,"Ġcavalry":43339,"ĠPresence":43340,"rehens":43341,"tool":43342,"accessible":43343,"Ġ(~":43344,"ĠLicensed":43345,"Ġprophets":43346,"Ġboulder":43347,"mean":43348,"akura":43349,"Ġunres":43350,"ĠCinnamon":43351,"Leaks":43352,"........................":43353,"Contact":43354,"Ġassassins":43355,"ĠGreenwald":43356,"dk":43357,"amazon":43358,"Ġagreeable":43359,"ernandez":43360,"Easy":43361,"PLA":43362,"ĠBigfoot":43363,"Ġconvent":43364,"Ġempires":43365,"Ġ387":43366,"Ġgrasped":43367,"Ġruby":43368,"Ġreconc":43369,"Warning":43370,"atem":43371,"Ġretrieval":43372,"ĠFDR":43373,"ĠReaper":43374,"orem":43375,"ĠLuo":43376,"hig":43377,"ĠArmor":43378,"tp":43379,"ĠInterpret":43380,"Conservative":43381,"ĠSodium":43382,"Ġbead":43383,"Ġpropagate":43384,"claw":43385,"href":43386,"ĠPaste":43387,"Ġomit":43388,"Boost":43389,"Diamond":43390,"goo":43391,"Ġanomal":43392,"ĠDISTRICT":43393,"Greek":43394,"warning":43395,"Ġdespised":43396,"Karl":43397,"AGES":43398,"Ġserotonin":43399,"ESSION":43400,"_______":43401,"ĠCollider":43402,"auldron":43403,"Ġsquee":43404,"Control":43405,"ffield":43406,"cycles":43407,"Legal":43408,"xa":43409,"minimum":43410,"ĠGeneric":43411,"Circ":43412,"·":43413,"Behind":43414,"guide":43415,"Ground":43416,"roying":43417,"ĠGrail":43418,"Ġthee":43419,"Ġ9000":43420,"Batman":43421,"Brother":43422,"Ġnons":43423,"RW":43424,"saf":43425,"ĠCroat":43426,"tainment":43427,"sci":43428,"Ye":43429,"Range":43430,"Ey":43431,"perature":43432,"ĠDracula":43433,"oreal":43434,"Fighting":43435,"Ġreleg":43436,"Ġcoupling":43437,"Tracker":43438,"tyard":43439,"Mut":43440,"Military":43441,"lamm":43442,"ittens":43443,"ĠCRC":43444,"ĠXiang":43445,"Ġorthodoxy":43446,"ĠGoth":43447,"Ġalgorith":43448,"ĠAthen":43449,"Ġtyrann":43450,"ĠTorrent":43451,"IDs":43452,"ĠGENERAL":43453,"ĠASUS":43454,"rastructure":43455,"Faith":43456,"models":43457,"rentices":43458,"ĠCurse":43459,"Ġcalibr":43460,"attled":43461,"monary":43462,"Ġpenet":43463,"aclysm":43464,"album":43465,"Ġremnant":43466,"Ġfung":43467,"itiveness":43468,"thodox":43469,"Ġunlocks":43470,"Ġprobabilities":43471,"Ġster":43472,"Ġscrim":43473,"Ġanalytic":43474,"Urban":43475,"âĢĶâĢĶâĢĶâĢĶ":43476,"Craft":43477,"Ġbrut":43478,"1986":43479,"Section":43480,"raged":43481,"arij":43482,"Hero":43483,"ĠHebdo":43484,"ĠEmpress":43485,"Ġvivo":43486,"ĠPublications":43487,"Ġcannabinoids":43488,"arrett":43489,"Ġbounded":43490,"Ġquests":43491,"Ġomin":43492,"ĠRuler":43493,"ĠYue":43494,"ridges":43495,"Ġpeasants":43496,"ĠAlloy":43497,"Desk":43498,"ULAR":43499,"Ġthor":43500,"ĠOvers":43501,"ĠTome":43502,"mk":43503,"Ġ1050":43504,"Ġshroud":43505,"Ġdistribut":43506,"weapons":43507,"ĠAuthorization":43508,"ĠPoke":43509,"ĠAlternate":43510,"scan":43511,"artisan":43512,"ĠGems":43513,"ĠForums":43514,"atonin":43515,"viron":43516,"Rog":43517,"duct":43518,"Ġtabletop":43519,"crow":43520,"/)":43521,"ĠStainless":43522,"ottest":43523,"Ġreborn":43524,"anchez":43525,"cium":43526,"ĠNicarag":43527,"elfare":43528,"Ġupd":43529,"ritic":43530,"bm":43531,"Ġ608":43532,"ĠSlightly":43533,"ĠDrops":43534,"ISO":43535,"ĠiT":43536,"xiety":43537,"ĠGawker":43538,"omination":43539,"ĠReached":43540,"Student":43541,"Drop":43542,"MET":43543,"ĠKubrick":43544,"1950":43545,"ĠTuls":43546,"Ġcomputed":43547,"depending":43548,"ĠCosmetic":43549,"udget":43550,"Lex":43551,"icut":43552,"ĠDepth":43553,"Ġ1893":43554,"ahah":43555,"Ġath":43556,"fights":43557,"thia":43558,"Ġoccult":43559,"Wheel":43560,"ĠSega":43561,"Ġtheolog":43562,"reement":43563,")--":43564,"Ġunus":43565,"ĠGamma":43566,"Looks":43567,"Ġellipt":43568,"Ġairflow":43569,"ĠHimself":43570,"Ġpagan":43571,"ĠRei":43572,"Ġpilgr":43573,"ĠSubmission":43574,"Region":43575,"Ġinsertion":43576,"Ġsket":43577,"Ġsatisfies":43578,"ĠPixie":43579,"Ġcontempl":43580,"abbit":43581,"ĠReplay":43582,"ĠGalile":43583,"ĠGodzilla":43584,"Ġarithmetic":43585,"iasm":43586,"1987":43587,"ĠFeminist":43588,"Liter":43589,"ĠDisable":43590,"ouble":43591,"essors":43592,"Ġfors":43593,"Ġensu":43594,"Putting":43595,"ĠMSM":43596,"Cond":43597,"emade":43598,"Ġindistinguishable":43599,"Magn":43600,"Ġms":43601,"MAL":43602,"ĠBF":43603,"dm":43604,"iltration":43605,"irection":43606,"ĠSpir":43607,"Gb":43608,"ĠIbn":43609,"Abs":43610,"imens":43611,"RNA":43612,"============":43613,"Ġ655":43614,"ĠConversion":43615,"imilation":43616,"igion":43617,"ĠSomew":43618,"mL":43619,"Border":43620,"Ë":43621,"Factor":43622,"Number":43623,"Ġejac":43624,"Cho":43625,"Ġrighteousness":43626,"ĠPATH":43627,"ĠElys":43628,"ouched":43629,"Ġmultic":43630,"Ġfaculties":43631,"ĠEarthquake":43632,"ĠReferences":43633,"ensitive":43634,"Ġimpat":43635,"Ġ................":43636,"buff":43637,"Ġ1895":43638,"colo":43639,"Vi":43640,"Ġubiqu":43641,"ĠChev":43642,"Fish":43643,"ĠBlueprint":43644,"CHQ":43645,"Ġlinem":43646,"ĠFlavor":43647,"Ġcrimson":43648,"ĠAbstract":43649,"arette":43650,"plete":43651,"ranean":43652,"Dash":43653,"Ġdimensional":43654,"Cub":43655,"ttle":43656,"ĠDSM":43657,"Ġinstantaneous":43658,"esy":43659,"Ġepoch":43660,"Brit":43661,"ĠÎ":43662,"ECD":43663,"Ġwarp":43664,"obyl":43665,"ubric":43666,"Ġutilitarian":43667,"Ġsummarizes":43668,"letal":43669,"Ord":43670,"opath":43671,"tained":43672,"ghai":43673,"Ġwhis":43674,"insert":43675,"Ġphon":43676,"rils":43677,"Ġearthly":43678,"ĠAlic":43679,"ĠPCIe":43680,"Ġfurthermore":43681,"ocard":43682,"Ġuter":43683,"ĠAdmin":43684,"ographics":43685,"ĠConstantin":43686,"gravity":43687,"iPhone":43688,"Ġwasteland":43689,"Ġfps":43690,"Tip":43691,"Ġmurm":43692,"paces":43693,"ĠSamurai":43694,"ĠFOIA":43695,"ĠRadiant":43696,"ĠUnreal":43697,"Ġmicrow":43698,"usterity":43699,"zyme":43700,"itbart":43701,"metadata":43702,"Dat":43703,"ĠMoons":43704,"ĠProtestants":43705,"ungle":43706,"Ġvideog":43707,"pid":43708,"Ġdisple":43709,"aucus":43710,"Ġcoils":43711,"ĠDwar":43712,"fixed":43713,"Alice":43714,"Ġgarrison":43715,"ĠVelocity":43716,"ĠJehovah":43717,"Ġfascists":43718,"ĠCHO":43719,"jl":43720,"Ġmetaphors":43721,"ĠSiege":43722,"scientific":43723,"Ä«":43724,"Slow":43725,"hex":43726,"ĠBlaz":43727,"mediated":43728,"esthesia":43729,"ĠAvg":43730,"Ġbelie":43731,"Carter":43732,"Ġexposition":43733,"azeera":43734,"dial":43735,"Ġbask":43736,"Scale":43737,"Ġdisob":43738,"Ġgore":43739,"Ġhypocr":43740,"Ġphantom":43741,"ĠSynd":43742,"BLIC":43743,"pter":43744,"ĠScorpion":43745,"eor":43746,"ĠRecover":43747,"Ġsummoning":43748,"Ġorb":43749,"jump":43750,"Ġ768":43751,"ĠEnix":43752,"Spons":43753,",...":43754,"Wide":43755,"Ġparse":43756,"Ġdebtor":43757,"Ġpathological":43758,"Ġserpent":43759,"ĠFranç":43760,"reetings":43761,"Ġdeletion":43762,"Ġvolunt":43763,"ĠNotification":43764,"liga":43765,"Disk":43766,"Account":43767,"1979":43768,"Ġsymmetry":43769,"ĠBearing":43770,"ĠABV":43771,"ĠORDER":43772,"rpm":43773,"ĠFuck":43774,"?!\"":43775,"mask":43776,"Grade":43777,"neath":43778,"ocom":43779,"Detect":43780,"ryption":43781,"ĠAura":43782,"Ġinert":43783,"PLAY":43784,"gres":43785,"INTON":43786,"Deal":43787,"fficient":43788,"ĠVoid":43789,"gement":43790,"Ġscorp":43791,"Ġreincarn":43792,"ĠVapor":43793,"Ġ1840":43794,"Yellow":43795,"......":43796,"Ġparameter":43797,"ĠDISTR":43798,"ĠForgotten":43799,"Eat":43800,"izational":43801,"Witness":43802,"ĠDupl":43803,"Ġdogma":43804,"Ġzipper":43805,"ĠZeus":43806,"mage":43807,"ormal":43808,"Ġ\".":43809,"Ġecc":43810,"ĠSlot":43811,"ĠRegist":43812,"Others":43813,"VID":43814,"Windows":43815,"Ġshitty":43816,"ĠLethal":43817,"Monster":43818,"ĠExpression":43819,"tx":43820,"ythm":43821,"Were":43822,"ivalry":43823,"atcher":43824,"ĠFormat":43825,"ĠPlasma":43826,"Phys":43827,"laugh":43828,"Fu":43829,"java":43830,"roma":43831,"ĠIncreases":43832,"Ġlicensee":43833,"Ġmystic":43834,"Ġproto":43835,"ĠLoki":43836,"forcing":43837,"hots":43838,"Ġ->":43839,"Outside":43840,"ĠEndless":43841,"Ġachie":43842,"ĠTurtles":43843,"Ġconvin":43844,"JUST":43845,"Ġimmobil":43846,"ĠCauses":43847,"Ġclich":43848,"xes":43849,"ffiti":43850,"Ġhypot":43851,"Bat":43852,"Ġbigot":43853,"Personal":43854,"ĠPharmac":43855,"Lot":43856,"VERT":43857,"Ġbapt":43858,"idelines":43859,"Ġprox":43860,"MAP":43861,"Spirit":43862,"ĠSlug":43863,"Ġebook":43864,"eches":43865,"ĠAndromeda":43866,"Ġceremon":43867,"1975":43868,"PRE":43869,"Ġasshole":43870,"linear":43871,"Nevertheless":43872,"Ġwillpower":43873,"azel":43874,"Fif":43875,"andise":43876,"Ġextravag":43877,"ĠBuffy":43878,"Ġcorrelations":43879,"ptr":43880,"Progress":43881,"shape":43882,"ĠSymbol":43883,"arag":43884,"ĠContext":43885,"ucer":43886,"1983":43887,"ĠMyster":43888,"Pain":43889,"Login":43890,"mbol":43891,"codes":43892,"RANT":43893,"Ġoverse":43894,"opot":43895,"STEM":43896,"enser":43897,"ĠCosmic":43898,"Spl":43899,"ritional":43900,"ĠPharaoh":43901,"ĠRemix":43902,"xon":43903,"ĠXII":43904,"Ġunman":43905,"Ġimmedi":43906,"Ġmonog":43907,"ĠLX":43908,"Ġabstraction":43909,"ocolate":43910,"ĠDonkey":43911,"Ġ!!":43912,"ĠLIA":43913,"shed":43914,"rules":43915,"Ġcalc":43916,"ĠAutob":43917,"anmar":43918,"eworks":43919,"notations":43920,"Ġtenancy":43921,"ĠPetraeus":43922,"dp":43923,"amphetamine":43924,"ĠCortex":43925,"rw":43926,"Ġprojectile":43927,"Ġintrinsically":43928,"Route":43929,"Ġnegoti":43930,"anuts":43931,"Analysis":43932,"redits":43933,"ĠGG":43934,"thread":43935,"ĠChosen":43936,"Years":43937,"otyp":43938,"ĠNCT":43939,"udic":43940,"ochemical":43941,"Neigh":43942,"Ġfishes":43943,"ĠFloat":43944,"Print":43945,"okia":43946,"Ġbarb":43947,"quote":43948,"Lew":43949,"Ġannoun":43950,"istors":43951,"Reading":43952,"ACTION":43953,"Ġintakes":43954,"ĠBeet":43955,"matter":43956,"Swe":43957,"Ther":43958,"Ġtyrant":43959,"ĠPsycho":43960,"ĠDestroy":43961,"Ġesoteric":43962,"Ġbiom":43963,"idious":43964,"Merc":43965,"hran":43966,"ĠBaal":43967,"seconds":43968,"Ġsuperhuman":43969,"ancel":43970,"Ġworshipped":43971,"Ġwebs":43972,"Ġviolet":43973,"ĠMetallic":43974,"eday":43975,"ordering":43976,"Nut":43977,"Ġconstructs":43978,"olescent":43979,"Unit":43980,"otypes":43981,"Ġembryonic":43982,"perm":43983,"Nature":43984,"ĠDecre":43985,"levant":43986,"Ġss":43987,"+(":43988,"ĠDoctrine":43989,"puters":43990,"Ġsaline":43991,"orsche":43992,"1111":43993,"values":43994,"Ġutopian":43995,"ĠBooster":43996,"Technical":43997,"ì":43998,"ĠLIMITED":43999,"nir":44000,"Ġclones":44001,"Performance":44002,"aple":44003,"Ġshudder":44004,"Ġcontempor":44005,"lator":44006,"ĠOops":44007,"Ġammon":44008,"Ġdavid":44009,"Ġbom":44010,"bish":44011,"Ġdetectable":44012,"Ġmultiplying":44013,"Ġreddit":44014,"Prim":44015,"Ġmedial":44016,"Ġsubstrate":44017,"ĠSanskrit":44018,"Spect":44019,"ĠMagical":44020,"Ġarcane":44021,"align":44022,"Ġ1861":44023,"Ġneocons":44024,"Ì":44025,"ĠBounty":44026,"ĠContinent":44027,"Ġhurd":44028,"alions":44029,"Ġgeneralized":44030,"ĠInsect":44031,"Ġsimul":44032,"actual":44033,"advert":44034,"ukong":44035,"Resp":44036,"ĠWarcraft":44037,"Hunter":44038,"hyper":44039,"ĠBreach":44040,"ught":44041,"Ġcomputation":44042,"react":44043,"Feel":44044,"ĠCheong":44045,"Ġslut":44046,"Ġgalactic":44047,"Ġtaunt":44048,"Enjoy":44049,"Ġreprinted":44050,"Word":44051,"ĠHandbook":44052,"amins":44053,"exit":44054,"Wo":44055,"Ġadherents":44056,"Counter":44057,"ĠNode":44058,"ĠTwisted":44059,"Ġgrinned":44060,"universal":44061,"ĠAmon":44062,"Ġaster":44063,"ĠEquip":44064,"!\".":44065,"Ġanalogous":44066,"rients":44067,"alky":44068,"ĠQian":44069,"Ġspont":44070,"docs":44071,"Ġcontemplation":44072,"Ġrevolutionaries":44073,"Ġpreset":44074,"ĠAmendments":44075,"Ġexecutes":44076,"ĠDuration":44077,"Ġcompulsion":44078,"Ġstagger":44079,"ynamic":44080,"blem":44081,"];":44082,"Higher":44083,"Balt":44084,"heast":44085,"Ġcorp":44086,"awei":44087,"Motion":44088,"Mis":44089,"Ġadventurer":44090,"eger":44091,"Ġarsen":44092,"ĠVoltage":44093,"ĠEVENTS":44094,"Salt":44095,"issance":44096,"DK":44097,"Ship":44098,"Ġunwitting":44099,"Ton":44100,"ĠPROGRAM":44101,"Ġtentacles":44102,"erness":44103,"thirst":44104,"Fig":44105,"fty":44106,"ĠTolkien":44107,"Sleep":44108,"ĠExplain":44109,"Pub":44110,"ĠBounce":44111,"ĠDemo":44112,"Ġ1897":44113,"ĠSPI":44114,"intern":44115,"********":44116,"ĠKills":44117,"ĠZombies":44118,"Single":44119,"ratom":44120,"ĠClaw":44121,"hid":44122,"asel":44123,"Shock":44124,"erential":44125,"Ġupgr":44126,"holy":44127,"Ġ\\":44128,"aghetti":44129,"Ġthence":44130,"genic":44131,"papers":44132,"1982":44133,"ravel":44134,"ĠUNIVERS":44135,"Charge":44136,"ĠDelay":44137,"ibrary":44138,"ĠHDD":44139,"olson":44140,"Ġenchanted":44141,"Wr":44142,"graph":44143,"Ġcorro":44144,"ept":44145,"etsu":44146,"ĠQin":44147,"Û":44148,"Ġantidepressant":44149,"ĠCerberus":44150,"Ġappe":44151,"ĠDEFENSE":44152,"Ġdysph":44153,"split":44154,"zilla":44155,"attr":44156,"Clar":44157,"Äĵ":44158,"hov":44159,"IRC":44160,"hibition":44161,"'/":44162,"ĠURLs":44163,"Draft":44164,"Prep":44165,"ĠLanguages":44166,"ĠTravels":44167,"ceiver":44168,"aturally":44169,"pair":44170,"ĠALWAYS":44171,"aaaa":44172,"ĠTenth":44173,"ĠNAD":44174,"Serv":44175,"ĠUID":44176,"cens":44177,"ĠLearned":44178,"Ġtraject":44179,"Ġmoaning":44180,"ĠNare":44181,"Ġingen":44182,"Ġsurn":44183,"Ġfloppy":44184,"breeding":44185,"uph":44186,"rossover":44187,"Understanding":44188,"Glass":44189,"Ġruntime":44190,"gp":44191,"Ġâľĵ":44192,"Ġcyt":44193,"bley":44194,"agall":44195,"Ġunworthy":44196,"otine":44197,"Ġchromosome":44198,"utters":44199,"Ġµ":44200,"Ġexpans":44201,"Ġdement":44202,"Ġinsurrection":44203,"Ġsurviv":44204,"genre":44205,"ospital":44206,"ĠPlato":44207,"ĠTrigger":44208,"selection":44209,"ilege":44210,"Ġsegreg":44211,"itizens":44212,"ĠRAID":44213,"Pure":44214,"hetti":44215,"ĠFailed":44216,"ĠCharacters":44217,"ĠCreep":44218,"akra":44219,"Ec":44220,"ĠAristotle":44221,"Lim":44222,"error":44223,"yrus":44224,"umably":44225,">>":44226,"Ġtsun":44227,"knowledge":44228,"Cert":44229,"bable":44230,"hesion":44231,"ĠProcedures":44232,"Ġmarkup":44233,"ideo":44234,"Ġrhet":44235,"ĠChapters":44236,"ĠChecking":44237,"mega":44238,"Ġphotons":44239,"required":44240,"Unknown":44241,"ĠDrawn":44242,"Ġvari":44243,"EEK":44244,"Ġcompuls":44245,"Ġcloning":44246,"ccoli":44247,"Ġ1070":44248,"Ġkindred":44249,"Ġdiscl":44250,"ĠCind":44251,"Collect":44252,"Ġchromosomes":44253,"phant":44254,"ĠKafka":44255,"Ġeverlasting":44256,"Ġmercenary":44257,"ĠHmm":44258,"----":44259,"riber":44260,"Ġdoubtless":44261,"Ġsusceptibility":44262,"beta":44263,"notice":44264,"Ġcrochet":44265,"Ġrespir":44266,"Ġphilosophers":44267,"ĠExtras":44268,"Ġseparat":44269,"shown":44270,"iblings":44271,"Hispanic":44272,"copy":44273,"Tang":44274,"Knight":44275,"Ġpursu":44276,"ĠAnime":44277,"Ġlipid":44278,"ggies":44279,"levels":44280,"phalt":44281,"ĠCompleted":44282,"bral":44283,"Ġcerv":44284,"ĠAfric":44285,"ĠPhar":44286,"Color":44287,"ogene":44288,"ĠCompan":44289,"memory":44290,"Dust":44291,"ĠXIV":44292,"ĠConsole":44293,"').":44294,"Ġ1888":44295,"byn":44296,"Ġpolygamy":44297,"Auth":44298,"BUT":44299,"istine":44300,"Ġsacr":44301,"Ġabsor":44302,"ijah":44303,"ĠNeural":44304,"olester":44305,"ql":44306,"Already":44307,"Creating":44308,"ĠStarg":44309,"ĠPhilos":44310,"Consider":44311,"Ġrepositories":44312,"cludes":44313,"ĠBuffer":44314,"ĠPerspect":44315,"Ġcomput":44316,"Stew":44317,"iamond":44318,"ĠJudgment":44319,"OVA":44320,"angible":44321,"Ġoxid":44322,"Ġepigen":44323,"Ġsidel":44324,"ĠEag":44325,"devices":44326,"icone":44327,"1920":44328,"atism":44329,"beard":44330,"ĠGujar":44331,"ĠPlaystation":44332,"Ġglances":44333,"ĠCOMPLE":44334,"VERTIS":44335,"ukemia":44336,"Edit":44337,"Tickets":44338,"Square":44339,"ĠSerpent":44340,"Ġtransporter":44341,"MQ":44342,"ĠMongo":44343,"1967":44344,"ibaba":44345,"Ġtimet":44346,"sylvania":44347,"Latin":44348,"osaurs":44349,"Ġhumanoid":44350,"Ġcannabinoid":44351,"Ġdisciple":44352,"Psych":44353,"Ġimpro":44354,"Ġmc":44355,"Raid":44356,"Letter":44357,"ificant":44358,"ĠPortug":44359,"ĠFreem":44360,"Ġappell":44361,"ĠMushroom":44362,"Ġclans":44363,"Ġsinful":44364,"Ġingestion":44365,"ĠDirectory":44366,"abetic":44367,"Ġantigen":44368,"Ġimagin":44369,"mitter":44370,"!!!!!":44371,"ĠDPR":44372,"leness":44373,"\":\"\",\"":44374,"ĠAUTHOR":44375,"Ġgrunt":44376,"Ġflickering":44377,"Cath":44378,"asury":44379,"Ġnozzle":44380,"Secure":44381,"Stre":44382,"ĠBIT":44383,"Ġdeviations":44384,"Professor":44385,"bilt":44386,"ĠConscious":44387,"Ġinterrupts":44388,"ĠMormons":44389,"ĠCutter":44390,"Bed":44391,"ipient":44392,"ĠGhostbusters":44393,"Cart":44394,"endas":44395,"ĠExecution":44396,"ycle":44397,"Ġwedd":44398,"Sold":44399,"Ġvanquished":44400,"Regarding":44401,"Depending":44402,"']":44403,"atron":44404,"oidal":44405,"Cube":44406,"Studio":44407,":/":44408,"ĠExplosion":44409,"activate":44410,"pport":44411,"fuck":44412,"Whe":44413,"Ġsmir":44414,"Ġwidgets":44415,"urses":44416,"izard":44417,")*":44418,"icho":44419,"ĠVersus":44420,"ĠIntroduced":44421,"osaurus":44422,"1977":44423,"forum":44424,"Gray":44425,"Program":44426,"righteous":44427,"endum":44428,"ĠScare":44429,"Ġresists":44430,"*)":44431,"ĠCombo":44432,"Ġsockets":44433,"Ġaston":44434,"LAB":44435,"Ġmutated":44436,"eworld":44437,"DEF":44438,"Trend":44439,"âĢĶ-":44440,"Ġpropagation":44441,"Ġemancipation":44442,"collection":44443,"ĠDifferences":44444,"Tweet":44445,"Ġmajesty":44446,")...":44447,"sylv":44448,"Ġadapters":44449,"Ġmilliseconds":44450,"Jews":44451,"ĠPatreon":44452,"phasis":44453,"ĠHTTP":44454,"onnaissance":44455,"ENDED":44456,"ĠIntro":44457,"qs":44458,"Ġsuperflu":44459,"*.":44460,"Ġminions":44461,"ĠStupid":44462,"Ġspecialization":44463,"ĠPikachu":44464,"Ġappellant":44465,"Training":44466,"circle":44467,"Interest":44468,"Ġfallacy":44469,"ĠDinosaur":44470,"ĠTHEM":44471,"Ġdirectories":44472,"Ġmasturbation":44473,"ĠStain":44474,"1978":44475,"odied":44476,"Ġexqu":44477,"ĠRats":44478,"swick":44479,"Ġemptiness":44480,"ĠXeon":44481,"Ġthereto":44482,"ĠEngels":44483,"ĠSupplement":44484,"Chan":44485,"Ġundead":44486,"ĠNoct":44487,"erest":44488,"ĠQuery":44489,"ĠSOLD":44490,"thritis":44491,"ĠEncounter":44492,"Ġvectors":44493,"Econom":44494,"Rogue":44495,"Ġgelatin":44496,"Rot":44497,"Flickr":44498,"Ġcaching":44499,"Ġloader":44500,"ĠELE":44501,"Ġcamoufl":44502,"Commission":44503,"Ġ1886":44504,"Ġcombos":44505,"ĠAwakening":44506,"Ġfeudal":44507,"Ġasses":44508,"ASY":44509,"atalie":44510,"Ġpanties":44511,"ĠMono":44512,"selves":44513,"Download":44514,"Ġvampires":44515,"------":44516,"ishop":44517,"User":44518,"Ġimperialist":44519,"ĠGOODMAN":44520,"1973":44521,"Vel":44522,"Struct":44523,"ĠUFOs":44524,"drivers":44525,"ĠOptional":44526,"uably":44527,"ĠPrinciple":44528,"verett":44529,"taining":44530,"Ġ1889":44531,"ĠCommunism":44532,"auder":44533,"Keys":44534,"lore":44535,"ĠMedieval":44536,"Hyd":44537,"weapon":44538,"Register":44539,"ĠHighlander":44540,"ĠRFC":44541,"Demon":44542,"ardless":44543,"ĠOrche":44544,"Kick":44545,"pixel":44546,"address":44547,"OUP":44548,"Brain":44549,"ĠMorph":44550,"bash":44551,"ĠANG":44552,"ĠIdle":44553,"ĠLucifer":44554,"Ġcorrelates":44555,"Ġgazed":44556,"colm":44557,"ĠKard":44558,"Solar":44559,"ĠVariable":44560,"ĠPACK":44561,"Ġfuzz":44562,"Ġanonym":44563,"ĠECO":44564,"feature":44565,"ĠEsports":44566,"ĠAnthropology":44567,"cise":44568,"manac":44569,"ĠSupports":44570,"rists":44571,"Quant":44572,"istical":44573,"çļĦ":44574,"Ġdexterity":44575,"monster":44576,"ordial":44577,"Mob":44578,"DEC":44579,"ĠConj":44580,"entric":44581,"1981":44582,"ECTION":44583,"ietal":44584,"ĠUses":44585,"ĠArmageddon":44586,"ĠCapitalism":44587,"Ub":44588,"iazep":44589,"helps":44590,"ouls":44591,"grim":44592,"ĠEthiop":44593,"tesy":44594,"Ġclipboard":44595,"Ġchimpanzees":44596,"PLIC":44597,"Sexual":44598,"wallet":44599,"ĠRect":44600,"ocytes":44601,"ĠHels":44602,"lace":44603,"Damn":44604,"Ġblasp":44605,"ildo":44606,"ĠRober":44607,"APD":44608,"ĠWCS":44609,"ippery":44610,"ellectual":44611,"Ġ$(":44612,"Ġuniverses":44613,"Ġholster":44614,"Ġshading":44615,"Ġinflic":44616,"else":44617,"ĠShiny":44618,"ĠAVG":44619,"Lower":44620,"ĠMayhem":44621,"Originally":44622,"Crypt":44623,"SHARE":44624,"ĠBeir":44625,"!:":44626,"Ġrepentance":44627,"WHAT":44628,".......":44629,"Ġauditory":44630,"aaa":44631,"ĠLoot":44632,"ciples":44633,"Ġcontem":44634,"Ġphoton":44635,"æľ":44636,"omach":44637,"ĠWhedon":44638,"ĠValid":44639,"asonable":44640,"pha":44641,"assad":44642,"ĠPse":44643,"Heat":44644,"Ġplugins":44645,"Ġclenched":44646,"ĠAmeric":44647,"transform":44648,"ĠEnh":44649,"agnetic":44650,"usalem":44651,"sych":44652,"Wed":44653,"replace":44654,"ĠKinect":44655,"shield":44656,"Sax":44657,"ividually":44658,"Ġfunctionally":44659,"Ġ:)":44660,"typically":44661,"Opening":44662,"Fa":44663,"ĠSELECT":44664,"Ġsamurai":44665,"Ġhorde":44666,"entle":44667,"sth":44668,"Changes":44669,"Pin":44670,"ithing":44671,"illance":44672,"ĠEmblem":44673,"ĠMicha":44674,"crypt":44675,"ĠObjective":44676,"ophys":44677,"Ġavg":44678,"poon":44679,"Ġreadable":44680,"ĠRx":44681,"allel":44682,"Sit":44683,"gom":44684,"ureau":44685,"ĠDoodle":44686,"Ġdungeon":44687,"($":44688,"Nintendo":44689,"\"],\"":44690,"Notes":44691,"Grab":44692,"Prosecutors":44693,"Advanced":44694,"Ġ1862":44695,"ĠVeter":44696,"Ġjurisd":44697,"ĠLauncher":44698,"Catal":44699,"udder":44700,"Ġresidues":44701,"Ġregress":44702,"ĠConquer":44703,"osal":44704,"ĠDice":44705,"************":44706,"braska":44707,"ipolar":44708,"Ġathe":44709,"bringing":44710,"Suddenly":44711,"ĠIEEE":44712,"verbs":44713,"Ġdelet":44714,"ipeg":44715,"Previous":44716,"]\"":44717,"Ġsidebar":44718,"illac":44719,"Property":44720,"α":44721,"REP":44722,"Ġauthenticated":44723,"gypt":44724,"uilding":44725,"ĠGing":44726,"Ġwart":44727,"Birth":44728,"Ġobedient":44729,"ĠXuan":44730,"ĠTYPE":44731,"Ġinhibits":44732,"1972":44733,"humans":44734,"IENT":44735,"Ġyoutube":44736,"Shortly":44737,"ophen":44738,"ĠWinc":44739,"ĠWrit":44740,"AUD":44741,"ĠHobbit":44742,"emphasis":44743,"ĠWonders":44744,"Ġtwitch":44745,"ĠProphe":44746,"Berry":44747,"ĠGinny":44748,"ĠBurst":44749,"ĠGenerator":44750,"Ġepile":44751,"ĠBalanced":44752,"GPU":44753,"maps":44754,"Ġneurotrans":44755,"ĠIRC":44756,"Ġ\"$":44757,"Create":44758,"Particip":44759,"ĠMarxism":44760,"Ġthou":44761,"ĠMortal":44762,"Ġ�":44763,"Ġninja":44764,"inburgh":44765,"Ġappro":44766,"ĠPistol":44767,"Jar":44768,"Ġprophes":44769,"classes":44770,"Ġanarchist":44771,"Ġextant":44772,"message":44773,"itaire":44774,"Ġ1863":44775,"ĠProl":44776,"Ġpropell":44777,"Ġimpossibility":44778,"Ġpropos":44779,"itamin":44780,"Rating":44781,"olphin":44782,"Ġmitochond":44783,"versions":44784,"Liberal":44785,"ishy":44786,"Ġspherical":44787,"ĠSurvive":44788,"FREE":44789,"rawler":44790,"Metal":44791,"ĠStarship":44792,"Ġ=================================================================":44793,"ĠDharma":44794,"ĠSeller":44795,"Ġwrapper":44796,"Experience":44797,"Integ":44798,"Customer":44799,"hammad":44800,"Ġunanim":44801,"Jenn":44802,"Ġschizophren":44803,"agree":44804,"ĠEVENT":44805,"Shell":44806,"Ġfractions":44807,"1968":44808,"Ġextermination":44809,"ĠSniper":44810,"Ġpronoun":44811,"ĠHitman":44812,"xp":44813,"resource":44814,"WIND":44815,"Ġhierarchical":44816,"Ġted":44817,"Changing":44818,"Ġplaus":44819,"Transform":44820,"Ġbicy":44821,"imentary":44822,"Fuck":44823,"Mini":44824,"Ġoverc":44825,"ĠOptimus":44826,"outer":44827,"helial":44828,"akening":44829,"fx":44830,"Ġnig":44831,"Ġ+/-":44832,"ĠVICE":44833,"Ġnm":44834,"1976":44835,"ĠRitual":44836,"ĠTyrann":44837,"Ġscriptures":44838,"inical":44839,"ĠNull":44840,"ourgeois":44841,"dra":44842,"Ġpious":44843,"Ġneuron":44844,"Ġcolonists":44845,"ĠNebula":44846,"apply":44847,"Sah":44848,"Marx":44849,"Ġhypotheses":44850,"notation":44851,"acists":44852,"Math":44853,"Manager":44854,"Library":44855,"audi":44856,"Ġmp":44857,"ergic":44858,"Ġwizards":44859,"fw":44860,"DVD":44861,"ĠScala":44862,"Different":44863,"ampoo":44864,"ĠDread":44865,"abbage":44866,"Rus":44867,"ĠDumbledore":44868,"keleton":44869,"elsh":44870,"esian":44871,"ĠCorsair":44872,"Tier":44873,"ĠCelest":44874,"Ġnoun":44875,"Ġlucid":44876,"requisites":44877,"Ġgenus":44878,"Event":44879,"1974":44880,"ĠSatanic":44881,"iox":44882,"ĠHandle":44883,"ĠDestroyer":44884,"Ġinvocation":44885,"ĠXD":44886,"modified":44887,"Gam":44888,"ĠRPC":44889,"Ġsubsystem":44890,"Compared":44891,"odan":44892,"ĠPassive":44893,"ĠHelmet":44894,"nutrition":44895,"riction":44896,"HOW":44897,"Jess":44898,"Ġpiston":44899,"imately":44900,"Ġhypoc":44901,"ĠCelestial":44902,"MRI":44903,"Ġcompiler":44904,"ĠBadge":44905,"ĠRevelation":44906,"Ġintrig":44907,"Grad":44908,"ĠSPACE":44909,"Poly":44910,"ĠVul":44911,"Ġtrembling":44912,"Ġindepend":44913,"doctor":44914,"Certain":44915,"emet":44916,"Password":44917,"Ġgasped":44918,"Ġpronunciation":44919,"Fuel":44920,"ĠSPEC":44921,"assets":44922,"Extra":44923,"Ġformatting":44924,"Ġmods":44925,"\"!":44926,"akedown":44927,"Ġcircuitry":44928,"ĠTRUE":44929,"ĠVeil":44930,"Ġsighed":44931,"Charg":44932,"eals":44933,"Ġworkaround":44934,"Ġank":44935,"ĠScrolls":44936,"Ġdiffusion":44937,"Ġamps":44938,"ĠTempest":44939,"adata":44940,"Ġphenomen":44941,"Ġ???":44942,"Ġpopup":44943,"Ġinhibition":44944,"Ġaliases":44945,"erity":44946,"agraph":44947,"Jew":44948,"Ġbec":44949,"Classic":44950,"comment":44951,"usable":44952,"rodu":44953,"ĠEnlightenment":44954,"Ġinvis":44955,"Ġbiochemical":44956,"latest":44957,"ĠGMOs":44958,"ĠSocialism":44959,"Ġpollut":44960,"Ġeluc":44961,"Js":44962,"orthern":44963,"PDATED":44964,"alyses":44965,"Experts":44966,"Blog":44967,"ĠDemocr":44968,"etooth":44969,"pause":44970,"âĢ¢âĢ¢":44971,"ĠShinji":44972,"Ġdystop":44973,"Sources":44974,"ĠBrach":44975,"np":44976,"ĠXY":44977,"Ġneurot":44978,"assembly":44979,"Ġbourgeois":44980,"ĠReson":44981,"ĠIDE":44982,"Ġrecoil":44983,"raq":44984,"ĠAvenger":44985,"Paper":44986,"UTF":44987,"ĠWrest":44988,"ĠSimulation":44989,"elaide":44990,"ĠDMCA":44991,"utm":44992,"1963":44993,"Ġarcs":44994,"Ġmaximal":44995,"Ġcyl":44996,"Ġphilosoph":44997,"enium":44998,"Ġrelativity":44999,"ĠMacintosh":45000,"Ġpneum":45001,"LOC":45002,"Ġgoddamn":45003,"SHA":45004,"Ġlocalization":45005,"ĠPHI":45006,"Ġhierarch":45007,"Ġatheists":45008,"±":45009,"Luck":45010,"ĠJugg":45011,"options":45012,"alore":45013,"Edward":45014,"Monitor":45015,"Ġneoc":45016,"numbered":45017,"Arc":45018,"ĠCodes":45019,"ĠHallow":45020,"olitan":45021,"sections":45022,"ĠEzek":45023,"Ġamy":45024,"task":45025,"ĠCLS":45026,"ĠValkyrie":45027,"Ġcircumference":45028,"amac":45029,"ĠNotting":45030,"Ġproverb":45031,"Spec":45032,"Ġelemental":45033,"ĠBitcoins":45034,"Except":45035,"Release":45036,"ADVERTISEMENT":45037,"Complete":45038,"phrine":45039,"Ġspores":45040,"random":45041,"neum":45042,"trigger":45043,"ocide":45044,"Ġlongitudinal":45045,"isec":45046,"peat":45047,"Ġprecept":45048,"Wing":45049,"ĠâĹ":45050,"otropic":45051,"mouse":45052,"ĠWitcher":45053,"ĠAppearance":45054,"ROR":45055,"Ġ||":45056,"aird":45057,"Blu":45058,"Ġincomp":45059,"ĠFirefly":45060,"update":45061,"Loc":45062,"Ġnihil":45063,"hesive":45064,"Quality":45065,"youtu":45066,"Seriously":45067,"Ġannot":45068,"ĠCoins":45069,"Visit":45070,"lc":45071,"----------":45072,"Ġdiction":45073,"Ġafore":45074,"Ġimmortality":45075,"ĠForbidden":45076,"Allah":45077,"ĠPartial":45078,"ĠGears":45079,"Ġtrance":45080,"Hat":45081,"irez":45082,"ĠSATA":45083,"Ġelectrode":45084,"ĠLinear":45085,"rikes":45086,"Ġderiv":45087,"ĠXue":45088,"Fine":45089,"ĠIgnore":45090,"desc":45091,"DOM":45092,"Simple":45093,"orescence":45094,"Previously":45095,"Ġcircumcision":45096,"Sphere":45097,"Ġrenown":45098,"SET":45099,"ilight":45100,"ĠByzantine":45101,"EXP":45102,"Ġwhine":45103,"Missing":45104,"Lt":45105,"Guide":45106,"Ġhippocampus":45107,"Ġwip":45108,"yrights":45109,"Ġsubmer":45110,"Maker":45111,"Switch":45112,"Ġspectral":45113,"nect":45114,"Ãį":45115,"Ġreven":45116,"WER":45117,"Adding":45118,"ĠCONTROL":45119,"asper":45120,"0000000":45121,"ynt":45122,"annabin":45123,"ĠAliens":45124,"ĠPCR":45125,"asketball":45126,"ricia":45127,"ĠUnch":45128,"Tap":45129,"Ġpracticable":45130,"ĠUsage":45131,"Ġsoluble":45132,"Scroll":45133,"Random":45134,"Ġmoan":45135,"ĠPuppet":45136,"Dim":45137,"Attack":45138,"Ġspears":45139,"Ġrectangle":45140,"Ġamuse":45141,"ĠDoct":45142,"reon":45143,"ĠReset":45144,"vag":45145,"unin":45146,"ĠBris":45147,"ĠSwarm":45148,"Model":45149,"Standing":45150,"Ġdenotes":45151,"{":45152,"ĠLizard":45153,"nesty":45154,"Ġwor":45155,"Ġamplification":45156,"ĠInferno":45157,"Cover":45158,"SAM":45159,"respective":45160,"Shift":45161,"Ġlibertarians":45162,"Runner":45163,"ĠRevelations":45164,"Spr":45165,"ĠCrusader":45166,"Ġcaffe":45167,"Patch":45168,"stros":45169,"ĠImmortal":45170,"Ġinsofar":45171,"itance":45172,"ĠValhalla":45173,"Ġradial":45174,"Beast":45175,"sync":45176,"Ġ--------":45177,"ĠPathfinder":45178,"iless":45179,"operator":45180,"Choose":45181,"Ġdecode":45182,"Ġvou":45183,"ĠMutant":45184,"ĠCVE":45185,"Female":45186,"Ġoxidation":45187,"inational":45188,"dB":45189,"Scope":45190,"Wan":45191,"ĠBought":45192,"ĠDietary":45193,"rotein":45194,"Present":45195,"aukee":45196,"Ġtotem":45197,"Ġsatur":45198,"wagon":45199,"Builder":45200,"ĠBulg":45201,"Ġsects":45202,"Flo":45203,"ombat":45204,"ĠHermione":45205,"aughs":45206,"Ġhydra":45207,"paren":45208,"ë":45209,"Whereas":45210,"tsky":45211,"Ġchall":45212,"WORK":45213,"opian":45214,"rican":45215,"vati":45216,"ĠHTTPS":45217,"Ġwrink":45218,"Ġthrob":45219,"habi":45220,"Ġiodine":45221,"omorph":45222,"ĠScion":45223,"Hunt":45224,"Written":45225,"iosity":45226,"ĠBrowser":45227,"Ġsinners":45228,"culosis":45229,"Ġunconsciously":45230,"0100":45231,"Ġanarchists":45232,"Pull":45233,"FFER":45234,"Ġpandemonium":45235,"matically":45236,"Rush":45237,"Ġpurified":45238,"ĠCyan":45239,"ĠDifficulty":45240,"«":45241,"Aside":45242,"oggles":45243,"untu":45244,"iege":45245,"iberal":45246,"ĠCOUR":45247,"eteenth":45248,"weeney":45249,"biased":45250,"ĠDecay":45251,"quart":45252,"alysis":45253,"Ġstere":45254,"ellect":45255,"Ġkernels":45256,"juven":45257,"ĠJPEG":45258,"indal":45259,"topic":45260,"Ġidentifier":45261,"åı":45262,"Ġepid":45263,"1969":45264,"Ġpoisons":45265,"sym":45266,"mop":45267,"LOCK":45268,"axe":45269,"cohol":45270,"ctory":45271,"Ġadject":45272,"Skin":45273,"ĠFract":45274,"ĠSHAR":45275,"echo":45276,"thood":45277,"Ġencoding":45278,"Ġrelational":45279,"Len":45280,"Bone":45281,"agara":45282,"uggish":45283,"ĠTanks":45284,"Stats":45285,"lihood":45286,"Mult":45287,"Graph":45288,"ĠCannot":45289,"ĠSpac":45290,"handler":45291,"ĠShit":45292,"Ġmorp":45293,"controller":45294,"udeau":45295,"Screenshot":45296,"Development":45297,"Gear":45298,"Ġtong":45299,"ĠColossus":45300,"rylic":45301,"STRUCT":45302,"capitalist":45303,"Ġsupplementation":45304,"Parts":45305,"pb":45306,"oppy":45307,"pite":45308,"processor":45309,"Ġexplanatory":45310,"Environmental":45311,"Compl":45312,"Gaming":45313,"arently":45314,"Ġconcess":45315,"Ġathlet":45316,"forestation":45317,"orsi":45318,"igmat":45319,"Ġencoded":45320,"misc":45321,"Ġproofs":45322,"ĠRevision":45323,"Ġmathematic":45324,"Ġconstitu":45325,"fficiency":45326,"Ġlightsaber":45327,"gz":45328,"erate":45329,"ournals":45330,"Comment":45331,"Ġpercept":45332,".\"[":45333,"ĠTechniques":45334,"coins":45335,"Shape":45336,"venant":45337,"ĠPrinted":45338,"Native":45339,"ĠGors":45340,"pecting":45341,"ĠDuel":45342,"Ġadmins":45343,"Flor":45344,"ĠDeus":45345,"cham":45346,"ĠRails":45347,"ceptor":45348,"naire":45349,"ĠSquid":45350,"ĠWarranty":45351,"SPEC":45352,"ensis":45353,"FUN":45354,"stellar":45355,"Select":45356,"llular":45357,"arget":45358,"ĠUncharted":45359,"Details":45360,"rison":45361,"Ġsyntax":45362,"chanted":45363,"Ġ-----":45364,"Ġthats":45365,"Registration":45366,"ĠSaber":45367,"ethical":45368,"Ġcryptography":45369,"atown":45370,"Ġdependencies":45371,"nw":45372,"Ġvehement":45373,"Ġrationality":45374,"ĠThou":45375,"Ġ----":45376,"rador":45377,"Ġenh":45378,"ĠCrate":45379,"STATE":45380,"/(":45381,"Ġdelim":45382,"CEPT":45383,"monkey":45384,"pai":45385,"uracy":45386,"Ġmortals":45387,"Sanders":45388,"ĠSeraph":45389,"-\"":45390,"1945":45391,"endix":45392,":'":45393,"ĠLegs":45394,"Exper":45395,"ĠKrypt":45396,"clinton":45397,"Ġuphe":45398,"Vers":45399,"Similarly":45400,"ressor":45401,"leans":45402,"LOG":45403,"cific":45404,"Ġ].":45405,"-)":45406,"resist":45407,"Pred":45408,"Latest":45409,"ilyn":45410,"Ġblob":45411,"Ġdevils":45412,"ĠIllusion":45413,"erella":45414,"Ġyak":45415,"method":45416,"Ġ698":45417,"Shadow":45418,"velt":45419,"Ġsomet":45420,"xc":45421,"Ġtriangles":45422,"netic":45423,"Calling":45424,"ĠDRM":45425,"Ġtriglycer":45426,"Ġinhibited":45427,"Ġnep":45428,"Ġalgebra":45429,"ascar":45430,"laim":45431,"Ġappl":45432,"1971":45433,"Bernie":45434,"Eh":45435,"Ġundefined":45436,"âĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶ":45437,"Sys":45438,"ournaments":45439,"Solid":45440,"Ġhep":45441,"ĠMales":45442,"Agent":45443,"Ġpsychedel":45444,"Wik":45445,"Ġdoctrines":45446,"rection":45447,"Compare":45448,"âĺ":45449,"Ġcertific":45450,"Ġsubstr":45451,"ĠCitation":45452,"ĠAFB":45453,"ĠBecame":45454,"Ġaristocracy":45455,"aryl":45456,"Ġanatomical":45457,"ocumented":45458,"ĠAssy":45459,"ĠFORM":45460,"Traditional":45461,"azines":45462,"Content":45463,"furt":45464,"Ġscripting":45465,"Ġcloaked":45466,"Ġunint":45467,"ĠCivilization":45468,"Desktop":45469,"ĠRagnar":45470,"Ġcurses":45471,"Ġobservable":45472,"ĠSpock":45473,"ĠPyr":45474,"Ġelectrom":45475,"ĠLump":45476,"oresc":45477,"ĠAttribution":45478,"egal":45479,"achusetts":45480,"Ġmarqu":45481,"âϦ":45482,"Ġcursor":45483,"ascist":45484,"1966":45485,"edit":45486,"lisher":45487,"ocyte":45488,"Writer":45489,"BILITIES":45490,"ĠUpload":45491,"Ġtreacher":45492,"Ġrecomb":45493,"Ġknights":45494,"Ġimmutable":45495,"ĠPly":45496,"Ġatten":45497,"ĠPassed":45498,"Flying":45499,"icipated":45500,"querade":45501,"ĠZot":45502,"CRE":45503,"ĠCursed":45504,"ickr":45505,"ĠDroid":45506,"thereum":45507,"Ġadjective":45508,"DIT":45509,"Ġtob":45510,"Ġinit":45511,"ĠPenet":45512,"Ġignor":45513,"Ġexalted":45514,"ĠDwell":45515,"assemb":45516,"Ġsentient":45517,"Ġ``":45518,"ĠGoo":45519,"Professional":45520,"othing":45521,"rupted":45522,"olics":45523,"ĠSetup":45524,"Thu":45525,"Campaign":45526,"Secondly":45527,"clipse":45528,"hibit":45529,"amate":45530,"SUP":45531,"ĠSuppose":45532,"submit":45533,"ĠDebian":45534,"Ġantid":45535,"Ġentert":45536,"ysical":45537,"ĠGladiator":45538,"ĠSTL":45539,"ĠBugs":45540,"ĠMech":45541,"ĠCoffin":45542,"itored":45543,"ICLE":45544,"Mist":45545,"Ġinfall":45546,"votes":45547,"actly":45548,"Occ":45549,"ĠConquest":45550,"alach":45551,"Ġintertw":45552,"reverse":45553,"amiya":45554,"icularly":45555,"edom":45556,"ĠLuxem":45557,"Fra":45558,"urrencies":45559,"Ġnobility":45560,"Tab":45561,"Beer":45562,"Ġ10000":45563,"Ġincor":45564,"Ġmelanch":45565,"Depth":45566,"Firstly":45567,"usr":45568,"ĠWiki":45569,"hhhh":45570,"ĠProxy":45571,"Ġantagonists":45572,"Ġtransistor":45573,"ĠRelic":45574,"ĠPrometheus":45575,"Ġ1280":45576,"Coun":45577,"ĠMedals":45578,"stats":45579,"Assembly":45580,"inished":45581,"cemic":45582,"Ġadventurers":45583,"Ġcd":45584,"Supporters":45585,"ĠYs":45586,"])":45587,"Ġneglig":45588,"Request":45589,"Ġwhore":45590,"Ġovercl":45591,"_-":45592,"partial":45593,"amd":45594,"Ġfructose":45595,"Ġdivid":45596,"Administ":45597,"amples":45598,"Boo":45599,"akery":45600,"owered":45601,"hester":45602,"Links":45603,"GROUND":45604,"ethy":45605,"Ġincarcer":45606,"Ġincap":45607,"Drag":45608,"ĠElastic":45609,"âĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶâĢĶ":45610,"Ultra":45611,"AAAA":45612,"Order":45613,"ĠMysteries":45614,"Ġcanonical":45615,"Ign":45616,"Ġanimate":45617,"wegian":45618,"ggle":45619,"Hash":45620,"Arg":45621,"verty":45622,"Ġanalges":45623,"ouver":45624,"ittees":45625,"ĠAsgard":45626,"______":45627,"Mix":45628,"1964":45629,"Rate":45630,"Ġarousal":45631,"pheus":45632,"undai":45633,"hetamine":45634,"ĠMysterious":45635,"Alright":45636,"ĠHerod":45637,"riott":45638,"ĠAnarchy":45639,"ĠArche":45640,"Question":45641,"Chapter":45642,"Token":45643,"ĠSphere":45644,"Ġinduces":45645,"Audio":45646,"Normal":45647,"Ġprophe":45648,"ĠValiant":45649,"Tag":45650,"Relations":45651,"Ġblinked":45652,"onyms":45653,"ĠVortex":45654,"Ġdb":45655,"emonic":45656,"Phase":45657,"Ġkingdoms":45658,"Twe":45659,"ĠLORD":45660,"plementation":45661,"ĠConstantinople":45662,"helm":45663,"ĠFlesh":45664,"Ġthumbnail":45665,"ledged":45666,"ĠPROG":45667,"Ġdisbel":45668,"ĠLikes":45669,"ĠGamer":45670,"renches":45671,"hattan":45672,"Index":45673,"pecially":45674,"ĠJiu":45675,"Ġwhats":45676,"erion":45677,"xf":45678,"ĠPerception":45679,"Alien":45680,"Capt":45681,"ãĢĤ":45682,"joining":45683,"nesium":45684,"ĠSocrates":45685,"Icon":45686,"animate":45687,"ocalypse":45688,"ĠTactics":45689,"assador":45690,"Veh":45691,"src":45692,",-":45693,"Ġvisc":45694,"ĠDiscord":45695,"initial":45696,"atana":45697,"Size":45698,"Claim":45699,"ffect":45700,"iciary":45701,"Ġturret":45702,"reset":45703,"Ï":45704,"wrap":45705,"ulnerability":45706,"ĠInsert":45707,"Ġirrad":45708,"ognitive":45709,"clips":45710,"uncle":45711,"chemy":45712,"ottesville":45713,"Write":45714,"earances":45715,"1965":45716,"MIC":45717,"Ġmanag":45718,"Ġtelesc":45719,"Termin":45720,"Guest":45721,"Ġdenote":45722,"Failure":45723,"ograp":45724,"âĢķ":45725,"Ġscrolls":45726,"ĠArmored":45727,"Ġrecomp":45728,"Ġplaceholder":45729,"ĠISBN":45730,"ĠBelief":45731,"emporary":45732,"Asset":45733,"arcer":45734,"haar":45735,"assium":45736,"%:":45737,"ernal":45738,"ĠLv":45739,"atible":45740,"Pand":45741,"oubted":45742,"Lie":45743,"bial":45744,"STEP":45745,"Ġpresets":45746,"Ġstatist":45747,"Sund":45748,"reshold":45749,"endium":45750,"\");":45751,"Software":45752,"Ġbasal":45753,"ĠYose":45754,"Ġmortg":45755,"ocry":45756,"Ġsubreddit":45757,"omorphic":45758,"ĠLoaded":45759,"berra":45760,"vg":45761,"orkshire":45762,"ĠChrys":45763,"Repeat":45764,"ĠSimulator":45765,"rx":45766,"gex":45767,"Linux":45768,"ĠInstruct":45769,"irable":45770,"Ġmosquit":45771,"ĠManga":45772,"iOS":45773,"Ġsynt":45774,"Ġclitor":45775,"Ġlobe":45776,"ĠDelete":45777,"CVE":45778,"fortunately":45779,"Enc":45780,"vertising":45781,"Ġanten":45782,"Ġfif":45783,"Study":45784,"prev":45785,"ossus":45786,"Nar":45787,"Decl":45788,"erala":45789,"ĠPrototype":45790,"UGE":45791,"1001":45792,"Ġ---------":45793,"deals":45794,"odcast":45795,"TPS":45796,"Ġcodec":45797,"ittee":45798,"isexual":45799,"ĠBreaker":45800,"menu":45801,"ĠURI":45802,"('":45803,"ĠFiorina":45804,"ĠApostles":45805,"ĠWitches":45806,"raint":45807,"addafi":45808,"ersive":45809,"yrim":45810,"Ġmosa":45811,"Ġrog":45812,"Ear":45813,"âĺħ":45814,"Ġcaloric":45815,"matical":45816,"yrics":45817,"ĠKrugman":45818,"axter":45819,"1016":45820,"Ġsep":45821,"ĠExtend":45822,"ropolitan":45823,"thren":45824,"ologne":45825,"atomic":45826,"Naturally":45827,"Pros":45828,"gencies":45829,"akens":45830,"Male":45831,"Ġcausation":45832,"omnia":45833,"Comments":45834,"eeee":45835,"iquette":45836,"Ġcytok":45837,"ename":45838,"details":45839,"Ġdestruct":45840,"leep":45841,"ĠCavern":45842,"ĠInvention":45843,"ueless":45844,"Ġsubsection":45845,"outhern":45846,"metic":45847,"blogs":45848,"ĠPacks":45849,"ĠArduino":45850,"hhh":45851,"elligence":45852,"imity":45853,"ĠUltron":45854,"astrous":45855,"Ġbiome":45856,"ĠHover":45857,"Ġprivile":45858,"igham":45859,"apest":45860,"ĠYoshi":45861,"Artist":45862,".\",":45863,"gamer":45864,"Virgin":45865,"Tea":45866,"ĠDoomsday":45867,"ĠðŁĻĤ":45868,"terday":45869,"ĠCommando":45870,"ĠAchieve":45871,"chrom":45872,"Ġcryptographic":45873,"Ġrebell":45874,"Specifically":45875,"â̦â̦â̦â̦":45876,"ĠEternity":45877,"Ġemulation":45878,"ĠSERV":45879,"ĠMiscellaneous":45880,"ĠParticipant":45881,"duc":45882,"vp":45883,"ĠSparkle":45884,"ategories":45885,"Ġdecrypt":45886,"ĠGNOME":45887,"activation":45888,"Ġanarch":45889,"owler":45890,"adiator":45891,"itars":45892,"ĠTHEN":45893,")\",":45894,"åħ":45895,"Ġembod":45896,"vae":45897,"âĺĨ":45898,"Member":45899,"Ġrm":45900,"nyder":45901,"ĠLeviathan":45902,"Gaza":45903,"erenn":45904,"Chicken":45905,"ĠDefinitive":45906,"ĠBolshe":45907,"ĠJagu":45908,"gorith":45909,"loader":45910,"exe":45911,".........":45912,"ĠReceived":45913,"ĠProto":45914,"ĠLocked":45915,"Posts":45916,"ankind":45917,"Clock":45918,"ĠCLI":45919,"Throw":45920,"dL":45921,"epad":45922,"ĠAtmosp":45923,"Ġmk":45924,"ĠSteal":45925,"uple":45926,"reference":45927,"ĠGNU":45928,"adelphia":45929,"scripts":45930,"ilaterally":45931,"ĠMods":45932,"odus":45933,"ignty":45934,"REF":45935,"Ġhypothesized":45936,"issors":45937,"Ġanus":45938,"HUD":45939,"rices":45940,"Draw":45941,"Computer":45942,"Below":45943,"uthor":45944,"ĠTact":45945,"=$":45946,"00000000":45947,"Ġcaut":45948,"Sharp":45949,"depend":45950,"Ġtatt":45951,"Goal":45952,"Sounds":45953,"zona":45954,"anyon":45955,"ricanes":45956,"ĠUSAF":45957,"Jump":45958,"Bottom":45959,"etermination":45960,"ĠPles":45961,"Ġhypothes":45962,"Reference":45963,"Ġswall":45964,"Ġmaneu":45965,"rifice":45966,"ĠVeh":45967,"Ġtex":45968,"geoning":45969,"ĠâľĶ":45970,"Mach":45971,"eanor":45972,"%);":45973,"archives":45974,"Ġencyclopedia":45975,"ĠPreferences":45976,"damage":45977,"Done":45978,"Ġcoefficient":45979,"ĠCreatures":45980,"Ġital":45981,"ivari":45982,"Revolution":45983,"Ġnob":45984,"Diff":45985,"Ġabbre":45986,"Writ":45987,"ĠDOS":45988,"redd":45989,"Ġsplend":45990,"orest":45991,"flame":45992,"Ġdevs":45993,"Ġ==":45994,"ĠPuzzle":45995,"Ġgit":45996,"MOD":45997,"ĠArgument":45998,"ĠAbyss":45999,"Studies":46000,"ophob":46001,"uild":46002,"scill":46003,"fp":46004,"Ġplur":46005,"Delete":46006,"ĠFALSE":46007,"FIL":46008,"Ġmicrobiota":46009,"ĠIPv":46010,"Stud":46011,"ortal":46012,"ĠDivinity":46013,"ounter":46014,"ä¸":46015,"Naz":46016,"stals":46017,"ihilation":46018,"Ġpersecut":46019,"ĠPlanes":46020,"viation":46021,"Driver":46022,"ĠEEG":46023,"Unity":46024,"Premium":46025,"ĠSiren":46026,"ĠPaleo":46027,"earchers":46028,"Pract":46029,"Ö":46030,"VII":46031,"mosp":46032,"Ġidentifiers":46033,"Near":46034,"achu":46035,"Apps":46036,"tackle":46037,"COLOR":46038,"Ġperpendicular":46039,"viks":46040,"ecided":46041,"ĠDota":46042,"icons":46043,"Ġpsi":46044,"Brave":46045,"Ġunimagin":46046,"ĠATI":46047,"OOL":46048,"Gender":46049,"ĠSwords":46050,"oples":46051,"Rank":46052,"olphins":46053,"Ġdeities":46054,"ĠXIII":46055,"м":46056,"ĠKraken":46057,"ĠLEVEL":46058,"stasy":46059,"ĠBabel":46060,"Hours":46061,"Avoid":46062,"Mech":46063,"Multi":46064,"Ġect":46065,"Occup":46066,"panic":46067,"Ġmutants":46068,"Evidence":46069,"Tips":46070,"Ġvolts":46071,"Exit":46072,"xb":46073,"planet":46074,"avez":46075,"features":46076,")]":46077,"lol":46078,"ĠNeph":46079,"ĠSanct":46080,"Ġimpover":46081,"................................":46082,"Sty":46083,"Email":46084,"Torrent":46085,"Ġgluc":46086,"ĠSins":46087,"ĠIncarn":46088,"ĠWITHOUT":46089,"ĠPanzer":46090,"ĠAssignment":46091,"versible":46092,"Strange":46093,"ITNESS":46094,"incible":46095,"ZX":46096,"ĠMySQL":46097,"Ġconson":46098,"Ġoxidative":46099,"Machine":46100,"Impro":46101,"Parent":46102,"ĠMetroid":46103,"Educ":46104,"Ġdismant":46105,"dx":46106,"ĠPersona":46107,"ĠHDL":46108,"Americ":46109,"Users":46110,"Ġeighteenth":46111,"WARNING":46112,"ĠLists":46113,"ĠCanter":46114,"ĠTrotsky":46115,"Ġhaha":46116,"]'":46117,"ĠEncyclopedia":46118,"admin":46119,"ĠACTIONS":46120,"idav":46121,"ο":46122,"ĠFTP":46123,"Ġquar":46124,"ongyang":46125,"â̦â̦â̦â̦â̦â̦â̦â̦":46126,"Ġsynchronization":46127,"DEM":46128,"riched":46129,"Ġnegro":46130,"Bench":46131,"Ġfilament":46132,"Ġdecoding":46133,"obj":46134,"Ġjoystick":46135,"Decre":46136,"ĠBolshevik":46137,"Virtual":46138,"ĠSacrament":46139,"xd":46140,"BILL":46141,"-+-+":46142,"¶":46143,"anchester":46144,"Pokemon":46145,"Ġslic":46146,"iameter":46147,"errilla":46148,"Exactly":46149,"\"'":46150,"getic":46151,"3333":46152,"solete":46153,"Ġincorpor":46154,"Ġio":46155,"------------":46156,"Ġantiquity":46157,"ATURES":46158,"Policy":46159,"oppable":46160,"Ġ=>":46161,"ODUCT":46162,"otide":46163,"Ú":46164,"Ġnormative":46165,"Fac":46166,"Ġshaman":46167,"element":46168,"Plex":46169,"INTER":46170,"etsk":46171,"ĠGauntlet":46172,"ĠBIOS":46173,"×ķ":46174,"riet":46175,"Rew":46176,"uristic":46177,"urches":46178,"ĠChomsky":46179,"ixir":46180,"package":46181,"Owner":46182,"Ġschematic":46183,"Assistant":46184,"Ġemanc":46185,"Ġarchetype":46186,"Initial":46187,"intent":46188,"Ġfilib":46189,"ispers":46190,"Flag":46191,"Tank":46192,"Ġinsurg":46193,"Ġapproximation":46194,"Ġsemantic":46195,"Ġsubtitle":46196,"Font":46197,"Ġintimid":46198,"Ġhath":46199,"tools":46200,"gob":46201,"Process":46202,"slave":46203,"ĠJUSTICE":46204,"âĻ¥":46205,"ĠHardcore":46206,"Discover":46207,"Ġexch":46208,"ptive":46209,"units":46210,"ĠDjango":46211,"itudinal":46212,"Ġpc":46213,"akespeare":46214,"ospace":46215,"Ġhorny":46216,"auth":46217,"ĠSkyrim":46218,"ENGTH":46219,"perors":46220,"ĠVulkan":46221,"Ġchimpan":46222,"Ġremem":46223,"Ġopacity":46224,"Ġ:(":46225,"ushima":46226,"Ġawoken":46227,"Ġsacrament":46228,"Beginning":46229,"escape":46230,"Anim":46231,"Ġadvant":46232,"ĠRequires":46233,"output":46234,"Ġdroid":46235,"Yep":46236,"rieving":46237,"Ġpt":46238,"ĠShotgun":46239,"ĠOsiris":46240,"disabled":46241,"ĠRadius":46242,"Medium":46243,"ĠScient":46244,"ĠRept":46245,"ymm":46246,"Ġcp":46247,"ĠLabyrinth":46248,"poral":46249,"Ġ'(":46250,"Hack":46251,"ĠTechnique":46252,"/,":46253,"Ġambig":46254,"Basic":46255,"Ġretrie":46256,"VICE":46257,"BIP":46258,"ragon":46259,"phies":46260,"uminum":46261,"ĠFei":46262,"lesi":46263,"Ġsemantics":46264,"ĠHz":46265,"ĠUnderworld":46266,"Ġendot":46267,"olesterol":46268,"ourning":46269,"Ġcaches":46270,"ĠYug":46271,"Legendary":46272,"ĠDocumentation":46273,"ĠSpiral":46274,"ĠClone":46275,"bnb":46276,"ĠâĶ":46277,"ustom":46278,"Mp":46279,"gettable":46280,"agonist":46281,"Ġneuronal":46282,"culus":46283,"enum":46284,"cules":46285,"Ġmuttered":46286,"ctica":46287,"necess":46288,"ĠSubtle":46289,"Ġsolder":46290,"Environment":46291,"oneliness":46292,"orage":46293,"â̦.\"":46294,"nesota":46295,"agements":46296,"Ùİ":46297,"WHERE":46298,"ĠGDDR":46299,"Scient":46300,"ĠMulcair":46301,"ĠRena":46302,"________________________________________________________________":46303,"antics":46304,"Ġtorped":46305,"Brow":46306,"ossal":46307,"Category":46308,"Regular":46309,"remote":46310,"ãģ":46311,"ĠCoil":46312,"ritch":46313,"specified":46314,"Average":46315,"Ġfingert":46316,"entity":46317,"atibility":46318,"ampunk":46319,"ĠScriptures":46320,"Ġunequ":46321,"arettes":46322,"arching":46323,"Ġastron":46324,"Ġnumeric":46325,"ĠeBook":46326,"remove":46327,"onday":46328,"Ġmetaphysical":46329,"ĠGoku":46330,"Element":46331,"ĠRuin":46332,"Norm":46333,"Ġtox":46334,"puff":46335,"Ġharmonic":46336,"ĠAgility":46337,"ĠHearthstone":46338,"Ġmana":46339,"Points":46340,"Ġconduc":46341,"ĠPersia":46342,"-----":46343,"license":46344,"Application":46345,"assert":46346,"Reader":46347,"ĠSacrifice":46348,"float":46349,"inctions":46350,"byter":46351,"Ġfundament":46352,"\"â̦":46353,"Fourth":46354,"Effective":46355,"ĠMeow":46356,"ĠErrors":46357,"ĠIcar":46358,"ĠMMO":46359,"Ġapostles":46360,"Ġfaintly":46361,"component":46362,"bably":46363,"uggage":46364,"ĠMPG":46365,"krit":46366,"container":46367,"ixture":46368,"ĠPOV":46369,"izabeth":46370,"onut":46371,"isdom":46372,"trace":46373,"ĠSDL":46374,"Interestingly":46375,"ĠExplan":46376,"lesiastical":46377,"ternal":46378,"Bug":46379,"Ġmetabolites":46380,"geries":46381,"Ġsupra":46382,"ĠMakoto":46383,"orget":46384,"racuse":46385,"][":46386,"ĠPrelude":46387,"peria":46388,"tube":46389,"ĠCatalog":46390,"ĠGoblin":46391,"QUEST":46392,"ĠINCLUD":46393,"ĠVERS":46394,"erguson":46395,"Ġcommandments":46396,"ĠUDP":46397,"itle":46398,"ι":46399,"domain":46400,"roximately":46401,"ĠTLS":46402,"ongevity":46403,"Ġmodulation":46404,"Ġdidnt":46405,"ĠCalories":46406,"Applications":46407,"ormon":46408,"Ġsd":46409,"dullah":46410,"Ġcous":46411,"ĠDARK":46412,"clip":46413,"ĠPsychiat":46414,"ĠTanz":46415,"ĠCharisma":46416,"ĠMerge":46417,"ĠKDE":46418,"requires":46419,"urdue":46420,"Ġdecimal":46421,"Ġâī¥":46422,"ĠAuth":46423,"ebted":46424,"ĠTempl":46425,"ĠâĢº":46426,"Ultimate":46427,"Ġmammalian":46428,"advertising":46429,"Ġdominion":46430,"Ġacron":46431,"ĠWem":46432,"ĠHeist":46433,"oiler":46434,"FLAG":46435,"ovember":46436,"Syn":46437,"Ġgodd":46438,"ĠPyth":46439,"Ġglyc":46440,"ĠHelpful":46441,"Ġgad":46442,"chedel":46443,"Similar":46444,"Ġ¶":46445,"Ġnp":46446,"ĠREPL":46447,"Fill":46448,"ĠSunder":46449,"etsy":46450,"ĠPAX":46451,"ĠFemales":46452,"ĠKingdoms":46453,"Ġwhistlebl":46454,"Hide":46455,"serial":46456,"ĠEnemies":46457,"ĠPeb":46458,"Ġpiety":46459,"ifact":46460,"esity":46461,"bsite":46462,"esides":46463,"Ġported":46464,"Ġamygdala":46465,"ĠGerr":46466,"afety":46467,"Ġadip":46468,"(\"":46469,"Ġcf":46470,"Ġurl":46471,"unia":46472,"icro":46473,"Austral":46474,"ĠConfig":46475,"accompanied":46476,"isite":46477,"Ġtextual":46478,"\">":46479,"Ġanecd":46480,"Ġ\",":46481,"angular":46482,"ĠUnicode":46483,"Proof":46484,"Ġmultiplication":46485,"Address":46486,"Ġbytes":46487,"lems":46488,"uterte":46489,"Episode":46490,"oshop":46491,"ritical":46492,"Adjust":46493,"argument":46494,"\\'":46495,"Rober":46496,"pection":46497,"Agg":46498,"äº":46499,"interrupted":46500,"ĠDebor":46501,"Ġlair":46502,"Various":46503,"isively":46504,"ĠStatic":46505,"ohyd":46506,"ĠEchoes":46507,"UID":46508,"raught":46509,"Bott":46510,"Ġapostle":46511,"ĠCentauri":46512,"oxicity":46513,"ibling":46514,"Ġparalle":46515,"inav":46516,"Crit":46517,"ĠTyph":46518,"Ġhig":46519,"ĠEDITION":46520,"Ġcoord":46521,"uish":46522,"sectional":46523,"inki":46524,"Title":46525,"anyahu":46526,"osterone":46527,"Ġdesper":46528,"ribly":46529,"Legend":46530,"afort":46531,"Org":46532,"Ġempir":46533,"ĠQuake":46534,"SSL":46535,"ioxide":46536,"åľ":46537,"Ġenz":46538,"urtle":46539,"BSD":46540,"Rust":46541,"ospels":46542,"Rare":46543,"Ġpartitions":46544,"Ġheresy":46545,"overy":46546,"Ġmonop":46547,"Pixel":46548,"odder":46549,"Option":46550,"withstanding":46551,"Transfer":46552,"Ġarrog":46553,"skip":46554,"ĠSSH":46555,"ĠSph":46556,"Ġcallback":46557,"PIN":46558,"Ġpdf":46559,"Ġplaint":46560,"cipled":46561,"reenshots":46562,"Ġparsing":46563,"::::::::":46564,"ioxid":46565,"Ġhereafter":46566,"ĠFunctions":46567,"ĠBulgar":46568,"Ġintu":46569,"DOC":46570,"Location":46571,"Hyper":46572,"ageddon":46573,"Evil":46574,"illions":46575,"Introduction":46576,"Physical":46577,"ĠLayout":46578,"âķ":46579,"------------------------":46580,"ĠRodham":46581,"ĠPatterns":46582,"Delivery":46583,"Ġdistur":46584,"ĠVolunte":46585,"ĠGUI":46586,"Ġclen":46587,"Ġinacc":46588,"ĠBallistic":46589,"ĠSprite":46590,"Privacy":46591,"theme":46592,"dump":46593,"ĠByte":46594,"ĠIncre":46595,"apult":46596,"ĠWrath":46597,"ensibly":46598,"NOTE":46599,"ounge":46600,"ustomed":46601,"ochond":46602,"ĠQt":46603,"Primary":46604,"Ġsidew":46605,"Root":46606,"gregation":46607,"SQL":46608,"ĠSOFTWARE":46609,"Gallery":46610,"ĠDungeon":46611,"ĠVengeance":46612,"->":46613,"steam":46614,"Ġfrivol":46615,"Ġpid":46616,"filter":46617,"Ġfacult":46618,"doms":46619,"Tool":46620,"1959":46621,"Ġprefix":46622,"Ġcomma":46623,"relative":46624,"Ġformatted":46625,"appropriately":46626,"Ġmd":46627,"xxx":46628,"ĠAuthentication":46629,"ĠWTC":46630,"Ġvulner":46631,"reditary":46632,"Steam":46633,"Tx":46634,"ĠGHC":46635,"Increased":46636,"forcement":46637,"ĠGuant":46638,"bernatorial":46639,"Entry":46640,"ĠWarp":46641,"ĠCreature":46642,"ĠAmmunition":46643,"Ġclust":46644,"ĠInher":46645,"Ġunbel":46646,"RGB":46647,"ĠMankind":46648,"ĠPlague":46649,"Ġ=================================":46650,"psc":46651,"Intern":46652,"tml":46653,"ĠCrusade":46654,"inflamm":46655,"Storage":46656,"token":46657,"inse":46658,"False":46659,"Adult":46660,"Pokémon":46661,"PLIED":46662,"Ġglac":46663,"ĠDwarf":46664,"sequence":46665,"Ġmagnification":46666,"ĠIlluminati":46667,"hedral":46668,"param":46669,"regon":46670,".\",\"":46671,"Eva":46672,"igree":46673,"Object":46674,"Ġoptimizations":46675,"uador":46676,"mmmm":46677,"ullivan":46678,"Ġ[\"":46679,"ĠDusk":46680,"Ġtrig":46681,"Ġiss":46682,"Ġhypert":46683,"Ġperspect":46684,"Ġassum":46685,":,":46686,"Ġinterpol":46687,"Asked":46688,"Boot":46689,"LIB":46690,"Loading":46691,"Ident":46692,"upuncture":46693,"ioch":46694,"Ġprefrontal":46695,"delay":46696,"ĠPoké":46697,"bestos":46698,"overe":46699,"Elf":46700,"eteria":46701,"ĠSneak":46702,"bians":46703,"ĠARTICLE":46704,"Xbox":46705,"encrypted":46706,"ync":46707,"ĠNietzsche":46708,"Nonetheless":46709,"Ġ±":46710,"ĠPrimal":46711,"ĠFlare":46712,"Ġconflic":46713,"ĠRune":46714,"Tes":46715,"cellence":46716,"Mega":46717,"ĠEntity":46718,"chrome":46719,"iatures":46720,"Ġuninstall":46721,"Winner":46722,"aimon":46723,"Ġhomebrew":46724,"Ruby":46725,"araoh":46726,"itime":46727,"Ġpotion":46728,"ĠAllows":46729,"ogyn":46730,"osuke":46731,"Limited":46732,"Ġmacros":46733,"ERROR":46734,"gling":46735,"Ġtodd":46736,"repre":46737,"ĠSakura":46738,"erker":46739,"items":46740,"FIG":46741,"ĠUnle":46742,"Ġhardness":46743,"Split":46744,"Ġarous":46745,"ocally":46746,"Ġì":46747,"ĠEVE":46748,"pleasant":46749,"ihil":46750,"ĠRouter":46751,"ĠLucius":46752,"readable":46753,"Ġtremb":46754,"Dro":46755,"Ġblaster":46756,"Ġbourgeoisie":46757,"NUM":46758,"Alternative":46759,"flags":46760,"GAME":46761,"ebook":46762,"ĠIPM":46763,"Ġcorrel":46764,"Setting":46765,"Frame":46766,"Ġatheism":46767,"Interested":46768,"Liquid":46769,"stanbul":46770,"Lv":46771,"Ġtits":46772,"Ġdc":46773,"×Ļ×":46774,"Ġdoctr":46775,"background":46776,"tsy":46777,"ĠCtrl":46778,"ĠCompatibility":46779,"idae":46780,"example":46781,"perture":46782,"Ġguid":46783,"ĠWinged":46784,"Command":46785,"ridor":46786,"bool":46787,"comments":46788,"ĠImmunity":46789,"Nit":46790,"Statement":46791,"Ġmanif":46792,"ĠIntake":46793,"Bloom":46794,"txt":46795,"context":46796,"input":46797,"achus":46798,"proc":46799,"Ñĭ":46800,"Ġdisemb":46801,"ospons":46802,"utical":46803,"ĠRender":46804,"Ironically":46805,"ursday":46806,"ĠExile":46807,"lishes":46808,"iets":46809,"orescent":46810,"cair":46811,"ĠSubjects":46812,"ĠDungeons":46813,"Ġiii":46814,"neapolis":46815,"ĠBlaster":46816,"Ġphp":46817,"ORED":46818,"ĠSLI":46819,"Ġelig":46820,"ĠIdentified":46821,"ĠBrawl":46822,"bytes":46823,"ĠCTR":46824,"Ġsched":46825,"Assuming":46826,"Bound":46827,"ĠMathemat":46828,"razil":46829,"ĠAstral":46830,"mble":46831,"untled":46832,"Ġmech":46833,"ĠDagger":46834,"ĠUseful":46835,"nesday":46836,"tarians":46837,"AMY":46838,"Camera":46839,"node":46840,"pict":46841,"ginx":46842,"Ġyea":46843,">>>>>>>>":46844,"paragraph":46845,"ĠSupplementary":46846,"9999":46847,"ĠAlchemist":46848,"uzzle":46849,"igun":46850,"ĠCalculator":46851,"ĠApplicant":46852,"hift":46853,"ĠGPL":46854,"Ġencode":46855,"Crash":46856,"ĠNutr":46857,"kHz":46858,"TABLE":46859,"intestinal":46860,"andom":46861,"archive":46862,"Ëľ":46863,"Registered":46864,"Questions":46865,"Remote":46866,"ethyst":46867,"Ġgren":46868,"ĠTexture":46869,"Ġseiz":46870,"Anyway":46871,"ĠVariant":46872,"ê":46873,"Adapt":46874,"ittered":46875,"meta":46876,"ambers":46877,"ĠRuins":46878,"ĠChimera":46879,"password":46880,"ĠReboot":46881,"Ġcaster":46882,"Ġamplitude":46883,"Position":46884,"Ġnotation":46885,"Ġsecretion":46886,"Excellent":46887,"delete":46888,"aminer":46889,"ä»":46890,"Exec":46891,"ĠKenobi":46892,"Interview":46893,"ontent":46894,"ospel":46895,"Ġtuber":46896,"CONT":46897,"roups":46898,"Ġemulator":46899,"Ġjava":46900,"0200":46901,"Ġnested":46902,"Ġfert":46903,")).":46904,"Dex":46905,"ĠSora":46906,"Ġpotions":46907,"ĠAnon":46908,"aah":46909,"Ġdunno":46910,"Ġμ":46911,"Ġmethodological":46912,"itles":46913,"phia":46914,"Beg":46915,"Rules":46916,"ĠXML":46917,"Ġflask":46918,"ĠShogun":46919,"Ġ2048":46920,"atchewan":46921,"Ġfuckin":46922,"Built":46923,"Ġbour":46924,"Ġdisag":46925,"yss":46926,"ĠÏ":46927,"Spoiler":46928,"Wiki":46929,"Ġmorphology":46930,"Ġendors":46931,"Ġdungeons":46932,"dragon":46933,")),":46934,"Ġhous":46935,"Ġoverwhel":46936,"SAY":46937,"abwe":46938,"--------------------------------":46939,"Ġepist":46940,"Ġpalp":46941,"ĠExtensions":46942,"ĠMistress":46943,"ĠUkrain":46944,"================":46945,"edience":46946,"abama":46947,"ĠLua":46948,"ĠOffline":46949,"ĠKonami":46950,"unicip":46951,"ĠMachina":46952,"Specific":46953,"Ġpresupp":46954,"ĠGEAR":46955,"rition":46956,"rences":46957,"successfully":46958,"Ġ1024":46959,"Platform":46960,"}}":46961,"clude":46962,"roxy":46963,"Ġpromot":46964,"ĠAdapter":46965,"rocal":46966,"ĠMasquerade":46967,"Panel":46968,"Language":46969,"elsius":46970,"Push":46971,"abase":46972,"ĠdB":46973,"argon":46974,"ĠRemoved":46975,"amph":46976,"ĠWyr":46977,"Ġindisp":46978,"ĠOkin":46979,"aepernick":46980,"moil":46981,"Continue":46982,"00007":46983,"ĠJournals":46984,"TAG":46985,"ĠRemastered":46986,"Ġsymp":46987,"methyl":46988,"Overview":46989,"umeric":46990,"ĠCodex":46991,".$":46992,"ranged":46993,"Sym":46994,"ĠVerse":46995,"ĠEnabled":46996,"ĠFUCK":46997,"ĠHearth":46998,"Ġbrill":46999,"ĠChaser":47000,"Beh":47001,"ĠAlchemy":47002,"Oracle":47003,"roleum":47004,"ĠVoldemort":47005,"();":47006,"Ġcollaps":47007,"Visual":47008,"ĠAngular":47009,"ĠOsc":47010,"ichita":47011,"Ġcig":47012,"Ġtoolbar":47013,"ĠEnlight":47014,"ÑĮ":47015,"ε":47016,"aliation":47017,"ĠLovecraft":47018,"jri":47019,"ĠInterstellar":47020,"Ġdebugging":47021,"Ġparentheses":47022,"ĠInit":47023,"Located":47024,"Weak":47025,"ĠPvP":47026,"ĠCloak":47027,"uture":47028,"iths":47029,"asionally":47030,"FACE":47031,"Introdu":47032,"');":47033,"slot":47034,"aturday":47035,"ĠNiet":47036,"Ġpuzz":47037,"!!!!!!!!":47038,"folios":47039,"Ç":47040,"Ġverbs":47041,"ĠFrames":47042,"ĠAmbro":47043,"Ġmillisec":47044,"ĠRebell":47045,"ylum":47046,"PASS":47047,"ĠConfiguration":47048,"μ":47049,"brids":47050,"vantage":47051,"Ġ['":47052,"ĠScy":47053,"Benef":47054,"gradation":47055,"ĠOrc":47056,"Resources":47057,"Awesome":47058,"ĠMilitia":47059,"POST":47060,"Ġbinaries":47061,"Mode":47062,"Ġkb":47063,"ĠWARRANT":47064,"hemy":47065,"Desc":47066,"alion":47067,"Ġwiki":47068,"Ġcommer":47069,"Serial":47070,"ĠUncommon":47071,"ignore":47072,"Ġconstructor":47073,"ctl":47074,"Ġ):":47075,"ĠVerify":47076,"Notice":47077,"ĠRPGs":47078,"uckland":47079,"Ġincre":47080,"Pinterest":47081,"ĠDefinitions":47082,"iband":47083,"Ġtd":47084,"Ġsubscrib":47085,"Shin":47086,"ĠGadget":47087,"Document":47088,"å®":47089,"Requ":47090,"QUIRE":47091,"ĠQuadro":47092,"ĠUnix":47093,"Enlarge":47094,"thens":47095,"\"...":47096,"gebra":47097,"pload":47098,"alogue":47099,"vironments":47100,"Strength":47101,"ĠPID":47102,"ĠInvaders":47103,"HOME":47104,"Atl":47105,"ĠBlizz":47106,"ĠWidth":47107,"ĠOpenGL":47108,"zx":47109,"$,":47110,"Ġå":47111,"cig":47112,"lectic":47113,"relation":47114,"Ġfeas":47115,"undown":47116,"Said":47117,"ν":47118,"��":47119,"english":47120,"ĠTokens":47121,"ĠALEC":47122,"OOOO":47123,"isconsin":47124,"Ġconstants":47125,"ĠTemplar":47126,"Accept":47127,"Ġmascul":47128,"enegger":47129,"ampires":47130,"Rated":47131,"lua":47132,"ucl":47133,"ĠSequence":47134,"ĠNRS":47135,"STD":47136,"Cra":47137,"autions":47138,"ĠKernel":47139,"oleon":47140,"htaking":47141,"ancial":47142,"Pages":47143,"orthodox":47144,"ropy":47145,"EEE":47146,"Ġtranssexual":47147,"?????":47148,"Ġsurpr":47149,"arthy":47150,"ĠPsychic":47151,"Ġdorsal":47152,"cember":47153,"joice":47154,"/+":47155,"verend":47156,"uint":47157,"Ġderog":47158,"Subject":47159,"hemat":47160,"!]":47161,"Ġ);":47162,"Ġmeshes":47163,"Ġreperc":47164,"ĠTerran":47165,"åĪ":47166,"Load":47167,"å¹":47168,"ikarp":47169,"rompt":47170,"Ġgoblins":47171,"ĠShattered":47172,"tests":47173,"Spread":47174,"ĠNaruto":47175,"Ġpredic":47176,"Hyp":47177,"ĠArkham":47178,"ĠNASL":47179,"Material":47180,"Rule":47181,"raviolet":47182,"ĠKlingon":47183,"Memory":47184,"acers":47185,"Known":47186,"Important":47187,"Ġα":47188,"Ġtraged":47189,"Ġshalt":47190,"Ġiso":47191,"ĠJSON":47192,"Instant":47193,"Ġpg":47194,"Ġexponent":47195,"formance":47196,"bitcoin":47197,"DOS":47198,"cheat":47199,"Ġrook":47200,"ĠBiol":47201,"noticed":47202,"Ġtwent":47203,"ĠRedux":47204,"ĠBorderlands":47205,"Supported":47206,"TRUMP":47207,"Ġturrets":47208,"include":47209,"Effect":47210,"Ġdisg":47211,"ophical":47212,"ĠFaction":47213,"wiki":47214,"Ġsrc":47215,"Laun":47216,"TIT":47217,"Ġorbs":47218,"Ġincompet":47219,"Ġdescriptor":47220,"ĠTrog":47221,"Contribut":47222,"ĠGodd":47223,"inances":47224,"Ult":47225,"lyak":47226,"âĢ¢âĢ¢âĢ¢âĢ¢":47227,"stitial":47228,"essim":47229,"Graphics":47230,"ubis":47231,"Ġegreg":47232,"DEV":47233,"Ġannotations":47234,"Yang":47235,"ĠDruid":47236,"ĠInquisition":47237,"ohydrate":47238,"Critical":47239,"æĸ":47240,"Sample":47241,"ĠPref":47242,"ĠUnleashed":47243,"ĠAccessed":47244,"Ġconceptions":47245,"Minor":47246,"pard":47247,"prus":47248,"Factory":47249,"thinkable":47250,"Ġexecutable":47251,"chapter":47252,"inyl":47253,"Display":47254,"ilater":47255,"Released":47256,"ĠDirectX":47257,"aneers":47258,"Ġ______":47259,"ĠHilbert":47260,"Options":47261,"Ġsorcery":47262,"esm":47263,"ÏĦ":47264,"Ġdescript":47265,"ĠTycoon":47266,"psons":47267,"Ġcov":47268,"Launch":47269,"ogeneity":47270,"Ġsacrific":47271,"ADRA":47272,"netflix":47273,"flix":47274,"usage":47275,"properties":47276,"attach":47277,"req":47278,"Resource":47279,"requisite":47280,"1007":47281,"ĠMIDI":47282,"ĠZoro":47283,"Tue":47284,"hower":47285,"dds":47286,"ynasty":47287,"headers":47288,"Ġdisproportion":47289,"omaly":47290,"Ġvim":47291,"inces":47292,"edient":47293,"ĠWraith":47294,"ilibrium":47295,"Hig":47296,"ĠFrie":47297,"Meat":47298,"ldom":47299,"KNOWN":47300,"orgetown":47301,"Improve":47302,"10000":47303,"Ġretarded":47304,"Disclaimer":47305,"Ġunfocused":47306,"ĠUnsure":47307,"ĠElixir":47308,"idth":47309,"atural":47310,"ĠErr":47311,"Critics":47312,"ĠBows":47313,"ifferent":47314,"proxy":47315,"Lic":47316,"aucas":47317,"rolet":47318,"ĠCoC":47319,"Ġdoesnt":47320,"phabet":47321,"Version":47322,"Ġhepat":47323,"gif":47324,"izophren":47325,"ãĥ»":47326,"ĠGutenberg":47327,"β":47328,"phans":47329,"Scene":47330,"Ġaccomp":47331,"ilings":47332,"rypted":47333,"aceae":47334,"arantine":47335,"heses":47336,"iasco":47337,"lopp":47338,"ĠGSL":47339,"disk":47340,"ãĢģ":47341,"0010":47342,"ĠOutbreak":47343,"Column":47344,"odox":47345,"atform":47346,"ĠThrust":47347,"ĠSVG":47348,"Enhanced":47349,"¯":47350,"Tools":47351,"rogens":47352,"xus":47353,"Available":47354,"zbollah":47355,"è¡":47356,"osate":47357,"usb":47358,"ordes":47359,"Matrix":47360,"ĠBlazing":47361,"ascus":47362,"ĠSovere":47363,"hement":47364,"*:":47365,"amaru":47366,"Ġparsed":47367,"Bonus":47368,"otrop":47369,"spell":47370,"ancock":47371,"ĠEnchant":47372,"vP":47373,"ĠReferred":47374,"Ġalot":47375,"ĠRuntime":47376,"ĠFn":47377,"CPU":47378,"ĠNicotine":47379,"External":47380,"ĠNightmares":47381,"Ġentropy":47382,"kB":47383,"ĠRealms":47384,"Ġ##":47385,"Ġsubmar":47386,"ĠSlime":47387,"itual":47388,"ĠBastard":47389,"Ġacknowled":47390,"Magazine":47391,"rendered":47392,"ircraft":47393,"CSS":47394,"Numbers":47395,"Pg":47396,"utenant":47397,"ĠPalest":47398,"ĠRoose":47399,"udicrous":47400,"anooga":47401,"Unt":47402,"Ġcapacitor":47403,"Ġschema":47404,"hematic":47405,"ĠPinball":47406,"endars":47407,"Ġ===":47408,"nsic":47409,"ipedia":47410,"Ġchromos":47411,"ĠmRNA":47412,"Ct":47413,"ĠPaladin":47414,"sonian":47415,"Ġæ":47416,"ajor":47417,"repeat":47418,"ortex":47419,"ĠHeroic":47420,"ĠHera":47421,"ociated":47422,"Ġdebug":47423,"osher":47424,"upiter":47425,"_.":47426,"Ġsys":47427,"ĠDownloads":47428,"','":47429,"Adventure":47430,"FORE":47431,"ocument":47432,"arning":47433,"Ġmiscon":47434,"vidia":47435,"Cod":47436,"ibraries":47437,"buffer":47438,"cdn":47439,"ĠModes":47440,"tarian":47441,"ĠPyro":47442,"ĠFixes":47443,"ĠâĪ":47444,"ĠCf":47445,"Testing":47446,"Byte":47447,"nants":47448,"oufl":47449,"ĠCipher":47450,"Aim":47451,"ĠAfgh":47452,"ĠStarCraft":47453,"intendent":47454,"akespe":47455,"Apply":47456,">>>":47457,"Lenin":47458,"ĠShaman":47459,"%\"":47460,"ĠFrenzy":47461,"illusion":47462,"===":47463,"Website":47464,"Allow":47465,"ĠBinary":47466,"ensable":47467,"ĠEmpires":47468,"Ġpromul":47469,"ormonal":47470,"ileaks":47471,"ĠAmmo":47472,"assies":47473,"atican":47474,"avior":47475,"ĠIter":47476,"1024":47477,"uesday":47478,"ĠAppears":47479,"achine":47480,"Problem":47481,"ousy":47482,"ramid":47483,"nox":47484,"··":47485,"omething":47486,"ĠPurg":47487,"artney":47488,"Ġ0000":47489,"psey":47490,"Ġglutamate":47491,"ĠActivate":47492,"Repl":47493,"Priv":47494,"cyclop":47495,"ĠHispan":47496,"atsuki":47497,"Likewise":47498,"JOHN":47499,"POSE":47500,"pherd":47501,"schild":47502,"Ġsuffix":47503,"åIJ":47504,"Ġoptionally":47505,"ĠRecomm":47506,"ĠSpawn":47507,"ARDIS":47508,"Ġinconsist":47509,"Ġenglish":47510,"Beta":47511,"ĠContains":47512,"uddenly":47513,"Ġls":47514,"Dynamic":47515,"åĽ":47516,"Ġ{{":47517,"dq":47518,"Hmm":47519,"oliberal":47520,"ĠCarnage":47521,"ĠRebirth":47522,"incerity":47523,"Ġproletariat":47524,"ĠCrafting":47525,"Explore":47526,"Ġeld":47527,"ĠAnarch":47528,"Ġ(>":47529,"ĠClockwork":47530,"ĠProced":47531,"APTER":47532,"ĠSorcerer":47533,"âĶ":47534,"ĠSnape":47535,"elist":47536,"Balance":47537,"Tube":47538,"Ġ--------------------":47539,"Ġnostalg":47540,"ACTED":47541,"ĠVID":47542,"soever":47543,"ignt":47544,"Ġhypothal":47545,"ĠObj":47546,"igure":47547,"ĠElves":47548,"gorithm":47549,"Romney":47550,"idable":47551,"renheit":47552,"aptic":47553,"Ġnonex":47554,"Profile":47555,"Ġscient":47556,"ĠAchievements":47557,"ĠReload":47558,"Products":47559,"ampire":47560,"pread":47561,"ĠYamato":47562,"Thread":47563,"ĠFML":47564,"ĠForsaken":47565,"Statistics":47566,"Ġ([":47567,"utsu":47568,"nces":47569,"...?":47570,"upload":47571,"Typ":47572,"ĠReflex":47573,"Dial":47574,"Ġspawns":47575,"Server":47576,"Ġacquaint":47577,"iterranean":47578,"='":47579,"Device":47580,"ר":47581,"ocaly":47582,"Remove":47583,"Ġ=====":47584,"Ġabdom":47585,"ideos":47586,"Dual":47587,"Fax":47588,"Ġbesie":47589,"ĠAdin":47590,"Ġdescrib":47591,"Ġiod":47592,"Limit":47593,"aunders":47594,"ĠAssassins":47595,"xxxx":47596,"ulner":47597,"Shipping":47598,"Item":47599,"fortune":47600,"Ġcipher":47601,"mA":47602,"acerb":47603,"ebus":47604,"Ġmodifiers":47605,"Added":47606,"prisingly":47607,"Dir":47608,"ĠArchangel":47609,"umbnails":47610,"Huh":47611,"ĠWARN":47612,"Role":47613,"usional":47614,"Ġcortical":47615,"ĠSCP":47616,"ĠException":47617,"ĠWarhammer":47618,")))":47619,"](":47620,"Ġsynaptic":47621,"Ġcached":47622,"archment":47623,"Ġtarg":47624,"Filter":47625,"ĠHades":47626,"Ġprinc":47627,"halla":47628,"ptoms":47629,"Ïģ":47630,"ructose":47631,"termination":47632,"Ġcompe":47633,"define":47634,"Ġprosec":47635,"require":47636,"ĠCorpse":47637,"Abstract":47638,"********************************":47639,"Used":47640,"ĠIbid":47641,"trak":47642,"ä¸Ń":47643,"ĠGABA":47644,"åĬ":47645,"ĠHegel":47646,"Jere":47647,"odore":47648,"í":47649,"namese":47650,"Origin":47651,"ĠMastery":47652,"gerald":47653,"Charges":47654,"--------------------":47655,"Forge":47656,"comings":47657,"åį":47658,"Ġ(&":47659,"Ġgrap":47660,"Mask":47661,"ĠGundam":47662,"generic":47663,"ĠMalf":47664,"raphics":47665,"Internal":47666,"ourge":47667,"Ġirresist":47668,"sterdam":47669,"Ġendogenous":47670,"Export":47671,"Ġë":47672,"poons":47673,"Ġabund":47674,"ĠQuantity":47675,"Issue":47676,"âĪĴ":47677,"cknow":47678,"Anonymous":47679,"ĠDRAG":47680,"Wikipedia":47681,"Ġsubdu":47682,"iverpool":47683,"apesh":47684,"Ability":47685,"ĠCentOS":47686,"iseum":47687,"lycer":47688,"Untitled":47689,"Ġlineback":47690,"Ġtomat":47691,"byte":47692,"tile":47693,"linux":47694,"Palest":47695,"canon":47696,"FAULT":47697,"ĠkHz":47698,"Ġhelic":47699,"ĠIGF":47700,"WARE":47701,"Feature":47702,"ĠGraveyard":47703,"ĠNemesis":47704,"akuya":47705,"inement":47706,"Ġwhence":47707,"ractical":47708,"Ping":47709,"tesque":47710,"scroll":47711,"espie":47712,"Ġasynchronous":47713,"ocre":47714,"Measure":47715,"morph":47716,"std":47717,"Settings":47718,"Course":47719,"Ġ],":47720,"Ïĥ":47721,"Documents":47722,"estern":47723,"Ġtf":47724,"Ġcircumcised":47725,"geant":47726,"Ġconject":47727,"ĠFolder":47728,"outube":47729,"ĠMedline":47730,"Status":47731,"ctr":47732,"anoia":47733,"ĠPowerShell":47734,"Chel":47735,"Loop":47736,"Ġresize":47737,"aphael":47738,"workshop":47739,"velength":47740,"hover":47741,"flush":47742,"Ġβ":47743,"Task":47744,"pedia":47745,"ptin":47746,"bidden":47747,"windows":47748,"ĠCaucas":47749,"aml":47750,"isoft":47751,"Ġrs":47752,"cgi":47753,"urrection":47754,"miah":47755,"ÏĤ":47756,"Ġplaythrough":47757,"Reddit":47758,"׾":47759,"Ġannotation":47760,"Ġnobles":47761,"seq":47762,"mares":47763,"Ġwik":47764,"foreseen":47765,"RPG":47766,"Ġreper":47767,"aredevil":47768,"arcity":47769,"/\"":47770,"Ġ});":47771,"Ġdiscont":47772,"ĠBinding":47773,"answered":47774,"Mesh":47775,"ĠMPEG":47776,"Ġperceptual":47777,"OTAL":47778,"ursive":47779,"ãģĦ":47780,"Ġplun":47781,"onential":47782,"ãĤ":47783,"ĠReloaded":47784,"iscopal":47785,"ĠDespair":47786,"FIX":47787,"Ġheterogeneity":47788,",[":47789,"ichick":47790,"DCS":47791,"Ġcooldown":47792,"................":47793,"Ġsomew":47794,"Battery":47795,"stract":47796,"Attempt":47797,"allery":47798,"ĠNept":47799,"Ġtac":47800,"ĠElemental":47801,"Function":47802,"Ġbindings":47803,"versive":47804,"ĠWarlock":47805,"Response":47806,"ĠNPCs":47807,"ollower":47808,"ĠReborn":47809,"Ġphenotype":47810,"uscript":47811,"Ġpecul":47812,"!/":47813,"Unique":47814,"ĠFreeBSD":47815,"ĠChero":47816,"Ġcolle":47817,"gently":47818,"Empty":47819,"rss":47820,"Ġdd":47821,"forge":47822,"ĠTraps":47823,"×Ķ":47824,"iblical":47825,"---------":47826,"uminati":47827,"login":47828,"asus":47829,"xual":47830,"ĠMiko":47831,"ĠDrac":47832,"ssh":47833,"Submit":47834,"ĠMultiplayer":47835,"leanor":47836,"Orig":47837,"anism":47838,"peror":47839,"ĠESV":47840,"Ġencour":47841,"å°":47842,"ĠPLoS":47843,"ĠCrusher":47844,"ocrates":47845,"ynchronous":47846,"§":47847,"ĠLuffy":47848,"Lastly":47849,"Ġdiffere":47850,"okane":47851,"Enh":47852,"ursor":47853,"Ġapopt":47854,"ĠTotem":47855,"ä½":47856,"Honest":47857,"xml":47858,"Created":47859,"Ġteleport":47860,"NRS":47861,"ccess":47862,"ilitary":47863,"ackets":47864,"Ġenchantment":47865,"ĠCunning":47866,"ortmund":47867,"Altern":47868,"Alternatively":47869,"ĠLuthor":47870,"Publisher":47871,"GBT":47872,"çĶ":47873,"Activity":47874,"Ġleptin":47875,"æĪ":47876,"ĠStarfleet":47877,"å¸":47878,"oooooooo":47879,"Ġlawy":47880,"Frag":47881,"ת":47882,"yright":47883,"cookie":47884,"Finish":47885,"wikipedia":47886,"ĠAbilities":47887,"interface":47888,"Ġglared":47889,"Engineers":47890,"ĠAtk":47891,"oteric":47892,"Ġbyte":47893,"ossibility":47894,"Label":47895,"ĠCSV":47896,"Ġè":47897,"ĠOblivion":47898,"android":47899,"rehensive":47900,"ĠCommands":47901,"clud":47902,"ĠTutorial":47903,"retched":47904,"irlwind":47905,"conserv":47906,"ministic":47907,"void":47908,"ernels":47909,"alias":47910,"ĠDraco":47911,"desktop":47912,"ĠMormonism":47913,"oÄŁ":47914,"kef":47915,"Ġtimestamp":47916,"WAYS":47917,"ãģĹ":47918,"\"(":47919,"eneg":47920,"CHAT":47921,"Ġnpm":47922,"ĠGrenade":47923,"rongh":47924,"dinand":47925,"Definition":47926,"ĠInteger":47927,"Ġmodifier":47928,"Ġdex":47929,"ĠParameters":47930,"andestine":47931,"ĠSHALL":47932,"Purchase":47933,"enaries":47934,"Ġstarship":47935,"Armor":47936,"Skill":47937,"Ġlookup":47938,"verages":47939,"Minimum":47940,"ĠBleach":47941,"Ġdf":47942,"inosaur":47943,"ixel":47944,"Zip":47945,"temp":47946,"ruby":47947,"Fram":47948,"sword":47949,"Minecraft":47950,"strous":47951,"Client":47952,"ĠBarbarian":47953,"æĹ":47954,"USER":47955,"ĠMehran":47956,"axies":47957,"ermanent":47958,"ĠHeader":47959,"ablishment":47960,"hyde":47961,"Snake":47962,"ĠTelesc":47963,"Pocket":47964,"Ġ........":47965,"Destroy":47966,"Method":47967,"ĠZup":47968,"olulu":47969,"Ġunemploy":47970,"Temp":47971,"ĠExplicit":47972,"人":47973,"cache":47974,"innamon":47975,"Ġunavoid":47976,"Summary":47977,"Ġappre":47978,"Ġtaxp":47979,"XXX":47980,"ieval":47981,"ĠSummon":47982,"å¤":47983,"Lear":47984,"ibliography":47985,"CLASS":47986,"dimension":47987,"ĠHorde":47988,"Ġfilesystem":47989,"ĠQiao":47990,"obbies":47991,"DIR":47992,"Ġimpedance":47993,"éĩ":47994,"Names":47995,"ĠDrupal":47996,"Applic":47997,"imei":47998,"ynchron":47999,"Ire":48000,"ĠMinion":48001,"ĠHaste":48002,"ä¿":48003,"Ġ(=":48004,"LinkedIn":48005,"Maps":48006,"ifacts":48007,"Damage":48008,"odynam":48009,"ĠShroud":48010,"Ancient":48011,"enhagen":48012,"Tact":48013,"anship":48014,"aturdays":48015,"ãģ«":48016,"ikhail":48017,"ãģ®":48018,"framework":48019,"lication":48020,"â̦]":48021,"Plug":48022,"ĠLilith":48023,"browser":48024,"offset":48025,"ĠJuda":48026,"ciating":48027,"console":48028,"Ġ=================":48029,"._":48030,"ĠPuzz":48031,"OPLE":48032,"erial":48033,"OHN":48034,"ĠGolem":48035,"ierrez":48036,"Ġ},":48037,"inition":48038,"insula":48039,"ĠEntered":48040,"greSQL":48041,"ĠFlask":48042,"ĠXCOM":48043,"fixes":48044,"ĠWeasley":48045,"arser":48046,"Ġrc":48047,"microsoft":48048,"HHHH":48049,"INFO":48050,"rehend":48051,"Ġpolymorph":48052,"Button":48053,"âī":48054,"QUI":48055,"twitch":48056,"jriwal":48057,"ĠSaiyan":48058,"Ġadherent":48059,"acters":48060,"arthed":48061,"âĢł":48062,"Ġfoss":48063,"ã":48064,"Quote":48065,"ependent":48066,"Ġhorr":48067,"UGC":48068,"Weiss":48069,"styles":48070,"advertisement":48071,"Credits":48072,"Lua":48073,"ĠUCH":48074,"Ġhorrend":48075,"Ġminion":48076,">,":48077,"ãĥ³":48078,"Ġinclud":48079,"Compar":48080,"Ġ[]":48081,"Ġ(<":48082,"Phones":48083,"paralleled":48084,"HTML":48085,"Ġ(%":48086,"raltar":48087,"Ġamd":48088,"Maximum":48089,"ĠSolitaire":48090,"SCP":48091,"ĠVaugh":48092,"ĠCLR":48093,"database":48094,"module":48095,"̶":48096,"Capture":48097,"Window":48098,"ubuntu":48099,"Includes":48100,"ĠUriel":48101,"ORPG":48102,"κ":48103,"âĪ":48104,"ä¸Ģ":48105,"Ġdexter":48106,"ĠGlac":48107,"slice":48108,"HAHAHAHA":48109,"\\\"":48110,"lations":48111,"ÙIJ":48112,"ĠAUTH":48113,"earch":48114,"ĠSocket":48115,"Character":48116,"Sort":48117,"Ġindist":48118,"/_":48119,"ĠAntar":48120,"ifix":48121,"Ġlich":48122,"variable":48123,"_(":48124,"Ġgui":48125,"Herm":48126,"elvet":48127,"è¯":48128,"Developer":48129,"Ġkcal":48130,"ciation":48131,"Transaction":48132,"Ġdocker":48133,"###":48134,"ĠVegeta":48135,"Result":48136,"ocamp":48137,"aughtered":48138,"Increase":48139,"aples":48140,"iannopoulos":48141,"zbek":48142,"estyles":48143,"emonium":48144,"è¿":48145,"ĠFANT":48146,"Reason":48147,"Elsewhere":48148,"\"\"":48149,"ĠArtifact":48150,"Authent":48151,"herical":48152,"Ġmembr":48153,"socket":48154,"Elsa":48155,"Condition":48156,"Ġlapt":48157,"Ġsorcerer":48158,"Layer":48159,"apters":48160,"Ġveter":48161,"Myth":48162,"ensical":48163,"ÏĢ":48164,"noxious":48165,"Ġunpre":48166,"Flags":48167,"OOOOOOOO":48168,"Ġincent":48169,"Combat":48170,"Session":48171,"Ġteleportation":48172,"éĢ":48173,"ortment":48174,"Admin":48175,"Fixed":48176,"×Ļ":48177,"Ġconfir":48178,"ãģŁ":48179,"morrow":48180,"osponsors":48181,"\\/":48182,"ictionary":48183,"Num":48184,"Ġquir":48185,"åº":48186,"à¨":48187,"Ġ<<":48188,"Attempts":48189,"ãģ§":48190,"λ":48191,"Features":48192,"XXXX":48193,"Ġinflamm":48194,"VERSION":48195,"ortality":48196,"spawn":48197,"ratulations":48198,"Ġcharism":48199,"Ġ&&":48200,"Dialogue":48201,"luster":48202,"<<":48203,"args":48204,"redients":48205,"Ġpredicate":48206,"qqa":48207,"etheus":48208,"Ġ(!":48209,"Ġshowc":48210,"cmd":48211,"bringer":48212,"Ġcoh":48213,"Input":48214,"ĠFANTASY":48215,"Ġfict":48216,"Blocks":48217,"Install":48218,"vector":48219,"umblr":48220,"agnar":48221,"Array":48222,"Ġembry":48223,"Ġtheoret":48224,"Ġhref":48225,"irrel":48226,"irements":48227,"iations":48228,"Ġ(/":48229,"Thumbnail":48230,"Ġhashes":48231,"^^":48232,"Copy":48233,"Ġeq":48234,"translation":48235,"Favorite":48236,"Fail":48237,"Ġogre":48238,"isites":48239,"Merit":48240,"ãģ¦":48241,"DATA":48242,"rarily":48243,"igmatic":48244,"Sequ":48245,"Els":48246,"ãģª":48247,"lehem":48248,"requency":48249,"aughed":48250,"Ġdistingu":48251,"Ġartific":48252,"Ġdwarves":48253,"Í":48254,"resy":48255,"~~":48256,"sofar":48257,"ideon":48258,"ozyg":48259,"EEEE":48260,"ĠMelee":48261,"大":48262,"tumblr":48263,"ssl":48264,"Wra":48265,"ONSORED":48266,"Ġvowel":48267,"},":48268,"Vari":48269,"cientious":48270,"Node":48271,"Ġsorce":48272,"========":48273,"perse":48274,"Detailed":48275,"isphere":48276,"Background":48277,"ĺħ":48278,"Redd":48279,"ìĿ":48280,"ãģ¨":48281,"ĠCTRL":48282,"Ġç":48283,"iculty":48284,"ername":48285,"Ġns":48286,"Deploy":48287,"Ġhapp":48288,"Ġ///":48289,"Begin":48290,"Ġgp":48291,"$.":48292,"Output":48293,"Suggest":48294,"×IJ":48295,"ĠToggle":48296,"Ġnutrit":48297,"Ġ\\\"":48298,"Ġpreval":48299,"Ġsubreddits":48300,"Menu":48301,"Amount":48302,"ĠWasteland":48303,"Ġsprites":48304,"Ġshader":48305,"Ġ;)":48306,"NAME":48307,"CLUD":48308,"Ġgoblin":48309,"Refer":48310,"ÙĴ":48311,"á¹":48312,"Improved":48313,"endiary":48314,"Ġassail":48315,"chieve":48316,"reply":48317,"Ġcontrad":48318,"cients":48319,"GROUP":48320,"Controller":48321,"omsky":48322,"chemist":48323,"packages":48324,"ombies":48325,"scl":48326,"Ġibn":48327,"çĽ":48328,":(":48329,"ĠMinotaur":48330,"niper":48331,"====":48332,"Ġsubsc":48333,"è¦":48334,"Ġinteger":48335,"Ġ\"-":48336,"Ġtheorem":48337,"utenberg":48338,"Trigger":48339,"github":48340,"ä¼":48341,"##":48342,"xtap":48343,"oké":48344,"ilial":48345,"idepress":48346,":\\":48347,"Param":48348,"Correction":48349,"ïve":48350,"Chest":48351,"ש":48352,"ĠÏĦ":48353,"Ġrespawn":48354,"Ġrall":48355,"Ġcreatine":48356,"umsy":48357,"ĠTemplate":48358,"foo":48359,"query":48360,"Ġmanufact":48361,"Hardware":48362,"iframe":48363,"Ġ-------":48364,"Ġrecip":48365,"ĠAttributes":48366,"Ġforeskin":48367,"ãĤĭ":48368,"ãĥĦ":48369,"uania":48370,"................................................................":48371,"Ġphylogen":48372,"eaturing":48373,"Ġsprite":48374,"Ġinvari":48375,"DonaldTrump":48376,"({":48377,"ĠMalfoy":48378,"Gamer":48379,"ĠPlugin":48380,"γ":48381,"Query":48382,"ĠPuzzles":48383,"inventory":48384,"trl":48385,"Insert":48386,"Ġawa":48387,"ĠWerewolf":48388,"Ġhorizont":48389,"×ŀ":48390,"Ġcunt":48391,"]]":48392,"ĠByz":48393,"Mouse":48394,"Ġ[[":48395,"ĠCthulhu":48396,"ĠDRAGON":48397,"Default":48398,"ĠPresbyter":48399,"Ġff":48400,"Ġorcs":48401,"Construct":48402,"ĠDebug":48403,"Ġ*/":48404,"×ij":48405,"Ġembr":48406,"License":48407,"css":48408,"incinn":48409,"Prosecut":48410,"Ġsugg":48411,"å¾":48412,"ĠUndead":48413,"æĿ":48414,"Ġfs":48415,"Ġthw":48416,"Vector":48417,"åĮ":48418,"settings":48419,"å¯":48420,"Ġssh":48421,"ĠConverted":48422,"ãĤĴ":48423,"risome":48424,"Ġagre":48425,"Collection":48426,"cmp":48427,"puter":48428,"alloc":48429,"Ġé":48430,"ascade":48431,"ĠSpells":48432,"Ġ:-)":48433,"Haunted":48434,"Ġadolesc":48435,"FORMATION":48436,"ĠImperium":48437,"ãĥ¼":48438,"Supplement":48439,"Render":48440,"Theme":48441,"ĠTorment":48442,"([":48443,"ëĭ":48444,"Ġhtml":48445,"Ġjuven":48446,"ĠSiber":48447,"Ġdaemon":48448,"ivariate":48449,"objects":48450,"negie":48451,"Ġindu":48452,"landish":48453,"Meta":48454,"Impl":48455,"Ġglyph":48456,"Ġ-->":48457,"Ġstreng":48458,"agascar":48459,"guyen":48460,"((":48461,")[":48462,"ĠNorn":48463,"Ġhippocamp":48464,"Ġ¯":48465,"îĢ":48466,"Connection":48467,"PATH":48468,"mbuds":48469,"ĠShards":48470,"Ġadvoc":48471,"Ġsimulac":48472,"âĸij":48473,"!?\"":48474,"ĠPotion":48475,"Ġamulet":48476,"ĠFnatic":48477,"Ġcryptoc":48478,"wav":48479,"radius":48480,"pkg":48481,"ĠMFT":48482,"æĢ":48483,"Ġtoile":48484,"Items":48485,"ifference":48486,"errors":48487,"ĠCelt":48488,"Ġunpop":48489,"ilogy":48490,"6666":48491,"hesda":48492,"Instruct":48493,"å·":48494,"Materials":48495,"ettings":48496,"Percent":48497,"Ġresistor":48498,"tymology":48499,"Ġdeprecated":48500,"Ġgrep":48501,"ĠWRITE":48502,"Ġtriv":48503,"Ġscrut":48504,"[/":48505,"anyl":48506,"skirts":48507,"MSN":48508,"ĠCodec":48509,"ecd":48510,"Anth":48511,"){":48512,"%]":48513,"veyard":48514,"aspberry":48515,"ãĢ":48516,"Reward":48517,"rha":48518,"Stretch":48519,"]-":48520,"Prev":48521,"Context":48522,"Ġlinux":48523,"HAHA":48524,"perties":48525,"ĠVIDE":48526,"Domain":48527,"Ġmurd":48528,"ĠLegions":48529,"apache":48530,"æŃ":48531,"Pause":48532,"Temperature":48533,"ufact":48534,"igslist":48535,"ĠRetrieved":48536,"èª":48537,"ãģĮ":48538,"Ingredients":48539,"ruary":48540,"dyl":48541,"Alias":48542,"ĠÎĶ":48543,"Ġinval":48544,"amsung":48545,"!--":48546,"olean":48547,"æī":48548,"ãģ¯":48549,"Ġcoefficients":48550,"ĠDHCP":48551,"âĨĴ":48552,"utonium":48553,":[":48554,"âĹ":48555,"cli":48556,"Container":48557,"å¼":48558,"nexus":48559,"SOURCE":48560,"Ò":48561,"=/":48562,"Ġmysql":48563,"ĠGained":48564,"Ġ/*":48565,"uncture":48566,"Ġstatically":48567,"âĸł":48568,"æĺ¯":48569,"æ°":48570,"estamp":48571,"Cache":48572,"ulkan":48573,"staking":48574,"apter":48575,"ãģ¾":48576,"Ġμg":48577,"Ġtremend":48578,"ĠPiercing":48579,"naissance":48580,"ĠHealer":48581,"Enabled":48582,"éģ":48583,"âĸ":48584,"ĠThumbnails":48585,"Ġhither":48586,"Format":48587,"utherland":48588,"íķ":48589,"Ġdestro":48590,"fff":48591,"execute":48592,"msg":48593,"romancer":48594,"ĠCanaver":48595,"ĠVaults":48596,"oided":48597,"iage":48598,"Ġimg":48599,"summary":48600,"]);":48601,"ĠABE":48602,"ĠGamergate":48603,"utherford":48604,"Ġoverwrite":48605,"enment":48606,"æķ":48607,"Ġsystemd":48608,"tif":48609,"]).":48610,"ãĤ¤":48611,"Widget":48612,"======":48613,"(-":48614,"Ġ\"+":48615,"ĠIncarnation":48616,"æĥ":48617,"���":48618,"GUI":48619,"èĥ":48620,"forums":48621,"Ġrunes":48622,"Ġâī¤":48623,"Ġdefic":48624,"Distance":48625,"directory":48626,"ĠHorus":48627,"iltr":48628,"ortium":48629,"Ġ./":48630,"bda":48631,"owship":48632,"ĠâĨij":48633,"}.":48634,"åĩ":48635,"1027":48636,"Weapons":48637,"lucent":48638,"Ġauth":48639,";;":48640,"Recommended":48641,"Ġsurv":48642,"Ġvm":48643,"ĠStronghold":48644,"Ġparan":48645,"ĠTrance":48646,"æĺ":48647,"Ġsovere":48648,"Ġcorrid":48649,"ĠPwr":48650,"Ġ[/":48651,"Ġseq":48652,"Population":48653,"Ġ[];":48654,"Ġreferen":48655,"ĠInstr":48656,"ĠStamina":48657,"kernel":48658,"Python":48659,"-+":48660,"Ġallele":48661,"éĽ":48662,"isode":48663,"ä¸į":48664,"otonin":48665,"modules":48666,"Notable":48667,"Spell":48668,"\\\\":48669,"Pref":48670,"Ġdatas":48671,"setup":48672,"Ġhapl":48673,"Height":48674,"åĭ":48675,"ãģ£":48676,"]),":48677,"Handle":48678,"umenthal":48679,"Package":48680,"Ġenthus":48681,"Ġunsus":48682,"Narr":48683,"Examples":48684,"FAQ":48685,"REDACTED":48686,"Ġnotor":48687,"Enable":48688,"Pattern":48689,"aeda":48690,">.":48691,"CHECK":48692,"Ġ����":48693,"Ġ'.":48694,"Ġãĥ":48695,"append":48696,"����":48697,"gemony":48698,"terness":48699,"ĠHaku":48700,"NVIDIA":48701,"queue":48702,"Bind":48703,"Ġneigh":48704,"armor":48705,"retty":48706,"LOD":48707,"plugins":48708,"Ġ/>":48709,"TYPE":48710,"Ġ4096":48711,"-------":48712,"Preview":48713,"FML":48714,"Ġproletarian":48715,"zees":48716,"enfranch":48717,"ãģĨ":48718,"Ctrl":48719,"Module":48720,"ĠSurviv":48721,"ĠStarcraft":48722,"rored":48723,"reddit":48724,"Ġrul":48725,"Ġtx":48726,"Ġmage":48727,"Sword":48728,"Ġ~/":48729,"Effects":48730,"éļ":48731,"ä¹":48732,"Sensor":48733,"Solution":48734,"ãģĻ":48735,"Arcade":48736,"Ġpredec":48737,"Values":48738,"Length":48739,"Ġfortun":48740,"ttp":48741,"\"[":48742,"tmp":48743,"ĠBerserker":48744,"åĨ":48745,"ositories":48746,"Ġcouncill":48747,"ffff":48748,"));":48749,"Recipe":48750,"ĠASCII":48751,"âĦ¢:":48752,"ä":48753,"Ġhorm":48754,"=>":48755,"sers":48756,"ãģĭ":48757,"Recommend":48758,"['":48759,"agame":48760,"Animation":48761,"aucuses":48762,"Discussion":48763,"Ġhelicop":48764,"å¿":48765,"Float":48766,"Component":48767,"instance":48768,"Ġfoo":48769,"localhost":48770,"=-":48771,"Offset":48772,"Psy":48773,"ĠGohan":48774,"buquerque":48775,"Ġdefe":48776,"chwitz":48777,"parse":48778,"Ġdors":48779,"Ġspons":48780,"Ġasync":48781,"agonists":48782,"Ġindo":48783,".>>":48784,"ĠDisciple":48785,"Ġfilename":48786,"rency":48787,"ĠDise":48788,"Ġ\"/":48789,"template":48790,"ãĤ¹":48791,"swers":48792,"Ġ++":48793,"Ġ[(":48794,"thora":48795,"ĠDepths":48796,"livious":48797,"Ġdisadvant":48798,"foundland":48799,"Upload":48800,"Ġ§§":48801,"Ġsophistic":48802,";}":48803,"izont":48804,"\"}":48805,"estial":48806,"Ranked":48807,"ĠOccupations":48808,"LEASE":48809,"ĠOgre":48810,"folder":48811,"Plot":48812,"farious":48813,"Ġsuscept":48814,"Types":48815,"Discuss":48816,"Ġ'/":48817,"æµ":48818,"earable":48819,"æ³":48820,"Tile":48821,"iatus":48822,"åŃ":48823,"Ġreperto":48824,"Helper":48825,"Returns":48826,"ä¸Ĭ":48827,"imaru":48828,"Ġreq":48829,"Ġdissatisf":48830,"multipl":48831,"}{":48832,"-[":48833,"itial":48834,"*/":48835,"Config":48836,"Example":48837,"ĠjQuery":48838,"Mods":48839,"ĠGPIO":48840,"Ġlaun":48841,"layout":48842,"cised":48843,"Ġ......":48844,"+++":48845,"prototype":48846,"Exception":48847,"Ġsubsections":48848,"Ġresemb":48849,"Ġâĩ":48850,"ĠPubMed":48851,"username":48852,"Ġaggro":48853,"éĥ":48854,"Ġ};":48855,"ĠMages":48856,"ryu":48857,"apons":48858,"Optional":48859,"ĠAncients":48860,"ãĤĬ":48861,"Quotes":48862,"oaded":48863,"Ġsuspic":48864,"inline":48865,"omial":48866,"ĠMahjong":48867,"auntlets":48868,"Ġanarchism":48869,"Ġsubclass":48870,"ĠMLG":48871,"...]":48872,"Dialog":48873,"uphem":48874,"Ġrecursive":48875,"7601":48876,"frac":48877,"Else":48878,"ĠSeverus":48879,"},{\"":48880,"ĠCLIENT":48881,"Ġjavascript":48882,"sama":48883,"ĠLearns":48884,"ãĤĤ":48885,"Upgrade":48886,"Listener":48887,"Ġsnipp":48888,"Ġrune":48889,"ĠTTL":48890,"ertation":48891,"olicy":48892,"=\"\"":48893,"«ĺ":48894,"Ġexpr":48895,"ovych":48896,"Ġãģ":48897,"_-_":48898,"munition":48899,"////":48900,"func":48901,">>>>":48902,"Provider":48903,"Ïī":48904,"BUG":48905,"Ġ[-":48906,"Ġarrang":48907,"merce":48908,"ãĥ":48909,"incarn":48910,"Valid":48911,"ĠAether":48912,"ãĤĵ":48913,"ĠUTF":48914,"ĠMonstrous":48915,"ãĤĮ":48916,"hedon":48917,"áµ":48918,":#":48919,"ĠFrieza":48920,"padding":48921,"Reviewer":48922,"Ġpsychiat":48923,"yrinth":48924,"ĠâĶĤ":48925,"hillary":48926,"Static":48927,"Newsletter":48928,"Avg":48929,"Ġfn":48930,"Topic":48931,"choes":48932,"Ġnewsp":48933,"á¸":48934,"Ġ[+":48935,"~~~~~~~~~~~~~~~~":48936,":]":48937,"apego":48938,"buf":48939,"Translation":48940,"ById":48941,"Ġmmol":48942,"ãĥ¼ãĥ":48943,"å½":48944,"ãĤī":48945,"Ġparser":48946,"ãĥª":48947,"`,":48948,"Lair":48949,")}":48950,"ypes":48951,"adobe":48952,"Ġancest":48953,"ernel":48954,"ĠNULL":48955,"ç«":48956,"anguages":48957,"Increases":48958,"æĦ":48959,"utorial":48960,"ithmetic":48961,"dll":48962,"ĠArcane":48963,"çī":48964,"Ġtc":48965,"urtles":48966,"èĪ":48967,"Bytes":48968,"Slot":48969,"ĠBahá":48970,"Weapon":48971,"widget":48972,"querque":48973,"Ġembodiments":48974,"å¥":48975,"WARN":48976,"swer":48977,"thumbnails":48978,"FFFF":48979,"inguishable":48980,"Ġâī":48981,"Ġ${":48982,"AAAAAAAA":48983,"Conclusion":48984,"ĻĤ":48985,"disable":48986,"Rect":48987,"Ġsubp":48988,"Ġ().":48989,"ĠDetected":48990,"èĢ":48991,"[]":48992,"Ġcoerc":48993,"ĠmM":48994,"recated":48995,"fusc":48996,"ĠSorce":48997,"çĶŁ":48998,").[":48999,"Ġ})":49000,"mobi":49001,"yip":49002,"Acknowled":49003,"ternity":49004,"iqueness":49005,"ython":49006,"><":49007,"Ġstd":49008,"Url":49009,"Ġnamespace":49010,"Ġtion":49011,"oother":49012,"Ó":49013,"Ġhemor":49014,"Ġrg":49015,"ventory":49016,"ãĤ¢":49017,"anamo":49018,"Socket":49019,"Topics":49020,"apeshifter":49021,"gnu":49022,"Ġdetrim":49023,"`.":49024,"romeda":49025,"çIJ":49026,"Ġlambda":49027,"Compan":49028,"Variable":49029,"Ġusb":49030,"ĠAdamant":49031,"ournal":49032,"Ġcovari":49033,"ãĥ©":49034,"éĸ":49035,"åİ":49036,"otaur":49037,"Ġ(),":49038,"Marginal":49039,"ãģı":49040,"Ġphysic":49041,"adeon":49042,"RESULTS":49043,"200000":49044,"ãģį":49045,"udeb":49046,"ãģĵ":49047,"COMPLE":49048,"Ġmsg":49049,"ghazi":49050,"/*":49051,"ĠDeity":49052,"Ġdisapp":49053,"Availability":49054,"Ġillum":49055,"à©":49056,"ptives":49057,",âĢĶ":49058,"chnology":49059,"Ġaccur":49060,"Ġapi":49061,"Obj":49062,"ãĤ«":49063,"ãĤ¸":49064,"ä¹ĭ":49065,"ËĪ":49066,"Ġtcp":49067,"Required":49068,".<":49069,"\".[":49070,"Ġ~/.":49071,"Ġobser":49072,"RFC":49073,"Ġintegers":49074,"åī":49075,"Installation":49076,"Ô":49077,"ó":49078,"csv":49079,"ãĥ«":49080,"ĠNoticed":49081,"âĸĵ":49082,"Tumblr":49083,"Reply":49084,"||":49085,"Ġconclud":49086,"Ġ))":49087,"ebin":49088,"sql":49089,"Closure":49090,"++++":49091,"],[":49092,"âĹı":49093,"Ġprolet":49094,"Ġ>=":49095,"estinal":49096,"Ġ[*":49097,"ĠInquisitor":49098,"Ġcmd":49099,"FINE":49100,"CRIP":49101,"Ġvertex":49102,"TeX":49103,"///":49104,"Ö¼":49105,"iscons":49106,"Ġmyster":49107,"Changed":49108,"timeout":49109,"irtual":49110,"Methods":49111,"Ġcerts":49112,"texture":49113,"Roaming":49114,"Proxy":49115,"Override":49116,"éĹ":49117,"utf":49118,"python":49119,"ĠRarity":49120,"ilitarian":49121,"çľ":49122,"().":49123,"æł":49124,"Ġbuf":49125,"åij":49126,"çķ":49127,"Ġ*.":49128,"umerable":49129,"~~~~":49130,"å¦":49131,"Ġsimultane":49132,"Ġjson":49133,"Requires":49134,"Ġperl":49135,"Interface":49136,"rupal":49137,":":49242,"itialized":49243,"HTTP":49244,"Trivia":49245,"Sov":49246,"wrapper":49247,"={":49248,"ĠAzerb":49249,"aeper":49250,"Ġneighb":49251,"initions":49252,"Ġsts":49253,"ĠSasuke":49254,"#$":49255,"uliffe":49256,"æĸ¹":49257,"++++++++++++++++":49258,"ĠElven":49259,"ãģĤ":49260,"Ġartif":49261,"Folder":49262,"Ġà¨":49263,"åĤ":49264,"Ġphyl":49265,"uggest":49266,"blance":49267,"ãģł":49268,"Requirements":49269,"Usage":49270,"Ġinitialized":49271,"ã쮿":49272,"conservancy":49273,"ĠReincarn":49274,")|":49275,"Ġantioxid":49276,"ĠClicker":49277,"Ġunlaw":49278,"Ġ\\(":49279,"ãĥĪ":49280,"Ġ[*]":49281,"Characters":49282,"////////":49283,"ãĢIJ":49284,"ãĤ·":49285,"webkit":49286,"ãĢij":49287,"Ġxp":49288,"alkyrie":49289,"Console":49290,"());":49291,"ĠKorra":49292,"\"))":49293,"oooooooooooooooo":49294,"Timer":49295,"////////////////":49296,"yout":49297,"engeance":49298,"emetery":49299,"Ġmages":49300,"mods":49301,"Null":49302,"Ġphilos":49303,"ascript":49304,"Ġaddon":49305,"ĠâĸĪ":49306,"emale":49307,"----------------------------------------------------------------":49308,"Ġ\\\\":49309,"=[":49310,"ĠParables":49311,"ãĥĨ":49312,"VALUE":49313,"Ġ@@":49314,"Ġuint":49315,"${":49316,"cpp":49317,"%%":49318,"Ġ(âĪĴ":49319,"utils":49320,"prefix":49321,"å°Ĩ":49322,"ãĥŃ":49323,"Completed":49324,"Ġgoto":49325,"ãĤ¯":49326,"Winged":49327,"perty":49328,"[\"":49329,"ãĥİ":49330,"ĠScythe":49331,"Ġæľ":49332,"Ġ!=":49333,"Buffer":49334,"docker":49335,"ĠWATCHED":49336,"èĢħ":49337,"())":49338,"Ġdst":49339,"SIZE":49340,"ĠDemonic":49341,"Ġresil":49342,"ãĤ¿":49343,"Ġpione":49344,"cpu":49345,"++)":49346,"TEXT":49347,"Ġdiscrep":49348,"debian":49349,"quished":49350,"Ġacknow":49351,"Ġtrave":49352,"Ġgcc":49353,"Catalog":49354,"ctrl":49355,"ĠMoroc":49356,"Ġcpu":49357,"Ġ];":49358,"ĠSorceress":49359,"Introduced":49360,"Frames":49361,"Ġcondem":49362,"¶æ":49363,"~~~~~~~~":49364,"ĠEmacs":49365,"][/":49366,"Ġglim":49367,"Init":49368,"ĠPrimordial":49369,"ãĥĥ":49370,"Ġ+=":49371,"Ġblat":49372,"à¼":49373,"------------------------------------------------":49374,"gpu":49375,"ãĥĥãĥĪ":49376,"Ġxml":49377,"Ġboolean":49378,"References":49379,"Ġ?)":49380,"Ġsatell":49381,"Queue":49382,"Ġpestic":49383,"Ġ}}":49384,"Attribute":49385,"Ġdx":49386,"ĠDefin":49387,"Synopsis":49388,"..................":49389,"ãĥ¬":49390,"plugin":49391,"Disable":49392,"0000000000000000":49393,")\\":49394,"ĠIchigo":49395,"println":49396,"rontal":49397,"Setup":49398,"Ġ��������":49399,"å§":49400,"âĸº":49401,"ĠPengu":49402,"ailability":49403,"Duration":49404,"Timeout":49405,"ãĢĮ":49406,"Ġbehav":49407,"Reviewed":49408,"Ġtoget":49409,"\\.":49410,"lished":49411,"Ġthous":49412,"Ġperpend":49413,"ecause":49414,"Layout":49415,"è»":49416,"ĠDexterity":49417,"unsigned":49418,"+=":49419,"[[":49420,"ĠRunes":49421,"ãĤ¦":49422,"};":49423,"})":49424,"FTWARE":49425,"ength":49426,"milo":49427,"duino":49428,"天":49429,"ĠClojure":49430,"ļé":49431,"ãĥ¥":49432,"gradient":49433,"Ġ\"\"\"":49434,"âĨij":49435,"@#":49436,"JSON":49437,"Ġproport":49438,"addr":49439,"});":49440,"ãĥIJ":49441,"ä¸ī":49442,"Ġtmp":49443,"å£":49444,"../":49445,"zsche":49446,"Ġâμ":49447,"Entity":49448,"æ©Ł":49449,"ĠâĶľâĶĢâĶĢ":49450,"filename":49451,"{{":49452,"@@":49453,"ĠSeym":49454,"Ġ/**":49455,"ĠSummoner":49456,"Quantity":49457,"ç·":49458,"Attach":49459,"Ġbool":49460,"Texture":49461,"Ġopio":49462,".}":49463,"ãĥĭ":49464,"integer":49465,"Ġregex":49466,"Ġnomine":49467,"ription":49468,"ãģ®ç":49469,"ãĥķ":49470,"Ġsubparagraph":49471,"GGGG":49472,"Ġexplan":49473,"Header":49474,"Spawn":49475,"toggle":49476,"²¾":49477,"Abyss":49478,"expr":49479,"ĠZerg":49480,"ĠGrimoire":49481,"Contents":49482,"Instance":49483,"cyclopedia":49484,"ãĥĹ":49485,"ĠTakeru":49486,"=(":49487,"代":49488,"\\)":49489,"Ġrgb":49490,"htt":49491,"bryce":49492,"Ġlivest":49493,"ĠAnnotations":49494,"âĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢ":49495,"berus":49496,"ntil":49497,"Ġskelet":49498,"callback":49499,"åħī":49500,"Joined":49501,"ãĤª":49502,"Ġargs":49503,"artifacts":49504,"Ġå¤":49505,"ÃĽ":49506,"ãĥŀ":49507,"Streamer":49508,"}\"":49509,"Ġunden":49510,"ãĥģ":49511,"Īè":49512,"ãĥ£":49513,"Ġ0004":49514,"Ġ\\'":49515,"ãĤ°":49516,"ĠCONFIG":49517,"Ġ#####":49518,"``":49519,"anguage":49520,"Ġ*)":49521,"Template":49522,"MODE":49523,"Ġ00000000":49524,"'';":49525,">":49625,"Ġlvl":49626,"Footnote":49627,"Iter":49628,"####":49629,"ãĥij":49630,"ĠCarbuncle":49631,"Ġ[+]":49632,"Ġmathemat":49633,"Allows":49634,"Ġ4090":49635,"Async":49636,"ģ«":49637,"Ͻ":49638,"))))":49639,"á½":49640,"Ġcx":49641,"Ġansw":49642,"{\"":49643,"ãĥŁ":49644,"addons":49645,"Filename":49646,"Appearances":49647,"ĠãĢĮ":49648,"Ġaddr":49649,"Ġcharact":49650,"glomer":49651,"Advertisements":49652,"Ġdracon":49653,"ĠFenrir":49654,"Ġ();":49655,"ĠCitiz":49656,"acebook":49657,"Ġparams":49658,"]=":49659,"Ġsubscript":49660,"Ġentreprene":49661,"tnc":49662,"iversal":49663,"Ġmillenn":49664,"ithub":49665,"/>":49666,"Ġ\"{":49667,"Frameworks":49668,"avorite":49669,"Ġ])":49670,"Constructed":49671,"fml":49672,"ãĥį":49673,"################################":49674,"-|":49675,"¥ŀ":49676,"Ġwithd":49677,"ĠCth":49678,"AppData":49679,"Msg":49680,":{":49681,"ãĤ¨":49682,"Ġtuple":49683,"ç¥ŀ":49684,"Ġintrins":49685,"ĠCooldown":49686,"ategory":49687,"^{":49688,"ãĥĬ":49689,"''''":49690,"çͰ":49691,"ĠDEBUG":49692,"Ġcannabin":49693,"ocobo":49694,"Invalid":49695,"ãĥĢ":49696,"Compat":49697,"Ġ({":49698,"Removed":49699,"Ġconvol":49700,"}:":49701,"interstitial":49702,"Ġ\"":49721,"initialized":49722,"Ġexting":49723,"Poké":49724,"Parameters":49725,"¶ħ":49726,"########":49727,"NULL":49728,"ãĥĩ":49729,"groupon":49730,"\\-":49731,"ãĥı":49732,"ãĤ±":49733,"Ġsubsequ":49734,"ccording":49735,"ĠMODULE":49736,"ĠProtoss":49737,"\"},{\"":49738,"Ġ..............":49739,"Integer":49740,"endif":49741,"ãĥĻ":49742,"parser":49743,"lambda":49744,"Ġcarbohyd":49745,"ĠUnloaded":49746,"_{":49747,"âĸ¬âĸ¬":49748,"Ġdebian":49749,"]}":49750,"ãĤ¶":49751,"Parameter":49752,"ãĤ£":49753,"ãĤ»":49754,"Ġ$_":49755,"İĭ":49756,"Ġiterator":49757,"ãĤ¬":49758,"WINDOWS":49759,"CONCLUS":49760,"Ġ\"\\":49761,"umbn":49762,"(&":49763,"ãĥ©ãĥ³":49764,"usercontent":49765,"ometimes":49766,"METHOD":49767,"ãĥ¢":49768,"potion":49769,"ãĥ¯":49770,"everal":49771,"Ġweap":49772,"minecraft":49773,"================================":49774,"printf":49775,"ĠShinra":49776,"Ġreluct":49777,"\\\",":49778,"Runtime":49779,"xff":49780,"ĠAbyssal":49781,"akeru":49782,"Ġ\\(\\":49783,"\"/>":49784,"efficients":49785,"Ü":49786,"avascript":49787,"Ġbehavi":49788,"++;":49789,"=#":49790,"Attributes":49791,"âĵĺ":49792,"lvl":49793,"¬¼":49794,"/**":49795,"Gameplay":49796,"ĠLeilan":49797,">)":49798,"=\"/":49799,"Ġ));":49800,"ãĥĨãĤ£":49801,"ġ":49802,".":49836,"DEBUG":49837,"âĶģ":49838,"ãĢı":49839,"WithNo":49840,"Redditor":49841,"ĠâĶľ":49842,"Ġfmt":49843,"ãĢİ":49844,"Ġmsec":49845,"ĪĴ":49846,"eatures":49847,"itially":49848,"\"\"\"":49849,"ãĥ¼ãĤ¯":49850,"Textures":49851,"\"},":49852,"\"><":49858,"||||":49859,"ß":49860,"iterator":49861,"è£ħ":49862,"Ĥª":49863,"ojure":49864,"ãħĭãħĭ":49865,"ãĥ¼ãĥ³":49866,"Ġprintln":49867,"Ġ][":49868,"âĸĪâĸĪ":49869,"âķIJ":49870,"\\\":":49871,"senal":49872,"é¾į":49873,"é¾":49874,"Ġcryst":49875,"ãĥķãĤ¡":49876,"ĠCosponsors":49877,"ãĤ·ãĥ£":49878,"Magikarp":49879,"ĠMagicka":49880,"âĸĪâĸĪâĸĪâĸĪ":49881,",,,,,,,,":49882,"vertisement":49883,"âĶĢâĶĢâĶĢâĶĢ":49884,"ãĥķãĤ©":49885,"luaj":49886,"CLASSIFIED":49887,".''.":49888,"byss":49889,"Ġ{:":49890,"ĠNanto":49891,"Ġptr":49892,"Ġ%%":49893,"Ġteasp":49894,"[_":49895,"ãĥ¤":49896,"ħĭ":49897,"ŃĶ":49898,"Ġpci":49899,"Ġ\"<":49900,"GGGGGGGG":49901,"æĪ¦":49902,"--+":49903,"ãĤ®":49904,"Ġ())":49905,"âĸ¬":49906,"Ġsizeof":49907,"}}}":49908,";;;;;;;;":49909,">]":49910,"âĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪ":49911,"Vaults":49912,"Ġistg":49913,"Ġnewcom":49914,"=]":49915,"¿½":49916,"ĵĺ":49917,"{\\":49918,"Args":49919,"Ġexha":49920,"(\\":49921,"Ġunnecess":49922,"\"}],\"":49923,"ĠUNCLASSIFIED":49924,">(":49925,"ãĤ¢ãĥ«":49926,"æ©":49927,"70710":49928,"Ń·":49929,"ãĥ¼ãĥĨãĤ£":49930,"ĠSakuya":49931,"ãĥĥãĥī":49932,"ĠPyrrha":49933,"escription":49934,"VIDIA":49935,"================================================================":49936,"Ġlooph":49937,"=~":49938,"Ġcumbers":49939,"Ġ)]":49940,"govtrack":49941,"ĠãĤµ":49942,"Ġsubur":49943,"Þ":49944,"Ġâī¡":49945,"Interstitial":49946,"ãĥ¼ãĥĨ":49947,"Ġgobl":49948,"ãĥīãĥ©":49949,"oldown":49950,"ģĸ":49951,"Depths":49952,"Ġ());":49953,"Ġ._":49954,"20439":49955,"Ġç¥ŀ":49956,"ãģ®å®":49957,"ãĤ¼":49958,"Ġ$\\":49959,"âĹ¼":49960,"Ġencount":49961,"Ġ": 48457, + "Ġstreng": 48458, + "agascar": 48459, + "guyen": 48460, + "((": 48461, + ")[": 48462, + "ĠNorn": 48463, + "Ġhippocamp": 48464, + "Ġ¯": 48465, + "îĢ": 48466, + "Connection": 48467, + "PATH": 48468, + "mbuds": 48469, + "ĠShards": 48470, + "Ġadvoc": 48471, + "Ġsimulac": 48472, + "âĸij": 48473, + "!?\"": 48474, + "ĠPotion": 48475, + "Ġamulet": 48476, + "ĠFnatic": 48477, + "Ġcryptoc": 48478, + "wav": 48479, + "radius": 48480, + "pkg": 48481, + "ĠMFT": 48482, + "æĢ": 48483, + "Ġtoile": 48484, + "Items": 48485, + "ifference": 48486, + "errors": 48487, + "ĠCelt": 48488, + "Ġunpop": 48489, + "ilogy": 48490, + "6666": 48491, + "hesda": 48492, + "Instruct": 48493, + "å·": 48494, + "Materials": 48495, + "ettings": 48496, + "Percent": 48497, + "Ġresistor": 48498, + "tymology": 48499, + "Ġdeprecated": 48500, + "Ġgrep": 48501, + "ĠWRITE": 48502, + "Ġtriv": 48503, + "Ġscrut": 48504, + "[/": 48505, + "anyl": 48506, + "skirts": 48507, + "MSN": 48508, + "ĠCodec": 48509, + "ecd": 48510, + "Anth": 48511, + "){": 48512, + "%]": 48513, + "veyard": 48514, + "aspberry": 48515, + "ãĢ": 48516, + "Reward": 48517, + "rha": 48518, + "Stretch": 48519, + "]-": 48520, + "Prev": 48521, + "Context": 48522, + "Ġlinux": 48523, + "HAHA": 48524, + "perties": 48525, + "ĠVIDE": 48526, + "Domain": 48527, + "Ġmurd": 48528, + "ĠLegions": 48529, + "apache": 48530, + "æŃ": 48531, + "Pause": 48532, + "Temperature": 48533, + "ufact": 48534, + "igslist": 48535, + "ĠRetrieved": 48536, + "èª": 48537, + "ãģĮ": 48538, + "Ingredients": 48539, + "ruary": 48540, + "dyl": 48541, + "Alias": 48542, + "ĠÎĶ": 48543, + "Ġinval": 48544, + "amsung": 48545, + "!--": 48546, + "olean": 48547, + "æī": 48548, + "ãģ¯": 48549, + "Ġcoefficients": 48550, + "ĠDHCP": 48551, + "âĨĴ": 48552, + "utonium": 48553, + ":[": 48554, + "âĹ": 48555, + "cli": 48556, + "Container": 48557, + "å¼": 48558, + "nexus": 48559, + "SOURCE": 48560, + "Ò": 48561, + "=/": 48562, + "Ġmysql": 48563, + "ĠGained": 48564, + "Ġ/*": 48565, + "uncture": 48566, + "Ġstatically": 48567, + "âĸł": 48568, + "æĺ¯": 48569, + "æ°": 48570, + "estamp": 48571, + "Cache": 48572, + "ulkan": 48573, + "staking": 48574, + "apter": 48575, + "ãģ¾": 48576, + "Ġμg": 48577, + "Ġtremend": 48578, + "ĠPiercing": 48579, + "naissance": 48580, + "ĠHealer": 48581, + "Enabled": 48582, + "éģ": 48583, + "âĸ": 48584, + "ĠThumbnails": 48585, + "Ġhither": 48586, + "Format": 48587, + "utherland": 48588, + "íķ": 48589, + "Ġdestro": 48590, + "fff": 48591, + "execute": 48592, + "msg": 48593, + "romancer": 48594, + "ĠCanaver": 48595, + "ĠVaults": 48596, + "oided": 48597, + "iage": 48598, + "Ġimg": 48599, + "summary": 48600, + "]);": 48601, + "ĠABE": 48602, + "ĠGamergate": 48603, + "utherford": 48604, + "Ġoverwrite": 48605, + "enment": 48606, + "æķ": 48607, + "Ġsystemd": 48608, + "tif": 48609, + "]).": 48610, + "ãĤ¤": 48611, + "Widget": 48612, + "======": 48613, + "(-": 48614, + "Ġ\"+": 48615, + "ĠIncarnation": 48616, + "æĥ": 48617, + "���": 48618, + "GUI": 48619, + "èĥ": 48620, + "forums": 48621, + "Ġrunes": 48622, + "Ġâī¤": 48623, + "Ġdefic": 48624, + "Distance": 48625, + "directory": 48626, + "ĠHorus": 48627, + "iltr": 48628, + "ortium": 48629, + "Ġ./": 48630, + "bda": 48631, + "owship": 48632, + "ĠâĨij": 48633, + "}.": 48634, + "åĩ": 48635, + "1027": 48636, + "Weapons": 48637, + "lucent": 48638, + "Ġauth": 48639, + ";;": 48640, + "Recommended": 48641, + "Ġsurv": 48642, + "Ġvm": 48643, + "ĠStronghold": 48644, + "Ġparan": 48645, + "ĠTrance": 48646, + "æĺ": 48647, + "Ġsovere": 48648, + "Ġcorrid": 48649, + "ĠPwr": 48650, + "Ġ[/": 48651, + "Ġseq": 48652, + "Population": 48653, + "Ġ[];": 48654, + "Ġreferen": 48655, + "ĠInstr": 48656, + "ĠStamina": 48657, + "kernel": 48658, + "Python": 48659, + "-+": 48660, + "Ġallele": 48661, + "éĽ": 48662, + "isode": 48663, + "ä¸į": 48664, + "otonin": 48665, + "modules": 48666, + "Notable": 48667, + "Spell": 48668, + "\\\\": 48669, + "Pref": 48670, + "Ġdatas": 48671, + "setup": 48672, + "Ġhapl": 48673, + "Height": 48674, + "åĭ": 48675, + "ãģ£": 48676, + "]),": 48677, + "Handle": 48678, + "umenthal": 48679, + "Package": 48680, + "Ġenthus": 48681, + "Ġunsus": 48682, + "Narr": 48683, + "Examples": 48684, + "FAQ": 48685, + "REDACTED": 48686, + "Ġnotor": 48687, + "Enable": 48688, + "Pattern": 48689, + "aeda": 48690, + ">.": 48691, + "CHECK": 48692, + "Ġ����": 48693, + "Ġ'.": 48694, + "Ġãĥ": 48695, + "append": 48696, + "����": 48697, + "gemony": 48698, + "terness": 48699, + "ĠHaku": 48700, + "NVIDIA": 48701, + "queue": 48702, + "Bind": 48703, + "Ġneigh": 48704, + "armor": 48705, + "retty": 48706, + "LOD": 48707, + "plugins": 48708, + "Ġ/>": 48709, + "TYPE": 48710, + "Ġ4096": 48711, + "-------": 48712, + "Preview": 48713, + "FML": 48714, + "Ġproletarian": 48715, + "zees": 48716, + "enfranch": 48717, + "ãģĨ": 48718, + "Ctrl": 48719, + "Module": 48720, + "ĠSurviv": 48721, + "ĠStarcraft": 48722, + "rored": 48723, + "reddit": 48724, + "Ġrul": 48725, + "Ġtx": 48726, + "Ġmage": 48727, + "Sword": 48728, + "Ġ~/": 48729, + "Effects": 48730, + "éļ": 48731, + "ä¹": 48732, + "Sensor": 48733, + "Solution": 48734, + "ãģĻ": 48735, + "Arcade": 48736, + "Ġpredec": 48737, + "Values": 48738, + "Length": 48739, + "Ġfortun": 48740, + "ttp": 48741, + "\"[": 48742, + "tmp": 48743, + "ĠBerserker": 48744, + "åĨ": 48745, + "ositories": 48746, + "Ġcouncill": 48747, + "ffff": 48748, + "));": 48749, + "Recipe": 48750, + "ĠASCII": 48751, + "âĦ¢:": 48752, + "ä": 48753, + "Ġhorm": 48754, + "=>": 48755, + "sers": 48756, + "ãģĭ": 48757, + "Recommend": 48758, + "['": 48759, + "agame": 48760, + "Animation": 48761, + "aucuses": 48762, + "Discussion": 48763, + "Ġhelicop": 48764, + "å¿": 48765, + "Float": 48766, + "Component": 48767, + "instance": 48768, + "Ġfoo": 48769, + "localhost": 48770, + "=-": 48771, + "Offset": 48772, + "Psy": 48773, + "ĠGohan": 48774, + "buquerque": 48775, + "Ġdefe": 48776, + "chwitz": 48777, + "parse": 48778, + "Ġdors": 48779, + "Ġspons": 48780, + "Ġasync": 48781, + "agonists": 48782, + "Ġindo": 48783, + ".>>": 48784, + "ĠDisciple": 48785, + "Ġfilename": 48786, + "rency": 48787, + "ĠDise": 48788, + "Ġ\"/": 48789, + "template": 48790, + "ãĤ¹": 48791, + "swers": 48792, + "Ġ++": 48793, + "Ġ[(": 48794, + "thora": 48795, + "ĠDepths": 48796, + "livious": 48797, + "Ġdisadvant": 48798, + "foundland": 48799, + "Upload": 48800, + "Ġ§§": 48801, + "Ġsophistic": 48802, + ";}": 48803, + "izont": 48804, + "\"}": 48805, + "estial": 48806, + "Ranked": 48807, + "ĠOccupations": 48808, + "LEASE": 48809, + "ĠOgre": 48810, + "folder": 48811, + "Plot": 48812, + "farious": 48813, + "Ġsuscept": 48814, + "Types": 48815, + "Discuss": 48816, + "Ġ'/": 48817, + "æµ": 48818, + "earable": 48819, + "æ³": 48820, + "Tile": 48821, + "iatus": 48822, + "åŃ": 48823, + "Ġreperto": 48824, + "Helper": 48825, + "Returns": 48826, + "ä¸Ĭ": 48827, + "imaru": 48828, + "Ġreq": 48829, + "Ġdissatisf": 48830, + "multipl": 48831, + "}{": 48832, + "-[": 48833, + "itial": 48834, + "*/": 48835, + "Config": 48836, + "Example": 48837, + "ĠjQuery": 48838, + "Mods": 48839, + "ĠGPIO": 48840, + "Ġlaun": 48841, + "layout": 48842, + "cised": 48843, + "Ġ......": 48844, + "+++": 48845, + "prototype": 48846, + "Exception": 48847, + "Ġsubsections": 48848, + "Ġresemb": 48849, + "Ġâĩ": 48850, + "ĠPubMed": 48851, + "username": 48852, + "Ġaggro": 48853, + "éĥ": 48854, + "Ġ};": 48855, + "ĠMages": 48856, + "ryu": 48857, + "apons": 48858, + "Optional": 48859, + "ĠAncients": 48860, + "ãĤĬ": 48861, + "Quotes": 48862, + "oaded": 48863, + "Ġsuspic": 48864, + "inline": 48865, + "omial": 48866, + "ĠMahjong": 48867, + "auntlets": 48868, + "Ġanarchism": 48869, + "Ġsubclass": 48870, + "ĠMLG": 48871, + "...]": 48872, + "Dialog": 48873, + "uphem": 48874, + "Ġrecursive": 48875, + "7601": 48876, + "frac": 48877, + "Else": 48878, + "ĠSeverus": 48879, + "},{\"": 48880, + "ĠCLIENT": 48881, + "Ġjavascript": 48882, + "sama": 48883, + "ĠLearns": 48884, + "ãĤĤ": 48885, + "Upgrade": 48886, + "Listener": 48887, + "Ġsnipp": 48888, + "Ġrune": 48889, + "ĠTTL": 48890, + "ertation": 48891, + "olicy": 48892, + "=\"\"": 48893, + "«ĺ": 48894, + "Ġexpr": 48895, + "ovych": 48896, + "Ġãģ": 48897, + "_-_": 48898, + "munition": 48899, + "////": 48900, + "func": 48901, + ">>>>": 48902, + "Provider": 48903, + "Ïī": 48904, + "BUG": 48905, + "Ġ[-": 48906, + "Ġarrang": 48907, + "merce": 48908, + "ãĥ": 48909, + "incarn": 48910, + "Valid": 48911, + "ĠAether": 48912, + "ãĤĵ": 48913, + "ĠUTF": 48914, + "ĠMonstrous": 48915, + "ãĤĮ": 48916, + "hedon": 48917, + "áµ": 48918, + ":#": 48919, + "ĠFrieza": 48920, + "padding": 48921, + "Reviewer": 48922, + "Ġpsychiat": 48923, + "yrinth": 48924, + "ĠâĶĤ": 48925, + "hillary": 48926, + "Static": 48927, + "Newsletter": 48928, + "Avg": 48929, + "Ġfn": 48930, + "Topic": 48931, + "choes": 48932, + "Ġnewsp": 48933, + "á¸": 48934, + "Ġ[+": 48935, + "~~~~~~~~~~~~~~~~": 48936, + ":]": 48937, + "apego": 48938, + "buf": 48939, + "Translation": 48940, + "ById": 48941, + "Ġmmol": 48942, + "ãĥ¼ãĥ": 48943, + "å½": 48944, + "ãĤī": 48945, + "Ġparser": 48946, + "ãĥª": 48947, + "`,": 48948, + "Lair": 48949, + ")}": 48950, + "ypes": 48951, + "adobe": 48952, + "Ġancest": 48953, + "ernel": 48954, + "ĠNULL": 48955, + "ç«": 48956, + "anguages": 48957, + "Increases": 48958, + "æĦ": 48959, + "utorial": 48960, + "ithmetic": 48961, + "dll": 48962, + "ĠArcane": 48963, + "çī": 48964, + "Ġtc": 48965, + "urtles": 48966, + "èĪ": 48967, + "Bytes": 48968, + "Slot": 48969, + "ĠBahá": 48970, + "Weapon": 48971, + "widget": 48972, + "querque": 48973, + "Ġembodiments": 48974, + "å¥": 48975, + "WARN": 48976, + "swer": 48977, + "thumbnails": 48978, + "FFFF": 48979, + "inguishable": 48980, + "Ġâī": 48981, + "Ġ${": 48982, + "AAAAAAAA": 48983, + "Conclusion": 48984, + "ĻĤ": 48985, + "disable": 48986, + "Rect": 48987, + "Ġsubp": 48988, + "Ġ().": 48989, + "ĠDetected": 48990, + "èĢ": 48991, + "[]": 48992, + "Ġcoerc": 48993, + "ĠmM": 48994, + "recated": 48995, + "fusc": 48996, + "ĠSorce": 48997, + "çĶŁ": 48998, + ").[": 48999, + "Ġ})": 49000, + "mobi": 49001, + "yip": 49002, + "Acknowled": 49003, + "ternity": 49004, + "iqueness": 49005, + "ython": 49006, + "><": 49007, + "Ġstd": 49008, + "Url": 49009, + "Ġnamespace": 49010, + "Ġtion": 49011, + "oother": 49012, + "Ó": 49013, + "Ġhemor": 49014, + "Ġrg": 49015, + "ventory": 49016, + "ãĤ¢": 49017, + "anamo": 49018, + "Socket": 49019, + "Topics": 49020, + "apeshifter": 49021, + "gnu": 49022, + "Ġdetrim": 49023, + "`.": 49024, + "romeda": 49025, + "çIJ": 49026, + "Ġlambda": 49027, + "Compan": 49028, + "Variable": 49029, + "Ġusb": 49030, + "ĠAdamant": 49031, + "ournal": 49032, + "Ġcovari": 49033, + "ãĥ©": 49034, + "éĸ": 49035, + "åİ": 49036, + "otaur": 49037, + "Ġ(),": 49038, + "Marginal": 49039, + "ãģı": 49040, + "Ġphysic": 49041, + "adeon": 49042, + "RESULTS": 49043, + "200000": 49044, + "ãģį": 49045, + "udeb": 49046, + "ãģĵ": 49047, + "COMPLE": 49048, + "Ġmsg": 49049, + "ghazi": 49050, + "/*": 49051, + "ĠDeity": 49052, + "Ġdisapp": 49053, + "Availability": 49054, + "Ġillum": 49055, + "à©": 49056, + "ptives": 49057, + ",âĢĶ": 49058, + "chnology": 49059, + "Ġaccur": 49060, + "Ġapi": 49061, + "Obj": 49062, + "ãĤ«": 49063, + "ãĤ¸": 49064, + "ä¹ĭ": 49065, + "ËĪ": 49066, + "Ġtcp": 49067, + "Required": 49068, + ".<": 49069, + "\".[": 49070, + "Ġ~/.": 49071, + "Ġobser": 49072, + "RFC": 49073, + "Ġintegers": 49074, + "åī": 49075, + "Installation": 49076, + "Ô": 49077, + "ó": 49078, + "csv": 49079, + "ãĥ«": 49080, + "ĠNoticed": 49081, + "âĸĵ": 49082, + "Tumblr": 49083, + "Reply": 49084, + "||": 49085, + "Ġconclud": 49086, + "Ġ))": 49087, + "ebin": 49088, + "sql": 49089, + "Closure": 49090, + "++++": 49091, + "],[": 49092, + "âĹı": 49093, + "Ġprolet": 49094, + "Ġ>=": 49095, + "estinal": 49096, + "Ġ[*": 49097, + "ĠInquisitor": 49098, + "Ġcmd": 49099, + "FINE": 49100, + "CRIP": 49101, + "Ġvertex": 49102, + "TeX": 49103, + "///": 49104, + "Ö¼": 49105, + "iscons": 49106, + "Ġmyster": 49107, + "Changed": 49108, + "timeout": 49109, + "irtual": 49110, + "Methods": 49111, + "Ġcerts": 49112, + "texture": 49113, + "Roaming": 49114, + "Proxy": 49115, + "Override": 49116, + "éĹ": 49117, + "utf": 49118, + "python": 49119, + "ĠRarity": 49120, + "ilitarian": 49121, + "çľ": 49122, + "().": 49123, + "æł": 49124, + "Ġbuf": 49125, + "åij": 49126, + "çķ": 49127, + "Ġ*.": 49128, + "umerable": 49129, + "~~~~": 49130, + "å¦": 49131, + "Ġsimultane": 49132, + "Ġjson": 49133, + "Requires": 49134, + "Ġperl": 49135, + "Interface": 49136, + "rupal": 49137, + ":": 49242, + "itialized": 49243, + "HTTP": 49244, + "Trivia": 49245, + "Sov": 49246, + "wrapper": 49247, + "={": 49248, + "ĠAzerb": 49249, + "aeper": 49250, + "Ġneighb": 49251, + "initions": 49252, + "Ġsts": 49253, + "ĠSasuke": 49254, + "#$": 49255, + "uliffe": 49256, + "æĸ¹": 49257, + "++++++++++++++++": 49258, + "ĠElven": 49259, + "ãģĤ": 49260, + "Ġartif": 49261, + "Folder": 49262, + "Ġà¨": 49263, + "åĤ": 49264, + "Ġphyl": 49265, + "uggest": 49266, + "blance": 49267, + "ãģł": 49268, + "Requirements": 49269, + "Usage": 49270, + "Ġinitialized": 49271, + "ã쮿": 49272, + "conservancy": 49273, + "ĠReincarn": 49274, + ")|": 49275, + "Ġantioxid": 49276, + "ĠClicker": 49277, + "Ġunlaw": 49278, + "Ġ\\(": 49279, + "ãĥĪ": 49280, + "Ġ[*]": 49281, + "Characters": 49282, + "////////": 49283, + "ãĢIJ": 49284, + "ãĤ·": 49285, + "webkit": 49286, + "ãĢij": 49287, + "Ġxp": 49288, + "alkyrie": 49289, + "Console": 49290, + "());": 49291, + "ĠKorra": 49292, + "\"))": 49293, + "oooooooooooooooo": 49294, + "Timer": 49295, + "////////////////": 49296, + "yout": 49297, + "engeance": 49298, + "emetery": 49299, + "Ġmages": 49300, + "mods": 49301, + "Null": 49302, + "Ġphilos": 49303, + "ascript": 49304, + "Ġaddon": 49305, + "ĠâĸĪ": 49306, + "emale": 49307, + "----------------------------------------------------------------": 49308, + "Ġ\\\\": 49309, + "=[": 49310, + "ĠParables": 49311, + "ãĥĨ": 49312, + "VALUE": 49313, + "Ġ@@": 49314, + "Ġuint": 49315, + "${": 49316, + "cpp": 49317, + "%%": 49318, + "Ġ(âĪĴ": 49319, + "utils": 49320, + "prefix": 49321, + "å°Ĩ": 49322, + "ãĥŃ": 49323, + "Completed": 49324, + "Ġgoto": 49325, + "ãĤ¯": 49326, + "Winged": 49327, + "perty": 49328, + "[\"": 49329, + "ãĥİ": 49330, + "ĠScythe": 49331, + "Ġæľ": 49332, + "Ġ!=": 49333, + "Buffer": 49334, + "docker": 49335, + "ĠWATCHED": 49336, + "èĢħ": 49337, + "())": 49338, + "Ġdst": 49339, + "SIZE": 49340, + "ĠDemonic": 49341, + "Ġresil": 49342, + "ãĤ¿": 49343, + "Ġpione": 49344, + "cpu": 49345, + "++)": 49346, + "TEXT": 49347, + "Ġdiscrep": 49348, + "debian": 49349, + "quished": 49350, + "Ġacknow": 49351, + "Ġtrave": 49352, + "Ġgcc": 49353, + "Catalog": 49354, + "ctrl": 49355, + "ĠMoroc": 49356, + "Ġcpu": 49357, + "Ġ];": 49358, + "ĠSorceress": 49359, + "Introduced": 49360, + "Frames": 49361, + "Ġcondem": 49362, + "¶æ": 49363, + "~~~~~~~~": 49364, + "ĠEmacs": 49365, + "][/": 49366, + "Ġglim": 49367, + "Init": 49368, + "ĠPrimordial": 49369, + "ãĥĥ": 49370, + "Ġ+=": 49371, + "Ġblat": 49372, + "à¼": 49373, + "------------------------------------------------": 49374, + "gpu": 49375, + "ãĥĥãĥĪ": 49376, + "Ġxml": 49377, + "Ġboolean": 49378, + "References": 49379, + "Ġ?)": 49380, + "Ġsatell": 49381, + "Queue": 49382, + "Ġpestic": 49383, + "Ġ}}": 49384, + "Attribute": 49385, + "Ġdx": 49386, + "ĠDefin": 49387, + "Synopsis": 49388, + "..................": 49389, + "ãĥ¬": 49390, + "plugin": 49391, + "Disable": 49392, + "0000000000000000": 49393, + ")\\": 49394, + "ĠIchigo": 49395, + "println": 49396, + "rontal": 49397, + "Setup": 49398, + "Ġ��������": 49399, + "å§": 49400, + "âĸº": 49401, + "ĠPengu": 49402, + "ailability": 49403, + "Duration": 49404, + "Timeout": 49405, + "ãĢĮ": 49406, + "Ġbehav": 49407, + "Reviewed": 49408, + "Ġtoget": 49409, + "\\.": 49410, + "lished": 49411, + "Ġthous": 49412, + "Ġperpend": 49413, + "ecause": 49414, + "Layout": 49415, + "è»": 49416, + "ĠDexterity": 49417, + "unsigned": 49418, + "+=": 49419, + "[[": 49420, + "ĠRunes": 49421, + "ãĤ¦": 49422, + "};": 49423, + "})": 49424, + "FTWARE": 49425, + "ength": 49426, + "milo": 49427, + "duino": 49428, + "天": 49429, + "ĠClojure": 49430, + "ļé": 49431, + "ãĥ¥": 49432, + "gradient": 49433, + "Ġ\"\"\"": 49434, + "âĨij": 49435, + "@#": 49436, + "JSON": 49437, + "Ġproport": 49438, + "addr": 49439, + "});": 49440, + "ãĥIJ": 49441, + "ä¸ī": 49442, + "Ġtmp": 49443, + "å£": 49444, + "../": 49445, + "zsche": 49446, + "Ġâμ": 49447, + "Entity": 49448, + "æ©Ł": 49449, + "ĠâĶľâĶĢâĶĢ": 49450, + "filename": 49451, + "{{": 49452, + "@@": 49453, + "ĠSeym": 49454, + "Ġ/**": 49455, + "ĠSummoner": 49456, + "Quantity": 49457, + "ç·": 49458, + "Attach": 49459, + "Ġbool": 49460, + "Texture": 49461, + "Ġopio": 49462, + ".}": 49463, + "ãĥĭ": 49464, + "integer": 49465, + "Ġregex": 49466, + "Ġnomine": 49467, + "ription": 49468, + "ãģ®ç": 49469, + "ãĥķ": 49470, + "Ġsubparagraph": 49471, + "GGGG": 49472, + "Ġexplan": 49473, + "Header": 49474, + "Spawn": 49475, + "toggle": 49476, + "²¾": 49477, + "Abyss": 49478, + "expr": 49479, + "ĠZerg": 49480, + "ĠGrimoire": 49481, + "Contents": 49482, + "Instance": 49483, + "cyclopedia": 49484, + "ãĥĹ": 49485, + "ĠTakeru": 49486, + "=(": 49487, + "代": 49488, + "\\)": 49489, + "Ġrgb": 49490, + "htt": 49491, + "bryce": 49492, + "Ġlivest": 49493, + "ĠAnnotations": 49494, + "âĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢ": 49495, + "berus": 49496, + "ntil": 49497, + "Ġskelet": 49498, + "callback": 49499, + "åħī": 49500, + "Joined": 49501, + "ãĤª": 49502, + "Ġargs": 49503, + "artifacts": 49504, + "Ġå¤": 49505, + "ÃĽ": 49506, + "ãĥŀ": 49507, + "Streamer": 49508, + "}\"": 49509, + "Ġunden": 49510, + "ãĥģ": 49511, + "Īè": 49512, + "ãĥ£": 49513, + "Ġ0004": 49514, + "Ġ\\'": 49515, + "ãĤ°": 49516, + "ĠCONFIG": 49517, + "Ġ#####": 49518, + "``": 49519, + "anguage": 49520, + "Ġ*)": 49521, + "Template": 49522, + "MODE": 49523, + "Ġ00000000": 49524, + "'';": 49525, + ">": 49625, + "Ġlvl": 49626, + "Footnote": 49627, + "Iter": 49628, + "####": 49629, + "ãĥij": 49630, + "ĠCarbuncle": 49631, + "Ġ[+]": 49632, + "Ġmathemat": 49633, + "Allows": 49634, + "Ġ4090": 49635, + "Async": 49636, + "ģ«": 49637, + "Ͻ": 49638, + "))))": 49639, + "á½": 49640, + "Ġcx": 49641, + "Ġansw": 49642, + "{\"": 49643, + "ãĥŁ": 49644, + "addons": 49645, + "Filename": 49646, + "Appearances": 49647, + "ĠãĢĮ": 49648, + "Ġaddr": 49649, + "Ġcharact": 49650, + "glomer": 49651, + "Advertisements": 49652, + "Ġdracon": 49653, + "ĠFenrir": 49654, + "Ġ();": 49655, + "ĠCitiz": 49656, + "acebook": 49657, + "Ġparams": 49658, + "]=": 49659, + "Ġsubscript": 49660, + "Ġentreprene": 49661, + "tnc": 49662, + "iversal": 49663, + "Ġmillenn": 49664, + "ithub": 49665, + "/>": 49666, + "Ġ\"{": 49667, + "Frameworks": 49668, + "avorite": 49669, + "Ġ])": 49670, + "Constructed": 49671, + "fml": 49672, + "ãĥį": 49673, + "################################": 49674, + "-|": 49675, + "¥ŀ": 49676, + "Ġwithd": 49677, + "ĠCth": 49678, + "AppData": 49679, + "Msg": 49680, + ":{": 49681, + "ãĤ¨": 49682, + "Ġtuple": 49683, + "ç¥ŀ": 49684, + "Ġintrins": 49685, + "ĠCooldown": 49686, + "ategory": 49687, + "^{": 49688, + "ãĥĬ": 49689, + "''''": 49690, + "çͰ": 49691, + "ĠDEBUG": 49692, + "Ġcannabin": 49693, + "ocobo": 49694, + "Invalid": 49695, + "ãĥĢ": 49696, + "Compat": 49697, + "Ġ({": 49698, + "Removed": 49699, + "Ġconvol": 49700, + "}:": 49701, + "interstitial": 49702, + "Ġ\"": 49721, + "initialized": 49722, + "Ġexting": 49723, + "Poké": 49724, + "Parameters": 49725, + "¶ħ": 49726, + "########": 49727, + "NULL": 49728, + "ãĥĩ": 49729, + "groupon": 49730, + "\\-": 49731, + "ãĥı": 49732, + "ãĤ±": 49733, + "Ġsubsequ": 49734, + "ccording": 49735, + "ĠMODULE": 49736, + "ĠProtoss": 49737, + "\"},{\"": 49738, + "Ġ..............": 49739, + "Integer": 49740, + "endif": 49741, + "ãĥĻ": 49742, + "parser": 49743, + "lambda": 49744, + "Ġcarbohyd": 49745, + "ĠUnloaded": 49746, + "_{": 49747, + "âĸ¬âĸ¬": 49748, + "Ġdebian": 49749, + "]}": 49750, + "ãĤ¶": 49751, + "Parameter": 49752, + "ãĤ£": 49753, + "ãĤ»": 49754, + "Ġ$_": 49755, + "İĭ": 49756, + "Ġiterator": 49757, + "ãĤ¬": 49758, + "WINDOWS": 49759, + "CONCLUS": 49760, + "Ġ\"\\": 49761, + "umbn": 49762, + "(&": 49763, + "ãĥ©ãĥ³": 49764, + "usercontent": 49765, + "ometimes": 49766, + "METHOD": 49767, + "ãĥ¢": 49768, + "potion": 49769, + "ãĥ¯": 49770, + "everal": 49771, + "Ġweap": 49772, + "minecraft": 49773, + "================================": 49774, + "printf": 49775, + "ĠShinra": 49776, + "Ġreluct": 49777, + "\\\",": 49778, + "Runtime": 49779, + "xff": 49780, + "ĠAbyssal": 49781, + "akeru": 49782, + "Ġ\\(\\": 49783, + "\"/>": 49784, + "efficients": 49785, + "Ü": 49786, + "avascript": 49787, + "Ġbehavi": 49788, + "++;": 49789, + "=#": 49790, + "Attributes": 49791, + "âĵĺ": 49792, + "lvl": 49793, + "¬¼": 49794, + "/**": 49795, + "Gameplay": 49796, + "ĠLeilan": 49797, + ">)": 49798, + "=\"/": 49799, + "Ġ));": 49800, + "ãĥĨãĤ£": 49801, + "ġ": 49802, + ".": 49836, + "DEBUG": 49837, + "âĶģ": 49838, + "ãĢı": 49839, + "WithNo": 49840, + "Redditor": 49841, + "ĠâĶľ": 49842, + "Ġfmt": 49843, + "ãĢİ": 49844, + "Ġmsec": 49845, + "ĪĴ": 49846, + "eatures": 49847, + "itially": 49848, + "\"\"\"": 49849, + "ãĥ¼ãĤ¯": 49850, + "Textures": 49851, + "\"},": 49852, + "\"><": 49858, + "||||": 49859, + "ß": 49860, + "iterator": 49861, + "è£ħ": 49862, + "Ĥª": 49863, + "ojure": 49864, + "ãħĭãħĭ": 49865, + "ãĥ¼ãĥ³": 49866, + "Ġprintln": 49867, + "Ġ][": 49868, + "âĸĪâĸĪ": 49869, + "âķIJ": 49870, + "\\\":": 49871, + "senal": 49872, + "é¾į": 49873, + "é¾": 49874, + "Ġcryst": 49875, + "ãĥķãĤ¡": 49876, + "ĠCosponsors": 49877, + "ãĤ·ãĥ£": 49878, + "Magikarp": 49879, + "ĠMagicka": 49880, + "âĸĪâĸĪâĸĪâĸĪ": 49881, + ",,,,,,,,": 49882, + "vertisement": 49883, + "âĶĢâĶĢâĶĢâĶĢ": 49884, + "ãĥķãĤ©": 49885, + "luaj": 49886, + "CLASSIFIED": 49887, + ".''.": 49888, + "byss": 49889, + "Ġ{:": 49890, + "ĠNanto": 49891, + "Ġptr": 49892, + "Ġ%%": 49893, + "Ġteasp": 49894, + "[_": 49895, + "ãĥ¤": 49896, + "ħĭ": 49897, + "ŃĶ": 49898, + "Ġpci": 49899, + "Ġ\"<": 49900, + "GGGGGGGG": 49901, + "æĪ¦": 49902, + "--+": 49903, + "ãĤ®": 49904, + "Ġ())": 49905, + "âĸ¬": 49906, + "Ġsizeof": 49907, + "}}}": 49908, + ";;;;;;;;": 49909, + ">]": 49910, + "âĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪ": 49911, + "Vaults": 49912, + "Ġistg": 49913, + "Ġnewcom": 49914, + "=]": 49915, + "¿½": 49916, + "ĵĺ": 49917, + "{\\": 49918, + "Args": 49919, + "Ġexha": 49920, + "(\\": 49921, + "Ġunnecess": 49922, + "\"}],\"": 49923, + "ĠUNCLASSIFIED": 49924, + ">(": 49925, + "ãĤ¢ãĥ«": 49926, + "æ©": 49927, + "70710": 49928, + "Ń·": 49929, + "ãĥ¼ãĥĨãĤ£": 49930, + "ĠSakuya": 49931, + "ãĥĥãĥī": 49932, + "ĠPyrrha": 49933, + "escription": 49934, + "VIDIA": 49935, + "================================================================": 49936, + "Ġlooph": 49937, + "=~": 49938, + "Ġcumbers": 49939, + "Ġ)]": 49940, + "govtrack": 49941, + "ĠãĤµ": 49942, + "Ġsubur": 49943, + "Þ": 49944, + "Ġâī¡": 49945, + "Interstitial": 49946, + "ãĥ¼ãĥĨ": 49947, + "Ġgobl": 49948, + "ãĥīãĥ©": 49949, + "oldown": 49950, + "ģĸ": 49951, + "Depths": 49952, + "Ġ());": 49953, + "Ġ._": 49954, + "20439": 49955, + "Ġç¥ŀ": 49956, + "ãģ®å®": 49957, + "ãĤ¼": 49958, + "Ġ$\\": 49959, + "âĹ¼": 49960, + "Ġencount": 49961, + "Ġ": 48457, + "Ġstreng": 48458, + "agascar": 48459, + "guyen": 48460, + "((": 48461, + ")[": 48462, + "ĠNorn": 48463, + "Ġhippocamp": 48464, + "Ġ¯": 48465, + "îĢ": 48466, + "Connection": 48467, + "PATH": 48468, + "mbuds": 48469, + "ĠShards": 48470, + "Ġadvoc": 48471, + "Ġsimulac": 48472, + "âĸij": 48473, + "!?\"": 48474, + "ĠPotion": 48475, + "Ġamulet": 48476, + "ĠFnatic": 48477, + "Ġcryptoc": 48478, + "wav": 48479, + "radius": 48480, + "pkg": 48481, + "ĠMFT": 48482, + "æĢ": 48483, + "Ġtoile": 48484, + "Items": 48485, + "ifference": 48486, + "errors": 48487, + "ĠCelt": 48488, + "Ġunpop": 48489, + "ilogy": 48490, + "6666": 48491, + "hesda": 48492, + "Instruct": 48493, + "å·": 48494, + "Materials": 48495, + "ettings": 48496, + "Percent": 48497, + "Ġresistor": 48498, + "tymology": 48499, + "Ġdeprecated": 48500, + "Ġgrep": 48501, + "ĠWRITE": 48502, + "Ġtriv": 48503, + "Ġscrut": 48504, + "[/": 48505, + "anyl": 48506, + "skirts": 48507, + "MSN": 48508, + "ĠCodec": 48509, + "ecd": 48510, + "Anth": 48511, + "){": 48512, + "%]": 48513, + "veyard": 48514, + "aspberry": 48515, + "ãĢ": 48516, + "Reward": 48517, + "rha": 48518, + "Stretch": 48519, + "]-": 48520, + "Prev": 48521, + "Context": 48522, + "Ġlinux": 48523, + "HAHA": 48524, + "perties": 48525, + "ĠVIDE": 48526, + "Domain": 48527, + "Ġmurd": 48528, + "ĠLegions": 48529, + "apache": 48530, + "æŃ": 48531, + "Pause": 48532, + "Temperature": 48533, + "ufact": 48534, + "igslist": 48535, + "ĠRetrieved": 48536, + "èª": 48537, + "ãģĮ": 48538, + "Ingredients": 48539, + "ruary": 48540, + "dyl": 48541, + "Alias": 48542, + "ĠÎĶ": 48543, + "Ġinval": 48544, + "amsung": 48545, + "!--": 48546, + "olean": 48547, + "æī": 48548, + "ãģ¯": 48549, + "Ġcoefficients": 48550, + "ĠDHCP": 48551, + "âĨĴ": 48552, + "utonium": 48553, + ":[": 48554, + "âĹ": 48555, + "cli": 48556, + "Container": 48557, + "å¼": 48558, + "nexus": 48559, + "SOURCE": 48560, + "Ò": 48561, + "=/": 48562, + "Ġmysql": 48563, + "ĠGained": 48564, + "Ġ/*": 48565, + "uncture": 48566, + "Ġstatically": 48567, + "âĸł": 48568, + "æĺ¯": 48569, + "æ°": 48570, + "estamp": 48571, + "Cache": 48572, + "ulkan": 48573, + "staking": 48574, + "apter": 48575, + "ãģ¾": 48576, + "Ġμg": 48577, + "Ġtremend": 48578, + "ĠPiercing": 48579, + "naissance": 48580, + "ĠHealer": 48581, + "Enabled": 48582, + "éģ": 48583, + "âĸ": 48584, + "ĠThumbnails": 48585, + "Ġhither": 48586, + "Format": 48587, + "utherland": 48588, + "íķ": 48589, + "Ġdestro": 48590, + "fff": 48591, + "execute": 48592, + "msg": 48593, + "romancer": 48594, + "ĠCanaver": 48595, + "ĠVaults": 48596, + "oided": 48597, + "iage": 48598, + "Ġimg": 48599, + "summary": 48600, + "]);": 48601, + "ĠABE": 48602, + "ĠGamergate": 48603, + "utherford": 48604, + "Ġoverwrite": 48605, + "enment": 48606, + "æķ": 48607, + "Ġsystemd": 48608, + "tif": 48609, + "]).": 48610, + "ãĤ¤": 48611, + "Widget": 48612, + "======": 48613, + "(-": 48614, + "Ġ\"+": 48615, + "ĠIncarnation": 48616, + "æĥ": 48617, + "���": 48618, + "GUI": 48619, + "èĥ": 48620, + "forums": 48621, + "Ġrunes": 48622, + "Ġâī¤": 48623, + "Ġdefic": 48624, + "Distance": 48625, + "directory": 48626, + "ĠHorus": 48627, + "iltr": 48628, + "ortium": 48629, + "Ġ./": 48630, + "bda": 48631, + "owship": 48632, + "ĠâĨij": 48633, + "}.": 48634, + "åĩ": 48635, + "1027": 48636, + "Weapons": 48637, + "lucent": 48638, + "Ġauth": 48639, + ";;": 48640, + "Recommended": 48641, + "Ġsurv": 48642, + "Ġvm": 48643, + "ĠStronghold": 48644, + "Ġparan": 48645, + "ĠTrance": 48646, + "æĺ": 48647, + "Ġsovere": 48648, + "Ġcorrid": 48649, + "ĠPwr": 48650, + "Ġ[/": 48651, + "Ġseq": 48652, + "Population": 48653, + "Ġ[];": 48654, + "Ġreferen": 48655, + "ĠInstr": 48656, + "ĠStamina": 48657, + "kernel": 48658, + "Python": 48659, + "-+": 48660, + "Ġallele": 48661, + "éĽ": 48662, + "isode": 48663, + "ä¸į": 48664, + "otonin": 48665, + "modules": 48666, + "Notable": 48667, + "Spell": 48668, + "\\\\": 48669, + "Pref": 48670, + "Ġdatas": 48671, + "setup": 48672, + "Ġhapl": 48673, + "Height": 48674, + "åĭ": 48675, + "ãģ£": 48676, + "]),": 48677, + "Handle": 48678, + "umenthal": 48679, + "Package": 48680, + "Ġenthus": 48681, + "Ġunsus": 48682, + "Narr": 48683, + "Examples": 48684, + "FAQ": 48685, + "REDACTED": 48686, + "Ġnotor": 48687, + "Enable": 48688, + "Pattern": 48689, + "aeda": 48690, + ">.": 48691, + "CHECK": 48692, + "Ġ����": 48693, + "Ġ'.": 48694, + "Ġãĥ": 48695, + "append": 48696, + "����": 48697, + "gemony": 48698, + "terness": 48699, + "ĠHaku": 48700, + "NVIDIA": 48701, + "queue": 48702, + "Bind": 48703, + "Ġneigh": 48704, + "armor": 48705, + "retty": 48706, + "LOD": 48707, + "plugins": 48708, + "Ġ/>": 48709, + "TYPE": 48710, + "Ġ4096": 48711, + "-------": 48712, + "Preview": 48713, + "FML": 48714, + "Ġproletarian": 48715, + "zees": 48716, + "enfranch": 48717, + "ãģĨ": 48718, + "Ctrl": 48719, + "Module": 48720, + "ĠSurviv": 48721, + "ĠStarcraft": 48722, + "rored": 48723, + "reddit": 48724, + "Ġrul": 48725, + "Ġtx": 48726, + "Ġmage": 48727, + "Sword": 48728, + "Ġ~/": 48729, + "Effects": 48730, + "éļ": 48731, + "ä¹": 48732, + "Sensor": 48733, + "Solution": 48734, + "ãģĻ": 48735, + "Arcade": 48736, + "Ġpredec": 48737, + "Values": 48738, + "Length": 48739, + "Ġfortun": 48740, + "ttp": 48741, + "\"[": 48742, + "tmp": 48743, + "ĠBerserker": 48744, + "åĨ": 48745, + "ositories": 48746, + "Ġcouncill": 48747, + "ffff": 48748, + "));": 48749, + "Recipe": 48750, + "ĠASCII": 48751, + "âĦ¢:": 48752, + "ä": 48753, + "Ġhorm": 48754, + "=>": 48755, + "sers": 48756, + "ãģĭ": 48757, + "Recommend": 48758, + "['": 48759, + "agame": 48760, + "Animation": 48761, + "aucuses": 48762, + "Discussion": 48763, + "Ġhelicop": 48764, + "å¿": 48765, + "Float": 48766, + "Component": 48767, + "instance": 48768, + "Ġfoo": 48769, + "localhost": 48770, + "=-": 48771, + "Offset": 48772, + "Psy": 48773, + "ĠGohan": 48774, + "buquerque": 48775, + "Ġdefe": 48776, + "chwitz": 48777, + "parse": 48778, + "Ġdors": 48779, + "Ġspons": 48780, + "Ġasync": 48781, + "agonists": 48782, + "Ġindo": 48783, + ".>>": 48784, + "ĠDisciple": 48785, + "Ġfilename": 48786, + "rency": 48787, + "ĠDise": 48788, + "Ġ\"/": 48789, + "template": 48790, + "ãĤ¹": 48791, + "swers": 48792, + "Ġ++": 48793, + "Ġ[(": 48794, + "thora": 48795, + "ĠDepths": 48796, + "livious": 48797, + "Ġdisadvant": 48798, + "foundland": 48799, + "Upload": 48800, + "Ġ§§": 48801, + "Ġsophistic": 48802, + ";}": 48803, + "izont": 48804, + "\"}": 48805, + "estial": 48806, + "Ranked": 48807, + "ĠOccupations": 48808, + "LEASE": 48809, + "ĠOgre": 48810, + "folder": 48811, + "Plot": 48812, + "farious": 48813, + "Ġsuscept": 48814, + "Types": 48815, + "Discuss": 48816, + "Ġ'/": 48817, + "æµ": 48818, + "earable": 48819, + "æ³": 48820, + "Tile": 48821, + "iatus": 48822, + "åŃ": 48823, + "Ġreperto": 48824, + "Helper": 48825, + "Returns": 48826, + "ä¸Ĭ": 48827, + "imaru": 48828, + "Ġreq": 48829, + "Ġdissatisf": 48830, + "multipl": 48831, + "}{": 48832, + "-[": 48833, + "itial": 48834, + "*/": 48835, + "Config": 48836, + "Example": 48837, + "ĠjQuery": 48838, + "Mods": 48839, + "ĠGPIO": 48840, + "Ġlaun": 48841, + "layout": 48842, + "cised": 48843, + "Ġ......": 48844, + "+++": 48845, + "prototype": 48846, + "Exception": 48847, + "Ġsubsections": 48848, + "Ġresemb": 48849, + "Ġâĩ": 48850, + "ĠPubMed": 48851, + "username": 48852, + "Ġaggro": 48853, + "éĥ": 48854, + "Ġ};": 48855, + "ĠMages": 48856, + "ryu": 48857, + "apons": 48858, + "Optional": 48859, + "ĠAncients": 48860, + "ãĤĬ": 48861, + "Quotes": 48862, + "oaded": 48863, + "Ġsuspic": 48864, + "inline": 48865, + "omial": 48866, + "ĠMahjong": 48867, + "auntlets": 48868, + "Ġanarchism": 48869, + "Ġsubclass": 48870, + "ĠMLG": 48871, + "...]": 48872, + "Dialog": 48873, + "uphem": 48874, + "Ġrecursive": 48875, + "7601": 48876, + "frac": 48877, + "Else": 48878, + "ĠSeverus": 48879, + "},{\"": 48880, + "ĠCLIENT": 48881, + "Ġjavascript": 48882, + "sama": 48883, + "ĠLearns": 48884, + "ãĤĤ": 48885, + "Upgrade": 48886, + "Listener": 48887, + "Ġsnipp": 48888, + "Ġrune": 48889, + "ĠTTL": 48890, + "ertation": 48891, + "olicy": 48892, + "=\"\"": 48893, + "«ĺ": 48894, + "Ġexpr": 48895, + "ovych": 48896, + "Ġãģ": 48897, + "_-_": 48898, + "munition": 48899, + "////": 48900, + "func": 48901, + ">>>>": 48902, + "Provider": 48903, + "Ïī": 48904, + "BUG": 48905, + "Ġ[-": 48906, + "Ġarrang": 48907, + "merce": 48908, + "ãĥ": 48909, + "incarn": 48910, + "Valid": 48911, + "ĠAether": 48912, + "ãĤĵ": 48913, + "ĠUTF": 48914, + "ĠMonstrous": 48915, + "ãĤĮ": 48916, + "hedon": 48917, + "áµ": 48918, + ":#": 48919, + "ĠFrieza": 48920, + "padding": 48921, + "Reviewer": 48922, + "Ġpsychiat": 48923, + "yrinth": 48924, + "ĠâĶĤ": 48925, + "hillary": 48926, + "Static": 48927, + "Newsletter": 48928, + "Avg": 48929, + "Ġfn": 48930, + "Topic": 48931, + "choes": 48932, + "Ġnewsp": 48933, + "á¸": 48934, + "Ġ[+": 48935, + "~~~~~~~~~~~~~~~~": 48936, + ":]": 48937, + "apego": 48938, + "buf": 48939, + "Translation": 48940, + "ById": 48941, + "Ġmmol": 48942, + "ãĥ¼ãĥ": 48943, + "å½": 48944, + "ãĤī": 48945, + "Ġparser": 48946, + "ãĥª": 48947, + "`,": 48948, + "Lair": 48949, + ")}": 48950, + "ypes": 48951, + "adobe": 48952, + "Ġancest": 48953, + "ernel": 48954, + "ĠNULL": 48955, + "ç«": 48956, + "anguages": 48957, + "Increases": 48958, + "æĦ": 48959, + "utorial": 48960, + "ithmetic": 48961, + "dll": 48962, + "ĠArcane": 48963, + "çī": 48964, + "Ġtc": 48965, + "urtles": 48966, + "èĪ": 48967, + "Bytes": 48968, + "Slot": 48969, + "ĠBahá": 48970, + "Weapon": 48971, + "widget": 48972, + "querque": 48973, + "Ġembodiments": 48974, + "å¥": 48975, + "WARN": 48976, + "swer": 48977, + "thumbnails": 48978, + "FFFF": 48979, + "inguishable": 48980, + "Ġâī": 48981, + "Ġ${": 48982, + "AAAAAAAA": 48983, + "Conclusion": 48984, + "ĻĤ": 48985, + "disable": 48986, + "Rect": 48987, + "Ġsubp": 48988, + "Ġ().": 48989, + "ĠDetected": 48990, + "èĢ": 48991, + "[]": 48992, + "Ġcoerc": 48993, + "ĠmM": 48994, + "recated": 48995, + "fusc": 48996, + "ĠSorce": 48997, + "çĶŁ": 48998, + ").[": 48999, + "Ġ})": 49000, + "mobi": 49001, + "yip": 49002, + "Acknowled": 49003, + "ternity": 49004, + "iqueness": 49005, + "ython": 49006, + "><": 49007, + "Ġstd": 49008, + "Url": 49009, + "Ġnamespace": 49010, + "Ġtion": 49011, + "oother": 49012, + "Ó": 49013, + "Ġhemor": 49014, + "Ġrg": 49015, + "ventory": 49016, + "ãĤ¢": 49017, + "anamo": 49018, + "Socket": 49019, + "Topics": 49020, + "apeshifter": 49021, + "gnu": 49022, + "Ġdetrim": 49023, + "`.": 49024, + "romeda": 49025, + "çIJ": 49026, + "Ġlambda": 49027, + "Compan": 49028, + "Variable": 49029, + "Ġusb": 49030, + "ĠAdamant": 49031, + "ournal": 49032, + "Ġcovari": 49033, + "ãĥ©": 49034, + "éĸ": 49035, + "åİ": 49036, + "otaur": 49037, + "Ġ(),": 49038, + "Marginal": 49039, + "ãģı": 49040, + "Ġphysic": 49041, + "adeon": 49042, + "RESULTS": 49043, + "200000": 49044, + "ãģį": 49045, + "udeb": 49046, + "ãģĵ": 49047, + "COMPLE": 49048, + "Ġmsg": 49049, + "ghazi": 49050, + "/*": 49051, + "ĠDeity": 49052, + "Ġdisapp": 49053, + "Availability": 49054, + "Ġillum": 49055, + "à©": 49056, + "ptives": 49057, + ",âĢĶ": 49058, + "chnology": 49059, + "Ġaccur": 49060, + "Ġapi": 49061, + "Obj": 49062, + "ãĤ«": 49063, + "ãĤ¸": 49064, + "ä¹ĭ": 49065, + "ËĪ": 49066, + "Ġtcp": 49067, + "Required": 49068, + ".<": 49069, + "\".[": 49070, + "Ġ~/.": 49071, + "Ġobser": 49072, + "RFC": 49073, + "Ġintegers": 49074, + "åī": 49075, + "Installation": 49076, + "Ô": 49077, + "ó": 49078, + "csv": 49079, + "ãĥ«": 49080, + "ĠNoticed": 49081, + "âĸĵ": 49082, + "Tumblr": 49083, + "Reply": 49084, + "||": 49085, + "Ġconclud": 49086, + "Ġ))": 49087, + "ebin": 49088, + "sql": 49089, + "Closure": 49090, + "++++": 49091, + "],[": 49092, + "âĹı": 49093, + "Ġprolet": 49094, + "Ġ>=": 49095, + "estinal": 49096, + "Ġ[*": 49097, + "ĠInquisitor": 49098, + "Ġcmd": 49099, + "FINE": 49100, + "CRIP": 49101, + "Ġvertex": 49102, + "TeX": 49103, + "///": 49104, + "Ö¼": 49105, + "iscons": 49106, + "Ġmyster": 49107, + "Changed": 49108, + "timeout": 49109, + "irtual": 49110, + "Methods": 49111, + "Ġcerts": 49112, + "texture": 49113, + "Roaming": 49114, + "Proxy": 49115, + "Override": 49116, + "éĹ": 49117, + "utf": 49118, + "python": 49119, + "ĠRarity": 49120, + "ilitarian": 49121, + "çľ": 49122, + "().": 49123, + "æł": 49124, + "Ġbuf": 49125, + "åij": 49126, + "çķ": 49127, + "Ġ*.": 49128, + "umerable": 49129, + "~~~~": 49130, + "å¦": 49131, + "Ġsimultane": 49132, + "Ġjson": 49133, + "Requires": 49134, + "Ġperl": 49135, + "Interface": 49136, + "rupal": 49137, + ":": 49242, + "itialized": 49243, + "HTTP": 49244, + "Trivia": 49245, + "Sov": 49246, + "wrapper": 49247, + "={": 49248, + "ĠAzerb": 49249, + "aeper": 49250, + "Ġneighb": 49251, + "initions": 49252, + "Ġsts": 49253, + "ĠSasuke": 49254, + "#$": 49255, + "uliffe": 49256, + "æĸ¹": 49257, + "++++++++++++++++": 49258, + "ĠElven": 49259, + "ãģĤ": 49260, + "Ġartif": 49261, + "Folder": 49262, + "Ġà¨": 49263, + "åĤ": 49264, + "Ġphyl": 49265, + "uggest": 49266, + "blance": 49267, + "ãģł": 49268, + "Requirements": 49269, + "Usage": 49270, + "Ġinitialized": 49271, + "ã쮿": 49272, + "conservancy": 49273, + "ĠReincarn": 49274, + ")|": 49275, + "Ġantioxid": 49276, + "ĠClicker": 49277, + "Ġunlaw": 49278, + "Ġ\\(": 49279, + "ãĥĪ": 49280, + "Ġ[*]": 49281, + "Characters": 49282, + "////////": 49283, + "ãĢIJ": 49284, + "ãĤ·": 49285, + "webkit": 49286, + "ãĢij": 49287, + "Ġxp": 49288, + "alkyrie": 49289, + "Console": 49290, + "());": 49291, + "ĠKorra": 49292, + "\"))": 49293, + "oooooooooooooooo": 49294, + "Timer": 49295, + "////////////////": 49296, + "yout": 49297, + "engeance": 49298, + "emetery": 49299, + "Ġmages": 49300, + "mods": 49301, + "Null": 49302, + "Ġphilos": 49303, + "ascript": 49304, + "Ġaddon": 49305, + "ĠâĸĪ": 49306, + "emale": 49307, + "----------------------------------------------------------------": 49308, + "Ġ\\\\": 49309, + "=[": 49310, + "ĠParables": 49311, + "ãĥĨ": 49312, + "VALUE": 49313, + "Ġ@@": 49314, + "Ġuint": 49315, + "${": 49316, + "cpp": 49317, + "%%": 49318, + "Ġ(âĪĴ": 49319, + "utils": 49320, + "prefix": 49321, + "å°Ĩ": 49322, + "ãĥŃ": 49323, + "Completed": 49324, + "Ġgoto": 49325, + "ãĤ¯": 49326, + "Winged": 49327, + "perty": 49328, + "[\"": 49329, + "ãĥİ": 49330, + "ĠScythe": 49331, + "Ġæľ": 49332, + "Ġ!=": 49333, + "Buffer": 49334, + "docker": 49335, + "ĠWATCHED": 49336, + "èĢħ": 49337, + "())": 49338, + "Ġdst": 49339, + "SIZE": 49340, + "ĠDemonic": 49341, + "Ġresil": 49342, + "ãĤ¿": 49343, + "Ġpione": 49344, + "cpu": 49345, + "++)": 49346, + "TEXT": 49347, + "Ġdiscrep": 49348, + "debian": 49349, + "quished": 49350, + "Ġacknow": 49351, + "Ġtrave": 49352, + "Ġgcc": 49353, + "Catalog": 49354, + "ctrl": 49355, + "ĠMoroc": 49356, + "Ġcpu": 49357, + "Ġ];": 49358, + "ĠSorceress": 49359, + "Introduced": 49360, + "Frames": 49361, + "Ġcondem": 49362, + "¶æ": 49363, + "~~~~~~~~": 49364, + "ĠEmacs": 49365, + "][/": 49366, + "Ġglim": 49367, + "Init": 49368, + "ĠPrimordial": 49369, + "ãĥĥ": 49370, + "Ġ+=": 49371, + "Ġblat": 49372, + "à¼": 49373, + "------------------------------------------------": 49374, + "gpu": 49375, + "ãĥĥãĥĪ": 49376, + "Ġxml": 49377, + "Ġboolean": 49378, + "References": 49379, + "Ġ?)": 49380, + "Ġsatell": 49381, + "Queue": 49382, + "Ġpestic": 49383, + "Ġ}}": 49384, + "Attribute": 49385, + "Ġdx": 49386, + "ĠDefin": 49387, + "Synopsis": 49388, + "..................": 49389, + "ãĥ¬": 49390, + "plugin": 49391, + "Disable": 49392, + "0000000000000000": 49393, + ")\\": 49394, + "ĠIchigo": 49395, + "println": 49396, + "rontal": 49397, + "Setup": 49398, + "Ġ��������": 49399, + "å§": 49400, + "âĸº": 49401, + "ĠPengu": 49402, + "ailability": 49403, + "Duration": 49404, + "Timeout": 49405, + "ãĢĮ": 49406, + "Ġbehav": 49407, + "Reviewed": 49408, + "Ġtoget": 49409, + "\\.": 49410, + "lished": 49411, + "Ġthous": 49412, + "Ġperpend": 49413, + "ecause": 49414, + "Layout": 49415, + "è»": 49416, + "ĠDexterity": 49417, + "unsigned": 49418, + "+=": 49419, + "[[": 49420, + "ĠRunes": 49421, + "ãĤ¦": 49422, + "};": 49423, + "})": 49424, + "FTWARE": 49425, + "ength": 49426, + "milo": 49427, + "duino": 49428, + "天": 49429, + "ĠClojure": 49430, + "ļé": 49431, + "ãĥ¥": 49432, + "gradient": 49433, + "Ġ\"\"\"": 49434, + "âĨij": 49435, + "@#": 49436, + "JSON": 49437, + "Ġproport": 49438, + "addr": 49439, + "});": 49440, + "ãĥIJ": 49441, + "ä¸ī": 49442, + "Ġtmp": 49443, + "å£": 49444, + "../": 49445, + "zsche": 49446, + "Ġâμ": 49447, + "Entity": 49448, + "æ©Ł": 49449, + "ĠâĶľâĶĢâĶĢ": 49450, + "filename": 49451, + "{{": 49452, + "@@": 49453, + "ĠSeym": 49454, + "Ġ/**": 49455, + "ĠSummoner": 49456, + "Quantity": 49457, + "ç·": 49458, + "Attach": 49459, + "Ġbool": 49460, + "Texture": 49461, + "Ġopio": 49462, + ".}": 49463, + "ãĥĭ": 49464, + "integer": 49465, + "Ġregex": 49466, + "Ġnomine": 49467, + "ription": 49468, + "ãģ®ç": 49469, + "ãĥķ": 49470, + "Ġsubparagraph": 49471, + "GGGG": 49472, + "Ġexplan": 49473, + "Header": 49474, + "Spawn": 49475, + "toggle": 49476, + "²¾": 49477, + "Abyss": 49478, + "expr": 49479, + "ĠZerg": 49480, + "ĠGrimoire": 49481, + "Contents": 49482, + "Instance": 49483, + "cyclopedia": 49484, + "ãĥĹ": 49485, + "ĠTakeru": 49486, + "=(": 49487, + "代": 49488, + "\\)": 49489, + "Ġrgb": 49490, + "htt": 49491, + "bryce": 49492, + "Ġlivest": 49493, + "ĠAnnotations": 49494, + "âĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢ": 49495, + "berus": 49496, + "ntil": 49497, + "Ġskelet": 49498, + "callback": 49499, + "åħī": 49500, + "Joined": 49501, + "ãĤª": 49502, + "Ġargs": 49503, + "artifacts": 49504, + "Ġå¤": 49505, + "ÃĽ": 49506, + "ãĥŀ": 49507, + "Streamer": 49508, + "}\"": 49509, + "Ġunden": 49510, + "ãĥģ": 49511, + "Īè": 49512, + "ãĥ£": 49513, + "Ġ0004": 49514, + "Ġ\\'": 49515, + "ãĤ°": 49516, + "ĠCONFIG": 49517, + "Ġ#####": 49518, + "``": 49519, + "anguage": 49520, + "Ġ*)": 49521, + "Template": 49522, + "MODE": 49523, + "Ġ00000000": 49524, + "'';": 49525, + ">": 49625, + "Ġlvl": 49626, + "Footnote": 49627, + "Iter": 49628, + "####": 49629, + "ãĥij": 49630, + "ĠCarbuncle": 49631, + "Ġ[+]": 49632, + "Ġmathemat": 49633, + "Allows": 49634, + "Ġ4090": 49635, + "Async": 49636, + "ģ«": 49637, + "Ͻ": 49638, + "))))": 49639, + "á½": 49640, + "Ġcx": 49641, + "Ġansw": 49642, + "{\"": 49643, + "ãĥŁ": 49644, + "addons": 49645, + "Filename": 49646, + "Appearances": 49647, + "ĠãĢĮ": 49648, + "Ġaddr": 49649, + "Ġcharact": 49650, + "glomer": 49651, + "Advertisements": 49652, + "Ġdracon": 49653, + "ĠFenrir": 49654, + "Ġ();": 49655, + "ĠCitiz": 49656, + "acebook": 49657, + "Ġparams": 49658, + "]=": 49659, + "Ġsubscript": 49660, + "Ġentreprene": 49661, + "tnc": 49662, + "iversal": 49663, + "Ġmillenn": 49664, + "ithub": 49665, + "/>": 49666, + "Ġ\"{": 49667, + "Frameworks": 49668, + "avorite": 49669, + "Ġ])": 49670, + "Constructed": 49671, + "fml": 49672, + "ãĥį": 49673, + "################################": 49674, + "-|": 49675, + "¥ŀ": 49676, + "Ġwithd": 49677, + "ĠCth": 49678, + "AppData": 49679, + "Msg": 49680, + ":{": 49681, + "ãĤ¨": 49682, + "Ġtuple": 49683, + "ç¥ŀ": 49684, + "Ġintrins": 49685, + "ĠCooldown": 49686, + "ategory": 49687, + "^{": 49688, + "ãĥĬ": 49689, + "''''": 49690, + "çͰ": 49691, + "ĠDEBUG": 49692, + "Ġcannabin": 49693, + "ocobo": 49694, + "Invalid": 49695, + "ãĥĢ": 49696, + "Compat": 49697, + "Ġ({": 49698, + "Removed": 49699, + "Ġconvol": 49700, + "}:": 49701, + "interstitial": 49702, + "Ġ\"": 49721, + "initialized": 49722, + "Ġexting": 49723, + "Poké": 49724, + "Parameters": 49725, + "¶ħ": 49726, + "########": 49727, + "NULL": 49728, + "ãĥĩ": 49729, + "groupon": 49730, + "\\-": 49731, + "ãĥı": 49732, + "ãĤ±": 49733, + "Ġsubsequ": 49734, + "ccording": 49735, + "ĠMODULE": 49736, + "ĠProtoss": 49737, + "\"},{\"": 49738, + "Ġ..............": 49739, + "Integer": 49740, + "endif": 49741, + "ãĥĻ": 49742, + "parser": 49743, + "lambda": 49744, + "Ġcarbohyd": 49745, + "ĠUnloaded": 49746, + "_{": 49747, + "âĸ¬âĸ¬": 49748, + "Ġdebian": 49749, + "]}": 49750, + "ãĤ¶": 49751, + "Parameter": 49752, + "ãĤ£": 49753, + "ãĤ»": 49754, + "Ġ$_": 49755, + "İĭ": 49756, + "Ġiterator": 49757, + "ãĤ¬": 49758, + "WINDOWS": 49759, + "CONCLUS": 49760, + "Ġ\"\\": 49761, + "umbn": 49762, + "(&": 49763, + "ãĥ©ãĥ³": 49764, + "usercontent": 49765, + "ometimes": 49766, + "METHOD": 49767, + "ãĥ¢": 49768, + "potion": 49769, + "ãĥ¯": 49770, + "everal": 49771, + "Ġweap": 49772, + "minecraft": 49773, + "================================": 49774, + "printf": 49775, + "ĠShinra": 49776, + "Ġreluct": 49777, + "\\\",": 49778, + "Runtime": 49779, + "xff": 49780, + "ĠAbyssal": 49781, + "akeru": 49782, + "Ġ\\(\\": 49783, + "\"/>": 49784, + "efficients": 49785, + "Ü": 49786, + "avascript": 49787, + "Ġbehavi": 49788, + "++;": 49789, + "=#": 49790, + "Attributes": 49791, + "âĵĺ": 49792, + "lvl": 49793, + "¬¼": 49794, + "/**": 49795, + "Gameplay": 49796, + "ĠLeilan": 49797, + ">)": 49798, + "=\"/": 49799, + "Ġ));": 49800, + "ãĥĨãĤ£": 49801, + "ġ": 49802, + ".": 49836, + "DEBUG": 49837, + "âĶģ": 49838, + "ãĢı": 49839, + "WithNo": 49840, + "Redditor": 49841, + "ĠâĶľ": 49842, + "Ġfmt": 49843, + "ãĢİ": 49844, + "Ġmsec": 49845, + "ĪĴ": 49846, + "eatures": 49847, + "itially": 49848, + "\"\"\"": 49849, + "ãĥ¼ãĤ¯": 49850, + "Textures": 49851, + "\"},": 49852, + "\"><": 49858, + "||||": 49859, + "ß": 49860, + "iterator": 49861, + "è£ħ": 49862, + "Ĥª": 49863, + "ojure": 49864, + "ãħĭãħĭ": 49865, + "ãĥ¼ãĥ³": 49866, + "Ġprintln": 49867, + "Ġ][": 49868, + "âĸĪâĸĪ": 49869, + "âķIJ": 49870, + "\\\":": 49871, + "senal": 49872, + "é¾į": 49873, + "é¾": 49874, + "Ġcryst": 49875, + "ãĥķãĤ¡": 49876, + "ĠCosponsors": 49877, + "ãĤ·ãĥ£": 49878, + "Magikarp": 49879, + "ĠMagicka": 49880, + "âĸĪâĸĪâĸĪâĸĪ": 49881, + ",,,,,,,,": 49882, + "vertisement": 49883, + "âĶĢâĶĢâĶĢâĶĢ": 49884, + "ãĥķãĤ©": 49885, + "luaj": 49886, + "CLASSIFIED": 49887, + ".''.": 49888, + "byss": 49889, + "Ġ{:": 49890, + "ĠNanto": 49891, + "Ġptr": 49892, + "Ġ%%": 49893, + "Ġteasp": 49894, + "[_": 49895, + "ãĥ¤": 49896, + "ħĭ": 49897, + "ŃĶ": 49898, + "Ġpci": 49899, + "Ġ\"<": 49900, + "GGGGGGGG": 49901, + "æĪ¦": 49902, + "--+": 49903, + "ãĤ®": 49904, + "Ġ())": 49905, + "âĸ¬": 49906, + "Ġsizeof": 49907, + "}}}": 49908, + ";;;;;;;;": 49909, + ">]": 49910, + "âĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪ": 49911, + "Vaults": 49912, + "Ġistg": 49913, + "Ġnewcom": 49914, + "=]": 49915, + "¿½": 49916, + "ĵĺ": 49917, + "{\\": 49918, + "Args": 49919, + "Ġexha": 49920, + "(\\": 49921, + "Ġunnecess": 49922, + "\"}],\"": 49923, + "ĠUNCLASSIFIED": 49924, + ">(": 49925, + "ãĤ¢ãĥ«": 49926, + "æ©": 49927, + "70710": 49928, + "Ń·": 49929, + "ãĥ¼ãĥĨãĤ£": 49930, + "ĠSakuya": 49931, + "ãĥĥãĥī": 49932, + "ĠPyrrha": 49933, + "escription": 49934, + "VIDIA": 49935, + "================================================================": 49936, + "Ġlooph": 49937, + "=~": 49938, + "Ġcumbers": 49939, + "Ġ)]": 49940, + "govtrack": 49941, + "ĠãĤµ": 49942, + "Ġsubur": 49943, + "Þ": 49944, + "Ġâī¡": 49945, + "Interstitial": 49946, + "ãĥ¼ãĥĨ": 49947, + "Ġgobl": 49948, + "ãĥīãĥ©": 49949, + "oldown": 49950, + "ģĸ": 49951, + "Depths": 49952, + "Ġ());": 49953, + "Ġ._": 49954, + "20439": 49955, + "Ġç¥ŀ": 49956, + "ãģ®å®": 49957, + "ãĤ¼": 49958, + "Ġ$\\": 49959, + "âĹ¼": 49960, + "Ġencount": 49961, + "Ġ":48457,"Ġstreng":48458,"agascar":48459,"guyen":48460,"((":48461,")[":48462,"ĠNorn":48463,"Ġhippocamp":48464,"Ġ¯":48465,"îĢ":48466,"Connection":48467,"PATH":48468,"mbuds":48469,"ĠShards":48470,"Ġadvoc":48471,"Ġsimulac":48472,"âĸij":48473,"!?\"":48474,"ĠPotion":48475,"Ġamulet":48476,"ĠFnatic":48477,"Ġcryptoc":48478,"wav":48479,"radius":48480,"pkg":48481,"ĠMFT":48482,"æĢ":48483,"Ġtoile":48484,"Items":48485,"ifference":48486,"errors":48487,"ĠCelt":48488,"Ġunpop":48489,"ilogy":48490,"6666":48491,"hesda":48492,"Instruct":48493,"å·":48494,"Materials":48495,"ettings":48496,"Percent":48497,"Ġresistor":48498,"tymology":48499,"Ġdeprecated":48500,"Ġgrep":48501,"ĠWRITE":48502,"Ġtriv":48503,"Ġscrut":48504,"[/":48505,"anyl":48506,"skirts":48507,"MSN":48508,"ĠCodec":48509,"ecd":48510,"Anth":48511,"){":48512,"%]":48513,"veyard":48514,"aspberry":48515,"ãĢ":48516,"Reward":48517,"rha":48518,"Stretch":48519,"]-":48520,"Prev":48521,"Context":48522,"Ġlinux":48523,"HAHA":48524,"perties":48525,"ĠVIDE":48526,"Domain":48527,"Ġmurd":48528,"ĠLegions":48529,"apache":48530,"æŃ":48531,"Pause":48532,"Temperature":48533,"ufact":48534,"igslist":48535,"ĠRetrieved":48536,"èª":48537,"ãģĮ":48538,"Ingredients":48539,"ruary":48540,"dyl":48541,"Alias":48542,"ĠÎĶ":48543,"Ġinval":48544,"amsung":48545,"!--":48546,"olean":48547,"æī":48548,"ãģ¯":48549,"Ġcoefficients":48550,"ĠDHCP":48551,"âĨĴ":48552,"utonium":48553,":[":48554,"âĹ":48555,"cli":48556,"Container":48557,"å¼":48558,"nexus":48559,"SOURCE":48560,"Ò":48561,"=/":48562,"Ġmysql":48563,"ĠGained":48564,"Ġ/*":48565,"uncture":48566,"Ġstatically":48567,"âĸł":48568,"æĺ¯":48569,"æ°":48570,"estamp":48571,"Cache":48572,"ulkan":48573,"staking":48574,"apter":48575,"ãģ¾":48576,"Ġμg":48577,"Ġtremend":48578,"ĠPiercing":48579,"naissance":48580,"ĠHealer":48581,"Enabled":48582,"éģ":48583,"âĸ":48584,"ĠThumbnails":48585,"Ġhither":48586,"Format":48587,"utherland":48588,"íķ":48589,"Ġdestro":48590,"fff":48591,"execute":48592,"msg":48593,"romancer":48594,"ĠCanaver":48595,"ĠVaults":48596,"oided":48597,"iage":48598,"Ġimg":48599,"summary":48600,"]);":48601,"ĠABE":48602,"ĠGamergate":48603,"utherford":48604,"Ġoverwrite":48605,"enment":48606,"æķ":48607,"Ġsystemd":48608,"tif":48609,"]).":48610,"ãĤ¤":48611,"Widget":48612,"======":48613,"(-":48614,"Ġ\"+":48615,"ĠIncarnation":48616,"æĥ":48617,"���":48618,"GUI":48619,"èĥ":48620,"forums":48621,"Ġrunes":48622,"Ġâī¤":48623,"Ġdefic":48624,"Distance":48625,"directory":48626,"ĠHorus":48627,"iltr":48628,"ortium":48629,"Ġ./":48630,"bda":48631,"owship":48632,"ĠâĨij":48633,"}.":48634,"åĩ":48635,"1027":48636,"Weapons":48637,"lucent":48638,"Ġauth":48639,";;":48640,"Recommended":48641,"Ġsurv":48642,"Ġvm":48643,"ĠStronghold":48644,"Ġparan":48645,"ĠTrance":48646,"æĺ":48647,"Ġsovere":48648,"Ġcorrid":48649,"ĠPwr":48650,"Ġ[/":48651,"Ġseq":48652,"Population":48653,"Ġ[];":48654,"Ġreferen":48655,"ĠInstr":48656,"ĠStamina":48657,"kernel":48658,"Python":48659,"-+":48660,"Ġallele":48661,"éĽ":48662,"isode":48663,"ä¸į":48664,"otonin":48665,"modules":48666,"Notable":48667,"Spell":48668,"\\\\":48669,"Pref":48670,"Ġdatas":48671,"setup":48672,"Ġhapl":48673,"Height":48674,"åĭ":48675,"ãģ£":48676,"]),":48677,"Handle":48678,"umenthal":48679,"Package":48680,"Ġenthus":48681,"Ġunsus":48682,"Narr":48683,"Examples":48684,"FAQ":48685,"REDACTED":48686,"Ġnotor":48687,"Enable":48688,"Pattern":48689,"aeda":48690,">.":48691,"CHECK":48692,"Ġ����":48693,"Ġ'.":48694,"Ġãĥ":48695,"append":48696,"����":48697,"gemony":48698,"terness":48699,"ĠHaku":48700,"NVIDIA":48701,"queue":48702,"Bind":48703,"Ġneigh":48704,"armor":48705,"retty":48706,"LOD":48707,"plugins":48708,"Ġ/>":48709,"TYPE":48710,"Ġ4096":48711,"-------":48712,"Preview":48713,"FML":48714,"Ġproletarian":48715,"zees":48716,"enfranch":48717,"ãģĨ":48718,"Ctrl":48719,"Module":48720,"ĠSurviv":48721,"ĠStarcraft":48722,"rored":48723,"reddit":48724,"Ġrul":48725,"Ġtx":48726,"Ġmage":48727,"Sword":48728,"Ġ~/":48729,"Effects":48730,"éļ":48731,"ä¹":48732,"Sensor":48733,"Solution":48734,"ãģĻ":48735,"Arcade":48736,"Ġpredec":48737,"Values":48738,"Length":48739,"Ġfortun":48740,"ttp":48741,"\"[":48742,"tmp":48743,"ĠBerserker":48744,"åĨ":48745,"ositories":48746,"Ġcouncill":48747,"ffff":48748,"));":48749,"Recipe":48750,"ĠASCII":48751,"âĦ¢:":48752,"ä":48753,"Ġhorm":48754,"=>":48755,"sers":48756,"ãģĭ":48757,"Recommend":48758,"['":48759,"agame":48760,"Animation":48761,"aucuses":48762,"Discussion":48763,"Ġhelicop":48764,"å¿":48765,"Float":48766,"Component":48767,"instance":48768,"Ġfoo":48769,"localhost":48770,"=-":48771,"Offset":48772,"Psy":48773,"ĠGohan":48774,"buquerque":48775,"Ġdefe":48776,"chwitz":48777,"parse":48778,"Ġdors":48779,"Ġspons":48780,"Ġasync":48781,"agonists":48782,"Ġindo":48783,".>>":48784,"ĠDisciple":48785,"Ġfilename":48786,"rency":48787,"ĠDise":48788,"Ġ\"/":48789,"template":48790,"ãĤ¹":48791,"swers":48792,"Ġ++":48793,"Ġ[(":48794,"thora":48795,"ĠDepths":48796,"livious":48797,"Ġdisadvant":48798,"foundland":48799,"Upload":48800,"Ġ§§":48801,"Ġsophistic":48802,";}":48803,"izont":48804,"\"}":48805,"estial":48806,"Ranked":48807,"ĠOccupations":48808,"LEASE":48809,"ĠOgre":48810,"folder":48811,"Plot":48812,"farious":48813,"Ġsuscept":48814,"Types":48815,"Discuss":48816,"Ġ'/":48817,"æµ":48818,"earable":48819,"æ³":48820,"Tile":48821,"iatus":48822,"åŃ":48823,"Ġreperto":48824,"Helper":48825,"Returns":48826,"ä¸Ĭ":48827,"imaru":48828,"Ġreq":48829,"Ġdissatisf":48830,"multipl":48831,"}{":48832,"-[":48833,"itial":48834,"*/":48835,"Config":48836,"Example":48837,"ĠjQuery":48838,"Mods":48839,"ĠGPIO":48840,"Ġlaun":48841,"layout":48842,"cised":48843,"Ġ......":48844,"+++":48845,"prototype":48846,"Exception":48847,"Ġsubsections":48848,"Ġresemb":48849,"Ġâĩ":48850,"ĠPubMed":48851,"username":48852,"Ġaggro":48853,"éĥ":48854,"Ġ};":48855,"ĠMages":48856,"ryu":48857,"apons":48858,"Optional":48859,"ĠAncients":48860,"ãĤĬ":48861,"Quotes":48862,"oaded":48863,"Ġsuspic":48864,"inline":48865,"omial":48866,"ĠMahjong":48867,"auntlets":48868,"Ġanarchism":48869,"Ġsubclass":48870,"ĠMLG":48871,"...]":48872,"Dialog":48873,"uphem":48874,"Ġrecursive":48875,"7601":48876,"frac":48877,"Else":48878,"ĠSeverus":48879,"},{\"":48880,"ĠCLIENT":48881,"Ġjavascript":48882,"sama":48883,"ĠLearns":48884,"ãĤĤ":48885,"Upgrade":48886,"Listener":48887,"Ġsnipp":48888,"Ġrune":48889,"ĠTTL":48890,"ertation":48891,"olicy":48892,"=\"\"":48893,"«ĺ":48894,"Ġexpr":48895,"ovych":48896,"Ġãģ":48897,"_-_":48898,"munition":48899,"////":48900,"func":48901,">>>>":48902,"Provider":48903,"Ïī":48904,"BUG":48905,"Ġ[-":48906,"Ġarrang":48907,"merce":48908,"ãĥ":48909,"incarn":48910,"Valid":48911,"ĠAether":48912,"ãĤĵ":48913,"ĠUTF":48914,"ĠMonstrous":48915,"ãĤĮ":48916,"hedon":48917,"áµ":48918,":#":48919,"ĠFrieza":48920,"padding":48921,"Reviewer":48922,"Ġpsychiat":48923,"yrinth":48924,"ĠâĶĤ":48925,"hillary":48926,"Static":48927,"Newsletter":48928,"Avg":48929,"Ġfn":48930,"Topic":48931,"choes":48932,"Ġnewsp":48933,"á¸":48934,"Ġ[+":48935,"~~~~~~~~~~~~~~~~":48936,":]":48937,"apego":48938,"buf":48939,"Translation":48940,"ById":48941,"Ġmmol":48942,"ãĥ¼ãĥ":48943,"å½":48944,"ãĤī":48945,"Ġparser":48946,"ãĥª":48947,"`,":48948,"Lair":48949,")}":48950,"ypes":48951,"adobe":48952,"Ġancest":48953,"ernel":48954,"ĠNULL":48955,"ç«":48956,"anguages":48957,"Increases":48958,"æĦ":48959,"utorial":48960,"ithmetic":48961,"dll":48962,"ĠArcane":48963,"çī":48964,"Ġtc":48965,"urtles":48966,"èĪ":48967,"Bytes":48968,"Slot":48969,"ĠBahá":48970,"Weapon":48971,"widget":48972,"querque":48973,"Ġembodiments":48974,"å¥":48975,"WARN":48976,"swer":48977,"thumbnails":48978,"FFFF":48979,"inguishable":48980,"Ġâī":48981,"Ġ${":48982,"AAAAAAAA":48983,"Conclusion":48984,"ĻĤ":48985,"disable":48986,"Rect":48987,"Ġsubp":48988,"Ġ().":48989,"ĠDetected":48990,"èĢ":48991,"[]":48992,"Ġcoerc":48993,"ĠmM":48994,"recated":48995,"fusc":48996,"ĠSorce":48997,"çĶŁ":48998,").[":48999,"Ġ})":49000,"mobi":49001,"yip":49002,"Acknowled":49003,"ternity":49004,"iqueness":49005,"ython":49006,"><":49007,"Ġstd":49008,"Url":49009,"Ġnamespace":49010,"Ġtion":49011,"oother":49012,"Ó":49013,"Ġhemor":49014,"Ġrg":49015,"ventory":49016,"ãĤ¢":49017,"anamo":49018,"Socket":49019,"Topics":49020,"apeshifter":49021,"gnu":49022,"Ġdetrim":49023,"`.":49024,"romeda":49025,"çIJ":49026,"Ġlambda":49027,"Compan":49028,"Variable":49029,"Ġusb":49030,"ĠAdamant":49031,"ournal":49032,"Ġcovari":49033,"ãĥ©":49034,"éĸ":49035,"åİ":49036,"otaur":49037,"Ġ(),":49038,"Marginal":49039,"ãģı":49040,"Ġphysic":49041,"adeon":49042,"RESULTS":49043,"200000":49044,"ãģį":49045,"udeb":49046,"ãģĵ":49047,"COMPLE":49048,"Ġmsg":49049,"ghazi":49050,"/*":49051,"ĠDeity":49052,"Ġdisapp":49053,"Availability":49054,"Ġillum":49055,"à©":49056,"ptives":49057,",âĢĶ":49058,"chnology":49059,"Ġaccur":49060,"Ġapi":49061,"Obj":49062,"ãĤ«":49063,"ãĤ¸":49064,"ä¹ĭ":49065,"ËĪ":49066,"Ġtcp":49067,"Required":49068,".<":49069,"\".[":49070,"Ġ~/.":49071,"Ġobser":49072,"RFC":49073,"Ġintegers":49074,"åī":49075,"Installation":49076,"Ô":49077,"ó":49078,"csv":49079,"ãĥ«":49080,"ĠNoticed":49081,"âĸĵ":49082,"Tumblr":49083,"Reply":49084,"||":49085,"Ġconclud":49086,"Ġ))":49087,"ebin":49088,"sql":49089,"Closure":49090,"++++":49091,"],[":49092,"âĹı":49093,"Ġprolet":49094,"Ġ>=":49095,"estinal":49096,"Ġ[*":49097,"ĠInquisitor":49098,"Ġcmd":49099,"FINE":49100,"CRIP":49101,"Ġvertex":49102,"TeX":49103,"///":49104,"Ö¼":49105,"iscons":49106,"Ġmyster":49107,"Changed":49108,"timeout":49109,"irtual":49110,"Methods":49111,"Ġcerts":49112,"texture":49113,"Roaming":49114,"Proxy":49115,"Override":49116,"éĹ":49117,"utf":49118,"python":49119,"ĠRarity":49120,"ilitarian":49121,"çľ":49122,"().":49123,"æł":49124,"Ġbuf":49125,"åij":49126,"çķ":49127,"Ġ*.":49128,"umerable":49129,"~~~~":49130,"å¦":49131,"Ġsimultane":49132,"Ġjson":49133,"Requires":49134,"Ġperl":49135,"Interface":49136,"rupal":49137,":":49242,"itialized":49243,"HTTP":49244,"Trivia":49245,"Sov":49246,"wrapper":49247,"={":49248,"ĠAzerb":49249,"aeper":49250,"Ġneighb":49251,"initions":49252,"Ġsts":49253,"ĠSasuke":49254,"#$":49255,"uliffe":49256,"æĸ¹":49257,"++++++++++++++++":49258,"ĠElven":49259,"ãģĤ":49260,"Ġartif":49261,"Folder":49262,"Ġà¨":49263,"åĤ":49264,"Ġphyl":49265,"uggest":49266,"blance":49267,"ãģł":49268,"Requirements":49269,"Usage":49270,"Ġinitialized":49271,"ã쮿":49272,"conservancy":49273,"ĠReincarn":49274,")|":49275,"Ġantioxid":49276,"ĠClicker":49277,"Ġunlaw":49278,"Ġ\\(":49279,"ãĥĪ":49280,"Ġ[*]":49281,"Characters":49282,"////////":49283,"ãĢIJ":49284,"ãĤ·":49285,"webkit":49286,"ãĢij":49287,"Ġxp":49288,"alkyrie":49289,"Console":49290,"());":49291,"ĠKorra":49292,"\"))":49293,"oooooooooooooooo":49294,"Timer":49295,"////////////////":49296,"yout":49297,"engeance":49298,"emetery":49299,"Ġmages":49300,"mods":49301,"Null":49302,"Ġphilos":49303,"ascript":49304,"Ġaddon":49305,"ĠâĸĪ":49306,"emale":49307,"----------------------------------------------------------------":49308,"Ġ\\\\":49309,"=[":49310,"ĠParables":49311,"ãĥĨ":49312,"VALUE":49313,"Ġ@@":49314,"Ġuint":49315,"${":49316,"cpp":49317,"%%":49318,"Ġ(âĪĴ":49319,"utils":49320,"prefix":49321,"å°Ĩ":49322,"ãĥŃ":49323,"Completed":49324,"Ġgoto":49325,"ãĤ¯":49326,"Winged":49327,"perty":49328,"[\"":49329,"ãĥİ":49330,"ĠScythe":49331,"Ġæľ":49332,"Ġ!=":49333,"Buffer":49334,"docker":49335,"ĠWATCHED":49336,"èĢħ":49337,"())":49338,"Ġdst":49339,"SIZE":49340,"ĠDemonic":49341,"Ġresil":49342,"ãĤ¿":49343,"Ġpione":49344,"cpu":49345,"++)":49346,"TEXT":49347,"Ġdiscrep":49348,"debian":49349,"quished":49350,"Ġacknow":49351,"Ġtrave":49352,"Ġgcc":49353,"Catalog":49354,"ctrl":49355,"ĠMoroc":49356,"Ġcpu":49357,"Ġ];":49358,"ĠSorceress":49359,"Introduced":49360,"Frames":49361,"Ġcondem":49362,"¶æ":49363,"~~~~~~~~":49364,"ĠEmacs":49365,"][/":49366,"Ġglim":49367,"Init":49368,"ĠPrimordial":49369,"ãĥĥ":49370,"Ġ+=":49371,"Ġblat":49372,"à¼":49373,"------------------------------------------------":49374,"gpu":49375,"ãĥĥãĥĪ":49376,"Ġxml":49377,"Ġboolean":49378,"References":49379,"Ġ?)":49380,"Ġsatell":49381,"Queue":49382,"Ġpestic":49383,"Ġ}}":49384,"Attribute":49385,"Ġdx":49386,"ĠDefin":49387,"Synopsis":49388,"..................":49389,"ãĥ¬":49390,"plugin":49391,"Disable":49392,"0000000000000000":49393,")\\":49394,"ĠIchigo":49395,"println":49396,"rontal":49397,"Setup":49398,"Ġ��������":49399,"å§":49400,"âĸº":49401,"ĠPengu":49402,"ailability":49403,"Duration":49404,"Timeout":49405,"ãĢĮ":49406,"Ġbehav":49407,"Reviewed":49408,"Ġtoget":49409,"\\.":49410,"lished":49411,"Ġthous":49412,"Ġperpend":49413,"ecause":49414,"Layout":49415,"è»":49416,"ĠDexterity":49417,"unsigned":49418,"+=":49419,"[[":49420,"ĠRunes":49421,"ãĤ¦":49422,"};":49423,"})":49424,"FTWARE":49425,"ength":49426,"milo":49427,"duino":49428,"天":49429,"ĠClojure":49430,"ļé":49431,"ãĥ¥":49432,"gradient":49433,"Ġ\"\"\"":49434,"âĨij":49435,"@#":49436,"JSON":49437,"Ġproport":49438,"addr":49439,"});":49440,"ãĥIJ":49441,"ä¸ī":49442,"Ġtmp":49443,"å£":49444,"../":49445,"zsche":49446,"Ġâμ":49447,"Entity":49448,"æ©Ł":49449,"ĠâĶľâĶĢâĶĢ":49450,"filename":49451,"{{":49452,"@@":49453,"ĠSeym":49454,"Ġ/**":49455,"ĠSummoner":49456,"Quantity":49457,"ç·":49458,"Attach":49459,"Ġbool":49460,"Texture":49461,"Ġopio":49462,".}":49463,"ãĥĭ":49464,"integer":49465,"Ġregex":49466,"Ġnomine":49467,"ription":49468,"ãģ®ç":49469,"ãĥķ":49470,"Ġsubparagraph":49471,"GGGG":49472,"Ġexplan":49473,"Header":49474,"Spawn":49475,"toggle":49476,"²¾":49477,"Abyss":49478,"expr":49479,"ĠZerg":49480,"ĠGrimoire":49481,"Contents":49482,"Instance":49483,"cyclopedia":49484,"ãĥĹ":49485,"ĠTakeru":49486,"=(":49487,"代":49488,"\\)":49489,"Ġrgb":49490,"htt":49491,"bryce":49492,"Ġlivest":49493,"ĠAnnotations":49494,"âĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢâĶĢ":49495,"berus":49496,"ntil":49497,"Ġskelet":49498,"callback":49499,"åħī":49500,"Joined":49501,"ãĤª":49502,"Ġargs":49503,"artifacts":49504,"Ġå¤":49505,"ÃĽ":49506,"ãĥŀ":49507,"Streamer":49508,"}\"":49509,"Ġunden":49510,"ãĥģ":49511,"Īè":49512,"ãĥ£":49513,"Ġ0004":49514,"Ġ\\'":49515,"ãĤ°":49516,"ĠCONFIG":49517,"Ġ#####":49518,"``":49519,"anguage":49520,"Ġ*)":49521,"Template":49522,"MODE":49523,"Ġ00000000":49524,"'';":49525,">":49625,"Ġlvl":49626,"Footnote":49627,"Iter":49628,"####":49629,"ãĥij":49630,"ĠCarbuncle":49631,"Ġ[+]":49632,"Ġmathemat":49633,"Allows":49634,"Ġ4090":49635,"Async":49636,"ģ«":49637,"Ͻ":49638,"))))":49639,"á½":49640,"Ġcx":49641,"Ġansw":49642,"{\"":49643,"ãĥŁ":49644,"addons":49645,"Filename":49646,"Appearances":49647,"ĠãĢĮ":49648,"Ġaddr":49649,"Ġcharact":49650,"glomer":49651,"Advertisements":49652,"Ġdracon":49653,"ĠFenrir":49654,"Ġ();":49655,"ĠCitiz":49656,"acebook":49657,"Ġparams":49658,"]=":49659,"Ġsubscript":49660,"Ġentreprene":49661,"tnc":49662,"iversal":49663,"Ġmillenn":49664,"ithub":49665,"/>":49666,"Ġ\"{":49667,"Frameworks":49668,"avorite":49669,"Ġ])":49670,"Constructed":49671,"fml":49672,"ãĥį":49673,"################################":49674,"-|":49675,"¥ŀ":49676,"Ġwithd":49677,"ĠCth":49678,"AppData":49679,"Msg":49680,":{":49681,"ãĤ¨":49682,"Ġtuple":49683,"ç¥ŀ":49684,"Ġintrins":49685,"ĠCooldown":49686,"ategory":49687,"^{":49688,"ãĥĬ":49689,"''''":49690,"çͰ":49691,"ĠDEBUG":49692,"Ġcannabin":49693,"ocobo":49694,"Invalid":49695,"ãĥĢ":49696,"Compat":49697,"Ġ({":49698,"Removed":49699,"Ġconvol":49700,"}:":49701,"interstitial":49702,"Ġ\"":49721,"initialized":49722,"Ġexting":49723,"Poké":49724,"Parameters":49725,"¶ħ":49726,"########":49727,"NULL":49728,"ãĥĩ":49729,"groupon":49730,"\\-":49731,"ãĥı":49732,"ãĤ±":49733,"Ġsubsequ":49734,"ccording":49735,"ĠMODULE":49736,"ĠProtoss":49737,"\"},{\"":49738,"Ġ..............":49739,"Integer":49740,"endif":49741,"ãĥĻ":49742,"parser":49743,"lambda":49744,"Ġcarbohyd":49745,"ĠUnloaded":49746,"_{":49747,"âĸ¬âĸ¬":49748,"Ġdebian":49749,"]}":49750,"ãĤ¶":49751,"Parameter":49752,"ãĤ£":49753,"ãĤ»":49754,"Ġ$_":49755,"İĭ":49756,"Ġiterator":49757,"ãĤ¬":49758,"WINDOWS":49759,"CONCLUS":49760,"Ġ\"\\":49761,"umbn":49762,"(&":49763,"ãĥ©ãĥ³":49764,"usercontent":49765,"ometimes":49766,"METHOD":49767,"ãĥ¢":49768,"potion":49769,"ãĥ¯":49770,"everal":49771,"Ġweap":49772,"minecraft":49773,"================================":49774,"printf":49775,"ĠShinra":49776,"Ġreluct":49777,"\\\",":49778,"Runtime":49779,"xff":49780,"ĠAbyssal":49781,"akeru":49782,"Ġ\\(\\":49783,"\"/>":49784,"efficients":49785,"Ü":49786,"avascript":49787,"Ġbehavi":49788,"++;":49789,"=#":49790,"Attributes":49791,"âĵĺ":49792,"lvl":49793,"¬¼":49794,"/**":49795,"Gameplay":49796,"ĠLeilan":49797,">)":49798,"=\"/":49799,"Ġ));":49800,"ãĥĨãĤ£":49801,"ġ":49802,".":49836,"DEBUG":49837,"âĶģ":49838,"ãĢı":49839,"WithNo":49840,"Redditor":49841,"ĠâĶľ":49842,"Ġfmt":49843,"ãĢİ":49844,"Ġmsec":49845,"ĪĴ":49846,"eatures":49847,"itially":49848,"\"\"\"":49849,"ãĥ¼ãĤ¯":49850,"Textures":49851,"\"},":49852,"\"><":49858,"||||":49859,"ß":49860,"iterator":49861,"è£ħ":49862,"Ĥª":49863,"ojure":49864,"ãħĭãħĭ":49865,"ãĥ¼ãĥ³":49866,"Ġprintln":49867,"Ġ][":49868,"âĸĪâĸĪ":49869,"âķIJ":49870,"\\\":":49871,"senal":49872,"é¾į":49873,"é¾":49874,"Ġcryst":49875,"ãĥķãĤ¡":49876,"ĠCosponsors":49877,"ãĤ·ãĥ£":49878,"Magikarp":49879,"ĠMagicka":49880,"âĸĪâĸĪâĸĪâĸĪ":49881,",,,,,,,,":49882,"vertisement":49883,"âĶĢâĶĢâĶĢâĶĢ":49884,"ãĥķãĤ©":49885,"luaj":49886,"CLASSIFIED":49887,".''.":49888,"byss":49889,"Ġ{:":49890,"ĠNanto":49891,"Ġptr":49892,"Ġ%%":49893,"Ġteasp":49894,"[_":49895,"ãĥ¤":49896,"ħĭ":49897,"ŃĶ":49898,"Ġpci":49899,"Ġ\"<":49900,"GGGGGGGG":49901,"æĪ¦":49902,"--+":49903,"ãĤ®":49904,"Ġ())":49905,"âĸ¬":49906,"Ġsizeof":49907,"}}}":49908,";;;;;;;;":49909,">]":49910,"âĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪâĸĪ":49911,"Vaults":49912,"Ġistg":49913,"Ġnewcom":49914,"=]":49915,"¿½":49916,"ĵĺ":49917,"{\\":49918,"Args":49919,"Ġexha":49920,"(\\":49921,"Ġunnecess":49922,"\"}],\"":49923,"ĠUNCLASSIFIED":49924,">(":49925,"ãĤ¢ãĥ«":49926,"æ©":49927,"70710":49928,"Ń·":49929,"ãĥ¼ãĥĨãĤ£":49930,"ĠSakuya":49931,"ãĥĥãĥī":49932,"ĠPyrrha":49933,"escription":49934,"VIDIA":49935,"================================================================":49936,"Ġlooph":49937,"=~":49938,"Ġcumbers":49939,"Ġ)]":49940,"govtrack":49941,"ĠãĤµ":49942,"Ġsubur":49943,"Þ":49944,"Ġâī¡":49945,"Interstitial":49946,"ãĥ¼ãĥĨ":49947,"Ġgobl":49948,"ãĥīãĥ©":49949,"oldown":49950,"ģĸ":49951,"Depths":49952,"Ġ());":49953,"Ġ._":49954,"20439":49955,"Ġç¥ŀ":49956,"ãģ®å®":49957,"ãĤ¼":49958,"Ġ$\\":49959,"âĹ¼":49960,"Ġencount":49961,"Ġ